ipvtap.c 5.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240
  1. #include <linux/etherdevice.h>
  2. #include "ipvlan.h"
  3. #include <linux/if_vlan.h>
  4. #include <linux/if_tap.h>
  5. #include <linux/interrupt.h>
  6. #include <linux/nsproxy.h>
  7. #include <linux/compat.h>
  8. #include <linux/if_tun.h>
  9. #include <linux/module.h>
  10. #include <linux/skbuff.h>
  11. #include <linux/cache.h>
  12. #include <linux/sched.h>
  13. #include <linux/types.h>
  14. #include <linux/slab.h>
  15. #include <linux/wait.h>
  16. #include <linux/cdev.h>
  17. #include <linux/idr.h>
  18. #include <linux/fs.h>
  19. #include <linux/uio.h>
  20. #include <net/net_namespace.h>
  21. #include <net/rtnetlink.h>
  22. #include <net/sock.h>
  23. #include <linux/virtio_net.h>
  24. #define TUN_OFFLOADS (NETIF_F_HW_CSUM | NETIF_F_TSO_ECN | NETIF_F_TSO | \
  25. NETIF_F_TSO6)
  26. static dev_t ipvtap_major;
  27. static struct cdev ipvtap_cdev;
  28. static const void *ipvtap_net_namespace(struct device *d)
  29. {
  30. struct net_device *dev = to_net_dev(d->parent);
  31. return dev_net(dev);
  32. }
  33. static struct class ipvtap_class = {
  34. .name = "ipvtap",
  35. .owner = THIS_MODULE,
  36. .ns_type = &net_ns_type_operations,
  37. .namespace = ipvtap_net_namespace,
  38. };
  39. struct ipvtap_dev {
  40. struct ipvl_dev vlan;
  41. struct tap_dev tap;
  42. };
  43. static void ipvtap_count_tx_dropped(struct tap_dev *tap)
  44. {
  45. struct ipvtap_dev *vlantap = container_of(tap, struct ipvtap_dev, tap);
  46. struct ipvl_dev *vlan = &vlantap->vlan;
  47. this_cpu_inc(vlan->pcpu_stats->tx_drps);
  48. }
  49. static void ipvtap_count_rx_dropped(struct tap_dev *tap)
  50. {
  51. struct ipvtap_dev *vlantap = container_of(tap, struct ipvtap_dev, tap);
  52. struct ipvl_dev *vlan = &vlantap->vlan;
  53. ipvlan_count_rx(vlan, 0, 0, 0);
  54. }
  55. static void ipvtap_update_features(struct tap_dev *tap,
  56. netdev_features_t features)
  57. {
  58. struct ipvtap_dev *vlantap = container_of(tap, struct ipvtap_dev, tap);
  59. struct ipvl_dev *vlan = &vlantap->vlan;
  60. vlan->sfeatures = features;
  61. netdev_update_features(vlan->dev);
  62. }
  63. static int ipvtap_newlink(struct net *src_net, struct net_device *dev,
  64. struct nlattr *tb[], struct nlattr *data[],
  65. struct netlink_ext_ack *extack)
  66. {
  67. struct ipvtap_dev *vlantap = netdev_priv(dev);
  68. int err;
  69. INIT_LIST_HEAD(&vlantap->tap.queue_list);
  70. /* Since macvlan supports all offloads by default, make
  71. * tap support all offloads also.
  72. */
  73. vlantap->tap.tap_features = TUN_OFFLOADS;
  74. vlantap->tap.count_tx_dropped = ipvtap_count_tx_dropped;
  75. vlantap->tap.update_features = ipvtap_update_features;
  76. vlantap->tap.count_rx_dropped = ipvtap_count_rx_dropped;
  77. err = netdev_rx_handler_register(dev, tap_handle_frame, &vlantap->tap);
  78. if (err)
  79. return err;
  80. /* Don't put anything that may fail after macvlan_common_newlink
  81. * because we can't undo what it does.
  82. */
  83. err = ipvlan_link_new(src_net, dev, tb, data, extack);
  84. if (err) {
  85. netdev_rx_handler_unregister(dev);
  86. return err;
  87. }
  88. vlantap->tap.dev = vlantap->vlan.dev;
  89. return err;
  90. }
  91. static void ipvtap_dellink(struct net_device *dev,
  92. struct list_head *head)
  93. {
  94. struct ipvtap_dev *vlan = netdev_priv(dev);
  95. netdev_rx_handler_unregister(dev);
  96. tap_del_queues(&vlan->tap);
  97. ipvlan_link_delete(dev, head);
  98. }
  99. static void ipvtap_setup(struct net_device *dev)
  100. {
  101. ipvlan_link_setup(dev);
  102. dev->tx_queue_len = TUN_READQ_SIZE;
  103. dev->priv_flags &= ~IFF_NO_QUEUE;
  104. }
  105. static struct rtnl_link_ops ipvtap_link_ops __read_mostly = {
  106. .kind = "ipvtap",
  107. .setup = ipvtap_setup,
  108. .newlink = ipvtap_newlink,
  109. .dellink = ipvtap_dellink,
  110. .priv_size = sizeof(struct ipvtap_dev),
  111. };
  112. static int ipvtap_device_event(struct notifier_block *unused,
  113. unsigned long event, void *ptr)
  114. {
  115. struct net_device *dev = netdev_notifier_info_to_dev(ptr);
  116. struct ipvtap_dev *vlantap;
  117. struct device *classdev;
  118. dev_t devt;
  119. int err;
  120. char tap_name[IFNAMSIZ];
  121. if (dev->rtnl_link_ops != &ipvtap_link_ops)
  122. return NOTIFY_DONE;
  123. snprintf(tap_name, IFNAMSIZ, "tap%d", dev->ifindex);
  124. vlantap = netdev_priv(dev);
  125. switch (event) {
  126. case NETDEV_REGISTER:
  127. /* Create the device node here after the network device has
  128. * been registered but before register_netdevice has
  129. * finished running.
  130. */
  131. err = tap_get_minor(ipvtap_major, &vlantap->tap);
  132. if (err)
  133. return notifier_from_errno(err);
  134. devt = MKDEV(MAJOR(ipvtap_major), vlantap->tap.minor);
  135. classdev = device_create(&ipvtap_class, &dev->dev, devt,
  136. dev, tap_name);
  137. if (IS_ERR(classdev)) {
  138. tap_free_minor(ipvtap_major, &vlantap->tap);
  139. return notifier_from_errno(PTR_ERR(classdev));
  140. }
  141. err = sysfs_create_link(&dev->dev.kobj, &classdev->kobj,
  142. tap_name);
  143. if (err)
  144. return notifier_from_errno(err);
  145. break;
  146. case NETDEV_UNREGISTER:
  147. /* vlan->minor == 0 if NETDEV_REGISTER above failed */
  148. if (vlantap->tap.minor == 0)
  149. break;
  150. sysfs_remove_link(&dev->dev.kobj, tap_name);
  151. devt = MKDEV(MAJOR(ipvtap_major), vlantap->tap.minor);
  152. device_destroy(&ipvtap_class, devt);
  153. tap_free_minor(ipvtap_major, &vlantap->tap);
  154. break;
  155. case NETDEV_CHANGE_TX_QUEUE_LEN:
  156. if (tap_queue_resize(&vlantap->tap))
  157. return NOTIFY_BAD;
  158. break;
  159. }
  160. return NOTIFY_DONE;
  161. }
  162. static struct notifier_block ipvtap_notifier_block __read_mostly = {
  163. .notifier_call = ipvtap_device_event,
  164. };
  165. static int ipvtap_init(void)
  166. {
  167. int err;
  168. err = tap_create_cdev(&ipvtap_cdev, &ipvtap_major, "ipvtap",
  169. THIS_MODULE);
  170. if (err)
  171. goto out1;
  172. err = class_register(&ipvtap_class);
  173. if (err)
  174. goto out2;
  175. err = register_netdevice_notifier(&ipvtap_notifier_block);
  176. if (err)
  177. goto out3;
  178. err = ipvlan_link_register(&ipvtap_link_ops);
  179. if (err)
  180. goto out4;
  181. return 0;
  182. out4:
  183. unregister_netdevice_notifier(&ipvtap_notifier_block);
  184. out3:
  185. class_unregister(&ipvtap_class);
  186. out2:
  187. tap_destroy_cdev(ipvtap_major, &ipvtap_cdev);
  188. out1:
  189. return err;
  190. }
  191. module_init(ipvtap_init);
  192. static void ipvtap_exit(void)
  193. {
  194. rtnl_link_unregister(&ipvtap_link_ops);
  195. unregister_netdevice_notifier(&ipvtap_notifier_block);
  196. class_unregister(&ipvtap_class);
  197. tap_destroy_cdev(ipvtap_major, &ipvtap_cdev);
  198. }
  199. module_exit(ipvtap_exit);
  200. MODULE_ALIAS_RTNL_LINK("ipvtap");
  201. MODULE_AUTHOR("Sainath Grandhi <sainath.grandhi@intel.com>");
  202. MODULE_LICENSE("GPL");