sockex2_kern.c 4.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222
  1. #include <uapi/linux/bpf.h>
  2. #include "bpf_helpers.h"
  3. #include <uapi/linux/in.h>
  4. #include <uapi/linux/if.h>
  5. #include <uapi/linux/if_ether.h>
  6. #include <uapi/linux/ip.h>
  7. #include <uapi/linux/ipv6.h>
  8. #include <uapi/linux/if_tunnel.h>
  9. #define IP_MF 0x2000
  10. #define IP_OFFSET 0x1FFF
  11. struct vlan_hdr {
  12. __be16 h_vlan_TCI;
  13. __be16 h_vlan_encapsulated_proto;
  14. };
  15. struct flow_key_record {
  16. __be32 src;
  17. __be32 dst;
  18. union {
  19. __be32 ports;
  20. __be16 port16[2];
  21. };
  22. __u16 thoff;
  23. __u8 ip_proto;
  24. };
  25. static inline int proto_ports_offset(__u64 proto)
  26. {
  27. switch (proto) {
  28. case IPPROTO_TCP:
  29. case IPPROTO_UDP:
  30. case IPPROTO_DCCP:
  31. case IPPROTO_ESP:
  32. case IPPROTO_SCTP:
  33. case IPPROTO_UDPLITE:
  34. return 0;
  35. case IPPROTO_AH:
  36. return 4;
  37. default:
  38. return 0;
  39. }
  40. }
  41. static inline int ip_is_fragment(struct __sk_buff *ctx, __u64 nhoff)
  42. {
  43. return load_half(ctx, nhoff + offsetof(struct iphdr, frag_off))
  44. & (IP_MF | IP_OFFSET);
  45. }
  46. static inline __u32 ipv6_addr_hash(struct __sk_buff *ctx, __u64 off)
  47. {
  48. __u64 w0 = load_word(ctx, off);
  49. __u64 w1 = load_word(ctx, off + 4);
  50. __u64 w2 = load_word(ctx, off + 8);
  51. __u64 w3 = load_word(ctx, off + 12);
  52. return (__u32)(w0 ^ w1 ^ w2 ^ w3);
  53. }
  54. static inline __u64 parse_ip(struct __sk_buff *skb, __u64 nhoff, __u64 *ip_proto,
  55. struct flow_key_record *flow)
  56. {
  57. __u64 verlen;
  58. if (unlikely(ip_is_fragment(skb, nhoff)))
  59. *ip_proto = 0;
  60. else
  61. *ip_proto = load_byte(skb, nhoff + offsetof(struct iphdr, protocol));
  62. if (*ip_proto != IPPROTO_GRE) {
  63. flow->src = load_word(skb, nhoff + offsetof(struct iphdr, saddr));
  64. flow->dst = load_word(skb, nhoff + offsetof(struct iphdr, daddr));
  65. }
  66. verlen = load_byte(skb, nhoff + 0/*offsetof(struct iphdr, ihl)*/);
  67. if (likely(verlen == 0x45))
  68. nhoff += 20;
  69. else
  70. nhoff += (verlen & 0xF) << 2;
  71. return nhoff;
  72. }
  73. static inline __u64 parse_ipv6(struct __sk_buff *skb, __u64 nhoff, __u64 *ip_proto,
  74. struct flow_key_record *flow)
  75. {
  76. *ip_proto = load_byte(skb,
  77. nhoff + offsetof(struct ipv6hdr, nexthdr));
  78. flow->src = ipv6_addr_hash(skb,
  79. nhoff + offsetof(struct ipv6hdr, saddr));
  80. flow->dst = ipv6_addr_hash(skb,
  81. nhoff + offsetof(struct ipv6hdr, daddr));
  82. nhoff += sizeof(struct ipv6hdr);
  83. return nhoff;
  84. }
  85. static inline bool flow_dissector(struct __sk_buff *skb,
  86. struct flow_key_record *flow)
  87. {
  88. __u64 nhoff = ETH_HLEN;
  89. __u64 ip_proto;
  90. __u64 proto = load_half(skb, 12);
  91. int poff;
  92. if (proto == ETH_P_8021AD) {
  93. proto = load_half(skb, nhoff + offsetof(struct vlan_hdr,
  94. h_vlan_encapsulated_proto));
  95. nhoff += sizeof(struct vlan_hdr);
  96. }
  97. if (proto == ETH_P_8021Q) {
  98. proto = load_half(skb, nhoff + offsetof(struct vlan_hdr,
  99. h_vlan_encapsulated_proto));
  100. nhoff += sizeof(struct vlan_hdr);
  101. }
  102. if (likely(proto == ETH_P_IP))
  103. nhoff = parse_ip(skb, nhoff, &ip_proto, flow);
  104. else if (proto == ETH_P_IPV6)
  105. nhoff = parse_ipv6(skb, nhoff, &ip_proto, flow);
  106. else
  107. return false;
  108. switch (ip_proto) {
  109. case IPPROTO_GRE: {
  110. struct gre_hdr {
  111. __be16 flags;
  112. __be16 proto;
  113. };
  114. __u64 gre_flags = load_half(skb,
  115. nhoff + offsetof(struct gre_hdr, flags));
  116. __u64 gre_proto = load_half(skb,
  117. nhoff + offsetof(struct gre_hdr, proto));
  118. if (gre_flags & (GRE_VERSION|GRE_ROUTING))
  119. break;
  120. proto = gre_proto;
  121. nhoff += 4;
  122. if (gre_flags & GRE_CSUM)
  123. nhoff += 4;
  124. if (gre_flags & GRE_KEY)
  125. nhoff += 4;
  126. if (gre_flags & GRE_SEQ)
  127. nhoff += 4;
  128. if (proto == ETH_P_8021Q) {
  129. proto = load_half(skb,
  130. nhoff + offsetof(struct vlan_hdr,
  131. h_vlan_encapsulated_proto));
  132. nhoff += sizeof(struct vlan_hdr);
  133. }
  134. if (proto == ETH_P_IP)
  135. nhoff = parse_ip(skb, nhoff, &ip_proto, flow);
  136. else if (proto == ETH_P_IPV6)
  137. nhoff = parse_ipv6(skb, nhoff, &ip_proto, flow);
  138. else
  139. return false;
  140. break;
  141. }
  142. case IPPROTO_IPIP:
  143. nhoff = parse_ip(skb, nhoff, &ip_proto, flow);
  144. break;
  145. case IPPROTO_IPV6:
  146. nhoff = parse_ipv6(skb, nhoff, &ip_proto, flow);
  147. break;
  148. default:
  149. break;
  150. }
  151. flow->ip_proto = ip_proto;
  152. poff = proto_ports_offset(ip_proto);
  153. if (poff >= 0) {
  154. nhoff += poff;
  155. flow->ports = load_word(skb, nhoff);
  156. }
  157. flow->thoff = (__u16) nhoff;
  158. return true;
  159. }
  160. struct pair {
  161. long packets;
  162. long bytes;
  163. };
  164. struct bpf_map_def SEC("maps") hash_map = {
  165. .type = BPF_MAP_TYPE_HASH,
  166. .key_size = sizeof(__be32),
  167. .value_size = sizeof(struct pair),
  168. .max_entries = 1024,
  169. };
  170. SEC("socket2")
  171. int bpf_prog2(struct __sk_buff *skb)
  172. {
  173. struct flow_key_record flow = {};
  174. struct pair *value;
  175. u32 key;
  176. if (!flow_dissector(skb, &flow))
  177. return 0;
  178. key = flow.dst;
  179. value = bpf_map_lookup_elem(&hash_map, &key);
  180. if (value) {
  181. __sync_fetch_and_add(&value->packets, 1);
  182. __sync_fetch_and_add(&value->bytes, skb->len);
  183. } else {
  184. struct pair val = {1, skb->len};
  185. bpf_map_update_elem(&hash_map, &key, &val, BPF_ANY);
  186. }
  187. return 0;
  188. }
  189. char _license[] SEC("license") = "GPL";