123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291 |
- /* Copyright (c) 2015 PLUMgrid, http://plumgrid.com
- *
- * This program is free software; you can redistribute it and/or
- * modify it under the terms of version 2 of the GNU General Public
- * License as published by the Free Software Foundation.
- */
- #include <uapi/linux/bpf.h>
- #include "bpf_helpers.h"
- #include <uapi/linux/in.h>
- #include <uapi/linux/if.h>
- #include <uapi/linux/if_ether.h>
- #include <uapi/linux/ip.h>
- #include <uapi/linux/ipv6.h>
- #include <uapi/linux/if_tunnel.h>
- #include <uapi/linux/mpls.h>
- #define IP_MF 0x2000
- #define IP_OFFSET 0x1FFF
- #define PROG(F) SEC("socket/"__stringify(F)) int bpf_func_##F
- struct bpf_map_def SEC("maps") jmp_table = {
- .type = BPF_MAP_TYPE_PROG_ARRAY,
- .key_size = sizeof(u32),
- .value_size = sizeof(u32),
- .max_entries = 8,
- };
- #define PARSE_VLAN 1
- #define PARSE_MPLS 2
- #define PARSE_IP 3
- #define PARSE_IPV6 4
- /* protocol dispatch routine.
- * It tail-calls next BPF program depending on eth proto
- * Note, we could have used:
- * bpf_tail_call(skb, &jmp_table, proto);
- * but it would need large prog_array
- */
- static inline void parse_eth_proto(struct __sk_buff *skb, u32 proto)
- {
- switch (proto) {
- case ETH_P_8021Q:
- case ETH_P_8021AD:
- bpf_tail_call(skb, &jmp_table, PARSE_VLAN);
- break;
- case ETH_P_MPLS_UC:
- case ETH_P_MPLS_MC:
- bpf_tail_call(skb, &jmp_table, PARSE_MPLS);
- break;
- case ETH_P_IP:
- bpf_tail_call(skb, &jmp_table, PARSE_IP);
- break;
- case ETH_P_IPV6:
- bpf_tail_call(skb, &jmp_table, PARSE_IPV6);
- break;
- }
- }
- struct vlan_hdr {
- __be16 h_vlan_TCI;
- __be16 h_vlan_encapsulated_proto;
- };
- struct flow_key_record {
- __be32 src;
- __be32 dst;
- union {
- __be32 ports;
- __be16 port16[2];
- };
- __u32 ip_proto;
- };
- static inline int ip_is_fragment(struct __sk_buff *ctx, __u64 nhoff)
- {
- return load_half(ctx, nhoff + offsetof(struct iphdr, frag_off))
- & (IP_MF | IP_OFFSET);
- }
- static inline __u32 ipv6_addr_hash(struct __sk_buff *ctx, __u64 off)
- {
- __u64 w0 = load_word(ctx, off);
- __u64 w1 = load_word(ctx, off + 4);
- __u64 w2 = load_word(ctx, off + 8);
- __u64 w3 = load_word(ctx, off + 12);
- return (__u32)(w0 ^ w1 ^ w2 ^ w3);
- }
- struct globals {
- struct flow_key_record flow;
- };
- struct bpf_map_def SEC("maps") percpu_map = {
- .type = BPF_MAP_TYPE_ARRAY,
- .key_size = sizeof(__u32),
- .value_size = sizeof(struct globals),
- .max_entries = 32,
- };
- /* user poor man's per_cpu until native support is ready */
- static struct globals *this_cpu_globals(void)
- {
- u32 key = bpf_get_smp_processor_id();
- return bpf_map_lookup_elem(&percpu_map, &key);
- }
- /* some simple stats for user space consumption */
- struct pair {
- __u64 packets;
- __u64 bytes;
- };
- struct bpf_map_def SEC("maps") hash_map = {
- .type = BPF_MAP_TYPE_HASH,
- .key_size = sizeof(struct flow_key_record),
- .value_size = sizeof(struct pair),
- .max_entries = 1024,
- };
- static void update_stats(struct __sk_buff *skb, struct globals *g)
- {
- struct flow_key_record key = g->flow;
- struct pair *value;
- value = bpf_map_lookup_elem(&hash_map, &key);
- if (value) {
- __sync_fetch_and_add(&value->packets, 1);
- __sync_fetch_and_add(&value->bytes, skb->len);
- } else {
- struct pair val = {1, skb->len};
- bpf_map_update_elem(&hash_map, &key, &val, BPF_ANY);
- }
- }
- static __always_inline void parse_ip_proto(struct __sk_buff *skb,
- struct globals *g, __u32 ip_proto)
- {
- __u32 nhoff = skb->cb[0];
- int poff;
- switch (ip_proto) {
- case IPPROTO_GRE: {
- struct gre_hdr {
- __be16 flags;
- __be16 proto;
- };
- __u32 gre_flags = load_half(skb,
- nhoff + offsetof(struct gre_hdr, flags));
- __u32 gre_proto = load_half(skb,
- nhoff + offsetof(struct gre_hdr, proto));
- if (gre_flags & (GRE_VERSION|GRE_ROUTING))
- break;
- nhoff += 4;
- if (gre_flags & GRE_CSUM)
- nhoff += 4;
- if (gre_flags & GRE_KEY)
- nhoff += 4;
- if (gre_flags & GRE_SEQ)
- nhoff += 4;
- skb->cb[0] = nhoff;
- parse_eth_proto(skb, gre_proto);
- break;
- }
- case IPPROTO_IPIP:
- parse_eth_proto(skb, ETH_P_IP);
- break;
- case IPPROTO_IPV6:
- parse_eth_proto(skb, ETH_P_IPV6);
- break;
- case IPPROTO_TCP:
- case IPPROTO_UDP:
- g->flow.ports = load_word(skb, nhoff);
- case IPPROTO_ICMP:
- g->flow.ip_proto = ip_proto;
- update_stats(skb, g);
- break;
- default:
- break;
- }
- }
- PROG(PARSE_IP)(struct __sk_buff *skb)
- {
- struct globals *g = this_cpu_globals();
- __u32 nhoff, verlen, ip_proto;
- if (!g)
- return 0;
- nhoff = skb->cb[0];
- if (unlikely(ip_is_fragment(skb, nhoff)))
- return 0;
- ip_proto = load_byte(skb, nhoff + offsetof(struct iphdr, protocol));
- if (ip_proto != IPPROTO_GRE) {
- g->flow.src = load_word(skb, nhoff + offsetof(struct iphdr, saddr));
- g->flow.dst = load_word(skb, nhoff + offsetof(struct iphdr, daddr));
- }
- verlen = load_byte(skb, nhoff + 0/*offsetof(struct iphdr, ihl)*/);
- nhoff += (verlen & 0xF) << 2;
- skb->cb[0] = nhoff;
- parse_ip_proto(skb, g, ip_proto);
- return 0;
- }
- PROG(PARSE_IPV6)(struct __sk_buff *skb)
- {
- struct globals *g = this_cpu_globals();
- __u32 nhoff, ip_proto;
- if (!g)
- return 0;
- nhoff = skb->cb[0];
- ip_proto = load_byte(skb,
- nhoff + offsetof(struct ipv6hdr, nexthdr));
- g->flow.src = ipv6_addr_hash(skb,
- nhoff + offsetof(struct ipv6hdr, saddr));
- g->flow.dst = ipv6_addr_hash(skb,
- nhoff + offsetof(struct ipv6hdr, daddr));
- nhoff += sizeof(struct ipv6hdr);
- skb->cb[0] = nhoff;
- parse_ip_proto(skb, g, ip_proto);
- return 0;
- }
- PROG(PARSE_VLAN)(struct __sk_buff *skb)
- {
- __u32 nhoff, proto;
- nhoff = skb->cb[0];
- proto = load_half(skb, nhoff + offsetof(struct vlan_hdr,
- h_vlan_encapsulated_proto));
- nhoff += sizeof(struct vlan_hdr);
- skb->cb[0] = nhoff;
- parse_eth_proto(skb, proto);
- return 0;
- }
- PROG(PARSE_MPLS)(struct __sk_buff *skb)
- {
- __u32 nhoff, label;
- nhoff = skb->cb[0];
- label = load_word(skb, nhoff);
- nhoff += sizeof(struct mpls_label);
- skb->cb[0] = nhoff;
- if (label & MPLS_LS_S_MASK) {
- __u8 verlen = load_byte(skb, nhoff);
- if ((verlen & 0xF0) == 4)
- parse_eth_proto(skb, ETH_P_IP);
- else
- parse_eth_proto(skb, ETH_P_IPV6);
- } else {
- parse_eth_proto(skb, ETH_P_MPLS_UC);
- }
- return 0;
- }
- SEC("socket/0")
- int main_prog(struct __sk_buff *skb)
- {
- __u32 nhoff = ETH_HLEN;
- __u32 proto = load_half(skb, 12);
- skb->cb[0] = nhoff;
- parse_eth_proto(skb, proto);
- return 0;
- }
- char _license[] SEC("license") = "GPL";
|