1 // SPDX-License-Identifier: GPL-2.0-only 2 /* Copyright (c) 2016 Facebook 3 */ 4 #include <linux/bpf.h> 5 #include <linux/if_link.h> 6 #include <assert.h> 7 #include <errno.h> 8 #include <signal.h> 9 #include <stdio.h> 10 #include <stdlib.h> 11 #include <string.h> 12 #include <net/if.h> 13 #include <sys/resource.h> 14 #include <arpa/inet.h> 15 #include <netinet/ether.h> 16 #include <unistd.h> 17 #include <time.h> 18 #include <bpf/libbpf.h> 19 #include <bpf/bpf.h> 20 #include "bpf_util.h" 21 #include "xdp_tx_iptunnel_common.h" 22 23 #define STATS_INTERVAL_S 2U 24 25 static int ifindex = -1; 26 static __u32 xdp_flags = XDP_FLAGS_UPDATE_IF_NOEXIST; 27 static int rxcnt_map_fd; 28 static __u32 prog_id; 29 30 static void int_exit(int sig) 31 { 32 __u32 curr_prog_id = 0; 33 34 if (ifindex > -1) { 35 if (bpf_xdp_query_id(ifindex, xdp_flags, &curr_prog_id)) { 36 printf("bpf_xdp_query_id failed\n"); 37 exit(1); 38 } 39 if (prog_id == curr_prog_id) 40 bpf_xdp_detach(ifindex, xdp_flags, NULL); 41 else if (!curr_prog_id) 42 printf("couldn't find a prog id on a given iface\n"); 43 else 44 printf("program on interface changed, not removing\n"); 45 } 46 exit(0); 47 } 48 49 /* simple per-protocol drop counter 50 */ 51 static void poll_stats(unsigned int kill_after_s) 52 { 53 const unsigned int nr_protos = 256; 54 unsigned int nr_cpus = bpf_num_possible_cpus(); 55 time_t started_at = time(NULL); 56 __u64 values[nr_cpus], prev[nr_protos][nr_cpus]; 57 __u32 proto; 58 int i; 59 60 memset(prev, 0, sizeof(prev)); 61 62 while (!kill_after_s || time(NULL) - started_at <= kill_after_s) { 63 sleep(STATS_INTERVAL_S); 64 65 for (proto = 0; proto < nr_protos; proto++) { 66 __u64 sum = 0; 67 68 assert(bpf_map_lookup_elem(rxcnt_map_fd, &proto, 69 values) == 0); 70 for (i = 0; i < nr_cpus; i++) 71 sum += (values[i] - prev[proto][i]); 72 73 if (sum) 74 printf("proto %u: sum:%10llu pkts, rate:%10llu pkts/s\n", 75 proto, sum, sum / STATS_INTERVAL_S); 76 memcpy(prev[proto], values, sizeof(values)); 77 } 78 } 79 } 80 81 static void usage(const char *cmd) 82 { 83 printf("Start a XDP prog which encapsulates incoming packets\n" 84 "in an IPv4/v6 header and XDP_TX it out. The dst <VIP:PORT>\n" 85 "is used to select packets to encapsulate\n\n"); 86 printf("Usage: %s [...]\n", cmd); 87 printf(" -i <ifname|ifindex> Interface\n"); 88 printf(" -a <vip-service-address> IPv4 or IPv6\n"); 89 printf(" -p <vip-service-port> A port range (e.g. 433-444) is also allowed\n"); 90 printf(" -s <source-ip> Used in the IPTunnel header\n"); 91 printf(" -d <dest-ip> Used in the IPTunnel header\n"); 92 printf(" -m <dest-MAC> Used in sending the IP Tunneled pkt\n"); 93 printf(" -T <stop-after-X-seconds> Default: 0 (forever)\n"); 94 printf(" -P <IP-Protocol> Default is TCP\n"); 95 printf(" -S use skb-mode\n"); 96 printf(" -N enforce native mode\n"); 97 printf(" -F Force loading the XDP prog\n"); 98 printf(" -h Display this help\n"); 99 } 100 101 static int parse_ipstr(const char *ipstr, unsigned int *addr) 102 { 103 if (inet_pton(AF_INET6, ipstr, addr) == 1) { 104 return AF_INET6; 105 } else if (inet_pton(AF_INET, ipstr, addr) == 1) { 106 addr[1] = addr[2] = addr[3] = 0; 107 return AF_INET; 108 } 109 110 fprintf(stderr, "%s is an invalid IP\n", ipstr); 111 return AF_UNSPEC; 112 } 113 114 static int parse_ports(const char *port_str, int *min_port, int *max_port) 115 { 116 char *end; 117 long tmp_min_port; 118 long tmp_max_port; 119 120 tmp_min_port = strtol(optarg, &end, 10); 121 if (tmp_min_port < 1 || tmp_min_port > 65535) { 122 fprintf(stderr, "Invalid port(s):%s\n", optarg); 123 return 1; 124 } 125 126 if (*end == '-') { 127 end++; 128 tmp_max_port = strtol(end, NULL, 10); 129 if (tmp_max_port < 1 || tmp_max_port > 65535) { 130 fprintf(stderr, "Invalid port(s):%s\n", optarg); 131 return 1; 132 } 133 } else { 134 tmp_max_port = tmp_min_port; 135 } 136 137 if (tmp_min_port > tmp_max_port) { 138 fprintf(stderr, "Invalid port(s):%s\n", optarg); 139 return 1; 140 } 141 142 if (tmp_max_port - tmp_min_port + 1 > MAX_IPTNL_ENTRIES) { 143 fprintf(stderr, "Port range (%s) is larger than %u\n", 144 port_str, MAX_IPTNL_ENTRIES); 145 return 1; 146 } 147 *min_port = tmp_min_port; 148 *max_port = tmp_max_port; 149 150 return 0; 151 } 152 153 int main(int argc, char **argv) 154 { 155 int min_port = 0, max_port = 0, vip2tnl_map_fd; 156 const char *optstr = "i:a:p:s:d:m:T:P:FSNh"; 157 unsigned char opt_flags[256] = {}; 158 struct bpf_prog_info info = {}; 159 __u32 info_len = sizeof(info); 160 unsigned int kill_after_s = 0; 161 struct iptnl_info tnl = {}; 162 struct bpf_program *prog; 163 struct bpf_object *obj; 164 struct vip vip = {}; 165 char filename[256]; 166 int opt, prog_fd; 167 int i, err; 168 169 tnl.family = AF_UNSPEC; 170 vip.protocol = IPPROTO_TCP; 171 172 for (i = 0; i < strlen(optstr); i++) 173 if (optstr[i] != 'h' && 'a' <= optstr[i] && optstr[i] <= 'z') 174 opt_flags[(unsigned char)optstr[i]] = 1; 175 176 while ((opt = getopt(argc, argv, optstr)) != -1) { 177 unsigned short family; 178 unsigned int *v6; 179 180 switch (opt) { 181 case 'i': 182 ifindex = if_nametoindex(optarg); 183 if (!ifindex) 184 ifindex = atoi(optarg); 185 break; 186 case 'a': 187 vip.family = parse_ipstr(optarg, vip.daddr.v6); 188 if (vip.family == AF_UNSPEC) 189 return 1; 190 break; 191 case 'p': 192 if (parse_ports(optarg, &min_port, &max_port)) 193 return 1; 194 break; 195 case 'P': 196 vip.protocol = atoi(optarg); 197 break; 198 case 's': 199 case 'd': 200 if (opt == 's') 201 v6 = tnl.saddr.v6; 202 else 203 v6 = tnl.daddr.v6; 204 205 family = parse_ipstr(optarg, v6); 206 if (family == AF_UNSPEC) 207 return 1; 208 if (tnl.family == AF_UNSPEC) { 209 tnl.family = family; 210 } else if (tnl.family != family) { 211 fprintf(stderr, 212 "The IP version of the src and dst addresses used in the IP encapsulation does not match\n"); 213 return 1; 214 } 215 break; 216 case 'm': 217 if (!ether_aton_r(optarg, 218 (struct ether_addr *)tnl.dmac)) { 219 fprintf(stderr, "Invalid mac address:%s\n", 220 optarg); 221 return 1; 222 } 223 break; 224 case 'T': 225 kill_after_s = atoi(optarg); 226 break; 227 case 'S': 228 xdp_flags |= XDP_FLAGS_SKB_MODE; 229 break; 230 case 'N': 231 /* default, set below */ 232 break; 233 case 'F': 234 xdp_flags &= ~XDP_FLAGS_UPDATE_IF_NOEXIST; 235 break; 236 default: 237 usage(argv[0]); 238 return 1; 239 } 240 opt_flags[opt] = 0; 241 } 242 243 if (!(xdp_flags & XDP_FLAGS_SKB_MODE)) 244 xdp_flags |= XDP_FLAGS_DRV_MODE; 245 246 for (i = 0; i < strlen(optstr); i++) { 247 if (opt_flags[(unsigned int)optstr[i]]) { 248 fprintf(stderr, "Missing argument -%c\n", optstr[i]); 249 usage(argv[0]); 250 return 1; 251 } 252 } 253 254 if (!ifindex) { 255 fprintf(stderr, "Invalid ifname\n"); 256 return 1; 257 } 258 259 snprintf(filename, sizeof(filename), "%s_kern.o", argv[0]); 260 261 obj = bpf_object__open_file(filename, NULL); 262 if (libbpf_get_error(obj)) 263 return 1; 264 265 prog = bpf_object__next_program(obj, NULL); 266 bpf_program__set_type(prog, BPF_PROG_TYPE_XDP); 267 268 err = bpf_object__load(obj); 269 if (err) { 270 printf("bpf_object__load(): %s\n", strerror(errno)); 271 return 1; 272 } 273 prog_fd = bpf_program__fd(prog); 274 275 rxcnt_map_fd = bpf_object__find_map_fd_by_name(obj, "rxcnt"); 276 vip2tnl_map_fd = bpf_object__find_map_fd_by_name(obj, "vip2tnl"); 277 if (vip2tnl_map_fd < 0 || rxcnt_map_fd < 0) { 278 printf("bpf_object__find_map_fd_by_name failed\n"); 279 return 1; 280 } 281 282 signal(SIGINT, int_exit); 283 signal(SIGTERM, int_exit); 284 285 while (min_port <= max_port) { 286 vip.dport = htons(min_port++); 287 if (bpf_map_update_elem(vip2tnl_map_fd, &vip, &tnl, 288 BPF_NOEXIST)) { 289 perror("bpf_map_update_elem(&vip2tnl)"); 290 return 1; 291 } 292 } 293 294 if (bpf_xdp_attach(ifindex, prog_fd, xdp_flags, NULL) < 0) { 295 printf("link set xdp fd failed\n"); 296 return 1; 297 } 298 299 err = bpf_obj_get_info_by_fd(prog_fd, &info, &info_len); 300 if (err) { 301 printf("can't get prog info - %s\n", strerror(errno)); 302 return err; 303 } 304 prog_id = info.id; 305 306 poll_stats(kill_after_s); 307 308 bpf_xdp_detach(ifindex, xdp_flags, NULL); 309 310 return 0; 311 } 312