1 /* SPDX-License-Identifier: GPL-2.0
2 * Copyright (c) 2017 Jesper Dangaard Brouer, Red Hat Inc.
3 */
4 static const char *__doc__ = " XDP RX-queue info extract example\n\n"
5 "Monitor how many packets per sec (pps) are received\n"
6 "per NIC RX queue index and which CPU processed the packet\n"
7 ;
8
9 #include <errno.h>
10 #include <signal.h>
11 #include <stdio.h>
12 #include <stdlib.h>
13 #include <stdbool.h>
14 #include <string.h>
15 #include <unistd.h>
16 #include <locale.h>
17 #include <getopt.h>
18 #include <net/if.h>
19 #include <time.h>
20 #include <limits.h>
21 #include <arpa/inet.h>
22 #include <linux/if_link.h>
23
24 #include <bpf/bpf.h>
25 #include <bpf/libbpf.h>
26 #include "bpf_util.h"
27
28 static int ifindex = -1;
29 static char ifname_buf[IF_NAMESIZE];
30 static char *ifname;
31 static __u32 prog_id;
32
33 static __u32 xdp_flags = XDP_FLAGS_UPDATE_IF_NOEXIST;
34
35 static struct bpf_map *stats_global_map;
36 static struct bpf_map *rx_queue_index_map;
37
38 /* Exit return codes */
39 #define EXIT_OK 0
40 #define EXIT_FAIL 1
41 #define EXIT_FAIL_OPTION 2
42 #define EXIT_FAIL_XDP 3
43 #define EXIT_FAIL_BPF 4
44 #define EXIT_FAIL_MEM 5
45
46 #define FAIL_MEM_SIG INT_MAX
47 #define FAIL_STAT_SIG (INT_MAX - 1)
48
49 static const struct option long_options[] = {
50 {"help", no_argument, NULL, 'h' },
51 {"dev", required_argument, NULL, 'd' },
52 {"skb-mode", no_argument, NULL, 'S' },
53 {"sec", required_argument, NULL, 's' },
54 {"no-separators", no_argument, NULL, 'z' },
55 {"action", required_argument, NULL, 'a' },
56 {"readmem", no_argument, NULL, 'r' },
57 {"swapmac", no_argument, NULL, 'm' },
58 {"force", no_argument, NULL, 'F' },
59 {0, 0, NULL, 0 }
60 };
61
int_exit(int sig)62 static void int_exit(int sig)
63 {
64 __u32 curr_prog_id = 0;
65
66 if (ifindex > -1) {
67 if (bpf_xdp_query_id(ifindex, xdp_flags, &curr_prog_id)) {
68 printf("bpf_xdp_query_id failed\n");
69 exit(EXIT_FAIL);
70 }
71 if (prog_id == curr_prog_id) {
72 fprintf(stderr,
73 "Interrupted: Removing XDP program on ifindex:%d device:%s\n",
74 ifindex, ifname);
75 bpf_xdp_detach(ifindex, xdp_flags, NULL);
76 } else if (!curr_prog_id) {
77 printf("couldn't find a prog id on a given iface\n");
78 } else {
79 printf("program on interface changed, not removing\n");
80 }
81 }
82
83 if (sig == FAIL_MEM_SIG)
84 exit(EXIT_FAIL_MEM);
85 else if (sig == FAIL_STAT_SIG)
86 exit(EXIT_FAIL);
87
88 exit(EXIT_OK);
89 }
90
91 struct config {
92 __u32 action;
93 int ifindex;
94 __u32 options;
95 };
96 enum cfg_options_flags {
97 NO_TOUCH = 0x0U,
98 READ_MEM = 0x1U,
99 SWAP_MAC = 0x2U,
100 };
101 #define XDP_ACTION_MAX (XDP_TX + 1)
102 #define XDP_ACTION_MAX_STRLEN 11
103 static const char *xdp_action_names[XDP_ACTION_MAX] = {
104 [XDP_ABORTED] = "XDP_ABORTED",
105 [XDP_DROP] = "XDP_DROP",
106 [XDP_PASS] = "XDP_PASS",
107 [XDP_TX] = "XDP_TX",
108 };
109
action2str(int action)110 static const char *action2str(int action)
111 {
112 if (action < XDP_ACTION_MAX)
113 return xdp_action_names[action];
114 return NULL;
115 }
116
parse_xdp_action(char * action_str)117 static int parse_xdp_action(char *action_str)
118 {
119 size_t maxlen;
120 __u64 action = -1;
121 int i;
122
123 for (i = 0; i < XDP_ACTION_MAX; i++) {
124 maxlen = XDP_ACTION_MAX_STRLEN;
125 if (strncmp(xdp_action_names[i], action_str, maxlen) == 0) {
126 action = i;
127 break;
128 }
129 }
130 return action;
131 }
132
list_xdp_actions(void)133 static void list_xdp_actions(void)
134 {
135 int i;
136
137 printf("Available XDP --action <options>\n");
138 for (i = 0; i < XDP_ACTION_MAX; i++)
139 printf("\t%s\n", xdp_action_names[i]);
140 printf("\n");
141 }
142
options2str(enum cfg_options_flags flag)143 static char* options2str(enum cfg_options_flags flag)
144 {
145 if (flag == NO_TOUCH)
146 return "no_touch";
147 if (flag & SWAP_MAC)
148 return "swapmac";
149 if (flag & READ_MEM)
150 return "read";
151 fprintf(stderr, "ERR: Unknown config option flags");
152 int_exit(FAIL_STAT_SIG);
153 return "unknown";
154 }
155
usage(char * argv[])156 static void usage(char *argv[])
157 {
158 int i;
159
160 printf("\nDOCUMENTATION:\n%s\n", __doc__);
161 printf(" Usage: %s (options-see-below)\n", argv[0]);
162 printf(" Listing options:\n");
163 for (i = 0; long_options[i].name != 0; i++) {
164 printf(" --%-12s", long_options[i].name);
165 if (long_options[i].flag != NULL)
166 printf(" flag (internal value:%d)",
167 *long_options[i].flag);
168 else
169 printf(" short-option: -%c",
170 long_options[i].val);
171 printf("\n");
172 }
173 printf("\n");
174 list_xdp_actions();
175 }
176
177 #define NANOSEC_PER_SEC 1000000000 /* 10^9 */
gettime(void)178 static __u64 gettime(void)
179 {
180 struct timespec t;
181 int res;
182
183 res = clock_gettime(CLOCK_MONOTONIC, &t);
184 if (res < 0) {
185 fprintf(stderr, "Error with gettimeofday! (%i)\n", res);
186 int_exit(FAIL_STAT_SIG);
187 }
188 return (__u64) t.tv_sec * NANOSEC_PER_SEC + t.tv_nsec;
189 }
190
191 /* Common stats data record shared with _kern.c */
192 struct datarec {
193 __u64 processed;
194 __u64 issue;
195 };
196 struct record {
197 __u64 timestamp;
198 struct datarec total;
199 struct datarec *cpu;
200 };
201 struct stats_record {
202 struct record stats;
203 struct record *rxq;
204 };
205
alloc_record_per_cpu(void)206 static struct datarec *alloc_record_per_cpu(void)
207 {
208 unsigned int nr_cpus = bpf_num_possible_cpus();
209 struct datarec *array;
210
211 array = calloc(nr_cpus, sizeof(struct datarec));
212 if (!array) {
213 fprintf(stderr, "Mem alloc error (nr_cpus:%u)\n", nr_cpus);
214 int_exit(FAIL_MEM_SIG);
215 }
216 return array;
217 }
218
alloc_record_per_rxq(void)219 static struct record *alloc_record_per_rxq(void)
220 {
221 unsigned int nr_rxqs = bpf_map__max_entries(rx_queue_index_map);
222 struct record *array;
223
224 array = calloc(nr_rxqs, sizeof(struct record));
225 if (!array) {
226 fprintf(stderr, "Mem alloc error (nr_rxqs:%u)\n", nr_rxqs);
227 int_exit(FAIL_MEM_SIG);
228 }
229 return array;
230 }
231
alloc_stats_record(void)232 static struct stats_record *alloc_stats_record(void)
233 {
234 unsigned int nr_rxqs = bpf_map__max_entries(rx_queue_index_map);
235 struct stats_record *rec;
236 int i;
237
238 rec = calloc(1, sizeof(struct stats_record));
239 if (!rec) {
240 fprintf(stderr, "Mem alloc error\n");
241 int_exit(FAIL_MEM_SIG);
242 }
243 rec->rxq = alloc_record_per_rxq();
244 for (i = 0; i < nr_rxqs; i++)
245 rec->rxq[i].cpu = alloc_record_per_cpu();
246
247 rec->stats.cpu = alloc_record_per_cpu();
248 return rec;
249 }
250
free_stats_record(struct stats_record * r)251 static void free_stats_record(struct stats_record *r)
252 {
253 unsigned int nr_rxqs = bpf_map__max_entries(rx_queue_index_map);
254 int i;
255
256 for (i = 0; i < nr_rxqs; i++)
257 free(r->rxq[i].cpu);
258
259 free(r->rxq);
260 free(r->stats.cpu);
261 free(r);
262 }
263
map_collect_percpu(int fd,__u32 key,struct record * rec)264 static bool map_collect_percpu(int fd, __u32 key, struct record *rec)
265 {
266 /* For percpu maps, userspace gets a value per possible CPU */
267 unsigned int nr_cpus = bpf_num_possible_cpus();
268 struct datarec values[nr_cpus];
269 __u64 sum_processed = 0;
270 __u64 sum_issue = 0;
271 int i;
272
273 if ((bpf_map_lookup_elem(fd, &key, values)) != 0) {
274 fprintf(stderr,
275 "ERR: bpf_map_lookup_elem failed key:0x%X\n", key);
276 return false;
277 }
278 /* Get time as close as possible to reading map contents */
279 rec->timestamp = gettime();
280
281 /* Record and sum values from each CPU */
282 for (i = 0; i < nr_cpus; i++) {
283 rec->cpu[i].processed = values[i].processed;
284 sum_processed += values[i].processed;
285 rec->cpu[i].issue = values[i].issue;
286 sum_issue += values[i].issue;
287 }
288 rec->total.processed = sum_processed;
289 rec->total.issue = sum_issue;
290 return true;
291 }
292
stats_collect(struct stats_record * rec)293 static void stats_collect(struct stats_record *rec)
294 {
295 int fd, i, max_rxqs;
296
297 fd = bpf_map__fd(stats_global_map);
298 map_collect_percpu(fd, 0, &rec->stats);
299
300 fd = bpf_map__fd(rx_queue_index_map);
301 max_rxqs = bpf_map__max_entries(rx_queue_index_map);
302 for (i = 0; i < max_rxqs; i++)
303 map_collect_percpu(fd, i, &rec->rxq[i]);
304 }
305
calc_period(struct record * r,struct record * p)306 static double calc_period(struct record *r, struct record *p)
307 {
308 double period_ = 0;
309 __u64 period = 0;
310
311 period = r->timestamp - p->timestamp;
312 if (period > 0)
313 period_ = ((double) period / NANOSEC_PER_SEC);
314
315 return period_;
316 }
317
calc_pps(struct datarec * r,struct datarec * p,double period_)318 static __u64 calc_pps(struct datarec *r, struct datarec *p, double period_)
319 {
320 __u64 packets = 0;
321 __u64 pps = 0;
322
323 if (period_ > 0) {
324 packets = r->processed - p->processed;
325 pps = packets / period_;
326 }
327 return pps;
328 }
329
calc_errs_pps(struct datarec * r,struct datarec * p,double period_)330 static __u64 calc_errs_pps(struct datarec *r,
331 struct datarec *p, double period_)
332 {
333 __u64 packets = 0;
334 __u64 pps = 0;
335
336 if (period_ > 0) {
337 packets = r->issue - p->issue;
338 pps = packets / period_;
339 }
340 return pps;
341 }
342
stats_print(struct stats_record * stats_rec,struct stats_record * stats_prev,int action,__u32 cfg_opt)343 static void stats_print(struct stats_record *stats_rec,
344 struct stats_record *stats_prev,
345 int action, __u32 cfg_opt)
346 {
347 unsigned int nr_rxqs = bpf_map__max_entries(rx_queue_index_map);
348 unsigned int nr_cpus = bpf_num_possible_cpus();
349 double pps = 0, err = 0;
350 struct record *rec, *prev;
351 double t;
352 int rxq;
353 int i;
354
355 /* Header */
356 printf("\nRunning XDP on dev:%s (ifindex:%d) action:%s options:%s\n",
357 ifname, ifindex, action2str(action), options2str(cfg_opt));
358
359 /* stats_global_map */
360 {
361 char *fmt_rx = "%-15s %-7d %'-11.0f %'-10.0f %s\n";
362 char *fm2_rx = "%-15s %-7s %'-11.0f\n";
363 char *errstr = "";
364
365 printf("%-15s %-7s %-11s %-11s\n",
366 "XDP stats", "CPU", "pps", "issue-pps");
367
368 rec = &stats_rec->stats;
369 prev = &stats_prev->stats;
370 t = calc_period(rec, prev);
371 for (i = 0; i < nr_cpus; i++) {
372 struct datarec *r = &rec->cpu[i];
373 struct datarec *p = &prev->cpu[i];
374
375 pps = calc_pps (r, p, t);
376 err = calc_errs_pps(r, p, t);
377 if (err > 0)
378 errstr = "invalid-ifindex";
379 if (pps > 0)
380 printf(fmt_rx, "XDP-RX CPU",
381 i, pps, err, errstr);
382 }
383 pps = calc_pps (&rec->total, &prev->total, t);
384 err = calc_errs_pps(&rec->total, &prev->total, t);
385 printf(fm2_rx, "XDP-RX CPU", "total", pps, err);
386 }
387
388 /* rx_queue_index_map */
389 printf("\n%-15s %-7s %-11s %-11s\n",
390 "RXQ stats", "RXQ:CPU", "pps", "issue-pps");
391
392 for (rxq = 0; rxq < nr_rxqs; rxq++) {
393 char *fmt_rx = "%-15s %3d:%-3d %'-11.0f %'-10.0f %s\n";
394 char *fm2_rx = "%-15s %3d:%-3s %'-11.0f\n";
395 char *errstr = "";
396 int rxq_ = rxq;
397
398 /* Last RXQ in map catch overflows */
399 if (rxq_ == nr_rxqs - 1)
400 rxq_ = -1;
401
402 rec = &stats_rec->rxq[rxq];
403 prev = &stats_prev->rxq[rxq];
404 t = calc_period(rec, prev);
405 for (i = 0; i < nr_cpus; i++) {
406 struct datarec *r = &rec->cpu[i];
407 struct datarec *p = &prev->cpu[i];
408
409 pps = calc_pps (r, p, t);
410 err = calc_errs_pps(r, p, t);
411 if (err > 0) {
412 if (rxq_ == -1)
413 errstr = "map-overflow-RXQ";
414 else
415 errstr = "err";
416 }
417 if (pps > 0)
418 printf(fmt_rx, "rx_queue_index",
419 rxq_, i, pps, err, errstr);
420 }
421 pps = calc_pps (&rec->total, &prev->total, t);
422 err = calc_errs_pps(&rec->total, &prev->total, t);
423 if (pps || err)
424 printf(fm2_rx, "rx_queue_index", rxq_, "sum", pps, err);
425 }
426 }
427
428
429 /* Pointer swap trick */
swap(struct stats_record ** a,struct stats_record ** b)430 static inline void swap(struct stats_record **a, struct stats_record **b)
431 {
432 struct stats_record *tmp;
433
434 tmp = *a;
435 *a = *b;
436 *b = tmp;
437 }
438
stats_poll(int interval,int action,__u32 cfg_opt)439 static void stats_poll(int interval, int action, __u32 cfg_opt)
440 {
441 struct stats_record *record, *prev;
442
443 record = alloc_stats_record();
444 prev = alloc_stats_record();
445 stats_collect(record);
446
447 while (1) {
448 swap(&prev, &record);
449 stats_collect(record);
450 stats_print(record, prev, action, cfg_opt);
451 sleep(interval);
452 }
453
454 free_stats_record(record);
455 free_stats_record(prev);
456 }
457
458
main(int argc,char ** argv)459 int main(int argc, char **argv)
460 {
461 __u32 cfg_options= NO_TOUCH ; /* Default: Don't touch packet memory */
462 struct bpf_prog_info info = {};
463 __u32 info_len = sizeof(info);
464 int prog_fd, map_fd, opt, err;
465 bool use_separators = true;
466 struct config cfg = { 0 };
467 struct bpf_program *prog;
468 struct bpf_object *obj;
469 struct bpf_map *map;
470 char filename[256];
471 int longindex = 0;
472 int interval = 2;
473 __u32 key = 0;
474
475
476 char action_str_buf[XDP_ACTION_MAX_STRLEN + 1 /* for \0 */] = { 0 };
477 int action = XDP_PASS; /* Default action */
478 char *action_str = NULL;
479
480 snprintf(filename, sizeof(filename), "%s_kern.o", argv[0]);
481
482 obj = bpf_object__open_file(filename, NULL);
483 if (libbpf_get_error(obj))
484 return EXIT_FAIL;
485
486 prog = bpf_object__next_program(obj, NULL);
487 bpf_program__set_type(prog, BPF_PROG_TYPE_XDP);
488
489 err = bpf_object__load(obj);
490 if (err)
491 return EXIT_FAIL;
492 prog_fd = bpf_program__fd(prog);
493
494 map = bpf_object__find_map_by_name(obj, "config_map");
495 stats_global_map = bpf_object__find_map_by_name(obj, "stats_global_map");
496 rx_queue_index_map = bpf_object__find_map_by_name(obj, "rx_queue_index_map");
497 if (!map || !stats_global_map || !rx_queue_index_map) {
498 printf("finding a map in obj file failed\n");
499 return EXIT_FAIL;
500 }
501 map_fd = bpf_map__fd(map);
502
503 if (!prog_fd) {
504 fprintf(stderr, "ERR: bpf_prog_load_xattr: %s\n", strerror(errno));
505 return EXIT_FAIL;
506 }
507
508 /* Parse commands line args */
509 while ((opt = getopt_long(argc, argv, "FhSrmzd:s:a:",
510 long_options, &longindex)) != -1) {
511 switch (opt) {
512 case 'd':
513 if (strlen(optarg) >= IF_NAMESIZE) {
514 fprintf(stderr, "ERR: --dev name too long\n");
515 goto error;
516 }
517 ifname = (char *)&ifname_buf;
518 strncpy(ifname, optarg, IF_NAMESIZE);
519 ifindex = if_nametoindex(ifname);
520 if (ifindex == 0) {
521 fprintf(stderr,
522 "ERR: --dev name unknown err(%d):%s\n",
523 errno, strerror(errno));
524 goto error;
525 }
526 break;
527 case 's':
528 interval = atoi(optarg);
529 break;
530 case 'S':
531 xdp_flags |= XDP_FLAGS_SKB_MODE;
532 break;
533 case 'z':
534 use_separators = false;
535 break;
536 case 'a':
537 action_str = (char *)&action_str_buf;
538 strncpy(action_str, optarg, XDP_ACTION_MAX_STRLEN);
539 break;
540 case 'r':
541 cfg_options |= READ_MEM;
542 break;
543 case 'm':
544 cfg_options |= SWAP_MAC;
545 break;
546 case 'F':
547 xdp_flags &= ~XDP_FLAGS_UPDATE_IF_NOEXIST;
548 break;
549 case 'h':
550 error:
551 default:
552 usage(argv);
553 return EXIT_FAIL_OPTION;
554 }
555 }
556
557 if (!(xdp_flags & XDP_FLAGS_SKB_MODE))
558 xdp_flags |= XDP_FLAGS_DRV_MODE;
559
560 /* Required option */
561 if (ifindex == -1) {
562 fprintf(stderr, "ERR: required option --dev missing\n");
563 usage(argv);
564 return EXIT_FAIL_OPTION;
565 }
566 cfg.ifindex = ifindex;
567
568 /* Parse action string */
569 if (action_str) {
570 action = parse_xdp_action(action_str);
571 if (action < 0) {
572 fprintf(stderr, "ERR: Invalid XDP --action: %s\n",
573 action_str);
574 list_xdp_actions();
575 return EXIT_FAIL_OPTION;
576 }
577 }
578 cfg.action = action;
579
580 /* XDP_TX requires changing MAC-addrs, else HW may drop */
581 if (action == XDP_TX)
582 cfg_options |= SWAP_MAC;
583 cfg.options = cfg_options;
584
585 /* Trick to pretty printf with thousands separators use %' */
586 if (use_separators)
587 setlocale(LC_NUMERIC, "en_US");
588
589 /* User-side setup ifindex in config_map */
590 err = bpf_map_update_elem(map_fd, &key, &cfg, 0);
591 if (err) {
592 fprintf(stderr, "Store config failed (err:%d)\n", err);
593 exit(EXIT_FAIL_BPF);
594 }
595
596 /* Remove XDP program when program is interrupted or killed */
597 signal(SIGINT, int_exit);
598 signal(SIGTERM, int_exit);
599
600 if (bpf_xdp_attach(ifindex, prog_fd, xdp_flags, NULL) < 0) {
601 fprintf(stderr, "link set xdp fd failed\n");
602 return EXIT_FAIL_XDP;
603 }
604
605 err = bpf_obj_get_info_by_fd(prog_fd, &info, &info_len);
606 if (err) {
607 printf("can't get prog info - %s\n", strerror(errno));
608 return err;
609 }
610 prog_id = info.id;
611
612 stats_poll(interval, action, cfg_options);
613 return EXIT_OK;
614 }
615