Path: blob/master/tools/testing/selftests/bpf/benchs/bench_sockmap.c
29270 views
// SPDX-License-Identifier: GPL-2.012#include <error.h>3#include <sys/types.h>4#include <sys/socket.h>5#include <netinet/in.h>6#include <sys/sendfile.h>7#include <arpa/inet.h>8#include <fcntl.h>9#include <argp.h>10#include "bench.h"11#include "bench_sockmap_prog.skel.h"12#include "bpf_util.h"1314#define FILE_SIZE (128 * 1024)15#define DATA_REPEAT_SIZE 101617static const char snd_data[DATA_REPEAT_SIZE] = {0, 1, 2, 3, 4, 5, 6, 7, 8, 9};1819/* c1 <-> [p1, p2] <-> c220* RX bench(BPF_SK_SKB_STREAM_VERDICT):21* ARG_FW_RX_PASS:22* send(p2) -> recv(c2) -> bpf skb passthrough -> recv(c2)23* ARG_FW_RX_VERDICT_EGRESS:24* send(c1) -> verdict skb to tx queuec of p2 -> recv(c2)25* ARG_FW_RX_VERDICT_INGRESS:26* send(c1) -> verdict skb to rx queuec of c2 -> recv(c2)27*28* TX bench(BPF_SK_MSG_VERDIC):29* ARG_FW_TX_PASS:30* send(p2) -> bpf msg passthrough -> send(p2) -> recv(c2)31* ARG_FW_TX_VERDICT_INGRESS:32* send(p2) -> verdict msg to rx queue of c2 -> recv(c2)33* ARG_FW_TX_VERDICT_EGRESS:34* send(p1) -> verdict msg to tx queue of p2 -> recv(c2)35*/36enum SOCKMAP_ARG_FLAG {37ARG_FW_RX_NORMAL = 11000,38ARG_FW_RX_PASS,39ARG_FW_RX_VERDICT_EGRESS,40ARG_FW_RX_VERDICT_INGRESS,41ARG_FW_TX_NORMAL,42ARG_FW_TX_PASS,43ARG_FW_TX_VERDICT_INGRESS,44ARG_FW_TX_VERDICT_EGRESS,45ARG_CTL_RX_STRP,46ARG_CONSUMER_DELAY_TIME,47ARG_PRODUCER_DURATION,48};4950#define TXMODE_NORMAL() \51((ctx.mode) == ARG_FW_TX_NORMAL)5253#define TXMODE_BPF_INGRESS() \54((ctx.mode) == ARG_FW_TX_VERDICT_INGRESS)5556#define TXMODE_BPF_EGRESS() \57((ctx.mode) == ARG_FW_TX_VERDICT_EGRESS)5859#define TXMODE_BPF_PASS() \60((ctx.mode) == ARG_FW_TX_PASS)6162#define TXMODE_BPF() ( \63TXMODE_BPF_PASS() || \64TXMODE_BPF_INGRESS() || \65TXMODE_BPF_EGRESS())6667#define TXMODE() ( \68TXMODE_NORMAL() || \69TXMODE_BPF())7071#define RXMODE_NORMAL() \72((ctx.mode) == ARG_FW_RX_NORMAL)7374#define RXMODE_BPF_PASS() \75((ctx.mode) == ARG_FW_RX_PASS)7677#define RXMODE_BPF_VERDICT_EGRESS() \78((ctx.mode) == ARG_FW_RX_VERDICT_EGRESS)7980#define RXMODE_BPF_VERDICT_INGRESS() \81((ctx.mode) == ARG_FW_RX_VERDICT_INGRESS)8283#define RXMODE_BPF_VERDICT() ( \84RXMODE_BPF_VERDICT_INGRESS() || \85RXMODE_BPF_VERDICT_EGRESS())8687#define RXMODE_BPF() ( \88RXMODE_BPF_PASS() || \89RXMODE_BPF_VERDICT())9091#define RXMODE() ( \92RXMODE_NORMAL() || \93RXMODE_BPF())9495static struct socmap_ctx {96struct bench_sockmap_prog *skel;97enum SOCKMAP_ARG_FLAG mode;98#define c1 fds[0]99#define p1 fds[1]100#define c2 fds[2]101#define p2 fds[3]102#define sfd fds[4]103int fds[5];104long send_calls;105long read_calls;106long prod_send;107long user_read;108int file_size;109int delay_consumer;110int prod_run_time;111int strp_size;112} ctx = {113.prod_send = 0,114.user_read = 0,115.file_size = FILE_SIZE,116.mode = ARG_FW_RX_VERDICT_EGRESS,117.fds = {0},118.delay_consumer = 0,119.prod_run_time = 0,120.strp_size = 0,121};122123static void bench_sockmap_prog_destroy(void)124{125int i;126127for (i = 0; i < ARRAY_SIZE(ctx.fds); i++) {128if (ctx.fds[i] > 0)129close(ctx.fds[i]);130}131132bench_sockmap_prog__destroy(ctx.skel);133}134135static void init_addr(struct sockaddr_storage *ss,136socklen_t *len)137{138struct sockaddr_in *addr4 = memset(ss, 0, sizeof(*ss));139140addr4->sin_family = AF_INET;141addr4->sin_port = 0;142addr4->sin_addr.s_addr = htonl(INADDR_LOOPBACK);143*len = sizeof(*addr4);144}145146static bool set_non_block(int fd, bool blocking)147{148int flags = fcntl(fd, F_GETFL, 0);149150if (flags == -1)151return false;152flags = blocking ? (flags | O_NONBLOCK) : (flags & ~O_NONBLOCK);153return (fcntl(fd, F_SETFL, flags) == 0);154}155156static int create_pair(int *c, int *p, int type)157{158struct sockaddr_storage addr;159int err, cfd, pfd;160socklen_t addr_len = sizeof(struct sockaddr_storage);161162err = getsockname(ctx.sfd, (struct sockaddr *)&addr, &addr_len);163if (err) {164fprintf(stderr, "getsockname error %d\n", errno);165return err;166}167cfd = socket(AF_INET, type, 0);168if (cfd < 0) {169fprintf(stderr, "socket error %d\n", errno);170return err;171}172173err = connect(cfd, (struct sockaddr *)&addr, addr_len);174if (err && errno != EINPROGRESS) {175fprintf(stderr, "connect error %d\n", errno);176return err;177}178179pfd = accept(ctx.sfd, NULL, NULL);180if (pfd < 0) {181fprintf(stderr, "accept error %d\n", errno);182return err;183}184*c = cfd;185*p = pfd;186return 0;187}188189static int create_sockets(void)190{191struct sockaddr_storage addr;192int err, one = 1;193socklen_t addr_len;194195init_addr(&addr, &addr_len);196ctx.sfd = socket(AF_INET, SOCK_STREAM, 0);197if (ctx.sfd < 0) {198fprintf(stderr, "socket error:%d\n", errno);199return ctx.sfd;200}201err = setsockopt(ctx.sfd, SOL_SOCKET, SO_REUSEPORT, &one, sizeof(one));202if (err) {203fprintf(stderr, "setsockopt error:%d\n", errno);204return err;205}206207err = bind(ctx.sfd, (struct sockaddr *)&addr, addr_len);208if (err) {209fprintf(stderr, "bind error:%d\n", errno);210return err;211}212213err = listen(ctx.sfd, SOMAXCONN);214if (err) {215fprintf(stderr, "listen error:%d\n", errno);216return err;217}218219err = create_pair(&ctx.c1, &ctx.p1, SOCK_STREAM);220if (err) {221fprintf(stderr, "create_pair 1 error\n");222return err;223}224225err = create_pair(&ctx.c2, &ctx.p2, SOCK_STREAM);226if (err) {227fprintf(stderr, "create_pair 2 error\n");228return err;229}230printf("create socket fd c1:%d p1:%d c2:%d p2:%d\n",231ctx.c1, ctx.p1, ctx.c2, ctx.p2);232return 0;233}234235static void validate(void)236{237if (env.consumer_cnt != 2 || env.producer_cnt != 1 ||238!env.affinity)239goto err;240return;241err:242fprintf(stderr, "argument '-c 2 -p 1 -a' is necessary");243exit(1);244}245246static int setup_rx_sockmap(void)247{248int verdict, pass, parser, map;249int zero = 0, one = 1;250int err;251252parser = bpf_program__fd(ctx.skel->progs.prog_skb_parser);253verdict = bpf_program__fd(ctx.skel->progs.prog_skb_verdict);254pass = bpf_program__fd(ctx.skel->progs.prog_skb_pass);255map = bpf_map__fd(ctx.skel->maps.sock_map_rx);256257if (ctx.strp_size != 0) {258ctx.skel->bss->pkt_size = ctx.strp_size;259err = bpf_prog_attach(parser, map, BPF_SK_SKB_STREAM_PARSER, 0);260if (err)261return err;262}263264if (RXMODE_BPF_VERDICT())265err = bpf_prog_attach(verdict, map, BPF_SK_SKB_STREAM_VERDICT, 0);266else if (RXMODE_BPF_PASS())267err = bpf_prog_attach(pass, map, BPF_SK_SKB_STREAM_VERDICT, 0);268if (err)269return err;270271if (RXMODE_BPF_PASS())272return bpf_map_update_elem(map, &zero, &ctx.c2, BPF_NOEXIST);273274err = bpf_map_update_elem(map, &zero, &ctx.p1, BPF_NOEXIST);275if (err < 0)276return err;277278if (RXMODE_BPF_VERDICT_INGRESS()) {279ctx.skel->bss->verdict_dir = BPF_F_INGRESS;280err = bpf_map_update_elem(map, &one, &ctx.c2, BPF_NOEXIST);281} else {282err = bpf_map_update_elem(map, &one, &ctx.p2, BPF_NOEXIST);283}284if (err < 0)285return err;286287return 0;288}289290static int setup_tx_sockmap(void)291{292int zero = 0, one = 1;293int prog, map;294int err;295296map = bpf_map__fd(ctx.skel->maps.sock_map_tx);297prog = TXMODE_BPF_PASS() ?298bpf_program__fd(ctx.skel->progs.prog_skmsg_pass) :299bpf_program__fd(ctx.skel->progs.prog_skmsg_verdict);300301err = bpf_prog_attach(prog, map, BPF_SK_MSG_VERDICT, 0);302if (err)303return err;304305if (TXMODE_BPF_EGRESS()) {306err = bpf_map_update_elem(map, &zero, &ctx.p1, BPF_NOEXIST);307err |= bpf_map_update_elem(map, &one, &ctx.p2, BPF_NOEXIST);308} else {309ctx.skel->bss->verdict_dir = BPF_F_INGRESS;310err = bpf_map_update_elem(map, &zero, &ctx.p2, BPF_NOEXIST);311err |= bpf_map_update_elem(map, &one, &ctx.c2, BPF_NOEXIST);312}313314if (err < 0)315return err;316317return 0;318}319320static void setup(void)321{322int err;323324ctx.skel = bench_sockmap_prog__open_and_load();325if (!ctx.skel) {326fprintf(stderr, "error loading skel\n");327exit(1);328}329330if (create_sockets()) {331fprintf(stderr, "create_net_mode error\n");332goto err;333}334335if (RXMODE_BPF()) {336err = setup_rx_sockmap();337if (err) {338fprintf(stderr, "setup_rx_sockmap error:%d\n", err);339goto err;340}341} else if (TXMODE_BPF()) {342err = setup_tx_sockmap();343if (err) {344fprintf(stderr, "setup_tx_sockmap error:%d\n", err);345goto err;346}347} else {348fprintf(stderr, "unknown sockmap bench mode: %d\n", ctx.mode);349goto err;350}351352return;353354err:355bench_sockmap_prog_destroy();356exit(1);357}358359static void measure(struct bench_res *res)360{361res->drops = atomic_swap(&ctx.prod_send, 0);362res->hits = atomic_swap(&ctx.skel->bss->process_byte, 0);363res->false_hits = atomic_swap(&ctx.user_read, 0);364res->important_hits = atomic_swap(&ctx.send_calls, 0);365res->important_hits |= atomic_swap(&ctx.read_calls, 0) << 32;366}367368static void verify_data(int *check_pos, char *buf, int rcv)369{370for (int i = 0 ; i < rcv; i++) {371if (buf[i] != snd_data[(*check_pos) % DATA_REPEAT_SIZE]) {372fprintf(stderr, "verify data fail");373exit(1);374}375(*check_pos)++;376if (*check_pos >= FILE_SIZE)377*check_pos = 0;378}379}380381static void *consumer(void *input)382{383int rcv, sent;384int check_pos = 0;385int tid = (long)input;386int recv_buf_size = FILE_SIZE;387char *buf = malloc(recv_buf_size);388int delay_read = ctx.delay_consumer;389390if (!buf) {391fprintf(stderr, "fail to init read buffer");392return NULL;393}394395while (true) {396if (tid == 1) {397/* consumer 1 is unused for tx test and stream verdict test */398if (RXMODE_BPF() || TXMODE())399return NULL;400/* it's only for RX_NORMAL which service as reserve-proxy mode */401rcv = read(ctx.p1, buf, recv_buf_size);402if (rcv < 0) {403fprintf(stderr, "fail to read p1");404return NULL;405}406407sent = send(ctx.p2, buf, recv_buf_size, 0);408if (sent < 0) {409fprintf(stderr, "fail to send p2");410return NULL;411}412} else {413if (delay_read != 0) {414if (delay_read < 0)415return NULL;416sleep(delay_read);417delay_read = 0;418}419/* read real endpoint by consumer 0 */420atomic_inc(&ctx.read_calls);421rcv = read(ctx.c2, buf, recv_buf_size);422if (rcv < 0 && errno != EAGAIN) {423fprintf(stderr, "%s fail to read c2 %d\n", __func__, errno);424return NULL;425}426verify_data(&check_pos, buf, rcv);427atomic_add(&ctx.user_read, rcv);428}429}430431return NULL;432}433434static void *producer(void *input)435{436int off = 0, fp, need_sent, sent;437int file_size = ctx.file_size;438struct timespec ts1, ts2;439int target;440FILE *file;441442file = tmpfile();443if (!file) {444fprintf(stderr, "create file for sendfile");445return NULL;446}447448/* we need simple verify */449for (int i = 0; i < file_size; i++) {450if (fwrite(&snd_data[off], sizeof(char), 1, file) != 1) {451fprintf(stderr, "init tmpfile error");452return NULL;453}454if (++off >= sizeof(snd_data))455off = 0;456}457fflush(file);458fseek(file, 0, SEEK_SET);459460fp = fileno(file);461need_sent = file_size;462clock_gettime(CLOCK_MONOTONIC, &ts1);463464if (RXMODE_BPF_VERDICT())465target = ctx.c1;466else if (TXMODE_BPF_EGRESS())467target = ctx.p1;468else469target = ctx.p2;470set_non_block(target, true);471while (true) {472if (ctx.prod_run_time) {473clock_gettime(CLOCK_MONOTONIC, &ts2);474if (ts2.tv_sec - ts1.tv_sec > ctx.prod_run_time)475return NULL;476}477478errno = 0;479atomic_inc(&ctx.send_calls);480sent = sendfile(target, fp, NULL, need_sent);481if (sent < 0) {482if (errno != EAGAIN && errno != ENOMEM && errno != ENOBUFS) {483fprintf(stderr, "sendfile return %d, errorno %d:%s\n",484sent, errno, strerror(errno));485return NULL;486}487continue;488} else if (sent < need_sent) {489need_sent -= sent;490atomic_add(&ctx.prod_send, sent);491continue;492}493atomic_add(&ctx.prod_send, need_sent);494need_sent = file_size;495lseek(fp, 0, SEEK_SET);496}497498return NULL;499}500501static void report_progress(int iter, struct bench_res *res, long delta_ns)502{503double speed_mbs, prod_mbs, bpf_mbs, send_hz, read_hz;504505prod_mbs = res->drops / 1000000.0 / (delta_ns / 1000000000.0);506speed_mbs = res->false_hits / 1000000.0 / (delta_ns / 1000000000.0);507bpf_mbs = res->hits / 1000000.0 / (delta_ns / 1000000000.0);508send_hz = (res->important_hits & 0xFFFFFFFF) / (delta_ns / 1000000000.0);509read_hz = (res->important_hits >> 32) / (delta_ns / 1000000000.0);510511printf("Iter %3d (%7.3lfus): ",512iter, (delta_ns - 1000000000) / 1000.0);513printf("Send Speed %8.3lf MB/s (%8.3lf calls/s), BPF Speed %8.3lf MB/s, "514"Rcv Speed %8.3lf MB/s (%8.3lf calls/s)\n",515prod_mbs, send_hz, bpf_mbs, speed_mbs, read_hz);516}517518static void report_final(struct bench_res res[], int res_cnt)519{520double verdict_mbs_mean = 0.0;521long verdict_total = 0;522int i;523524for (i = 0; i < res_cnt; i++) {525verdict_mbs_mean += res[i].hits / 1000000.0 / (0.0 + res_cnt);526verdict_total += res[i].hits / 1000000.0;527}528529printf("Summary: total trans %8.3lu MB \u00B1 %5.3lf MB/s\n",530verdict_total, verdict_mbs_mean);531}532533static const struct argp_option opts[] = {534{ "rx-normal", ARG_FW_RX_NORMAL, NULL, 0,535"simple reserve-proxy mode, no bfp enabled"},536{ "rx-pass", ARG_FW_RX_PASS, NULL, 0,537"run bpf prog but no redir applied"},538{ "rx-strp", ARG_CTL_RX_STRP, "Byte", 0,539"enable strparser and set the encapsulation size"},540{ "rx-verdict-egress", ARG_FW_RX_VERDICT_EGRESS, NULL, 0,541"forward data with bpf(stream verdict)"},542{ "rx-verdict-ingress", ARG_FW_RX_VERDICT_INGRESS, NULL, 0,543"forward data with bpf(stream verdict)"},544{ "tx-normal", ARG_FW_TX_NORMAL, NULL, 0,545"simple c-s mode, no bfp enabled"},546{ "tx-pass", ARG_FW_TX_PASS, NULL, 0,547"run bpf prog but no redir applied"},548{ "tx-verdict-ingress", ARG_FW_TX_VERDICT_INGRESS, NULL, 0,549"forward msg to ingress queue of another socket"},550{ "tx-verdict-egress", ARG_FW_TX_VERDICT_EGRESS, NULL, 0,551"forward msg to egress queue of another socket"},552{ "delay-consumer", ARG_CONSUMER_DELAY_TIME, "SEC", 0,553"delay consumer start"},554{ "producer-duration", ARG_PRODUCER_DURATION, "SEC", 0,555"producer duration"},556{},557};558559static error_t parse_arg(int key, char *arg, struct argp_state *state)560{561switch (key) {562case ARG_FW_RX_NORMAL...ARG_FW_TX_VERDICT_EGRESS:563ctx.mode = key;564break;565case ARG_CONSUMER_DELAY_TIME:566ctx.delay_consumer = strtol(arg, NULL, 10);567break;568case ARG_PRODUCER_DURATION:569ctx.prod_run_time = strtol(arg, NULL, 10);570break;571case ARG_CTL_RX_STRP:572ctx.strp_size = strtol(arg, NULL, 10);573break;574default:575return ARGP_ERR_UNKNOWN;576}577578return 0;579}580581/* exported into benchmark runner */582const struct argp bench_sockmap_argp = {583.options = opts,584.parser = parse_arg,585};586587/* Benchmark performance of creating bpf local storage */588const struct bench bench_sockmap = {589.name = "sockmap",590.argp = &bench_sockmap_argp,591.validate = validate,592.setup = setup,593.producer_thread = producer,594.consumer_thread = consumer,595.measure = measure,596.report_progress = report_progress,597.report_final = report_final,598};599600601