Path: blob/master/tools/testing/selftests/drivers/net/hw/iou-zcrx.c
53747 views
// SPDX-License-Identifier: GPL-2.01#include <assert.h>2#include <errno.h>3#include <error.h>4#include <fcntl.h>5#include <limits.h>6#include <stdbool.h>7#include <stdint.h>8#include <stdio.h>9#include <stdlib.h>10#include <string.h>11#include <unistd.h>1213#include <arpa/inet.h>14#include <linux/mman.h>15#include <linux/errqueue.h>16#include <linux/if_packet.h>17#include <linux/ipv6.h>18#include <linux/socket.h>19#include <linux/sockios.h>20#include <net/ethernet.h>21#include <net/if.h>22#include <netinet/in.h>23#include <netinet/ip.h>24#include <netinet/ip6.h>25#include <netinet/tcp.h>26#include <netinet/udp.h>27#include <sys/epoll.h>28#include <sys/ioctl.h>29#include <sys/mman.h>30#include <sys/resource.h>31#include <sys/socket.h>32#include <sys/stat.h>33#include <sys/time.h>34#include <sys/types.h>35#include <sys/un.h>36#include <sys/wait.h>3738#include <liburing.h>3940#define SKIP_CODE 424142struct t_io_uring_zcrx_ifq_reg {43__u32 if_idx;44__u32 if_rxq;45__u32 rq_entries;46__u32 flags;4748__u64 area_ptr; /* pointer to struct io_uring_zcrx_area_reg */49__u64 region_ptr; /* struct io_uring_region_desc * */5051struct io_uring_zcrx_offsets offsets;52__u32 zcrx_id;53__u32 rx_buf_len;54__u64 __resv[3];55};5657static long page_size;58#define AREA_SIZE (8192 * page_size)59#define SEND_SIZE (512 * 4096)60#define min(a, b) \61({ \62typeof(a) _a = (a); \63typeof(b) _b = (b); \64_a < _b ? _a : _b; \65})66#define min_t(t, a, b) \67({ \68t _ta = (a); \69t _tb = (b); \70min(_ta, _tb); \71})7273#define ALIGN_UP(v, align) (((v) + (align) - 1) & ~((align) - 1))7475static int cfg_server;76static int cfg_client;77static int cfg_port = 8000;78static int cfg_payload_len;79static const char *cfg_ifname;80static int cfg_queue_id = -1;81static bool cfg_oneshot;82static int cfg_oneshot_recvs;83static int cfg_send_size = SEND_SIZE;84static struct sockaddr_in6 cfg_addr;85static unsigned int cfg_rx_buf_len;86static bool cfg_dry_run;8788static char *payload;89static void *area_ptr;90static void *ring_ptr;91static size_t ring_size;92static struct io_uring_zcrx_rq rq_ring;93static unsigned long area_token;94static int connfd;95static bool stop;96static size_t received;9798static unsigned long gettimeofday_ms(void)99{100struct timeval tv;101102gettimeofday(&tv, NULL);103return (tv.tv_sec * 1000) + (tv.tv_usec / 1000);104}105106static int parse_address(const char *str, int port, struct sockaddr_in6 *sin6)107{108int ret;109110sin6->sin6_family = AF_INET6;111sin6->sin6_port = htons(port);112113ret = inet_pton(sin6->sin6_family, str, &sin6->sin6_addr);114if (ret != 1) {115/* fallback to plain IPv4 */116ret = inet_pton(AF_INET, str, &sin6->sin6_addr.s6_addr32[3]);117if (ret != 1)118return -1;119120/* add ::ffff prefix */121sin6->sin6_addr.s6_addr32[0] = 0;122sin6->sin6_addr.s6_addr32[1] = 0;123sin6->sin6_addr.s6_addr16[4] = 0;124sin6->sin6_addr.s6_addr16[5] = 0xffff;125}126127return 0;128}129130static inline size_t get_refill_ring_size(unsigned int rq_entries)131{132size_t size;133134ring_size = rq_entries * sizeof(struct io_uring_zcrx_rqe);135/* add space for the header (head/tail/etc.) */136ring_size += page_size;137return ALIGN_UP(ring_size, page_size);138}139140static void setup_zcrx(struct io_uring *ring)141{142unsigned int ifindex;143unsigned int rq_entries = 4096;144int ret;145146ifindex = if_nametoindex(cfg_ifname);147if (!ifindex)148error(1, 0, "bad interface name: %s", cfg_ifname);149150if (cfg_rx_buf_len && cfg_rx_buf_len != page_size) {151area_ptr = mmap(NULL,152AREA_SIZE,153PROT_READ | PROT_WRITE,154MAP_ANONYMOUS | MAP_PRIVATE |155MAP_HUGETLB | MAP_HUGE_2MB,156-1,1570);158if (area_ptr == MAP_FAILED) {159printf("Can't allocate huge pages\n");160exit(SKIP_CODE);161}162} else {163area_ptr = mmap(NULL,164AREA_SIZE,165PROT_READ | PROT_WRITE,166MAP_ANONYMOUS | MAP_PRIVATE,1670,1680);169if (area_ptr == MAP_FAILED)170error(1, 0, "mmap(): zero copy area");171}172173ring_size = get_refill_ring_size(rq_entries);174ring_ptr = mmap(NULL,175ring_size,176PROT_READ | PROT_WRITE,177MAP_ANONYMOUS | MAP_PRIVATE,1780,1790);180181struct io_uring_region_desc region_reg = {182.size = ring_size,183.user_addr = (__u64)(unsigned long)ring_ptr,184.flags = IORING_MEM_REGION_TYPE_USER,185};186187struct io_uring_zcrx_area_reg area_reg = {188.addr = (__u64)(unsigned long)area_ptr,189.len = AREA_SIZE,190.flags = 0,191};192193struct t_io_uring_zcrx_ifq_reg reg = {194.if_idx = ifindex,195.if_rxq = cfg_queue_id,196.rq_entries = rq_entries,197.area_ptr = (__u64)(unsigned long)&area_reg,198.region_ptr = (__u64)(unsigned long)®ion_reg,199.rx_buf_len = cfg_rx_buf_len,200};201202ret = io_uring_register_ifq(ring, (void *)®);203if (cfg_rx_buf_len && (ret == -EINVAL || ret == -EOPNOTSUPP ||204ret == -ERANGE)) {205printf("Large chunks are not supported %i\n", ret);206exit(SKIP_CODE);207} else if (ret) {208error(1, 0, "io_uring_register_ifq(): %d", ret);209}210211rq_ring.khead = (unsigned int *)((char *)ring_ptr + reg.offsets.head);212rq_ring.ktail = (unsigned int *)((char *)ring_ptr + reg.offsets.tail);213rq_ring.rqes = (struct io_uring_zcrx_rqe *)((char *)ring_ptr + reg.offsets.rqes);214rq_ring.rq_tail = 0;215rq_ring.ring_entries = reg.rq_entries;216217area_token = area_reg.rq_area_token;218}219220static void add_accept(struct io_uring *ring, int sockfd)221{222struct io_uring_sqe *sqe;223224sqe = io_uring_get_sqe(ring);225226io_uring_prep_accept(sqe, sockfd, NULL, NULL, 0);227sqe->user_data = 1;228}229230static void add_recvzc(struct io_uring *ring, int sockfd)231{232struct io_uring_sqe *sqe;233234sqe = io_uring_get_sqe(ring);235236io_uring_prep_rw(IORING_OP_RECV_ZC, sqe, sockfd, NULL, 0, 0);237sqe->ioprio |= IORING_RECV_MULTISHOT;238sqe->user_data = 2;239}240241static void add_recvzc_oneshot(struct io_uring *ring, int sockfd, size_t len)242{243struct io_uring_sqe *sqe;244245sqe = io_uring_get_sqe(ring);246247io_uring_prep_rw(IORING_OP_RECV_ZC, sqe, sockfd, NULL, len, 0);248sqe->ioprio |= IORING_RECV_MULTISHOT;249sqe->user_data = 2;250}251252static void process_accept(struct io_uring *ring, struct io_uring_cqe *cqe)253{254if (cqe->res < 0)255error(1, 0, "accept()");256if (connfd)257error(1, 0, "Unexpected second connection");258259connfd = cqe->res;260if (cfg_oneshot)261add_recvzc_oneshot(ring, connfd, page_size);262else263add_recvzc(ring, connfd);264}265266static void process_recvzc(struct io_uring *ring, struct io_uring_cqe *cqe)267{268unsigned rq_mask = rq_ring.ring_entries - 1;269struct io_uring_zcrx_cqe *rcqe;270struct io_uring_zcrx_rqe *rqe;271struct io_uring_sqe *sqe;272uint64_t mask;273char *data;274ssize_t n;275int i;276277if (cqe->res == 0 && cqe->flags == 0 && cfg_oneshot_recvs == 0) {278stop = true;279return;280}281282if (cqe->res < 0)283error(1, 0, "recvzc(): %d", cqe->res);284285if (cfg_oneshot) {286if (cqe->res == 0 && cqe->flags == 0 && cfg_oneshot_recvs) {287add_recvzc_oneshot(ring, connfd, page_size);288cfg_oneshot_recvs--;289}290} else if (!(cqe->flags & IORING_CQE_F_MORE)) {291add_recvzc(ring, connfd);292}293294rcqe = (struct io_uring_zcrx_cqe *)(cqe + 1);295296n = cqe->res;297mask = (1ULL << IORING_ZCRX_AREA_SHIFT) - 1;298data = (char *)area_ptr + (rcqe->off & mask);299300for (i = 0; i < n; i++) {301if (*(data + i) != payload[(received + i)])302error(1, 0, "payload mismatch at %d", i);303}304received += n;305306rqe = &rq_ring.rqes[(rq_ring.rq_tail & rq_mask)];307rqe->off = (rcqe->off & ~IORING_ZCRX_AREA_MASK) | area_token;308rqe->len = cqe->res;309io_uring_smp_store_release(rq_ring.ktail, ++rq_ring.rq_tail);310}311312static void server_loop(struct io_uring *ring)313{314struct io_uring_cqe *cqe;315unsigned int count = 0;316unsigned int head;317int i, ret;318319io_uring_submit_and_wait(ring, 1);320321io_uring_for_each_cqe(ring, head, cqe) {322if (cqe->user_data == 1)323process_accept(ring, cqe);324else if (cqe->user_data == 2)325process_recvzc(ring, cqe);326else327error(1, 0, "unknown cqe");328count++;329}330io_uring_cq_advance(ring, count);331}332333static void run_server(void)334{335unsigned int flags = 0;336struct io_uring ring;337int fd, enable, ret;338uint64_t tstop;339340fd = socket(AF_INET6, SOCK_STREAM, 0);341if (fd == -1)342error(1, 0, "socket()");343344enable = 1;345ret = setsockopt(fd, SOL_SOCKET, SO_REUSEADDR, &enable, sizeof(int));346if (ret < 0)347error(1, 0, "setsockopt(SO_REUSEADDR)");348349ret = bind(fd, (struct sockaddr *)&cfg_addr, sizeof(cfg_addr));350if (ret < 0)351error(1, 0, "bind()");352353if (listen(fd, 1024) < 0)354error(1, 0, "listen()");355356flags |= IORING_SETUP_COOP_TASKRUN;357flags |= IORING_SETUP_SINGLE_ISSUER;358flags |= IORING_SETUP_DEFER_TASKRUN;359flags |= IORING_SETUP_SUBMIT_ALL;360flags |= IORING_SETUP_CQE32;361362io_uring_queue_init(512, &ring, flags);363364setup_zcrx(&ring);365if (cfg_dry_run)366return;367368add_accept(&ring, fd);369370tstop = gettimeofday_ms() + 5000;371while (!stop && gettimeofday_ms() < tstop)372server_loop(&ring);373374if (!stop)375error(1, 0, "test failed\n");376}377378static void run_client(void)379{380ssize_t to_send = cfg_send_size;381ssize_t sent = 0;382ssize_t chunk, res;383int fd;384385fd = socket(AF_INET6, SOCK_STREAM, 0);386if (fd == -1)387error(1, 0, "socket()");388389if (connect(fd, (struct sockaddr *)&cfg_addr, sizeof(cfg_addr)))390error(1, 0, "connect()");391392while (to_send) {393void *src = &payload[sent];394395chunk = min_t(ssize_t, cfg_payload_len, to_send);396res = send(fd, src, chunk, 0);397if (res < 0)398error(1, 0, "send(): %zd", sent);399sent += res;400to_send -= res;401}402403close(fd);404}405406static void usage(const char *filepath)407{408error(1, 0, "Usage: %s (-4|-6) (-s|-c) -h<server_ip> -p<port> "409"-l<payload_size> -i<ifname> -q<rxq_id>", filepath);410}411412static void parse_opts(int argc, char **argv)413{414const int max_payload_len = SEND_SIZE -415sizeof(struct ipv6hdr) -416sizeof(struct tcphdr) -41740 /* max tcp options */;418struct sockaddr_in6 *addr6 = (void *) &cfg_addr;419char *addr = NULL;420int ret;421int c;422423if (argc <= 1)424usage(argv[0]);425cfg_payload_len = max_payload_len;426427while ((c = getopt(argc, argv, "sch:p:l:i:q:o:z:x:d")) != -1) {428switch (c) {429case 's':430if (cfg_client)431error(1, 0, "Pass one of -s or -c");432cfg_server = 1;433break;434case 'c':435if (cfg_server)436error(1, 0, "Pass one of -s or -c");437cfg_client = 1;438break;439case 'h':440addr = optarg;441break;442case 'p':443cfg_port = strtoul(optarg, NULL, 0);444break;445case 'l':446cfg_payload_len = strtoul(optarg, NULL, 0);447break;448case 'i':449cfg_ifname = optarg;450break;451case 'q':452cfg_queue_id = strtoul(optarg, NULL, 0);453break;454case 'o': {455cfg_oneshot = true;456cfg_oneshot_recvs = strtoul(optarg, NULL, 0);457break;458}459case 'z':460cfg_send_size = strtoul(optarg, NULL, 0);461break;462case 'x':463cfg_rx_buf_len = page_size * strtoul(optarg, NULL, 0);464break;465case 'd':466cfg_dry_run = true;467break;468}469}470471if (cfg_server && addr)472error(1, 0, "Receiver cannot have -h specified");473474memset(addr6, 0, sizeof(*addr6));475addr6->sin6_family = AF_INET6;476addr6->sin6_port = htons(cfg_port);477addr6->sin6_addr = in6addr_any;478if (addr) {479ret = parse_address(addr, cfg_port, addr6);480if (ret)481error(1, 0, "receiver address parse error: %s", addr);482}483484if (cfg_payload_len > max_payload_len)485error(1, 0, "-l: payload exceeds max (%d)", max_payload_len);486}487488int main(int argc, char **argv)489{490const char *cfg_test = argv[argc - 1];491int i;492493page_size = sysconf(_SC_PAGESIZE);494if (page_size < 0)495return 1;496497if (posix_memalign((void **)&payload, page_size, SEND_SIZE))498return 1;499500parse_opts(argc, argv);501502for (i = 0; i < SEND_SIZE; i++)503payload[i] = 'a' + (i % 26);504505if (cfg_server)506run_server();507else if (cfg_client)508run_client();509510return 0;511}512513514