Path: blob/master/tools/include/io_uring/mini_liburing.h
48952 views
/* SPDX-License-Identifier: MIT */12#include <linux/io_uring.h>3#include <sys/mman.h>4#include <sys/syscall.h>5#include <stdio.h>6#include <string.h>7#include <unistd.h>8#include <sys/uio.h>910struct io_sq_ring {11unsigned int *head;12unsigned int *tail;13unsigned int *ring_mask;14unsigned int *ring_entries;15unsigned int *flags;16unsigned int *array;17};1819struct io_cq_ring {20unsigned int *head;21unsigned int *tail;22unsigned int *ring_mask;23unsigned int *ring_entries;24struct io_uring_cqe *cqes;25};2627struct io_uring_sq {28unsigned int *khead;29unsigned int *ktail;30unsigned int *kring_mask;31unsigned int *kring_entries;32unsigned int *kflags;33unsigned int *kdropped;34unsigned int *array;35struct io_uring_sqe *sqes;3637unsigned int sqe_head;38unsigned int sqe_tail;3940size_t ring_sz;41};4243struct io_uring_cq {44unsigned int *khead;45unsigned int *ktail;46unsigned int *kring_mask;47unsigned int *kring_entries;48unsigned int *koverflow;49struct io_uring_cqe *cqes;5051size_t ring_sz;52};5354struct io_uring {55struct io_uring_sq sq;56struct io_uring_cq cq;57int ring_fd;58unsigned flags;59};6061#if defined(__x86_64) || defined(__i386__)62#define read_barrier() __asm__ __volatile__("":::"memory")63#define write_barrier() __asm__ __volatile__("":::"memory")64#else65#define read_barrier() __sync_synchronize()66#define write_barrier() __sync_synchronize()67#endif6869static inline int io_uring_mmap(int fd, struct io_uring_params *p,70struct io_uring_sq *sq, struct io_uring_cq *cq)71{72size_t size;73void *ptr;74int ret;7576if (p->flags & IORING_SETUP_NO_SQARRAY) {77sq->ring_sz = p->cq_off.cqes;78sq->ring_sz += p->cq_entries * sizeof(struct io_uring_cqe);79} else {80sq->ring_sz = p->sq_off.array;81sq->ring_sz += p->sq_entries * sizeof(unsigned int);82}8384ptr = mmap(0, sq->ring_sz, PROT_READ | PROT_WRITE,85MAP_SHARED | MAP_POPULATE, fd, IORING_OFF_SQ_RING);86if (ptr == MAP_FAILED)87return -errno;88sq->khead = ptr + p->sq_off.head;89sq->ktail = ptr + p->sq_off.tail;90sq->kring_mask = ptr + p->sq_off.ring_mask;91sq->kring_entries = ptr + p->sq_off.ring_entries;92sq->kflags = ptr + p->sq_off.flags;93sq->kdropped = ptr + p->sq_off.dropped;94if (!(p->flags & IORING_SETUP_NO_SQARRAY))95sq->array = ptr + p->sq_off.array;9697size = p->sq_entries * sizeof(struct io_uring_sqe);98sq->sqes = mmap(0, size, PROT_READ | PROT_WRITE,99MAP_SHARED | MAP_POPULATE, fd, IORING_OFF_SQES);100if (sq->sqes == MAP_FAILED) {101ret = -errno;102err:103munmap(sq->khead, sq->ring_sz);104return ret;105}106107cq->ring_sz = p->cq_off.cqes + p->cq_entries * sizeof(struct io_uring_cqe);108ptr = mmap(0, cq->ring_sz, PROT_READ | PROT_WRITE,109MAP_SHARED | MAP_POPULATE, fd, IORING_OFF_CQ_RING);110if (ptr == MAP_FAILED) {111ret = -errno;112munmap(sq->sqes, p->sq_entries * sizeof(struct io_uring_sqe));113goto err;114}115cq->khead = ptr + p->cq_off.head;116cq->ktail = ptr + p->cq_off.tail;117cq->kring_mask = ptr + p->cq_off.ring_mask;118cq->kring_entries = ptr + p->cq_off.ring_entries;119cq->koverflow = ptr + p->cq_off.overflow;120cq->cqes = ptr + p->cq_off.cqes;121return 0;122}123124static inline int io_uring_setup(unsigned int entries,125struct io_uring_params *p)126{127return syscall(__NR_io_uring_setup, entries, p);128}129130static inline int io_uring_enter(int fd, unsigned int to_submit,131unsigned int min_complete,132unsigned int flags, sigset_t *sig)133{134return syscall(__NR_io_uring_enter, fd, to_submit, min_complete,135flags, sig, _NSIG / 8);136}137138static inline int io_uring_queue_init_params(unsigned int entries,139struct io_uring *ring,140struct io_uring_params *p)141{142int fd, ret;143144memset(ring, 0, sizeof(*ring));145146fd = io_uring_setup(entries, p);147if (fd < 0)148return fd;149ret = io_uring_mmap(fd, p, &ring->sq, &ring->cq);150if (!ret) {151ring->ring_fd = fd;152ring->flags = p->flags;153} else {154close(fd);155}156return ret;157}158159static inline int io_uring_queue_init(unsigned int entries,160struct io_uring *ring,161unsigned int flags)162{163struct io_uring_params p;164165memset(&p, 0, sizeof(p));166p.flags = flags;167168return io_uring_queue_init_params(entries, ring, &p);169}170171/* Get a sqe */172static inline struct io_uring_sqe *io_uring_get_sqe(struct io_uring *ring)173{174struct io_uring_sq *sq = &ring->sq;175176if (sq->sqe_tail + 1 - sq->sqe_head > *sq->kring_entries)177return NULL;178return &sq->sqes[sq->sqe_tail++ & *sq->kring_mask];179}180181static inline int io_uring_wait_cqe(struct io_uring *ring,182struct io_uring_cqe **cqe_ptr)183{184struct io_uring_cq *cq = &ring->cq;185const unsigned int mask = *cq->kring_mask;186unsigned int head = *cq->khead;187int ret;188189*cqe_ptr = NULL;190do {191read_barrier();192if (head != *cq->ktail) {193*cqe_ptr = &cq->cqes[head & mask];194break;195}196ret = io_uring_enter(ring->ring_fd, 0, 1,197IORING_ENTER_GETEVENTS, NULL);198if (ret < 0)199return -errno;200} while (1);201202return 0;203}204205static inline int io_uring_submit(struct io_uring *ring)206{207struct io_uring_sq *sq = &ring->sq;208const unsigned int mask = *sq->kring_mask;209unsigned int ktail, submitted, to_submit;210int ret;211212read_barrier();213if (*sq->khead != *sq->ktail) {214submitted = *sq->kring_entries;215goto submit;216}217if (sq->sqe_head == sq->sqe_tail)218return 0;219220ktail = *sq->ktail;221to_submit = sq->sqe_tail - sq->sqe_head;222223if (!(ring->flags & IORING_SETUP_NO_SQARRAY)) {224for (submitted = 0; submitted < to_submit; submitted++) {225read_barrier();226sq->array[ktail++ & mask] = sq->sqe_head++ & mask;227}228} else {229ktail += to_submit;230sq->sqe_head += to_submit;231submitted = to_submit;232}233234if (!submitted)235return 0;236237if (*sq->ktail != ktail) {238write_barrier();239*sq->ktail = ktail;240write_barrier();241}242submit:243ret = io_uring_enter(ring->ring_fd, submitted, 0,244IORING_ENTER_GETEVENTS, NULL);245return ret < 0 ? -errno : ret;246}247248static inline void io_uring_queue_exit(struct io_uring *ring)249{250struct io_uring_sq *sq = &ring->sq;251252munmap(sq->sqes, *sq->kring_entries * sizeof(struct io_uring_sqe));253munmap(sq->khead, sq->ring_sz);254close(ring->ring_fd);255}256257/* Prepare and send the SQE */258static inline void io_uring_prep_cmd(struct io_uring_sqe *sqe, int op,259int sockfd,260int level, int optname,261const void *optval,262int optlen)263{264memset(sqe, 0, sizeof(*sqe));265sqe->opcode = (__u8)IORING_OP_URING_CMD;266sqe->fd = sockfd;267sqe->cmd_op = op;268269sqe->level = level;270sqe->optname = optname;271sqe->optval = (unsigned long long)optval;272sqe->optlen = optlen;273}274275static inline int io_uring_register_buffers(struct io_uring *ring,276const struct iovec *iovecs,277unsigned int nr_iovecs)278{279int ret;280281ret = syscall(__NR_io_uring_register, ring->ring_fd,282IORING_REGISTER_BUFFERS, iovecs, nr_iovecs);283return (ret < 0) ? -errno : ret;284}285286static inline void io_uring_prep_send(struct io_uring_sqe *sqe, int sockfd,287const void *buf, size_t len, int flags)288{289memset(sqe, 0, sizeof(*sqe));290sqe->opcode = (__u8)IORING_OP_SEND;291sqe->fd = sockfd;292sqe->addr = (unsigned long)buf;293sqe->len = len;294sqe->msg_flags = (__u32)flags;295}296297static inline void io_uring_prep_sendzc(struct io_uring_sqe *sqe, int sockfd,298const void *buf, size_t len, int flags,299unsigned int zc_flags)300{301io_uring_prep_send(sqe, sockfd, buf, len, flags);302sqe->opcode = (__u8)IORING_OP_SEND_ZC;303sqe->ioprio = zc_flags;304}305306static inline void io_uring_cqe_seen(struct io_uring *ring)307{308*(&ring->cq)->khead += 1;309write_barrier();310}311312313