Blame src/setup.c

Packit d3489f
/* SPDX-License-Identifier: MIT */
Packit d3489f
#include <sys/types.h>
Packit d3489f
#include <sys/stat.h>
Packit d3489f
#include <sys/mman.h>
Packit d3489f
#include <unistd.h>
Packit d3489f
#include <errno.h>
Packit d3489f
#include <string.h>
Packit d3489f
#include <stdlib.h>
Packit d3489f
Packit d3489f
#include "liburing/compat.h"
Packit d3489f
#include "liburing/io_uring.h"
Packit d3489f
#include "liburing.h"
Packit d3489f
Packit d3489f
#include "syscall.h"
Packit d3489f
Packit d3489f
static void io_uring_unmap_rings(struct io_uring_sq *sq, struct io_uring_cq *cq)
Packit d3489f
{
Packit d3489f
	munmap(sq->ring_ptr, sq->ring_sz);
Packit d3489f
	if (cq->ring_ptr && cq->ring_ptr != sq->ring_ptr)
Packit d3489f
		munmap(cq->ring_ptr, cq->ring_sz);
Packit d3489f
}
Packit d3489f
Packit d3489f
static int io_uring_mmap(int fd, struct io_uring_params *p,
Packit d3489f
			 struct io_uring_sq *sq, struct io_uring_cq *cq)
Packit d3489f
{
Packit d3489f
	size_t size;
Packit d3489f
	int ret;
Packit d3489f
Packit d3489f
	sq->ring_sz = p->sq_off.array + p->sq_entries * sizeof(unsigned);
Packit d3489f
	cq->ring_sz = p->cq_off.cqes + p->cq_entries * sizeof(struct io_uring_cqe);
Packit d3489f
Packit d3489f
	if (p->features & IORING_FEAT_SINGLE_MMAP) {
Packit d3489f
		if (cq->ring_sz > sq->ring_sz)
Packit d3489f
			sq->ring_sz = cq->ring_sz;
Packit d3489f
		cq->ring_sz = sq->ring_sz;
Packit d3489f
	}
Packit d3489f
	sq->ring_ptr = mmap(0, sq->ring_sz, PROT_READ | PROT_WRITE,
Packit d3489f
			MAP_SHARED | MAP_POPULATE, fd, IORING_OFF_SQ_RING);
Packit d3489f
	if (sq->ring_ptr == MAP_FAILED)
Packit d3489f
		return -errno;
Packit d3489f
Packit d3489f
	if (p->features & IORING_FEAT_SINGLE_MMAP) {
Packit d3489f
		cq->ring_ptr = sq->ring_ptr;
Packit d3489f
	} else {
Packit d3489f
		cq->ring_ptr = mmap(0, cq->ring_sz, PROT_READ | PROT_WRITE,
Packit d3489f
				MAP_SHARED | MAP_POPULATE, fd, IORING_OFF_CQ_RING);
Packit d3489f
		if (cq->ring_ptr == MAP_FAILED) {
Packit d3489f
			cq->ring_ptr = NULL;
Packit d3489f
			ret = -errno;
Packit d3489f
			goto err;
Packit d3489f
		}
Packit d3489f
	}
Packit d3489f
Packit d3489f
	sq->khead = sq->ring_ptr + p->sq_off.head;
Packit d3489f
	sq->ktail = sq->ring_ptr + p->sq_off.tail;
Packit d3489f
	sq->kring_mask = sq->ring_ptr + p->sq_off.ring_mask;
Packit d3489f
	sq->kring_entries = sq->ring_ptr + p->sq_off.ring_entries;
Packit d3489f
	sq->kflags = sq->ring_ptr + p->sq_off.flags;
Packit d3489f
	sq->kdropped = sq->ring_ptr + p->sq_off.dropped;
Packit d3489f
	sq->array = sq->ring_ptr + p->sq_off.array;
Packit d3489f
Packit d3489f
	size = p->sq_entries * sizeof(struct io_uring_sqe);
Packit d3489f
	sq->sqes = mmap(0, size, PROT_READ | PROT_WRITE,
Packit d3489f
				MAP_SHARED | MAP_POPULATE, fd,
Packit d3489f
				IORING_OFF_SQES);
Packit d3489f
	if (sq->sqes == MAP_FAILED) {
Packit d3489f
		ret = -errno;
Packit d3489f
err:
Packit d3489f
		io_uring_unmap_rings(sq, cq);
Packit d3489f
		return ret;
Packit d3489f
	}
Packit d3489f
Packit d3489f
	cq->khead = cq->ring_ptr + p->cq_off.head;
Packit d3489f
	cq->ktail = cq->ring_ptr + p->cq_off.tail;
Packit d3489f
	cq->kring_mask = cq->ring_ptr + p->cq_off.ring_mask;
Packit d3489f
	cq->kring_entries = cq->ring_ptr + p->cq_off.ring_entries;
Packit d3489f
	cq->koverflow = cq->ring_ptr + p->cq_off.overflow;
Packit d3489f
	cq->cqes = cq->ring_ptr + p->cq_off.cqes;
Packit d3489f
	if (p->cq_off.flags)
Packit d3489f
		cq->kflags = cq->ring_ptr + p->cq_off.flags;
Packit d3489f
	return 0;
Packit d3489f
}
Packit d3489f
Packit d3489f
/*
Packit d3489f
 * For users that want to specify sq_thread_cpu or sq_thread_idle, this
Packit d3489f
 * interface is a convenient helper for mmap()ing the rings.
Packit d3489f
 * Returns -errno on error, or zero on success.  On success, 'ring'
Packit d3489f
 * contains the necessary information to read/write to the rings.
Packit d3489f
 */
Packit d3489f
int io_uring_queue_mmap(int fd, struct io_uring_params *p, struct io_uring *ring)
Packit d3489f
{
Packit d3489f
	int ret;
Packit d3489f
Packit d3489f
	memset(ring, 0, sizeof(*ring));
Packit d3489f
	ret = io_uring_mmap(fd, p, &ring->sq, &ring->cq);
Packit d3489f
	if (!ret) {
Packit d3489f
		ring->flags = p->flags;
Packit d3489f
		ring->ring_fd = fd;
Packit d3489f
	}
Packit d3489f
	return ret;
Packit d3489f
}
Packit d3489f
Packit d3489f
/*
Packit d3489f
 * Ensure that the mmap'ed rings aren't available to a child after a fork(2).
Packit d3489f
 * This uses madvise(..., MADV_DONTFORK) on the mmap'ed ranges.
Packit d3489f
 */
Packit d3489f
int io_uring_ring_dontfork(struct io_uring *ring)
Packit d3489f
{
Packit d3489f
	size_t len;
Packit d3489f
	int ret;
Packit d3489f
Packit d3489f
	if (!ring->sq.ring_ptr || !ring->sq.sqes || !ring->cq.ring_ptr)
Packit d3489f
		return -EINVAL;
Packit d3489f
Packit d3489f
	len = *ring->sq.kring_entries * sizeof(struct io_uring_sqe);
Packit d3489f
	ret = madvise(ring->sq.sqes, len, MADV_DONTFORK);
Packit d3489f
	if (ret == -1)
Packit d3489f
		return -errno;
Packit d3489f
Packit d3489f
	len = ring->sq.ring_sz;
Packit d3489f
	ret = madvise(ring->sq.ring_ptr, len, MADV_DONTFORK);
Packit d3489f
	if (ret == -1)
Packit d3489f
		return -errno;
Packit d3489f
Packit d3489f
	if (ring->cq.ring_ptr != ring->sq.ring_ptr) {
Packit d3489f
		len = ring->cq.ring_sz;
Packit d3489f
		ret = madvise(ring->cq.ring_ptr, len, MADV_DONTFORK);
Packit d3489f
		if (ret == -1)
Packit d3489f
			return -errno;
Packit d3489f
	}
Packit d3489f
Packit d3489f
	return 0;
Packit d3489f
}
Packit d3489f
Packit d3489f
int io_uring_queue_init_params(unsigned entries, struct io_uring *ring,
Packit d3489f
			       struct io_uring_params *p)
Packit d3489f
{
Packit d3489f
	int fd, ret;
Packit d3489f
Packit d3489f
	fd = __sys_io_uring_setup(entries, p);
Packit d3489f
	if (fd < 0)
Packit d3489f
		return -errno;
Packit d3489f
Packit d3489f
	ret = io_uring_queue_mmap(fd, p, ring);
Packit d3489f
	if (ret)
Packit d3489f
		close(fd);
Packit d3489f
Packit d3489f
	return ret;
Packit d3489f
}
Packit d3489f
Packit d3489f
/*
Packit d3489f
 * Returns -errno on error, or zero on success. On success, 'ring'
Packit d3489f
 * contains the necessary information to read/write to the rings.
Packit d3489f
 */
Packit d3489f
int io_uring_queue_init(unsigned entries, struct io_uring *ring, unsigned flags)
Packit d3489f
{
Packit d3489f
	struct io_uring_params p;
Packit d3489f
Packit d3489f
	memset(&p, 0, sizeof(p));
Packit d3489f
	p.flags = flags;
Packit d3489f
Packit d3489f
	return io_uring_queue_init_params(entries, ring, &p);
Packit d3489f
}
Packit d3489f
Packit d3489f
void io_uring_queue_exit(struct io_uring *ring)
Packit d3489f
{
Packit d3489f
	struct io_uring_sq *sq = &ring->sq;
Packit d3489f
	struct io_uring_cq *cq = &ring->cq;
Packit d3489f
Packit d3489f
	munmap(sq->sqes, *sq->kring_entries * sizeof(struct io_uring_sqe));
Packit d3489f
	io_uring_unmap_rings(sq, cq);
Packit d3489f
	close(ring->ring_fd);
Packit d3489f
}
Packit d3489f
Packit d3489f
struct io_uring_probe *io_uring_get_probe_ring(struct io_uring *ring)
Packit d3489f
{
Packit d3489f
	struct io_uring_probe *probe;
Packit d3489f
	int r;
Packit d3489f
Packit d3489f
	size_t len = sizeof(*probe) + 256 * sizeof(struct io_uring_probe_op);
Packit d3489f
	probe = malloc(len);
Packit d3489f
	memset(probe, 0, len);
Packit d3489f
	r = io_uring_register_probe(ring, probe, 256);
Packit d3489f
	if (r < 0)
Packit d3489f
		goto fail;
Packit d3489f
Packit d3489f
	return probe;
Packit d3489f
fail:
Packit d3489f
	free(probe);
Packit d3489f
	return NULL;
Packit d3489f
}
Packit d3489f
Packit d3489f
struct io_uring_probe *io_uring_get_probe(void)
Packit d3489f
{
Packit d3489f
	struct io_uring ring;
Packit d3489f
	struct io_uring_probe* probe = NULL;
Packit d3489f
Packit d3489f
	int r = io_uring_queue_init(2, &ring, 0);
Packit d3489f
	if (r < 0)
Packit d3489f
		return NULL;
Packit d3489f
Packit d3489f
	probe = io_uring_get_probe_ring(&ring);
Packit d3489f
	io_uring_queue_exit(&ring);
Packit d3489f
	return probe;
Packit d3489f
}