1*25da2beaSAndroid Build Coastguard Worker /* SPDX-License-Identifier: MIT */
2*25da2beaSAndroid Build Coastguard Worker #define _DEFAULT_SOURCE
3*25da2beaSAndroid Build Coastguard Worker
4*25da2beaSAndroid Build Coastguard Worker #include "lib.h"
5*25da2beaSAndroid Build Coastguard Worker #include "syscall.h"
6*25da2beaSAndroid Build Coastguard Worker #include "liburing.h"
7*25da2beaSAndroid Build Coastguard Worker #include "int_flags.h"
8*25da2beaSAndroid Build Coastguard Worker #include "liburing/compat.h"
9*25da2beaSAndroid Build Coastguard Worker #include "liburing/io_uring.h"
10*25da2beaSAndroid Build Coastguard Worker
io_uring_unmap_rings(struct io_uring_sq * sq,struct io_uring_cq * cq)11*25da2beaSAndroid Build Coastguard Worker static void io_uring_unmap_rings(struct io_uring_sq *sq, struct io_uring_cq *cq)
12*25da2beaSAndroid Build Coastguard Worker {
13*25da2beaSAndroid Build Coastguard Worker __sys_munmap(sq->ring_ptr, sq->ring_sz);
14*25da2beaSAndroid Build Coastguard Worker if (cq->ring_ptr && cq->ring_ptr != sq->ring_ptr)
15*25da2beaSAndroid Build Coastguard Worker __sys_munmap(cq->ring_ptr, cq->ring_sz);
16*25da2beaSAndroid Build Coastguard Worker }
17*25da2beaSAndroid Build Coastguard Worker
io_uring_mmap(int fd,struct io_uring_params * p,struct io_uring_sq * sq,struct io_uring_cq * cq)18*25da2beaSAndroid Build Coastguard Worker static int io_uring_mmap(int fd, struct io_uring_params *p,
19*25da2beaSAndroid Build Coastguard Worker struct io_uring_sq *sq, struct io_uring_cq *cq)
20*25da2beaSAndroid Build Coastguard Worker {
21*25da2beaSAndroid Build Coastguard Worker size_t size;
22*25da2beaSAndroid Build Coastguard Worker int ret;
23*25da2beaSAndroid Build Coastguard Worker
24*25da2beaSAndroid Build Coastguard Worker size = sizeof(struct io_uring_cqe);
25*25da2beaSAndroid Build Coastguard Worker if (p->flags & IORING_SETUP_CQE32)
26*25da2beaSAndroid Build Coastguard Worker size += sizeof(struct io_uring_cqe);
27*25da2beaSAndroid Build Coastguard Worker
28*25da2beaSAndroid Build Coastguard Worker sq->ring_sz = p->sq_off.array + p->sq_entries * sizeof(unsigned);
29*25da2beaSAndroid Build Coastguard Worker cq->ring_sz = p->cq_off.cqes + p->cq_entries * size;
30*25da2beaSAndroid Build Coastguard Worker
31*25da2beaSAndroid Build Coastguard Worker if (p->features & IORING_FEAT_SINGLE_MMAP) {
32*25da2beaSAndroid Build Coastguard Worker if (cq->ring_sz > sq->ring_sz)
33*25da2beaSAndroid Build Coastguard Worker sq->ring_sz = cq->ring_sz;
34*25da2beaSAndroid Build Coastguard Worker cq->ring_sz = sq->ring_sz;
35*25da2beaSAndroid Build Coastguard Worker }
36*25da2beaSAndroid Build Coastguard Worker sq->ring_ptr = __sys_mmap(0, sq->ring_sz, PROT_READ | PROT_WRITE,
37*25da2beaSAndroid Build Coastguard Worker MAP_SHARED | MAP_POPULATE, fd,
38*25da2beaSAndroid Build Coastguard Worker IORING_OFF_SQ_RING);
39*25da2beaSAndroid Build Coastguard Worker if (IS_ERR(sq->ring_ptr))
40*25da2beaSAndroid Build Coastguard Worker return PTR_ERR(sq->ring_ptr);
41*25da2beaSAndroid Build Coastguard Worker
42*25da2beaSAndroid Build Coastguard Worker if (p->features & IORING_FEAT_SINGLE_MMAP) {
43*25da2beaSAndroid Build Coastguard Worker cq->ring_ptr = sq->ring_ptr;
44*25da2beaSAndroid Build Coastguard Worker } else {
45*25da2beaSAndroid Build Coastguard Worker cq->ring_ptr = __sys_mmap(0, cq->ring_sz, PROT_READ | PROT_WRITE,
46*25da2beaSAndroid Build Coastguard Worker MAP_SHARED | MAP_POPULATE, fd,
47*25da2beaSAndroid Build Coastguard Worker IORING_OFF_CQ_RING);
48*25da2beaSAndroid Build Coastguard Worker if (IS_ERR(cq->ring_ptr)) {
49*25da2beaSAndroid Build Coastguard Worker ret = PTR_ERR(cq->ring_ptr);
50*25da2beaSAndroid Build Coastguard Worker cq->ring_ptr = NULL;
51*25da2beaSAndroid Build Coastguard Worker goto err;
52*25da2beaSAndroid Build Coastguard Worker }
53*25da2beaSAndroid Build Coastguard Worker }
54*25da2beaSAndroid Build Coastguard Worker
55*25da2beaSAndroid Build Coastguard Worker sq->khead = sq->ring_ptr + p->sq_off.head;
56*25da2beaSAndroid Build Coastguard Worker sq->ktail = sq->ring_ptr + p->sq_off.tail;
57*25da2beaSAndroid Build Coastguard Worker sq->kring_mask = sq->ring_ptr + p->sq_off.ring_mask;
58*25da2beaSAndroid Build Coastguard Worker sq->kring_entries = sq->ring_ptr + p->sq_off.ring_entries;
59*25da2beaSAndroid Build Coastguard Worker sq->kflags = sq->ring_ptr + p->sq_off.flags;
60*25da2beaSAndroid Build Coastguard Worker sq->kdropped = sq->ring_ptr + p->sq_off.dropped;
61*25da2beaSAndroid Build Coastguard Worker sq->array = sq->ring_ptr + p->sq_off.array;
62*25da2beaSAndroid Build Coastguard Worker
63*25da2beaSAndroid Build Coastguard Worker size = sizeof(struct io_uring_sqe);
64*25da2beaSAndroid Build Coastguard Worker if (p->flags & IORING_SETUP_SQE128)
65*25da2beaSAndroid Build Coastguard Worker size += 64;
66*25da2beaSAndroid Build Coastguard Worker sq->sqes = __sys_mmap(0, size * p->sq_entries, PROT_READ | PROT_WRITE,
67*25da2beaSAndroid Build Coastguard Worker MAP_SHARED | MAP_POPULATE, fd, IORING_OFF_SQES);
68*25da2beaSAndroid Build Coastguard Worker if (IS_ERR(sq->sqes)) {
69*25da2beaSAndroid Build Coastguard Worker ret = PTR_ERR(sq->sqes);
70*25da2beaSAndroid Build Coastguard Worker err:
71*25da2beaSAndroid Build Coastguard Worker io_uring_unmap_rings(sq, cq);
72*25da2beaSAndroid Build Coastguard Worker return ret;
73*25da2beaSAndroid Build Coastguard Worker }
74*25da2beaSAndroid Build Coastguard Worker
75*25da2beaSAndroid Build Coastguard Worker cq->khead = cq->ring_ptr + p->cq_off.head;
76*25da2beaSAndroid Build Coastguard Worker cq->ktail = cq->ring_ptr + p->cq_off.tail;
77*25da2beaSAndroid Build Coastguard Worker cq->kring_mask = cq->ring_ptr + p->cq_off.ring_mask;
78*25da2beaSAndroid Build Coastguard Worker cq->kring_entries = cq->ring_ptr + p->cq_off.ring_entries;
79*25da2beaSAndroid Build Coastguard Worker cq->koverflow = cq->ring_ptr + p->cq_off.overflow;
80*25da2beaSAndroid Build Coastguard Worker cq->cqes = cq->ring_ptr + p->cq_off.cqes;
81*25da2beaSAndroid Build Coastguard Worker if (p->cq_off.flags)
82*25da2beaSAndroid Build Coastguard Worker cq->kflags = cq->ring_ptr + p->cq_off.flags;
83*25da2beaSAndroid Build Coastguard Worker return 0;
84*25da2beaSAndroid Build Coastguard Worker }
85*25da2beaSAndroid Build Coastguard Worker
86*25da2beaSAndroid Build Coastguard Worker /*
87*25da2beaSAndroid Build Coastguard Worker * For users that want to specify sq_thread_cpu or sq_thread_idle, this
88*25da2beaSAndroid Build Coastguard Worker * interface is a convenient helper for mmap()ing the rings.
89*25da2beaSAndroid Build Coastguard Worker * Returns -errno on error, or zero on success. On success, 'ring'
90*25da2beaSAndroid Build Coastguard Worker * contains the necessary information to read/write to the rings.
91*25da2beaSAndroid Build Coastguard Worker */
io_uring_queue_mmap(int fd,struct io_uring_params * p,struct io_uring * ring)92*25da2beaSAndroid Build Coastguard Worker int io_uring_queue_mmap(int fd, struct io_uring_params *p, struct io_uring *ring)
93*25da2beaSAndroid Build Coastguard Worker {
94*25da2beaSAndroid Build Coastguard Worker int ret;
95*25da2beaSAndroid Build Coastguard Worker
96*25da2beaSAndroid Build Coastguard Worker memset(ring, 0, sizeof(*ring));
97*25da2beaSAndroid Build Coastguard Worker ret = io_uring_mmap(fd, p, &ring->sq, &ring->cq);
98*25da2beaSAndroid Build Coastguard Worker if (!ret) {
99*25da2beaSAndroid Build Coastguard Worker ring->flags = p->flags;
100*25da2beaSAndroid Build Coastguard Worker ring->ring_fd = ring->enter_ring_fd = fd;
101*25da2beaSAndroid Build Coastguard Worker ring->int_flags = 0;
102*25da2beaSAndroid Build Coastguard Worker }
103*25da2beaSAndroid Build Coastguard Worker return ret;
104*25da2beaSAndroid Build Coastguard Worker }
105*25da2beaSAndroid Build Coastguard Worker
106*25da2beaSAndroid Build Coastguard Worker /*
107*25da2beaSAndroid Build Coastguard Worker * Ensure that the mmap'ed rings aren't available to a child after a fork(2).
108*25da2beaSAndroid Build Coastguard Worker * This uses madvise(..., MADV_DONTFORK) on the mmap'ed ranges.
109*25da2beaSAndroid Build Coastguard Worker */
io_uring_ring_dontfork(struct io_uring * ring)110*25da2beaSAndroid Build Coastguard Worker int io_uring_ring_dontfork(struct io_uring *ring)
111*25da2beaSAndroid Build Coastguard Worker {
112*25da2beaSAndroid Build Coastguard Worker size_t len;
113*25da2beaSAndroid Build Coastguard Worker int ret;
114*25da2beaSAndroid Build Coastguard Worker
115*25da2beaSAndroid Build Coastguard Worker if (!ring->sq.ring_ptr || !ring->sq.sqes || !ring->cq.ring_ptr)
116*25da2beaSAndroid Build Coastguard Worker return -EINVAL;
117*25da2beaSAndroid Build Coastguard Worker
118*25da2beaSAndroid Build Coastguard Worker len = sizeof(struct io_uring_sqe);
119*25da2beaSAndroid Build Coastguard Worker if (ring->flags & IORING_SETUP_SQE128)
120*25da2beaSAndroid Build Coastguard Worker len += 64;
121*25da2beaSAndroid Build Coastguard Worker len *= *ring->sq.kring_entries;
122*25da2beaSAndroid Build Coastguard Worker ret = __sys_madvise(ring->sq.sqes, len, MADV_DONTFORK);
123*25da2beaSAndroid Build Coastguard Worker if (ret < 0)
124*25da2beaSAndroid Build Coastguard Worker return ret;
125*25da2beaSAndroid Build Coastguard Worker
126*25da2beaSAndroid Build Coastguard Worker len = ring->sq.ring_sz;
127*25da2beaSAndroid Build Coastguard Worker ret = __sys_madvise(ring->sq.ring_ptr, len, MADV_DONTFORK);
128*25da2beaSAndroid Build Coastguard Worker if (ret < 0)
129*25da2beaSAndroid Build Coastguard Worker return ret;
130*25da2beaSAndroid Build Coastguard Worker
131*25da2beaSAndroid Build Coastguard Worker if (ring->cq.ring_ptr != ring->sq.ring_ptr) {
132*25da2beaSAndroid Build Coastguard Worker len = ring->cq.ring_sz;
133*25da2beaSAndroid Build Coastguard Worker ret = __sys_madvise(ring->cq.ring_ptr, len, MADV_DONTFORK);
134*25da2beaSAndroid Build Coastguard Worker if (ret < 0)
135*25da2beaSAndroid Build Coastguard Worker return ret;
136*25da2beaSAndroid Build Coastguard Worker }
137*25da2beaSAndroid Build Coastguard Worker
138*25da2beaSAndroid Build Coastguard Worker return 0;
139*25da2beaSAndroid Build Coastguard Worker }
140*25da2beaSAndroid Build Coastguard Worker
io_uring_queue_init_params(unsigned entries,struct io_uring * ring,struct io_uring_params * p)141*25da2beaSAndroid Build Coastguard Worker int io_uring_queue_init_params(unsigned entries, struct io_uring *ring,
142*25da2beaSAndroid Build Coastguard Worker struct io_uring_params *p)
143*25da2beaSAndroid Build Coastguard Worker {
144*25da2beaSAndroid Build Coastguard Worker int fd, ret;
145*25da2beaSAndroid Build Coastguard Worker
146*25da2beaSAndroid Build Coastguard Worker fd = ____sys_io_uring_setup(entries, p);
147*25da2beaSAndroid Build Coastguard Worker if (fd < 0)
148*25da2beaSAndroid Build Coastguard Worker return fd;
149*25da2beaSAndroid Build Coastguard Worker
150*25da2beaSAndroid Build Coastguard Worker ret = io_uring_queue_mmap(fd, p, ring);
151*25da2beaSAndroid Build Coastguard Worker if (ret) {
152*25da2beaSAndroid Build Coastguard Worker __sys_close(fd);
153*25da2beaSAndroid Build Coastguard Worker return ret;
154*25da2beaSAndroid Build Coastguard Worker }
155*25da2beaSAndroid Build Coastguard Worker
156*25da2beaSAndroid Build Coastguard Worker ring->features = p->features;
157*25da2beaSAndroid Build Coastguard Worker return 0;
158*25da2beaSAndroid Build Coastguard Worker }
159*25da2beaSAndroid Build Coastguard Worker
160*25da2beaSAndroid Build Coastguard Worker /*
161*25da2beaSAndroid Build Coastguard Worker * Returns -errno on error, or zero on success. On success, 'ring'
162*25da2beaSAndroid Build Coastguard Worker * contains the necessary information to read/write to the rings.
163*25da2beaSAndroid Build Coastguard Worker */
io_uring_queue_init(unsigned entries,struct io_uring * ring,unsigned flags)164*25da2beaSAndroid Build Coastguard Worker int io_uring_queue_init(unsigned entries, struct io_uring *ring, unsigned flags)
165*25da2beaSAndroid Build Coastguard Worker {
166*25da2beaSAndroid Build Coastguard Worker struct io_uring_params p;
167*25da2beaSAndroid Build Coastguard Worker
168*25da2beaSAndroid Build Coastguard Worker memset(&p, 0, sizeof(p));
169*25da2beaSAndroid Build Coastguard Worker p.flags = flags;
170*25da2beaSAndroid Build Coastguard Worker
171*25da2beaSAndroid Build Coastguard Worker return io_uring_queue_init_params(entries, ring, &p);
172*25da2beaSAndroid Build Coastguard Worker }
173*25da2beaSAndroid Build Coastguard Worker
io_uring_queue_exit(struct io_uring * ring)174*25da2beaSAndroid Build Coastguard Worker void io_uring_queue_exit(struct io_uring *ring)
175*25da2beaSAndroid Build Coastguard Worker {
176*25da2beaSAndroid Build Coastguard Worker struct io_uring_sq *sq = &ring->sq;
177*25da2beaSAndroid Build Coastguard Worker struct io_uring_cq *cq = &ring->cq;
178*25da2beaSAndroid Build Coastguard Worker size_t sqe_size;
179*25da2beaSAndroid Build Coastguard Worker
180*25da2beaSAndroid Build Coastguard Worker sqe_size = sizeof(struct io_uring_sqe);
181*25da2beaSAndroid Build Coastguard Worker if (ring->flags & IORING_SETUP_SQE128)
182*25da2beaSAndroid Build Coastguard Worker sqe_size += 64;
183*25da2beaSAndroid Build Coastguard Worker __sys_munmap(sq->sqes, sqe_size * *sq->kring_entries);
184*25da2beaSAndroid Build Coastguard Worker io_uring_unmap_rings(sq, cq);
185*25da2beaSAndroid Build Coastguard Worker /*
186*25da2beaSAndroid Build Coastguard Worker * Not strictly required, but frees up the slot we used now rather
187*25da2beaSAndroid Build Coastguard Worker * than at process exit time.
188*25da2beaSAndroid Build Coastguard Worker */
189*25da2beaSAndroid Build Coastguard Worker if (ring->int_flags & INT_FLAG_REG_RING)
190*25da2beaSAndroid Build Coastguard Worker io_uring_unregister_ring_fd(ring);
191*25da2beaSAndroid Build Coastguard Worker __sys_close(ring->ring_fd);
192*25da2beaSAndroid Build Coastguard Worker }
193*25da2beaSAndroid Build Coastguard Worker
io_uring_get_probe_ring(struct io_uring * ring)194*25da2beaSAndroid Build Coastguard Worker struct io_uring_probe *io_uring_get_probe_ring(struct io_uring *ring)
195*25da2beaSAndroid Build Coastguard Worker {
196*25da2beaSAndroid Build Coastguard Worker struct io_uring_probe *probe;
197*25da2beaSAndroid Build Coastguard Worker size_t len;
198*25da2beaSAndroid Build Coastguard Worker int r;
199*25da2beaSAndroid Build Coastguard Worker
200*25da2beaSAndroid Build Coastguard Worker len = sizeof(*probe) + 256 * sizeof(struct io_uring_probe_op);
201*25da2beaSAndroid Build Coastguard Worker probe = uring_malloc(len);
202*25da2beaSAndroid Build Coastguard Worker if (!probe)
203*25da2beaSAndroid Build Coastguard Worker return NULL;
204*25da2beaSAndroid Build Coastguard Worker memset(probe, 0, len);
205*25da2beaSAndroid Build Coastguard Worker
206*25da2beaSAndroid Build Coastguard Worker r = io_uring_register_probe(ring, probe, 256);
207*25da2beaSAndroid Build Coastguard Worker if (r >= 0)
208*25da2beaSAndroid Build Coastguard Worker return probe;
209*25da2beaSAndroid Build Coastguard Worker
210*25da2beaSAndroid Build Coastguard Worker uring_free(probe);
211*25da2beaSAndroid Build Coastguard Worker return NULL;
212*25da2beaSAndroid Build Coastguard Worker }
213*25da2beaSAndroid Build Coastguard Worker
io_uring_get_probe(void)214*25da2beaSAndroid Build Coastguard Worker struct io_uring_probe *io_uring_get_probe(void)
215*25da2beaSAndroid Build Coastguard Worker {
216*25da2beaSAndroid Build Coastguard Worker struct io_uring ring;
217*25da2beaSAndroid Build Coastguard Worker struct io_uring_probe *probe;
218*25da2beaSAndroid Build Coastguard Worker int r;
219*25da2beaSAndroid Build Coastguard Worker
220*25da2beaSAndroid Build Coastguard Worker r = io_uring_queue_init(2, &ring, 0);
221*25da2beaSAndroid Build Coastguard Worker if (r < 0)
222*25da2beaSAndroid Build Coastguard Worker return NULL;
223*25da2beaSAndroid Build Coastguard Worker
224*25da2beaSAndroid Build Coastguard Worker probe = io_uring_get_probe_ring(&ring);
225*25da2beaSAndroid Build Coastguard Worker io_uring_queue_exit(&ring);
226*25da2beaSAndroid Build Coastguard Worker return probe;
227*25da2beaSAndroid Build Coastguard Worker }
228*25da2beaSAndroid Build Coastguard Worker
io_uring_free_probe(struct io_uring_probe * probe)229*25da2beaSAndroid Build Coastguard Worker void io_uring_free_probe(struct io_uring_probe *probe)
230*25da2beaSAndroid Build Coastguard Worker {
231*25da2beaSAndroid Build Coastguard Worker uring_free(probe);
232*25da2beaSAndroid Build Coastguard Worker }
233*25da2beaSAndroid Build Coastguard Worker
__fls(int x)234*25da2beaSAndroid Build Coastguard Worker static inline int __fls(int x)
235*25da2beaSAndroid Build Coastguard Worker {
236*25da2beaSAndroid Build Coastguard Worker if (!x)
237*25da2beaSAndroid Build Coastguard Worker return 0;
238*25da2beaSAndroid Build Coastguard Worker return 8 * sizeof(x) - __builtin_clz(x);
239*25da2beaSAndroid Build Coastguard Worker }
240*25da2beaSAndroid Build Coastguard Worker
roundup_pow2(unsigned depth)241*25da2beaSAndroid Build Coastguard Worker static unsigned roundup_pow2(unsigned depth)
242*25da2beaSAndroid Build Coastguard Worker {
243*25da2beaSAndroid Build Coastguard Worker return 1UL << __fls(depth - 1);
244*25da2beaSAndroid Build Coastguard Worker }
245*25da2beaSAndroid Build Coastguard Worker
npages(size_t size,unsigned page_size)246*25da2beaSAndroid Build Coastguard Worker static size_t npages(size_t size, unsigned page_size)
247*25da2beaSAndroid Build Coastguard Worker {
248*25da2beaSAndroid Build Coastguard Worker size--;
249*25da2beaSAndroid Build Coastguard Worker size /= page_size;
250*25da2beaSAndroid Build Coastguard Worker return __fls(size);
251*25da2beaSAndroid Build Coastguard Worker }
252*25da2beaSAndroid Build Coastguard Worker
253*25da2beaSAndroid Build Coastguard Worker #define KRING_SIZE 320
254*25da2beaSAndroid Build Coastguard Worker
rings_size(struct io_uring_params * p,unsigned entries,unsigned cq_entries,unsigned page_size)255*25da2beaSAndroid Build Coastguard Worker static size_t rings_size(struct io_uring_params *p, unsigned entries,
256*25da2beaSAndroid Build Coastguard Worker unsigned cq_entries, unsigned page_size)
257*25da2beaSAndroid Build Coastguard Worker {
258*25da2beaSAndroid Build Coastguard Worker size_t pages, sq_size, cq_size;
259*25da2beaSAndroid Build Coastguard Worker
260*25da2beaSAndroid Build Coastguard Worker cq_size = sizeof(struct io_uring_cqe);
261*25da2beaSAndroid Build Coastguard Worker if (p->flags & IORING_SETUP_CQE32)
262*25da2beaSAndroid Build Coastguard Worker cq_size += sizeof(struct io_uring_cqe);
263*25da2beaSAndroid Build Coastguard Worker cq_size *= cq_entries;
264*25da2beaSAndroid Build Coastguard Worker cq_size += KRING_SIZE;
265*25da2beaSAndroid Build Coastguard Worker cq_size = (cq_size + 63) & ~63UL;
266*25da2beaSAndroid Build Coastguard Worker pages = (size_t) 1 << npages(cq_size, page_size);
267*25da2beaSAndroid Build Coastguard Worker
268*25da2beaSAndroid Build Coastguard Worker sq_size = sizeof(struct io_uring_sqe);
269*25da2beaSAndroid Build Coastguard Worker if (p->flags & IORING_SETUP_SQE128)
270*25da2beaSAndroid Build Coastguard Worker sq_size += 64;
271*25da2beaSAndroid Build Coastguard Worker sq_size *= entries;
272*25da2beaSAndroid Build Coastguard Worker pages += (size_t) 1 << npages(sq_size, page_size);
273*25da2beaSAndroid Build Coastguard Worker return pages * page_size;
274*25da2beaSAndroid Build Coastguard Worker }
275*25da2beaSAndroid Build Coastguard Worker
276*25da2beaSAndroid Build Coastguard Worker #define KERN_MAX_ENTRIES 32768
277*25da2beaSAndroid Build Coastguard Worker #define KERN_MAX_CQ_ENTRIES (2 * KERN_MAX_ENTRIES)
278*25da2beaSAndroid Build Coastguard Worker
279*25da2beaSAndroid Build Coastguard Worker /*
280*25da2beaSAndroid Build Coastguard Worker * Return the required ulimit -l memlock memory required for a given ring
281*25da2beaSAndroid Build Coastguard Worker * setup, in bytes. May return -errno on error. On newer (5.12+) kernels,
282*25da2beaSAndroid Build Coastguard Worker * io_uring no longer requires any memlock memory, and hence this function
283*25da2beaSAndroid Build Coastguard Worker * will return 0 for that case. On older (5.11 and prior) kernels, this will
284*25da2beaSAndroid Build Coastguard Worker * return the required memory so that the caller can ensure that enough space
285*25da2beaSAndroid Build Coastguard Worker * is available before setting up a ring with the specified parameters.
286*25da2beaSAndroid Build Coastguard Worker */
io_uring_mlock_size_params(unsigned entries,struct io_uring_params * p)287*25da2beaSAndroid Build Coastguard Worker ssize_t io_uring_mlock_size_params(unsigned entries, struct io_uring_params *p)
288*25da2beaSAndroid Build Coastguard Worker {
289*25da2beaSAndroid Build Coastguard Worker struct io_uring_params lp = { };
290*25da2beaSAndroid Build Coastguard Worker struct io_uring ring;
291*25da2beaSAndroid Build Coastguard Worker unsigned cq_entries;
292*25da2beaSAndroid Build Coastguard Worker long page_size;
293*25da2beaSAndroid Build Coastguard Worker ssize_t ret;
294*25da2beaSAndroid Build Coastguard Worker
295*25da2beaSAndroid Build Coastguard Worker /*
296*25da2beaSAndroid Build Coastguard Worker * We only really use this inited ring to see if the kernel is newer
297*25da2beaSAndroid Build Coastguard Worker * or not. Newer kernels don't require memlocked memory. If we fail,
298*25da2beaSAndroid Build Coastguard Worker * it's most likely because it's an older kernel and we have no
299*25da2beaSAndroid Build Coastguard Worker * available memlock space. Just continue on, lp.features will still
300*25da2beaSAndroid Build Coastguard Worker * be zeroed at this point and we'll do the right thing.
301*25da2beaSAndroid Build Coastguard Worker */
302*25da2beaSAndroid Build Coastguard Worker ret = io_uring_queue_init_params(entries, &ring, &lp);
303*25da2beaSAndroid Build Coastguard Worker if (!ret)
304*25da2beaSAndroid Build Coastguard Worker io_uring_queue_exit(&ring);
305*25da2beaSAndroid Build Coastguard Worker
306*25da2beaSAndroid Build Coastguard Worker /*
307*25da2beaSAndroid Build Coastguard Worker * Native workers imply using cgroup memory accounting, and hence no
308*25da2beaSAndroid Build Coastguard Worker * memlock memory is needed for the ring allocations.
309*25da2beaSAndroid Build Coastguard Worker */
310*25da2beaSAndroid Build Coastguard Worker if (lp.features & IORING_FEAT_NATIVE_WORKERS)
311*25da2beaSAndroid Build Coastguard Worker return 0;
312*25da2beaSAndroid Build Coastguard Worker
313*25da2beaSAndroid Build Coastguard Worker if (!entries)
314*25da2beaSAndroid Build Coastguard Worker return -EINVAL;
315*25da2beaSAndroid Build Coastguard Worker if (entries > KERN_MAX_ENTRIES) {
316*25da2beaSAndroid Build Coastguard Worker if (!(p->flags & IORING_SETUP_CLAMP))
317*25da2beaSAndroid Build Coastguard Worker return -EINVAL;
318*25da2beaSAndroid Build Coastguard Worker entries = KERN_MAX_ENTRIES;
319*25da2beaSAndroid Build Coastguard Worker }
320*25da2beaSAndroid Build Coastguard Worker
321*25da2beaSAndroid Build Coastguard Worker entries = roundup_pow2(entries);
322*25da2beaSAndroid Build Coastguard Worker if (p->flags & IORING_SETUP_CQSIZE) {
323*25da2beaSAndroid Build Coastguard Worker if (!p->cq_entries)
324*25da2beaSAndroid Build Coastguard Worker return -EINVAL;
325*25da2beaSAndroid Build Coastguard Worker cq_entries = p->cq_entries;
326*25da2beaSAndroid Build Coastguard Worker if (cq_entries > KERN_MAX_CQ_ENTRIES) {
327*25da2beaSAndroid Build Coastguard Worker if (!(p->flags & IORING_SETUP_CLAMP))
328*25da2beaSAndroid Build Coastguard Worker return -EINVAL;
329*25da2beaSAndroid Build Coastguard Worker cq_entries = KERN_MAX_CQ_ENTRIES;
330*25da2beaSAndroid Build Coastguard Worker }
331*25da2beaSAndroid Build Coastguard Worker cq_entries = roundup_pow2(cq_entries);
332*25da2beaSAndroid Build Coastguard Worker if (cq_entries < entries)
333*25da2beaSAndroid Build Coastguard Worker return -EINVAL;
334*25da2beaSAndroid Build Coastguard Worker } else {
335*25da2beaSAndroid Build Coastguard Worker cq_entries = 2 * entries;
336*25da2beaSAndroid Build Coastguard Worker }
337*25da2beaSAndroid Build Coastguard Worker
338*25da2beaSAndroid Build Coastguard Worker page_size = get_page_size();
339*25da2beaSAndroid Build Coastguard Worker return rings_size(p, entries, cq_entries, page_size);
340*25da2beaSAndroid Build Coastguard Worker }
341*25da2beaSAndroid Build Coastguard Worker
342*25da2beaSAndroid Build Coastguard Worker /*
343*25da2beaSAndroid Build Coastguard Worker * Return required ulimit -l memory space for a given ring setup. See
344*25da2beaSAndroid Build Coastguard Worker * @io_uring_mlock_size_params().
345*25da2beaSAndroid Build Coastguard Worker */
io_uring_mlock_size(unsigned entries,unsigned flags)346*25da2beaSAndroid Build Coastguard Worker ssize_t io_uring_mlock_size(unsigned entries, unsigned flags)
347*25da2beaSAndroid Build Coastguard Worker {
348*25da2beaSAndroid Build Coastguard Worker struct io_uring_params p = { .flags = flags, };
349*25da2beaSAndroid Build Coastguard Worker
350*25da2beaSAndroid Build Coastguard Worker return io_uring_mlock_size_params(entries, &p);
351*25da2beaSAndroid Build Coastguard Worker }
352