io_uring.h 9.0 KB
Newer Older
1
/* SPDX-License-Identifier: (GPL-2.0 WITH Linux-syscall-note) OR MIT */
J
Jens Axboe 已提交
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18
/*
 * Header file for the io_uring interface.
 *
 * Copyright (C) 2019 Jens Axboe
 * Copyright (C) 2019 Christoph Hellwig
 */
#ifndef LINUX_IO_URING_H
#define LINUX_IO_URING_H

#include <linux/fs.h>
#include <linux/types.h>

/*
 * IO submission data structure (Submission Queue Entry)
 */
struct io_uring_sqe {
	__u8	opcode;		/* type of operation for this sqe */
J
Jens Axboe 已提交
19
	__u8	flags;		/* IOSQE_ flags */
J
Jens Axboe 已提交
20 21
	__u16	ioprio;		/* ioprio for the request */
	__s32	fd;		/* file descriptor to do IO on */
22 23 24 25
	union {
		__u64	off;	/* offset into file */
		__u64	addr2;
	};
P
Pavel Begunkov 已提交
26 27 28 29
	union {
		__u64	addr;	/* pointer to buffer or iovecs */
		__u64	splice_off_in;
	};
J
Jens Axboe 已提交
30 31 32
	__u32	len;		/* buffer size or number of iovecs */
	union {
		__kernel_rwf_t	rw_flags;
C
Christoph Hellwig 已提交
33
		__u32		fsync_flags;
34 35
		__u16		poll_events;	/* compatibility */
		__u32		poll32_events;	/* word-reversed for BE */
36
		__u32		sync_range_flags;
J
Jens Axboe 已提交
37
		__u32		msg_flags;
J
Jens Axboe 已提交
38
		__u32		timeout_flags;
39
		__u32		accept_flags;
40
		__u32		cancel_flags;
41
		__u32		open_flags;
42
		__u32		statx_flags;
J
Jens Axboe 已提交
43
		__u32		fadvise_advice;
P
Pavel Begunkov 已提交
44
		__u32		splice_flags;
45
		__u32		rename_flags;
46
		__u32		unlink_flags;
J
Jens Axboe 已提交
47 48
	};
	__u64	user_data;	/* data to be passed back at completion time */
49
	/* pack this to avoid bogus arm OABI complaints */
50
	union {
51 52 53 54 55 56 57 58 59
		/* index into fixed buffers, if used */
		__u16	buf_index;
		/* for grouped buffer selection */
		__u16	buf_group;
	} __attribute__((packed));
	/* personality to use, if used */
	__u16	personality;
	__s32	splice_fd_in;
	__u64	__pad2[2];
J
Jens Axboe 已提交
60 61
};

62 63 64 65 66 67
enum {
	IOSQE_FIXED_FILE_BIT,
	IOSQE_IO_DRAIN_BIT,
	IOSQE_IO_LINK_BIT,
	IOSQE_IO_HARDLINK_BIT,
	IOSQE_ASYNC_BIT,
68
	IOSQE_BUFFER_SELECT_BIT,
69 70
};

J
Jens Axboe 已提交
71 72 73
/*
 * sqe->flags
 */
74 75 76 77 78 79 80 81 82 83
/* use fixed fileset */
#define IOSQE_FIXED_FILE	(1U << IOSQE_FIXED_FILE_BIT)
/* issue after inflight IO */
#define IOSQE_IO_DRAIN		(1U << IOSQE_IO_DRAIN_BIT)
/* links next sqe */
#define IOSQE_IO_LINK		(1U << IOSQE_IO_LINK_BIT)
/* like LINK, but stronger */
#define IOSQE_IO_HARDLINK	(1U << IOSQE_IO_HARDLINK_BIT)
/* always go async */
#define IOSQE_ASYNC		(1U << IOSQE_ASYNC_BIT)
84 85
/* select buffer from sqe->buf_group */
#define IOSQE_BUFFER_SELECT	(1U << IOSQE_BUFFER_SELECT_BIT)
J
Jens Axboe 已提交
86

J
Jens Axboe 已提交
87 88 89 90
/*
 * io_uring_setup() flags
 */
#define IORING_SETUP_IOPOLL	(1U << 0)	/* io_context is polled */
J
Jens Axboe 已提交
91 92
#define IORING_SETUP_SQPOLL	(1U << 1)	/* SQ poll thread */
#define IORING_SETUP_SQ_AFF	(1U << 2)	/* sq_thread_cpu is valid */
93
#define IORING_SETUP_CQSIZE	(1U << 3)	/* app defines CQ size */
94
#define IORING_SETUP_CLAMP	(1U << 4)	/* clamp SQ/CQ ring sizes */
95
#define IORING_SETUP_ATTACH_WQ	(1U << 5)	/* attach to existing wq */
96
#define IORING_SETUP_R_DISABLED	(1U << 6)	/* start with ring disabled */
J
Jens Axboe 已提交
97

98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115
enum {
	IORING_OP_NOP,
	IORING_OP_READV,
	IORING_OP_WRITEV,
	IORING_OP_FSYNC,
	IORING_OP_READ_FIXED,
	IORING_OP_WRITE_FIXED,
	IORING_OP_POLL_ADD,
	IORING_OP_POLL_REMOVE,
	IORING_OP_SYNC_FILE_RANGE,
	IORING_OP_SENDMSG,
	IORING_OP_RECVMSG,
	IORING_OP_TIMEOUT,
	IORING_OP_TIMEOUT_REMOVE,
	IORING_OP_ACCEPT,
	IORING_OP_ASYNC_CANCEL,
	IORING_OP_LINK_TIMEOUT,
	IORING_OP_CONNECT,
116
	IORING_OP_FALLOCATE,
117
	IORING_OP_OPENAT,
118
	IORING_OP_CLOSE,
119
	IORING_OP_FILES_UPDATE,
120
	IORING_OP_STATX,
121 122
	IORING_OP_READ,
	IORING_OP_WRITE,
J
Jens Axboe 已提交
123
	IORING_OP_FADVISE,
J
Jens Axboe 已提交
124
	IORING_OP_MADVISE,
125 126
	IORING_OP_SEND,
	IORING_OP_RECV,
127
	IORING_OP_OPENAT2,
128
	IORING_OP_EPOLL_CTL,
P
Pavel Begunkov 已提交
129
	IORING_OP_SPLICE,
130
	IORING_OP_PROVIDE_BUFFERS,
131
	IORING_OP_REMOVE_BUFFERS,
P
Pavel Begunkov 已提交
132
	IORING_OP_TEE,
J
Jens Axboe 已提交
133
	IORING_OP_SHUTDOWN,
134
	IORING_OP_RENAMEAT,
135
	IORING_OP_UNLINKAT,
136
	IORING_OP_MKDIRAT,
137 138 139 140

	/* this goes last, obviously */
	IORING_OP_LAST,
};
C
Christoph Hellwig 已提交
141 142 143 144 145

/*
 * sqe->fsync_flags
 */
#define IORING_FSYNC_DATASYNC	(1U << 0)
J
Jens Axboe 已提交
146

147 148 149 150
/*
 * sqe->timeout_flags
 */
#define IORING_TIMEOUT_ABS	(1U << 0)
P
Pavel Begunkov 已提交
151
#define IORING_TIMEOUT_UPDATE	(1U << 1)
152

P
Pavel Begunkov 已提交
153 154 155 156 157 158
/*
 * sqe->splice_flags
 * extends splice(2) flags
 */
#define SPLICE_F_FD_IN_FIXED	(1U << 31) /* the last bit of __u32 */

159 160 161 162 163 164 165
/*
 * POLL_ADD flags. Note that since sqe->poll_events is the flag space, the
 * command flags for POLL_ADD are stored in sqe->len.
 *
 * IORING_POLL_ADD_MULTI	Multishot poll. Sets IORING_CQE_F_MORE if
 *				the poll handler will continue to report
 *				CQEs on behalf of the same SQE.
166 167 168
 *
 * IORING_POLL_UPDATE		Update existing poll request, matching
 *				sqe->addr as the old user_data field.
169 170
 */
#define IORING_POLL_ADD_MULTI	(1U << 0)
171 172
#define IORING_POLL_UPDATE_EVENTS	(1U << 1)
#define IORING_POLL_UPDATE_USER_DATA	(1U << 2)
173

J
Jens Axboe 已提交
174 175 176 177 178 179 180 181 182
/*
 * IO completion data structure (Completion Queue Entry)
 */
struct io_uring_cqe {
	__u64	user_data;	/* sqe->data submission passed back */
	__s32	res;		/* result code for this event */
	__u32	flags;
};

183 184 185 186
/*
 * cqe->flags
 *
 * IORING_CQE_F_BUFFER	If set, the upper 16 bits are the buffer ID
187
 * IORING_CQE_F_MORE	If set, parent SQE will generate more CQE entries
188 189
 */
#define IORING_CQE_F_BUFFER		(1U << 0)
190
#define IORING_CQE_F_MORE		(1U << 1)
191 192 193 194 195

enum {
	IORING_CQE_BUFFER_SHIFT		= 16,
};

J
Jens Axboe 已提交
196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217
/*
 * Magic offsets for the application to mmap the data it needs
 */
#define IORING_OFF_SQ_RING		0ULL
#define IORING_OFF_CQ_RING		0x8000000ULL
#define IORING_OFF_SQES			0x10000000ULL

/*
 * Filled with the offset for mmap(2)
 */
struct io_sqring_offsets {
	__u32 head;
	__u32 tail;
	__u32 ring_mask;
	__u32 ring_entries;
	__u32 flags;
	__u32 dropped;
	__u32 array;
	__u32 resv1;
	__u64 resv2;
};

J
Jens Axboe 已提交
218 219 220 221
/*
 * sq_ring->flags
 */
#define IORING_SQ_NEED_WAKEUP	(1U << 0) /* needs io_uring_enter wakeup */
222
#define IORING_SQ_CQ_OVERFLOW	(1U << 1) /* CQ ring is overflown */
J
Jens Axboe 已提交
223

J
Jens Axboe 已提交
224 225 226 227 228 229 230
struct io_cqring_offsets {
	__u32 head;
	__u32 tail;
	__u32 ring_mask;
	__u32 ring_entries;
	__u32 overflow;
	__u32 cqes;
231 232 233
	__u32 flags;
	__u32 resv1;
	__u64 resv2;
J
Jens Axboe 已提交
234 235
};

236 237 238 239 240 241 242
/*
 * cq_ring->flags
 */

/* disable eventfd notifications */
#define IORING_CQ_EVENTFD_DISABLED	(1U << 0)

J
Jens Axboe 已提交
243 244 245 246
/*
 * io_uring_enter(2) flags
 */
#define IORING_ENTER_GETEVENTS	(1U << 0)
J
Jens Axboe 已提交
247
#define IORING_ENTER_SQ_WAKEUP	(1U << 1)
248
#define IORING_ENTER_SQ_WAIT	(1U << 2)
249
#define IORING_ENTER_EXT_ARG	(1U << 3)
J
Jens Axboe 已提交
250 251 252 253 254 255 256 257

/*
 * Passed in for io_uring_setup(2). Copied back with updated info on success
 */
struct io_uring_params {
	__u32 sq_entries;
	__u32 cq_entries;
	__u32 flags;
J
Jens Axboe 已提交
258 259
	__u32 sq_thread_cpu;
	__u32 sq_thread_idle;
260
	__u32 features;
261 262
	__u32 wq_fd;
	__u32 resv[3];
J
Jens Axboe 已提交
263 264 265 266
	struct io_sqring_offsets sq_off;
	struct io_cqring_offsets cq_off;
};

267 268 269 270
/*
 * io_uring_params->features flags
 */
#define IORING_FEAT_SINGLE_MMAP		(1U << 0)
271
#define IORING_FEAT_NODROP		(1U << 1)
272
#define IORING_FEAT_SUBMIT_STABLE	(1U << 2)
273
#define IORING_FEAT_RW_CUR_POS		(1U << 3)
274
#define IORING_FEAT_CUR_PERSONALITY	(1U << 4)
275
#define IORING_FEAT_FAST_POLL		(1U << 5)
276
#define IORING_FEAT_POLL_32BITS 	(1U << 6)
277
#define IORING_FEAT_SQPOLL_NONFIXED	(1U << 7)
278
#define IORING_FEAT_EXT_ARG		(1U << 8)
279
#define IORING_FEAT_NATIVE_WORKERS	(1U << 9)
280
#define IORING_FEAT_RSRC_TAGS		(1U << 10)
281

282 283 284
/*
 * io_uring_register(2) opcodes and arguments
 */
285 286 287 288 289 290 291 292 293 294 295 296
enum {
	IORING_REGISTER_BUFFERS			= 0,
	IORING_UNREGISTER_BUFFERS		= 1,
	IORING_REGISTER_FILES			= 2,
	IORING_UNREGISTER_FILES			= 3,
	IORING_REGISTER_EVENTFD			= 4,
	IORING_UNREGISTER_EVENTFD		= 5,
	IORING_REGISTER_FILES_UPDATE		= 6,
	IORING_REGISTER_EVENTFD_ASYNC		= 7,
	IORING_REGISTER_PROBE			= 8,
	IORING_REGISTER_PERSONALITY		= 9,
	IORING_UNREGISTER_PERSONALITY		= 10,
297
	IORING_REGISTER_RESTRICTIONS		= 11,
298
	IORING_REGISTER_ENABLE_RINGS		= 12,
299 300 301 302 303 304

	/* extended with tagging */
	IORING_REGISTER_FILES2			= 13,
	IORING_REGISTER_FILES_UPDATE2		= 14,
	IORING_REGISTER_BUFFERS2		= 15,
	IORING_REGISTER_BUFFERS_UPDATE		= 16,
305

306 307 308 309
	/* set/clear io-wq thread affinities */
	IORING_REGISTER_IOWQ_AFF		= 17,
	IORING_UNREGISTER_IOWQ_AFF		= 18,

310 311 312
	/* this goes last */
	IORING_REGISTER_LAST
};
313

314
/* deprecated, see struct io_uring_rsrc_update */
315 316
struct io_uring_files_update {
	__u32 offset;
317 318
	__u32 resv;
	__aligned_u64 /* __s32 * */ fds;
319
};
320

321 322
struct io_uring_rsrc_register {
	__u32 nr;
323 324
	__u32 resv;
	__u64 resv2;
325 326 327 328
	__aligned_u64 data;
	__aligned_u64 tags;
};

329 330 331 332 333 334 335 336 337 338 339 340
struct io_uring_rsrc_update {
	__u32 offset;
	__u32 resv;
	__aligned_u64 data;
};

struct io_uring_rsrc_update2 {
	__u32 offset;
	__u32 resv;
	__aligned_u64 data;
	__aligned_u64 tags;
	__u32 nr;
341
	__u32 resv2;
342 343
};

344 345 346
/* Skip updating fd indexes set to this value in the fd table */
#define IORING_REGISTER_FILES_SKIP	(-2)

347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363
#define IO_URING_OP_SUPPORTED	(1U << 0)

struct io_uring_probe_op {
	__u8 op;
	__u8 resv;
	__u16 flags;	/* IO_URING_OP_* flags */
	__u32 resv2;
};

struct io_uring_probe {
	__u8 last_op;	/* last opcode supported */
	__u8 ops_len;	/* length of ops[] array below */
	__u16 resv;
	__u32 resv2[3];
	struct io_uring_probe_op ops[0];
};

364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393
struct io_uring_restriction {
	__u16 opcode;
	union {
		__u8 register_op; /* IORING_RESTRICTION_REGISTER_OP */
		__u8 sqe_op;      /* IORING_RESTRICTION_SQE_OP */
		__u8 sqe_flags;   /* IORING_RESTRICTION_SQE_FLAGS_* */
	};
	__u8 resv;
	__u32 resv2[3];
};

/*
 * io_uring_restriction->opcode values
 */
enum {
	/* Allow an io_uring_register(2) opcode */
	IORING_RESTRICTION_REGISTER_OP		= 0,

	/* Allow an sqe opcode */
	IORING_RESTRICTION_SQE_OP		= 1,

	/* Allow sqe flags */
	IORING_RESTRICTION_SQE_FLAGS_ALLOWED	= 2,

	/* Require sqe flags (these flags must be set on each submission) */
	IORING_RESTRICTION_SQE_FLAGS_REQUIRED	= 3,

	IORING_RESTRICTION_LAST
};

394 395 396 397 398 399 400
struct io_uring_getevents_arg {
	__u64	sigmask;
	__u32	sigmask_sz;
	__u32	pad;
	__u64	ts;
};

J
Jens Axboe 已提交
401
#endif