1 /* SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note */ 2 #ifndef _UAPI_LINUX_FS_H 3 #define _UAPI_LINUX_FS_H 4 5 /* 6 * This file has definitions for some important file table structures 7 * and constants and structures used by various generic file system 8 * ioctl's. Please do not make any changes in this file before 9 * sending patches for review to linux-fsdevel@vger.kernel.org and 10 * linux-api@vger.kernel.org. 11 */ 12 13 #include <linux/limits.h> 14 #include <linux/ioctl.h> 15 #include <linux/types.h> 16 #ifndef __KERNEL__ 17 #include <linux/fscrypt.h> 18 #endif 19 20 /* Use of MS_* flags within the kernel is restricted to core mount(2) code. */ 21 #if !defined(__KERNEL__) 22 #include <linux/mount.h> 23 #endif 24 25 /* 26 * It's silly to have NR_OPEN bigger than NR_FILE, but you can change 27 * the file limit at runtime and only root can increase the per-process 28 * nr_file rlimit, so it's safe to set up a ridiculously high absolute 29 * upper limit on files-per-process. 30 * 31 * Some programs (notably those using select()) may have to be 32 * recompiled to take full advantage of the new limits.. 33 */ 34 35 /* Fixed constants first: */ 36 #undef NR_OPEN 37 #define INR_OPEN_CUR 1024 /* Initial setting for nfile rlimits */ 38 #define INR_OPEN_MAX 4096 /* Hard limit for nfile rlimits */ 39 40 #define BLOCK_SIZE_BITS 10 41 #define BLOCK_SIZE (1<<BLOCK_SIZE_BITS) 42 43 /* flags for integrity meta */ 44 #define IO_INTEGRITY_CHK_GUARD (1U << 0) /* enforce guard check */ 45 #define IO_INTEGRITY_CHK_REFTAG (1U << 1) /* enforce ref check */ 46 #define IO_INTEGRITY_CHK_APPTAG (1U << 2) /* enforce app check */ 47 48 #define IO_INTEGRITY_VALID_FLAGS (IO_INTEGRITY_CHK_GUARD | \ 49 IO_INTEGRITY_CHK_REFTAG | \ 50 IO_INTEGRITY_CHK_APPTAG) 51 52 #define SEEK_SET 0 /* seek relative to beginning of file */ 53 #define SEEK_CUR 1 /* seek relative to current file position */ 54 #define SEEK_END 2 /* seek relative to end of file */ 55 #define SEEK_DATA 3 /* seek to the next data */ 56 #define SEEK_HOLE 4 /* seek to the next hole */ 57 #define SEEK_MAX SEEK_HOLE 58 59 #define RENAME_NOREPLACE (1 << 0) /* Don't overwrite target */ 60 #define RENAME_EXCHANGE (1 << 1) /* Exchange source and dest */ 61 #define RENAME_WHITEOUT (1 << 2) /* Whiteout source */ 62 63 /* 64 * The root inode of procfs is guaranteed to always have the same inode number. 65 * For programs that make heavy use of procfs, verifying that the root is a 66 * real procfs root and using openat2(RESOLVE_{NO_{XDEV,MAGICLINKS},BENEATH}) 67 * will allow you to make sure you are never tricked into operating on the 68 * wrong procfs file. 69 */ 70 enum procfs_ino { 71 PROCFS_ROOT_INO = 1, 72 }; 73 74 struct file_clone_range { 75 __s64 src_fd; 76 __u64 src_offset; 77 __u64 src_length; 78 __u64 dest_offset; 79 }; 80 81 struct fstrim_range { 82 __u64 start; 83 __u64 len; 84 __u64 minlen; 85 }; 86 87 /* 88 * We include a length field because some filesystems (vfat) have an identifier 89 * that we do want to expose as a UUID, but doesn't have the standard length. 90 * 91 * We use a fixed size buffer beacuse this interface will, by fiat, never 92 * support "UUIDs" longer than 16 bytes; we don't want to force all downstream 93 * users to have to deal with that. 94 */ 95 struct fsuuid2 { 96 __u8 len; 97 __u8 uuid[16]; 98 }; 99 100 struct fs_sysfs_path { 101 __u8 len; 102 __u8 name[128]; 103 }; 104 105 /* Protection info capability flags */ 106 #define LBMD_PI_CAP_INTEGRITY (1 << 0) 107 #define LBMD_PI_CAP_REFTAG (1 << 1) 108 109 /* Checksum types for Protection Information */ 110 #define LBMD_PI_CSUM_NONE 0 111 #define LBMD_PI_CSUM_IP 1 112 #define LBMD_PI_CSUM_CRC16_T10DIF 2 113 #define LBMD_PI_CSUM_CRC64_NVME 4 114 115 /* sizeof first published struct */ 116 #define LBMD_SIZE_VER0 16 117 118 /* 119 * Logical block metadata capability descriptor 120 * If the device does not support metadata, all the fields will be zero. 121 * Applications must check lbmd_flags to determine whether metadata is 122 * supported or not. 123 */ 124 struct logical_block_metadata_cap { 125 /* Bitmask of logical block metadata capability flags */ 126 __u32 lbmd_flags; 127 /* 128 * The amount of data described by each unit of logical block 129 * metadata 130 */ 131 __u16 lbmd_interval; 132 /* 133 * Size in bytes of the logical block metadata associated with each 134 * interval 135 */ 136 __u8 lbmd_size; 137 /* 138 * Size in bytes of the opaque block tag associated with each 139 * interval 140 */ 141 __u8 lbmd_opaque_size; 142 /* 143 * Offset in bytes of the opaque block tag within the logical block 144 * metadata 145 */ 146 __u8 lbmd_opaque_offset; 147 /* Size in bytes of the T10 PI tuple associated with each interval */ 148 __u8 lbmd_pi_size; 149 /* Offset in bytes of T10 PI tuple within the logical block metadata */ 150 __u8 lbmd_pi_offset; 151 /* T10 PI guard tag type */ 152 __u8 lbmd_guard_tag_type; 153 /* Size in bytes of the T10 PI application tag */ 154 __u8 lbmd_app_tag_size; 155 /* Size in bytes of the T10 PI reference tag */ 156 __u8 lbmd_ref_tag_size; 157 /* Size in bytes of the T10 PI storage tag */ 158 __u8 lbmd_storage_tag_size; 159 __u8 pad; 160 }; 161 162 /* extent-same (dedupe) ioctls; these MUST match the btrfs ioctl definitions */ 163 #define FILE_DEDUPE_RANGE_SAME 0 164 #define FILE_DEDUPE_RANGE_DIFFERS 1 165 166 /* from struct btrfs_ioctl_file_extent_same_info */ 167 struct file_dedupe_range_info { 168 __s64 dest_fd; /* in - destination file */ 169 __u64 dest_offset; /* in - start of extent in destination */ 170 __u64 bytes_deduped; /* out - total # of bytes we were able 171 * to dedupe from this file. */ 172 /* status of this dedupe operation: 173 * < 0 for error 174 * == FILE_DEDUPE_RANGE_SAME if dedupe succeeds 175 * == FILE_DEDUPE_RANGE_DIFFERS if data differs 176 */ 177 __s32 status; /* out - see above description */ 178 __u32 reserved; /* must be zero */ 179 }; 180 181 /* from struct btrfs_ioctl_file_extent_same_args */ 182 struct file_dedupe_range { 183 __u64 src_offset; /* in - start of extent in source */ 184 __u64 src_length; /* in - length of extent */ 185 __u16 dest_count; /* in - total elements in info array */ 186 __u16 reserved1; /* must be zero */ 187 __u32 reserved2; /* must be zero */ 188 struct file_dedupe_range_info info[]; 189 }; 190 191 /* And dynamically-tunable limits and defaults: */ 192 struct files_stat_struct { 193 unsigned long nr_files; /* read only */ 194 unsigned long nr_free_files; /* read only */ 195 unsigned long max_files; /* tunable */ 196 }; 197 198 struct inodes_stat_t { 199 long nr_inodes; 200 long nr_unused; 201 long dummy[5]; /* padding for sysctl ABI compatibility */ 202 }; 203 204 205 #define NR_FILE 8192 /* this can well be larger on a larger system */ 206 207 /* 208 * Structure for FS_IOC_FSGETXATTR[A] and FS_IOC_FSSETXATTR. 209 */ 210 struct fsxattr { 211 __u32 fsx_xflags; /* xflags field value (get/set) */ 212 __u32 fsx_extsize; /* extsize field value (get/set)*/ 213 __u32 fsx_nextents; /* nextents field value (get) */ 214 __u32 fsx_projid; /* project identifier (get/set) */ 215 __u32 fsx_cowextsize; /* CoW extsize field value (get/set)*/ 216 unsigned char fsx_pad[8]; 217 }; 218 219 /* 220 * Variable size structure for file_[sg]et_attr(). 221 * 222 * Note. This is alternative to the structure 'struct file_kattr'/'struct fsxattr'. 223 * As this structure is passed to/from userspace with its size, this can 224 * be versioned based on the size. 225 */ 226 struct file_attr { 227 __u64 fa_xflags; /* xflags field value (get/set) */ 228 __u32 fa_extsize; /* extsize field value (get/set)*/ 229 __u32 fa_nextents; /* nextents field value (get) */ 230 __u32 fa_projid; /* project identifier (get/set) */ 231 __u32 fa_cowextsize; /* CoW extsize field value (get/set) */ 232 }; 233 234 #define FILE_ATTR_SIZE_VER0 24 235 #define FILE_ATTR_SIZE_LATEST FILE_ATTR_SIZE_VER0 236 237 /* 238 * Flags for the fsx_xflags field 239 */ 240 #define FS_XFLAG_REALTIME 0x00000001 /* data in realtime volume */ 241 #define FS_XFLAG_PREALLOC 0x00000002 /* preallocated file extents */ 242 #define FS_XFLAG_IMMUTABLE 0x00000008 /* file cannot be modified */ 243 #define FS_XFLAG_APPEND 0x00000010 /* all writes append */ 244 #define FS_XFLAG_SYNC 0x00000020 /* all writes synchronous */ 245 #define FS_XFLAG_NOATIME 0x00000040 /* do not update access time */ 246 #define FS_XFLAG_NODUMP 0x00000080 /* do not include in backups */ 247 #define FS_XFLAG_RTINHERIT 0x00000100 /* create with rt bit set */ 248 #define FS_XFLAG_PROJINHERIT 0x00000200 /* create with parents projid */ 249 #define FS_XFLAG_NOSYMLINKS 0x00000400 /* disallow symlink creation */ 250 #define FS_XFLAG_EXTSIZE 0x00000800 /* extent size allocator hint */ 251 #define FS_XFLAG_EXTSZINHERIT 0x00001000 /* inherit inode extent size */ 252 #define FS_XFLAG_NODEFRAG 0x00002000 /* do not defragment */ 253 #define FS_XFLAG_FILESTREAM 0x00004000 /* use filestream allocator */ 254 #define FS_XFLAG_DAX 0x00008000 /* use DAX for IO */ 255 #define FS_XFLAG_COWEXTSIZE 0x00010000 /* CoW extent size allocator hint */ 256 #define FS_XFLAG_VERITY 0x00020000 /* fs-verity enabled */ 257 #define FS_XFLAG_HASATTR 0x80000000 /* no DIFLAG for this */ 258 259 /* the read-only stuff doesn't really belong here, but any other place is 260 probably as bad and I don't want to create yet another include file. */ 261 262 #define BLKROSET _IO(0x12,93) /* set device read-only (0 = read-write) */ 263 #define BLKROGET _IO(0x12,94) /* get read-only status (0 = read_write) */ 264 #define BLKRRPART _IO(0x12,95) /* re-read partition table */ 265 #define BLKGETSIZE _IO(0x12,96) /* return device size /512 (long *arg) */ 266 #define BLKFLSBUF _IO(0x12,97) /* flush buffer cache */ 267 #define BLKRASET _IO(0x12,98) /* set read ahead for block device */ 268 #define BLKRAGET _IO(0x12,99) /* get current read ahead setting */ 269 #define BLKFRASET _IO(0x12,100)/* set filesystem (mm/filemap.c) read-ahead */ 270 #define BLKFRAGET _IO(0x12,101)/* get filesystem (mm/filemap.c) read-ahead */ 271 #define BLKSECTSET _IO(0x12,102)/* set max sectors per request (ll_rw_blk.c) */ 272 #define BLKSECTGET _IO(0x12,103)/* get max sectors per request (ll_rw_blk.c) */ 273 #define BLKSSZGET _IO(0x12,104)/* get block device sector size */ 274 #if 0 275 #define BLKPG _IO(0x12,105)/* See blkpg.h */ 276 277 /* Some people are morons. Do not use sizeof! */ 278 279 #define BLKELVGET _IOR(0x12,106,size_t)/* elevator get */ 280 #define BLKELVSET _IOW(0x12,107,size_t)/* elevator set */ 281 /* This was here just to show that the number is taken - 282 probably all these _IO(0x12,*) ioctls should be moved to blkpg.h. */ 283 #endif 284 /* A jump here: 108-111 have been used for various private purposes. */ 285 #define BLKBSZGET _IOR(0x12,112,size_t) 286 #define BLKBSZSET _IOW(0x12,113,size_t) 287 #define BLKGETSIZE64 _IOR(0x12,114,size_t) /* return device size in bytes (u64 *arg) */ 288 #define BLKTRACESETUP _IOWR(0x12,115,struct blk_user_trace_setup) 289 #define BLKTRACESTART _IO(0x12,116) 290 #define BLKTRACESTOP _IO(0x12,117) 291 #define BLKTRACETEARDOWN _IO(0x12,118) 292 #define BLKDISCARD _IO(0x12,119) 293 #define BLKIOMIN _IO(0x12,120) 294 #define BLKIOOPT _IO(0x12,121) 295 #define BLKALIGNOFF _IO(0x12,122) 296 #define BLKPBSZGET _IO(0x12,123) 297 #define BLKDISCARDZEROES _IO(0x12,124) 298 #define BLKSECDISCARD _IO(0x12,125) 299 #define BLKROTATIONAL _IO(0x12,126) 300 #define BLKZEROOUT _IO(0x12,127) 301 #define BLKGETDISKSEQ _IOR(0x12,128,__u64) 302 /* 130-136 and 142 are used by zoned block device ioctls (uapi/linux/blkzoned.h) */ 303 /* 137-141 are used by blk-crypto ioctls (uapi/linux/blk-crypto.h) */ 304 #define BLKTRACESETUP2 _IOWR(0x12, 142, struct blk_user_trace_setup2) 305 306 #define BMAP_IOCTL 1 /* obsolete - kept for compatibility */ 307 #define FIBMAP _IO(0x00,1) /* bmap access */ 308 #define FIGETBSZ _IO(0x00,2) /* get the block size used for bmap */ 309 #define FIFREEZE _IOWR('X', 119, int) /* Freeze */ 310 #define FITHAW _IOWR('X', 120, int) /* Thaw */ 311 #define FITRIM _IOWR('X', 121, struct fstrim_range) /* Trim */ 312 #define FICLONE _IOW(0x94, 9, int) 313 #define FICLONERANGE _IOW(0x94, 13, struct file_clone_range) 314 #define FIDEDUPERANGE _IOWR(0x94, 54, struct file_dedupe_range) 315 316 #define FSLABEL_MAX 256 /* Max chars for the interface; each fs may differ */ 317 318 #define FS_IOC_GETFLAGS _IOR('f', 1, long) 319 #define FS_IOC_SETFLAGS _IOW('f', 2, long) 320 #define FS_IOC_GETVERSION _IOR('v', 1, long) 321 #define FS_IOC_SETVERSION _IOW('v', 2, long) 322 #define FS_IOC_FIEMAP _IOWR('f', 11, struct fiemap) 323 #define FS_IOC32_GETFLAGS _IOR('f', 1, int) 324 #define FS_IOC32_SETFLAGS _IOW('f', 2, int) 325 #define FS_IOC32_GETVERSION _IOR('v', 1, int) 326 #define FS_IOC32_SETVERSION _IOW('v', 2, int) 327 #define FS_IOC_FSGETXATTR _IOR('X', 31, struct fsxattr) 328 #define FS_IOC_FSSETXATTR _IOW('X', 32, struct fsxattr) 329 #define FS_IOC_GETFSLABEL _IOR(0x94, 49, char[FSLABEL_MAX]) 330 #define FS_IOC_SETFSLABEL _IOW(0x94, 50, char[FSLABEL_MAX]) 331 /* Returns the external filesystem UUID, the same one blkid returns */ 332 #define FS_IOC_GETFSUUID _IOR(0x15, 0, struct fsuuid2) 333 /* 334 * Returns the path component under /sys/fs/ that refers to this filesystem; 335 * also /sys/kernel/debug/ for filesystems with debugfs exports 336 */ 337 #define FS_IOC_GETFSSYSFSPATH _IOR(0x15, 1, struct fs_sysfs_path) 338 /* Get logical block metadata capability details */ 339 #define FS_IOC_GETLBMD_CAP _IOWR(0x15, 2, struct logical_block_metadata_cap) 340 341 /* 342 * Inode flags (FS_IOC_GETFLAGS / FS_IOC_SETFLAGS) 343 * 344 * Note: for historical reasons, these flags were originally used and 345 * defined for use by ext2/ext3, and then other file systems started 346 * using these flags so they wouldn't need to write their own version 347 * of chattr/lsattr (which was shipped as part of e2fsprogs). You 348 * should think twice before trying to use these flags in new 349 * contexts, or trying to assign these flags, since they are used both 350 * as the UAPI and the on-disk encoding for ext2/3/4. Also, we are 351 * almost out of 32-bit flags. :-) 352 * 353 * We have recently hoisted FS_IOC_FSGETXATTR / FS_IOC_FSSETXATTR from 354 * XFS to the generic FS level interface. This uses a structure that 355 * has padding and hence has more room to grow, so it may be more 356 * appropriate for many new use cases. 357 * 358 * Please do not change these flags or interfaces before checking with 359 * linux-fsdevel@vger.kernel.org and linux-api@vger.kernel.org. 360 */ 361 #define FS_SECRM_FL 0x00000001 /* Secure deletion */ 362 #define FS_UNRM_FL 0x00000002 /* Undelete */ 363 #define FS_COMPR_FL 0x00000004 /* Compress file */ 364 #define FS_SYNC_FL 0x00000008 /* Synchronous updates */ 365 #define FS_IMMUTABLE_FL 0x00000010 /* Immutable file */ 366 #define FS_APPEND_FL 0x00000020 /* writes to file may only append */ 367 #define FS_NODUMP_FL 0x00000040 /* do not dump file */ 368 #define FS_NOATIME_FL 0x00000080 /* do not update atime */ 369 /* Reserved for compression usage... */ 370 #define FS_DIRTY_FL 0x00000100 371 #define FS_COMPRBLK_FL 0x00000200 /* One or more compressed clusters */ 372 #define FS_NOCOMP_FL 0x00000400 /* Don't compress */ 373 /* End compression flags --- maybe not all used */ 374 #define FS_ENCRYPT_FL 0x00000800 /* Encrypted file */ 375 #define FS_BTREE_FL 0x00001000 /* btree format dir */ 376 #define FS_INDEX_FL 0x00001000 /* hash-indexed directory */ 377 #define FS_IMAGIC_FL 0x00002000 /* AFS directory */ 378 #define FS_JOURNAL_DATA_FL 0x00004000 /* Reserved for ext3 */ 379 #define FS_NOTAIL_FL 0x00008000 /* file tail should not be merged */ 380 #define FS_DIRSYNC_FL 0x00010000 /* dirsync behaviour (directories only) */ 381 #define FS_TOPDIR_FL 0x00020000 /* Top of directory hierarchies*/ 382 #define FS_HUGE_FILE_FL 0x00040000 /* Reserved for ext4 */ 383 #define FS_EXTENT_FL 0x00080000 /* Extents */ 384 #define FS_VERITY_FL 0x00100000 /* Verity protected inode */ 385 #define FS_EA_INODE_FL 0x00200000 /* Inode used for large EA */ 386 #define FS_EOFBLOCKS_FL 0x00400000 /* Reserved for ext4 */ 387 #define FS_NOCOW_FL 0x00800000 /* Do not cow file */ 388 #define FS_DAX_FL 0x02000000 /* Inode is DAX */ 389 #define FS_INLINE_DATA_FL 0x10000000 /* Reserved for ext4 */ 390 #define FS_PROJINHERIT_FL 0x20000000 /* Create with parents projid */ 391 #define FS_CASEFOLD_FL 0x40000000 /* Folder is case insensitive */ 392 #define FS_RESERVED_FL 0x80000000 /* reserved for ext2 lib */ 393 394 #define FS_FL_USER_VISIBLE 0x0003DFFF /* User visible flags */ 395 #define FS_FL_USER_MODIFIABLE 0x000380FF /* User modifiable flags */ 396 397 398 #define SYNC_FILE_RANGE_WAIT_BEFORE 1 399 #define SYNC_FILE_RANGE_WRITE 2 400 #define SYNC_FILE_RANGE_WAIT_AFTER 4 401 #define SYNC_FILE_RANGE_WRITE_AND_WAIT (SYNC_FILE_RANGE_WRITE | \ 402 SYNC_FILE_RANGE_WAIT_BEFORE | \ 403 SYNC_FILE_RANGE_WAIT_AFTER) 404 405 /* 406 * Flags for preadv2/pwritev2: 407 */ 408 409 typedef int __bitwise __kernel_rwf_t; 410 411 /* high priority request, poll if possible */ 412 #define RWF_HIPRI ((__force __kernel_rwf_t)0x00000001) 413 414 /* per-IO O_DSYNC */ 415 #define RWF_DSYNC ((__force __kernel_rwf_t)0x00000002) 416 417 /* per-IO O_SYNC */ 418 #define RWF_SYNC ((__force __kernel_rwf_t)0x00000004) 419 420 /* per-IO, return -EAGAIN if operation would block */ 421 #define RWF_NOWAIT ((__force __kernel_rwf_t)0x00000008) 422 423 /* per-IO O_APPEND */ 424 #define RWF_APPEND ((__force __kernel_rwf_t)0x00000010) 425 426 /* per-IO negation of O_APPEND */ 427 #define RWF_NOAPPEND ((__force __kernel_rwf_t)0x00000020) 428 429 /* Atomic Write */ 430 #define RWF_ATOMIC ((__force __kernel_rwf_t)0x00000040) 431 432 /* buffered IO that drops the cache after reading or writing data */ 433 #define RWF_DONTCACHE ((__force __kernel_rwf_t)0x00000080) 434 435 /* prevent pipe and socket writes from raising SIGPIPE */ 436 #define RWF_NOSIGNAL ((__force __kernel_rwf_t)0x00000100) 437 438 /* mask of flags supported by the kernel */ 439 #define RWF_SUPPORTED (RWF_HIPRI | RWF_DSYNC | RWF_SYNC | RWF_NOWAIT |\ 440 RWF_APPEND | RWF_NOAPPEND | RWF_ATOMIC |\ 441 RWF_DONTCACHE | RWF_NOSIGNAL) 442 443 #define PROCFS_IOCTL_MAGIC 'f' 444 445 /* Pagemap ioctl */ 446 #define PAGEMAP_SCAN _IOWR(PROCFS_IOCTL_MAGIC, 16, struct pm_scan_arg) 447 448 /* Bitmasks provided in pm_scan_args masks and reported in page_region.categories. */ 449 #define PAGE_IS_WPALLOWED (1 << 0) 450 #define PAGE_IS_WRITTEN (1 << 1) 451 #define PAGE_IS_FILE (1 << 2) 452 #define PAGE_IS_PRESENT (1 << 3) 453 #define PAGE_IS_SWAPPED (1 << 4) 454 #define PAGE_IS_PFNZERO (1 << 5) 455 #define PAGE_IS_HUGE (1 << 6) 456 #define PAGE_IS_SOFT_DIRTY (1 << 7) 457 #define PAGE_IS_GUARD (1 << 8) 458 459 /* 460 * struct page_region - Page region with flags 461 * @start: Start of the region 462 * @end: End of the region (exclusive) 463 * @categories: PAGE_IS_* category bitmask for the region 464 */ 465 struct page_region { 466 __u64 start; 467 __u64 end; 468 __u64 categories; 469 }; 470 471 /* Flags for PAGEMAP_SCAN ioctl */ 472 #define PM_SCAN_WP_MATCHING (1 << 0) /* Write protect the pages matched. */ 473 #define PM_SCAN_CHECK_WPASYNC (1 << 1) /* Abort the scan when a non-WP-enabled page is found. */ 474 475 /* 476 * struct pm_scan_arg - Pagemap ioctl argument 477 * @size: Size of the structure 478 * @flags: Flags for the IOCTL 479 * @start: Starting address of the region 480 * @end: Ending address of the region 481 * @walk_end Address where the scan stopped (written by kernel). 482 * walk_end == end (address tags cleared) informs that the scan completed on entire range. 483 * @vec: Address of page_region struct array for output 484 * @vec_len: Length of the page_region struct array 485 * @max_pages: Optional limit for number of returned pages (0 = disabled) 486 * @category_inverted: PAGE_IS_* categories which values match if 0 instead of 1 487 * @category_mask: Skip pages for which any category doesn't match 488 * @category_anyof_mask: Skip pages for which no category matches 489 * @return_mask: PAGE_IS_* categories that are to be reported in `page_region`s returned 490 */ 491 struct pm_scan_arg { 492 __u64 size; 493 __u64 flags; 494 __u64 start; 495 __u64 end; 496 __u64 walk_end; 497 __u64 vec; 498 __u64 vec_len; 499 __u64 max_pages; 500 __u64 category_inverted; 501 __u64 category_mask; 502 __u64 category_anyof_mask; 503 __u64 return_mask; 504 }; 505 506 /* /proc/<pid>/maps ioctl */ 507 #define PROCMAP_QUERY _IOWR(PROCFS_IOCTL_MAGIC, 17, struct procmap_query) 508 509 enum procmap_query_flags { 510 /* 511 * VMA permission flags. 512 * 513 * Can be used as part of procmap_query.query_flags field to look up 514 * only VMAs satisfying specified subset of permissions. E.g., specifying 515 * PROCMAP_QUERY_VMA_READABLE only will return both readable and read/write VMAs, 516 * while having PROCMAP_QUERY_VMA_READABLE | PROCMAP_QUERY_VMA_WRITABLE will only 517 * return read/write VMAs, though both executable/non-executable and 518 * private/shared will be ignored. 519 * 520 * PROCMAP_QUERY_VMA_* flags are also returned in procmap_query.vma_flags 521 * field to specify actual VMA permissions. 522 */ 523 PROCMAP_QUERY_VMA_READABLE = 0x01, 524 PROCMAP_QUERY_VMA_WRITABLE = 0x02, 525 PROCMAP_QUERY_VMA_EXECUTABLE = 0x04, 526 PROCMAP_QUERY_VMA_SHARED = 0x08, 527 /* 528 * Query modifier flags. 529 * 530 * By default VMA that covers provided address is returned, or -ENOENT 531 * is returned. With PROCMAP_QUERY_COVERING_OR_NEXT_VMA flag set, closest 532 * VMA with vma_start > addr will be returned if no covering VMA is 533 * found. 534 * 535 * PROCMAP_QUERY_FILE_BACKED_VMA instructs query to consider only VMAs that 536 * have file backing. Can be combined with PROCMAP_QUERY_COVERING_OR_NEXT_VMA 537 * to iterate all VMAs with file backing. 538 */ 539 PROCMAP_QUERY_COVERING_OR_NEXT_VMA = 0x10, 540 PROCMAP_QUERY_FILE_BACKED_VMA = 0x20, 541 }; 542 543 /* 544 * Input/output argument structured passed into ioctl() call. It can be used 545 * to query a set of VMAs (Virtual Memory Areas) of a process. 546 * 547 * Each field can be one of three kinds, marked in a short comment to the 548 * right of the field: 549 * - "in", input argument, user has to provide this value, kernel doesn't modify it; 550 * - "out", output argument, kernel sets this field with VMA data; 551 * - "in/out", input and output argument; user provides initial value (used 552 * to specify maximum allowable buffer size), and kernel sets it to actual 553 * amount of data written (or zero, if there is no data). 554 * 555 * If matching VMA is found (according to criterias specified by 556 * query_addr/query_flags, all the out fields are filled out, and ioctl() 557 * returns 0. If there is no matching VMA, -ENOENT will be returned. 558 * In case of any other error, negative error code other than -ENOENT is 559 * returned. 560 * 561 * Most of the data is similar to the one returned as text in /proc/<pid>/maps 562 * file, but procmap_query provides more querying flexibility. There are no 563 * consistency guarantees between subsequent ioctl() calls, but data returned 564 * for matched VMA is self-consistent. 565 */ 566 struct procmap_query { 567 /* Query struct size, for backwards/forward compatibility */ 568 __u64 size; 569 /* 570 * Query flags, a combination of enum procmap_query_flags values. 571 * Defines query filtering and behavior, see enum procmap_query_flags. 572 * 573 * Input argument, provided by user. Kernel doesn't modify it. 574 */ 575 __u64 query_flags; /* in */ 576 /* 577 * Query address. By default, VMA that covers this address will 578 * be looked up. PROCMAP_QUERY_* flags above modify this default 579 * behavior further. 580 * 581 * Input argument, provided by user. Kernel doesn't modify it. 582 */ 583 __u64 query_addr; /* in */ 584 /* VMA starting (inclusive) and ending (exclusive) address, if VMA is found. */ 585 __u64 vma_start; /* out */ 586 __u64 vma_end; /* out */ 587 /* VMA permissions flags. A combination of PROCMAP_QUERY_VMA_* flags. */ 588 __u64 vma_flags; /* out */ 589 /* VMA backing page size granularity. */ 590 __u64 vma_page_size; /* out */ 591 /* 592 * VMA file offset. If VMA has file backing, this specifies offset 593 * within the file that VMA's start address corresponds to. 594 * Is set to zero if VMA has no backing file. 595 */ 596 __u64 vma_offset; /* out */ 597 /* Backing file's inode number, or zero, if VMA has no backing file. */ 598 __u64 inode; /* out */ 599 /* Backing file's device major/minor number, or zero, if VMA has no backing file. */ 600 __u32 dev_major; /* out */ 601 __u32 dev_minor; /* out */ 602 /* 603 * If set to non-zero value, signals the request to return VMA name 604 * (i.e., VMA's backing file's absolute path, with " (deleted)" suffix 605 * appended, if file was unlinked from FS) for matched VMA. VMA name 606 * can also be some special name (e.g., "[heap]", "[stack]") or could 607 * be even user-supplied with prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME). 608 * 609 * Kernel will set this field to zero, if VMA has no associated name. 610 * Otherwise kernel will return actual amount of bytes filled in 611 * user-supplied buffer (see vma_name_addr field below), including the 612 * terminating zero. 613 * 614 * If VMA name is longer that user-supplied maximum buffer size, 615 * -E2BIG error is returned. 616 * 617 * If this field is set to non-zero value, vma_name_addr should point 618 * to valid user space memory buffer of at least vma_name_size bytes. 619 * If set to zero, vma_name_addr should be set to zero as well 620 */ 621 __u32 vma_name_size; /* in/out */ 622 /* 623 * If set to non-zero value, signals the request to extract and return 624 * VMA's backing file's build ID, if the backing file is an ELF file 625 * and it contains embedded build ID. 626 * 627 * Kernel will set this field to zero, if VMA has no backing file, 628 * backing file is not an ELF file, or ELF file has no build ID 629 * embedded. 630 * 631 * Build ID is a binary value (not a string). Kernel will set 632 * build_id_size field to exact number of bytes used for build ID. 633 * If build ID is requested and present, but needs more bytes than 634 * user-supplied maximum buffer size (see build_id_addr field below), 635 * -E2BIG error will be returned. 636 * 637 * If this field is set to non-zero value, build_id_addr should point 638 * to valid user space memory buffer of at least build_id_size bytes. 639 * If set to zero, build_id_addr should be set to zero as well 640 */ 641 __u32 build_id_size; /* in/out */ 642 /* 643 * User-supplied address of a buffer of at least vma_name_size bytes 644 * for kernel to fill with matched VMA's name (see vma_name_size field 645 * description above for details). 646 * 647 * Should be set to zero if VMA name should not be returned. 648 */ 649 __u64 vma_name_addr; /* in */ 650 /* 651 * User-supplied address of a buffer of at least build_id_size bytes 652 * for kernel to fill with matched VMA's ELF build ID, if available 653 * (see build_id_size field description above for details). 654 * 655 * Should be set to zero if build ID should not be returned. 656 */ 657 __u64 build_id_addr; /* in */ 658 }; 659 660 #endif /* _UAPI_LINUX_FS_H */ 661