| 1 | /* SPDX-License-Identifier: GPL-2.0 WITH Linux-syscall-note */ | 
|---|
| 2 | #ifndef _UAPI_LINUX_FS_H | 
|---|
| 3 | #define _UAPI_LINUX_FS_H | 
|---|
| 4 |  | 
|---|
| 5 | /* | 
|---|
| 6 | * This file has definitions for some important file table structures | 
|---|
| 7 | * and constants and structures used by various generic file system | 
|---|
| 8 | * ioctl's.  Please do not make any changes in this file before | 
|---|
| 9 | * sending patches for review to linux-fsdevel@vger.kernel.org and | 
|---|
| 10 | * linux-api@vger.kernel.org. | 
|---|
| 11 | */ | 
|---|
| 12 |  | 
|---|
| 13 | #include <linux/limits.h> | 
|---|
| 14 | #include <linux/ioctl.h> | 
|---|
| 15 | #include <linux/types.h> | 
|---|
| 16 | #ifndef __KERNEL__ | 
|---|
| 17 | #include <linux/fscrypt.h> | 
|---|
| 18 | #endif | 
|---|
| 19 |  | 
|---|
| 20 | /* Use of MS_* flags within the kernel is restricted to core mount(2) code. */ | 
|---|
| 21 | #if !defined(__KERNEL__) | 
|---|
| 22 | #include <linux/mount.h> | 
|---|
| 23 | #endif | 
|---|
| 24 |  | 
|---|
| 25 | /* | 
|---|
| 26 | * It's silly to have NR_OPEN bigger than NR_FILE, but you can change | 
|---|
| 27 | * the file limit at runtime and only root can increase the per-process | 
|---|
| 28 | * nr_file rlimit, so it's safe to set up a ridiculously high absolute | 
|---|
| 29 | * upper limit on files-per-process. | 
|---|
| 30 | * | 
|---|
| 31 | * Some programs (notably those using select()) may have to be | 
|---|
| 32 | * recompiled to take full advantage of the new limits.. | 
|---|
| 33 | */ | 
|---|
| 34 |  | 
|---|
| 35 | /* Fixed constants first: */ | 
|---|
| 36 | #undef NR_OPEN | 
|---|
| 37 | #define INR_OPEN_CUR 1024	/* Initial setting for nfile rlimits */ | 
|---|
| 38 | #define INR_OPEN_MAX 4096	/* Hard limit for nfile rlimits */ | 
|---|
| 39 |  | 
|---|
| 40 | #define BLOCK_SIZE_BITS 10 | 
|---|
| 41 | #define BLOCK_SIZE (1<<BLOCK_SIZE_BITS) | 
|---|
| 42 |  | 
|---|
| 43 | /* flags for integrity meta */ | 
|---|
| 44 | #define IO_INTEGRITY_CHK_GUARD		(1U << 0) /* enforce guard check */ | 
|---|
| 45 | #define IO_INTEGRITY_CHK_REFTAG		(1U << 1) /* enforce ref check */ | 
|---|
| 46 | #define IO_INTEGRITY_CHK_APPTAG		(1U << 2) /* enforce app check */ | 
|---|
| 47 |  | 
|---|
| 48 | #define IO_INTEGRITY_VALID_FLAGS (IO_INTEGRITY_CHK_GUARD | \ | 
|---|
| 49 | IO_INTEGRITY_CHK_REFTAG | \ | 
|---|
| 50 | IO_INTEGRITY_CHK_APPTAG) | 
|---|
| 51 |  | 
|---|
| 52 | #define SEEK_SET	0	/* seek relative to beginning of file */ | 
|---|
| 53 | #define SEEK_CUR	1	/* seek relative to current file position */ | 
|---|
| 54 | #define SEEK_END	2	/* seek relative to end of file */ | 
|---|
| 55 | #define SEEK_DATA	3	/* seek to the next data */ | 
|---|
| 56 | #define SEEK_HOLE	4	/* seek to the next hole */ | 
|---|
| 57 | #define SEEK_MAX	SEEK_HOLE | 
|---|
| 58 |  | 
|---|
| 59 | #define RENAME_NOREPLACE	(1 << 0)	/* Don't overwrite target */ | 
|---|
| 60 | #define RENAME_EXCHANGE		(1 << 1)	/* Exchange source and dest */ | 
|---|
| 61 | #define RENAME_WHITEOUT		(1 << 2)	/* Whiteout source */ | 
|---|
| 62 |  | 
|---|
| 63 | /* | 
|---|
| 64 | * The root inode of procfs is guaranteed to always have the same inode number. | 
|---|
| 65 | * For programs that make heavy use of procfs, verifying that the root is a | 
|---|
| 66 | * real procfs root and using openat2(RESOLVE_{NO_{XDEV,MAGICLINKS},BENEATH}) | 
|---|
| 67 | * will allow you to make sure you are never tricked into operating on the | 
|---|
| 68 | * wrong procfs file. | 
|---|
| 69 | */ | 
|---|
| 70 | enum procfs_ino { | 
|---|
| 71 | PROCFS_ROOT_INO = 1, | 
|---|
| 72 | }; | 
|---|
| 73 |  | 
|---|
| 74 | struct file_clone_range { | 
|---|
| 75 | __s64 src_fd; | 
|---|
| 76 | __u64 src_offset; | 
|---|
| 77 | __u64 src_length; | 
|---|
| 78 | __u64 dest_offset; | 
|---|
| 79 | }; | 
|---|
| 80 |  | 
|---|
| 81 | struct fstrim_range { | 
|---|
| 82 | __u64 start; | 
|---|
| 83 | __u64 len; | 
|---|
| 84 | __u64 minlen; | 
|---|
| 85 | }; | 
|---|
| 86 |  | 
|---|
| 87 | /* | 
|---|
| 88 | * We include a length field because some filesystems (vfat) have an identifier | 
|---|
| 89 | * that we do want to expose as a UUID, but doesn't have the standard length. | 
|---|
| 90 | * | 
|---|
| 91 | * We use a fixed size buffer beacuse this interface will, by fiat, never | 
|---|
| 92 | * support "UUIDs" longer than 16 bytes; we don't want to force all downstream | 
|---|
| 93 | * users to have to deal with that. | 
|---|
| 94 | */ | 
|---|
| 95 | struct fsuuid2 { | 
|---|
| 96 | __u8	len; | 
|---|
| 97 | __u8	uuid[16]; | 
|---|
| 98 | }; | 
|---|
| 99 |  | 
|---|
| 100 | struct fs_sysfs_path { | 
|---|
| 101 | __u8			len; | 
|---|
| 102 | __u8			name[128]; | 
|---|
| 103 | }; | 
|---|
| 104 |  | 
|---|
| 105 | /* Protection info capability flags */ | 
|---|
| 106 | #define	LBMD_PI_CAP_INTEGRITY		(1 << 0) | 
|---|
| 107 | #define	LBMD_PI_CAP_REFTAG		(1 << 1) | 
|---|
| 108 |  | 
|---|
| 109 | /* Checksum types for Protection Information */ | 
|---|
| 110 | #define LBMD_PI_CSUM_NONE		0 | 
|---|
| 111 | #define LBMD_PI_CSUM_IP			1 | 
|---|
| 112 | #define LBMD_PI_CSUM_CRC16_T10DIF	2 | 
|---|
| 113 | #define LBMD_PI_CSUM_CRC64_NVME		4 | 
|---|
| 114 |  | 
|---|
| 115 | /* sizeof first published struct */ | 
|---|
| 116 | #define LBMD_SIZE_VER0			16 | 
|---|
| 117 |  | 
|---|
| 118 | /* | 
|---|
| 119 | * Logical block metadata capability descriptor | 
|---|
| 120 | * If the device does not support metadata, all the fields will be zero. | 
|---|
| 121 | * Applications must check lbmd_flags to determine whether metadata is | 
|---|
| 122 | * supported or not. | 
|---|
| 123 | */ | 
|---|
| 124 | struct logical_block_metadata_cap { | 
|---|
| 125 | /* Bitmask of logical block metadata capability flags */ | 
|---|
| 126 | __u32	lbmd_flags; | 
|---|
| 127 | /* | 
|---|
| 128 | * The amount of data described by each unit of logical block | 
|---|
| 129 | * metadata | 
|---|
| 130 | */ | 
|---|
| 131 | __u16	lbmd_interval; | 
|---|
| 132 | /* | 
|---|
| 133 | * Size in bytes of the logical block metadata associated with each | 
|---|
| 134 | * interval | 
|---|
| 135 | */ | 
|---|
| 136 | __u8	lbmd_size; | 
|---|
| 137 | /* | 
|---|
| 138 | * Size in bytes of the opaque block tag associated with each | 
|---|
| 139 | * interval | 
|---|
| 140 | */ | 
|---|
| 141 | __u8	lbmd_opaque_size; | 
|---|
| 142 | /* | 
|---|
| 143 | * Offset in bytes of the opaque block tag within the logical block | 
|---|
| 144 | * metadata | 
|---|
| 145 | */ | 
|---|
| 146 | __u8	lbmd_opaque_offset; | 
|---|
| 147 | /* Size in bytes of the T10 PI tuple associated with each interval */ | 
|---|
| 148 | __u8	lbmd_pi_size; | 
|---|
| 149 | /* Offset in bytes of T10 PI tuple within the logical block metadata */ | 
|---|
| 150 | __u8	lbmd_pi_offset; | 
|---|
| 151 | /* T10 PI guard tag type */ | 
|---|
| 152 | __u8	lbmd_guard_tag_type; | 
|---|
| 153 | /* Size in bytes of the T10 PI application tag */ | 
|---|
| 154 | __u8	lbmd_app_tag_size; | 
|---|
| 155 | /* Size in bytes of the T10 PI reference tag */ | 
|---|
| 156 | __u8	lbmd_ref_tag_size; | 
|---|
| 157 | /* Size in bytes of the T10 PI storage tag */ | 
|---|
| 158 | __u8	lbmd_storage_tag_size; | 
|---|
| 159 | __u8	pad; | 
|---|
| 160 | }; | 
|---|
| 161 |  | 
|---|
| 162 | /* extent-same (dedupe) ioctls; these MUST match the btrfs ioctl definitions */ | 
|---|
| 163 | #define FILE_DEDUPE_RANGE_SAME		0 | 
|---|
| 164 | #define FILE_DEDUPE_RANGE_DIFFERS	1 | 
|---|
| 165 |  | 
|---|
| 166 | /* from struct btrfs_ioctl_file_extent_same_info */ | 
|---|
| 167 | struct file_dedupe_range_info { | 
|---|
| 168 | __s64 dest_fd;		/* in - destination file */ | 
|---|
| 169 | __u64 dest_offset;	/* in - start of extent in destination */ | 
|---|
| 170 | __u64 bytes_deduped;	/* out - total # of bytes we were able | 
|---|
| 171 | * to dedupe from this file. */ | 
|---|
| 172 | /* status of this dedupe operation: | 
|---|
| 173 | * < 0 for error | 
|---|
| 174 | * == FILE_DEDUPE_RANGE_SAME if dedupe succeeds | 
|---|
| 175 | * == FILE_DEDUPE_RANGE_DIFFERS if data differs | 
|---|
| 176 | */ | 
|---|
| 177 | __s32 status;		/* out - see above description */ | 
|---|
| 178 | __u32 reserved;		/* must be zero */ | 
|---|
| 179 | }; | 
|---|
| 180 |  | 
|---|
| 181 | /* from struct btrfs_ioctl_file_extent_same_args */ | 
|---|
| 182 | struct file_dedupe_range { | 
|---|
| 183 | __u64 src_offset;	/* in - start of extent in source */ | 
|---|
| 184 | __u64 src_length;	/* in - length of extent */ | 
|---|
| 185 | __u16 dest_count;	/* in - total elements in info array */ | 
|---|
| 186 | __u16 reserved1;	/* must be zero */ | 
|---|
| 187 | __u32 reserved2;	/* must be zero */ | 
|---|
| 188 | struct file_dedupe_range_info info[]; | 
|---|
| 189 | }; | 
|---|
| 190 |  | 
|---|
| 191 | /* And dynamically-tunable limits and defaults: */ | 
|---|
| 192 | struct files_stat_struct { | 
|---|
| 193 | unsigned long nr_files;		/* read only */ | 
|---|
| 194 | unsigned long nr_free_files;	/* read only */ | 
|---|
| 195 | unsigned long max_files;		/* tunable */ | 
|---|
| 196 | }; | 
|---|
| 197 |  | 
|---|
| 198 | struct inodes_stat_t { | 
|---|
| 199 | long nr_inodes; | 
|---|
| 200 | long nr_unused; | 
|---|
| 201 | long dummy[5];		/* padding for sysctl ABI compatibility */ | 
|---|
| 202 | }; | 
|---|
| 203 |  | 
|---|
| 204 |  | 
|---|
| 205 | #define NR_FILE  8192	/* this can well be larger on a larger system */ | 
|---|
| 206 |  | 
|---|
| 207 | /* | 
|---|
| 208 | * Structure for FS_IOC_FSGETXATTR[A] and FS_IOC_FSSETXATTR. | 
|---|
| 209 | */ | 
|---|
| 210 | struct fsxattr { | 
|---|
| 211 | __u32		fsx_xflags;	/* xflags field value (get/set) */ | 
|---|
| 212 | __u32		fsx_extsize;	/* extsize field value (get/set)*/ | 
|---|
| 213 | __u32		fsx_nextents;	/* nextents field value (get)	*/ | 
|---|
| 214 | __u32		fsx_projid;	/* project identifier (get/set) */ | 
|---|
| 215 | __u32		fsx_cowextsize;	/* CoW extsize field value (get/set)*/ | 
|---|
| 216 | unsigned char	fsx_pad[8]; | 
|---|
| 217 | }; | 
|---|
| 218 |  | 
|---|
| 219 | /* | 
|---|
| 220 | * Variable size structure for file_[sg]et_attr(). | 
|---|
| 221 | * | 
|---|
| 222 | * Note. This is alternative to the structure 'struct file_kattr'/'struct fsxattr'. | 
|---|
| 223 | * As this structure is passed to/from userspace with its size, this can | 
|---|
| 224 | * be versioned based on the size. | 
|---|
| 225 | */ | 
|---|
| 226 | struct file_attr { | 
|---|
| 227 | __u64 fa_xflags;	/* xflags field value (get/set) */ | 
|---|
| 228 | __u32 fa_extsize;	/* extsize field value (get/set)*/ | 
|---|
| 229 | __u32 fa_nextents;	/* nextents field value (get)   */ | 
|---|
| 230 | __u32 fa_projid;	/* project identifier (get/set) */ | 
|---|
| 231 | __u32 fa_cowextsize;	/* CoW extsize field value (get/set) */ | 
|---|
| 232 | }; | 
|---|
| 233 |  | 
|---|
| 234 | #define FILE_ATTR_SIZE_VER0 24 | 
|---|
| 235 | #define FILE_ATTR_SIZE_LATEST FILE_ATTR_SIZE_VER0 | 
|---|
| 236 |  | 
|---|
| 237 | /* | 
|---|
| 238 | * Flags for the fsx_xflags field | 
|---|
| 239 | */ | 
|---|
| 240 | #define FS_XFLAG_REALTIME	0x00000001	/* data in realtime volume */ | 
|---|
| 241 | #define FS_XFLAG_PREALLOC	0x00000002	/* preallocated file extents */ | 
|---|
| 242 | #define FS_XFLAG_IMMUTABLE	0x00000008	/* file cannot be modified */ | 
|---|
| 243 | #define FS_XFLAG_APPEND		0x00000010	/* all writes append */ | 
|---|
| 244 | #define FS_XFLAG_SYNC		0x00000020	/* all writes synchronous */ | 
|---|
| 245 | #define FS_XFLAG_NOATIME	0x00000040	/* do not update access time */ | 
|---|
| 246 | #define FS_XFLAG_NODUMP		0x00000080	/* do not include in backups */ | 
|---|
| 247 | #define FS_XFLAG_RTINHERIT	0x00000100	/* create with rt bit set */ | 
|---|
| 248 | #define FS_XFLAG_PROJINHERIT	0x00000200	/* create with parents projid */ | 
|---|
| 249 | #define FS_XFLAG_NOSYMLINKS	0x00000400	/* disallow symlink creation */ | 
|---|
| 250 | #define FS_XFLAG_EXTSIZE	0x00000800	/* extent size allocator hint */ | 
|---|
| 251 | #define FS_XFLAG_EXTSZINHERIT	0x00001000	/* inherit inode extent size */ | 
|---|
| 252 | #define FS_XFLAG_NODEFRAG	0x00002000	/* do not defragment */ | 
|---|
| 253 | #define FS_XFLAG_FILESTREAM	0x00004000	/* use filestream allocator */ | 
|---|
| 254 | #define FS_XFLAG_DAX		0x00008000	/* use DAX for IO */ | 
|---|
| 255 | #define FS_XFLAG_COWEXTSIZE	0x00010000	/* CoW extent size allocator hint */ | 
|---|
| 256 | #define FS_XFLAG_HASATTR	0x80000000	/* no DIFLAG for this	*/ | 
|---|
| 257 |  | 
|---|
| 258 | /* the read-only stuff doesn't really belong here, but any other place is | 
|---|
| 259 | probably as bad and I don't want to create yet another include file. */ | 
|---|
| 260 |  | 
|---|
| 261 | #define BLKROSET   _IO(0x12,93)	/* set device read-only (0 = read-write) */ | 
|---|
| 262 | #define BLKROGET   _IO(0x12,94)	/* get read-only status (0 = read_write) */ | 
|---|
| 263 | #define BLKRRPART  _IO(0x12,95)	/* re-read partition table */ | 
|---|
| 264 | #define BLKGETSIZE _IO(0x12,96)	/* return device size /512 (long *arg) */ | 
|---|
| 265 | #define BLKFLSBUF  _IO(0x12,97)	/* flush buffer cache */ | 
|---|
| 266 | #define BLKRASET   _IO(0x12,98)	/* set read ahead for block device */ | 
|---|
| 267 | #define BLKRAGET   _IO(0x12,99)	/* get current read ahead setting */ | 
|---|
| 268 | #define BLKFRASET  _IO(0x12,100)/* set filesystem (mm/filemap.c) read-ahead */ | 
|---|
| 269 | #define BLKFRAGET  _IO(0x12,101)/* get filesystem (mm/filemap.c) read-ahead */ | 
|---|
| 270 | #define BLKSECTSET _IO(0x12,102)/* set max sectors per request (ll_rw_blk.c) */ | 
|---|
| 271 | #define BLKSECTGET _IO(0x12,103)/* get max sectors per request (ll_rw_blk.c) */ | 
|---|
| 272 | #define BLKSSZGET  _IO(0x12,104)/* get block device sector size */ | 
|---|
| 273 | #if 0 | 
|---|
| 274 | #define BLKPG      _IO(0x12,105)/* See blkpg.h */ | 
|---|
| 275 |  | 
|---|
| 276 | /* Some people are morons.  Do not use sizeof! */ | 
|---|
| 277 |  | 
|---|
| 278 | #define BLKELVGET  _IOR(0x12,106,size_t)/* elevator get */ | 
|---|
| 279 | #define BLKELVSET  _IOW(0x12,107,size_t)/* elevator set */ | 
|---|
| 280 | /* This was here just to show that the number is taken - | 
|---|
| 281 | probably all these _IO(0x12,*) ioctls should be moved to blkpg.h. */ | 
|---|
| 282 | #endif | 
|---|
| 283 | /* A jump here: 108-111 have been used for various private purposes. */ | 
|---|
| 284 | #define BLKBSZGET  _IOR(0x12,112,size_t) | 
|---|
| 285 | #define BLKBSZSET  _IOW(0x12,113,size_t) | 
|---|
| 286 | #define BLKGETSIZE64 _IOR(0x12,114,size_t)	/* return device size in bytes (u64 *arg) */ | 
|---|
| 287 | #define BLKTRACESETUP _IOWR(0x12,115,struct blk_user_trace_setup) | 
|---|
| 288 | #define BLKTRACESTART _IO(0x12,116) | 
|---|
| 289 | #define BLKTRACESTOP _IO(0x12,117) | 
|---|
| 290 | #define BLKTRACETEARDOWN _IO(0x12,118) | 
|---|
| 291 | #define BLKDISCARD _IO(0x12,119) | 
|---|
| 292 | #define BLKIOMIN _IO(0x12,120) | 
|---|
| 293 | #define BLKIOOPT _IO(0x12,121) | 
|---|
| 294 | #define BLKALIGNOFF _IO(0x12,122) | 
|---|
| 295 | #define BLKPBSZGET _IO(0x12,123) | 
|---|
| 296 | #define BLKDISCARDZEROES _IO(0x12,124) | 
|---|
| 297 | #define BLKSECDISCARD _IO(0x12,125) | 
|---|
| 298 | #define BLKROTATIONAL _IO(0x12,126) | 
|---|
| 299 | #define BLKZEROOUT _IO(0x12,127) | 
|---|
| 300 | #define BLKGETDISKSEQ _IOR(0x12,128,__u64) | 
|---|
| 301 | /* 130-136 are used by zoned block device ioctls (uapi/linux/blkzoned.h) */ | 
|---|
| 302 | /* 137-141 are used by blk-crypto ioctls (uapi/linux/blk-crypto.h) */ | 
|---|
| 303 |  | 
|---|
| 304 | #define BMAP_IOCTL 1		/* obsolete - kept for compatibility */ | 
|---|
| 305 | #define FIBMAP	   _IO(0x00,1)	/* bmap access */ | 
|---|
| 306 | #define FIGETBSZ   _IO(0x00,2)	/* get the block size used for bmap */ | 
|---|
| 307 | #define FIFREEZE	_IOWR('X', 119, int)	/* Freeze */ | 
|---|
| 308 | #define FITHAW		_IOWR('X', 120, int)	/* Thaw */ | 
|---|
| 309 | #define FITRIM		_IOWR('X', 121, struct fstrim_range)	/* Trim */ | 
|---|
| 310 | #define FICLONE		_IOW(0x94, 9, int) | 
|---|
| 311 | #define FICLONERANGE	_IOW(0x94, 13, struct file_clone_range) | 
|---|
| 312 | #define FIDEDUPERANGE	_IOWR(0x94, 54, struct file_dedupe_range) | 
|---|
| 313 |  | 
|---|
| 314 | #define FSLABEL_MAX 256	/* Max chars for the interface; each fs may differ */ | 
|---|
| 315 |  | 
|---|
| 316 | #define	FS_IOC_GETFLAGS			_IOR('f', 1, long) | 
|---|
| 317 | #define	FS_IOC_SETFLAGS			_IOW('f', 2, long) | 
|---|
| 318 | #define	FS_IOC_GETVERSION		_IOR('v', 1, long) | 
|---|
| 319 | #define	FS_IOC_SETVERSION		_IOW('v', 2, long) | 
|---|
| 320 | #define FS_IOC_FIEMAP			_IOWR('f', 11, struct fiemap) | 
|---|
| 321 | #define FS_IOC32_GETFLAGS		_IOR('f', 1, int) | 
|---|
| 322 | #define FS_IOC32_SETFLAGS		_IOW('f', 2, int) | 
|---|
| 323 | #define FS_IOC32_GETVERSION		_IOR('v', 1, int) | 
|---|
| 324 | #define FS_IOC32_SETVERSION		_IOW('v', 2, int) | 
|---|
| 325 | #define FS_IOC_FSGETXATTR		_IOR('X', 31, struct fsxattr) | 
|---|
| 326 | #define FS_IOC_FSSETXATTR		_IOW('X', 32, struct fsxattr) | 
|---|
| 327 | #define FS_IOC_GETFSLABEL		_IOR(0x94, 49, char[FSLABEL_MAX]) | 
|---|
| 328 | #define FS_IOC_SETFSLABEL		_IOW(0x94, 50, char[FSLABEL_MAX]) | 
|---|
| 329 | /* Returns the external filesystem UUID, the same one blkid returns */ | 
|---|
| 330 | #define FS_IOC_GETFSUUID		_IOR(0x15, 0, struct fsuuid2) | 
|---|
| 331 | /* | 
|---|
| 332 | * Returns the path component under /sys/fs/ that refers to this filesystem; | 
|---|
| 333 | * also /sys/kernel/debug/ for filesystems with debugfs exports | 
|---|
| 334 | */ | 
|---|
| 335 | #define FS_IOC_GETFSSYSFSPATH		_IOR(0x15, 1, struct fs_sysfs_path) | 
|---|
| 336 | /* Get logical block metadata capability details */ | 
|---|
| 337 | #define FS_IOC_GETLBMD_CAP		_IOWR(0x15, 2, struct logical_block_metadata_cap) | 
|---|
| 338 |  | 
|---|
| 339 | /* | 
|---|
| 340 | * Inode flags (FS_IOC_GETFLAGS / FS_IOC_SETFLAGS) | 
|---|
| 341 | * | 
|---|
| 342 | * Note: for historical reasons, these flags were originally used and | 
|---|
| 343 | * defined for use by ext2/ext3, and then other file systems started | 
|---|
| 344 | * using these flags so they wouldn't need to write their own version | 
|---|
| 345 | * of chattr/lsattr (which was shipped as part of e2fsprogs).  You | 
|---|
| 346 | * should think twice before trying to use these flags in new | 
|---|
| 347 | * contexts, or trying to assign these flags, since they are used both | 
|---|
| 348 | * as the UAPI and the on-disk encoding for ext2/3/4.  Also, we are | 
|---|
| 349 | * almost out of 32-bit flags.  :-) | 
|---|
| 350 | * | 
|---|
| 351 | * We have recently hoisted FS_IOC_FSGETXATTR / FS_IOC_FSSETXATTR from | 
|---|
| 352 | * XFS to the generic FS level interface.  This uses a structure that | 
|---|
| 353 | * has padding and hence has more room to grow, so it may be more | 
|---|
| 354 | * appropriate for many new use cases. | 
|---|
| 355 | * | 
|---|
| 356 | * Please do not change these flags or interfaces before checking with | 
|---|
| 357 | * linux-fsdevel@vger.kernel.org and linux-api@vger.kernel.org. | 
|---|
| 358 | */ | 
|---|
| 359 | #define	FS_SECRM_FL			0x00000001 /* Secure deletion */ | 
|---|
| 360 | #define	FS_UNRM_FL			0x00000002 /* Undelete */ | 
|---|
| 361 | #define	FS_COMPR_FL			0x00000004 /* Compress file */ | 
|---|
| 362 | #define FS_SYNC_FL			0x00000008 /* Synchronous updates */ | 
|---|
| 363 | #define FS_IMMUTABLE_FL			0x00000010 /* Immutable file */ | 
|---|
| 364 | #define FS_APPEND_FL			0x00000020 /* writes to file may only append */ | 
|---|
| 365 | #define FS_NODUMP_FL			0x00000040 /* do not dump file */ | 
|---|
| 366 | #define FS_NOATIME_FL			0x00000080 /* do not update atime */ | 
|---|
| 367 | /* Reserved for compression usage... */ | 
|---|
| 368 | #define FS_DIRTY_FL			0x00000100 | 
|---|
| 369 | #define FS_COMPRBLK_FL			0x00000200 /* One or more compressed clusters */ | 
|---|
| 370 | #define FS_NOCOMP_FL			0x00000400 /* Don't compress */ | 
|---|
| 371 | /* End compression flags --- maybe not all used */ | 
|---|
| 372 | #define FS_ENCRYPT_FL			0x00000800 /* Encrypted file */ | 
|---|
| 373 | #define FS_BTREE_FL			0x00001000 /* btree format dir */ | 
|---|
| 374 | #define FS_INDEX_FL			0x00001000 /* hash-indexed directory */ | 
|---|
| 375 | #define FS_IMAGIC_FL			0x00002000 /* AFS directory */ | 
|---|
| 376 | #define FS_JOURNAL_DATA_FL		0x00004000 /* Reserved for ext3 */ | 
|---|
| 377 | #define FS_NOTAIL_FL			0x00008000 /* file tail should not be merged */ | 
|---|
| 378 | #define FS_DIRSYNC_FL			0x00010000 /* dirsync behaviour (directories only) */ | 
|---|
| 379 | #define FS_TOPDIR_FL			0x00020000 /* Top of directory hierarchies*/ | 
|---|
| 380 | #define FS_HUGE_FILE_FL			0x00040000 /* Reserved for ext4 */ | 
|---|
| 381 | #define FS_EXTENT_FL			0x00080000 /* Extents */ | 
|---|
| 382 | #define FS_VERITY_FL			0x00100000 /* Verity protected inode */ | 
|---|
| 383 | #define FS_EA_INODE_FL			0x00200000 /* Inode used for large EA */ | 
|---|
| 384 | #define FS_EOFBLOCKS_FL			0x00400000 /* Reserved for ext4 */ | 
|---|
| 385 | #define FS_NOCOW_FL			0x00800000 /* Do not cow file */ | 
|---|
| 386 | #define FS_DAX_FL			0x02000000 /* Inode is DAX */ | 
|---|
| 387 | #define FS_INLINE_DATA_FL		0x10000000 /* Reserved for ext4 */ | 
|---|
| 388 | #define FS_PROJINHERIT_FL		0x20000000 /* Create with parents projid */ | 
|---|
| 389 | #define FS_CASEFOLD_FL			0x40000000 /* Folder is case insensitive */ | 
|---|
| 390 | #define FS_RESERVED_FL			0x80000000 /* reserved for ext2 lib */ | 
|---|
| 391 |  | 
|---|
| 392 | #define FS_FL_USER_VISIBLE		0x0003DFFF /* User visible flags */ | 
|---|
| 393 | #define FS_FL_USER_MODIFIABLE		0x000380FF /* User modifiable flags */ | 
|---|
| 394 |  | 
|---|
| 395 |  | 
|---|
| 396 | #define SYNC_FILE_RANGE_WAIT_BEFORE	1 | 
|---|
| 397 | #define SYNC_FILE_RANGE_WRITE		2 | 
|---|
| 398 | #define SYNC_FILE_RANGE_WAIT_AFTER	4 | 
|---|
| 399 | #define SYNC_FILE_RANGE_WRITE_AND_WAIT	(SYNC_FILE_RANGE_WRITE | \ | 
|---|
| 400 | SYNC_FILE_RANGE_WAIT_BEFORE | \ | 
|---|
| 401 | SYNC_FILE_RANGE_WAIT_AFTER) | 
|---|
| 402 |  | 
|---|
| 403 | /* | 
|---|
| 404 | * Flags for preadv2/pwritev2: | 
|---|
| 405 | */ | 
|---|
| 406 |  | 
|---|
| 407 | typedef int __bitwise __kernel_rwf_t; | 
|---|
| 408 |  | 
|---|
| 409 | /* high priority request, poll if possible */ | 
|---|
| 410 | #define RWF_HIPRI	((__force __kernel_rwf_t)0x00000001) | 
|---|
| 411 |  | 
|---|
| 412 | /* per-IO O_DSYNC */ | 
|---|
| 413 | #define RWF_DSYNC	((__force __kernel_rwf_t)0x00000002) | 
|---|
| 414 |  | 
|---|
| 415 | /* per-IO O_SYNC */ | 
|---|
| 416 | #define RWF_SYNC	((__force __kernel_rwf_t)0x00000004) | 
|---|
| 417 |  | 
|---|
| 418 | /* per-IO, return -EAGAIN if operation would block */ | 
|---|
| 419 | #define RWF_NOWAIT	((__force __kernel_rwf_t)0x00000008) | 
|---|
| 420 |  | 
|---|
| 421 | /* per-IO O_APPEND */ | 
|---|
| 422 | #define RWF_APPEND	((__force __kernel_rwf_t)0x00000010) | 
|---|
| 423 |  | 
|---|
| 424 | /* per-IO negation of O_APPEND */ | 
|---|
| 425 | #define RWF_NOAPPEND	((__force __kernel_rwf_t)0x00000020) | 
|---|
| 426 |  | 
|---|
| 427 | /* Atomic Write */ | 
|---|
| 428 | #define RWF_ATOMIC	((__force __kernel_rwf_t)0x00000040) | 
|---|
| 429 |  | 
|---|
| 430 | /* buffered IO that drops the cache after reading or writing data */ | 
|---|
| 431 | #define RWF_DONTCACHE	((__force __kernel_rwf_t)0x00000080) | 
|---|
| 432 |  | 
|---|
| 433 | /* prevent pipe and socket writes from raising SIGPIPE */ | 
|---|
| 434 | #define RWF_NOSIGNAL	((__force __kernel_rwf_t)0x00000100) | 
|---|
| 435 |  | 
|---|
| 436 | /* mask of flags supported by the kernel */ | 
|---|
| 437 | #define RWF_SUPPORTED	(RWF_HIPRI | RWF_DSYNC | RWF_SYNC | RWF_NOWAIT |\ | 
|---|
| 438 | RWF_APPEND | RWF_NOAPPEND | RWF_ATOMIC |\ | 
|---|
| 439 | RWF_DONTCACHE | RWF_NOSIGNAL) | 
|---|
| 440 |  | 
|---|
| 441 | #define PROCFS_IOCTL_MAGIC 'f' | 
|---|
| 442 |  | 
|---|
| 443 | /* Pagemap ioctl */ | 
|---|
| 444 | #define PAGEMAP_SCAN	_IOWR(PROCFS_IOCTL_MAGIC, 16, struct pm_scan_arg) | 
|---|
| 445 |  | 
|---|
| 446 | /* Bitmasks provided in pm_scan_args masks and reported in page_region.categories. */ | 
|---|
| 447 | #define PAGE_IS_WPALLOWED	(1 << 0) | 
|---|
| 448 | #define PAGE_IS_WRITTEN		(1 << 1) | 
|---|
| 449 | #define PAGE_IS_FILE		(1 << 2) | 
|---|
| 450 | #define PAGE_IS_PRESENT		(1 << 3) | 
|---|
| 451 | #define PAGE_IS_SWAPPED		(1 << 4) | 
|---|
| 452 | #define PAGE_IS_PFNZERO		(1 << 5) | 
|---|
| 453 | #define PAGE_IS_HUGE		(1 << 6) | 
|---|
| 454 | #define PAGE_IS_SOFT_DIRTY	(1 << 7) | 
|---|
| 455 | #define PAGE_IS_GUARD		(1 << 8) | 
|---|
| 456 |  | 
|---|
| 457 | /* | 
|---|
| 458 | * struct page_region - Page region with flags | 
|---|
| 459 | * @start:	Start of the region | 
|---|
| 460 | * @end:	End of the region (exclusive) | 
|---|
| 461 | * @categories:	PAGE_IS_* category bitmask for the region | 
|---|
| 462 | */ | 
|---|
| 463 | struct page_region { | 
|---|
| 464 | __u64 start; | 
|---|
| 465 | __u64 end; | 
|---|
| 466 | __u64 categories; | 
|---|
| 467 | }; | 
|---|
| 468 |  | 
|---|
| 469 | /* Flags for PAGEMAP_SCAN ioctl */ | 
|---|
| 470 | #define PM_SCAN_WP_MATCHING	(1 << 0)	/* Write protect the pages matched. */ | 
|---|
| 471 | #define PM_SCAN_CHECK_WPASYNC	(1 << 1)	/* Abort the scan when a non-WP-enabled page is found. */ | 
|---|
| 472 |  | 
|---|
| 473 | /* | 
|---|
| 474 | * struct pm_scan_arg - Pagemap ioctl argument | 
|---|
| 475 | * @size:		Size of the structure | 
|---|
| 476 | * @flags:		Flags for the IOCTL | 
|---|
| 477 | * @start:		Starting address of the region | 
|---|
| 478 | * @end:		Ending address of the region | 
|---|
| 479 | * @walk_end		Address where the scan stopped (written by kernel). | 
|---|
| 480 | *			walk_end == end (address tags cleared) informs that the scan completed on entire range. | 
|---|
| 481 | * @vec:		Address of page_region struct array for output | 
|---|
| 482 | * @vec_len:		Length of the page_region struct array | 
|---|
| 483 | * @max_pages:		Optional limit for number of returned pages (0 = disabled) | 
|---|
| 484 | * @category_inverted:	PAGE_IS_* categories which values match if 0 instead of 1 | 
|---|
| 485 | * @category_mask:	Skip pages for which any category doesn't match | 
|---|
| 486 | * @category_anyof_mask: Skip pages for which no category matches | 
|---|
| 487 | * @return_mask:	PAGE_IS_* categories that are to be reported in `page_region`s returned | 
|---|
| 488 | */ | 
|---|
| 489 | struct pm_scan_arg { | 
|---|
| 490 | __u64 size; | 
|---|
| 491 | __u64 flags; | 
|---|
| 492 | __u64 start; | 
|---|
| 493 | __u64 end; | 
|---|
| 494 | __u64 walk_end; | 
|---|
| 495 | __u64 vec; | 
|---|
| 496 | __u64 vec_len; | 
|---|
| 497 | __u64 max_pages; | 
|---|
| 498 | __u64 category_inverted; | 
|---|
| 499 | __u64 category_mask; | 
|---|
| 500 | __u64 category_anyof_mask; | 
|---|
| 501 | __u64 return_mask; | 
|---|
| 502 | }; | 
|---|
| 503 |  | 
|---|
| 504 | /* /proc/<pid>/maps ioctl */ | 
|---|
| 505 | #define PROCMAP_QUERY	_IOWR(PROCFS_IOCTL_MAGIC, 17, struct procmap_query) | 
|---|
| 506 |  | 
|---|
| 507 | enum procmap_query_flags { | 
|---|
| 508 | /* | 
|---|
| 509 | * VMA permission flags. | 
|---|
| 510 | * | 
|---|
| 511 | * Can be used as part of procmap_query.query_flags field to look up | 
|---|
| 512 | * only VMAs satisfying specified subset of permissions. E.g., specifying | 
|---|
| 513 | * PROCMAP_QUERY_VMA_READABLE only will return both readable and read/write VMAs, | 
|---|
| 514 | * while having PROCMAP_QUERY_VMA_READABLE | PROCMAP_QUERY_VMA_WRITABLE will only | 
|---|
| 515 | * return read/write VMAs, though both executable/non-executable and | 
|---|
| 516 | * private/shared will be ignored. | 
|---|
| 517 | * | 
|---|
| 518 | * PROCMAP_QUERY_VMA_* flags are also returned in procmap_query.vma_flags | 
|---|
| 519 | * field to specify actual VMA permissions. | 
|---|
| 520 | */ | 
|---|
| 521 | PROCMAP_QUERY_VMA_READABLE		= 0x01, | 
|---|
| 522 | PROCMAP_QUERY_VMA_WRITABLE		= 0x02, | 
|---|
| 523 | PROCMAP_QUERY_VMA_EXECUTABLE		= 0x04, | 
|---|
| 524 | PROCMAP_QUERY_VMA_SHARED		= 0x08, | 
|---|
| 525 | /* | 
|---|
| 526 | * Query modifier flags. | 
|---|
| 527 | * | 
|---|
| 528 | * By default VMA that covers provided address is returned, or -ENOENT | 
|---|
| 529 | * is returned. With PROCMAP_QUERY_COVERING_OR_NEXT_VMA flag set, closest | 
|---|
| 530 | * VMA with vma_start > addr will be returned if no covering VMA is | 
|---|
| 531 | * found. | 
|---|
| 532 | * | 
|---|
| 533 | * PROCMAP_QUERY_FILE_BACKED_VMA instructs query to consider only VMAs that | 
|---|
| 534 | * have file backing. Can be combined with PROCMAP_QUERY_COVERING_OR_NEXT_VMA | 
|---|
| 535 | * to iterate all VMAs with file backing. | 
|---|
| 536 | */ | 
|---|
| 537 | PROCMAP_QUERY_COVERING_OR_NEXT_VMA	= 0x10, | 
|---|
| 538 | PROCMAP_QUERY_FILE_BACKED_VMA		= 0x20, | 
|---|
| 539 | }; | 
|---|
| 540 |  | 
|---|
| 541 | /* | 
|---|
| 542 | * Input/output argument structured passed into ioctl() call. It can be used | 
|---|
| 543 | * to query a set of VMAs (Virtual Memory Areas) of a process. | 
|---|
| 544 | * | 
|---|
| 545 | * Each field can be one of three kinds, marked in a short comment to the | 
|---|
| 546 | * right of the field: | 
|---|
| 547 | *   - "in", input argument, user has to provide this value, kernel doesn't modify it; | 
|---|
| 548 | *   - "out", output argument, kernel sets this field with VMA data; | 
|---|
| 549 | *   - "in/out", input and output argument; user provides initial value (used | 
|---|
| 550 | *     to specify maximum allowable buffer size), and kernel sets it to actual | 
|---|
| 551 | *     amount of data written (or zero, if there is no data). | 
|---|
| 552 | * | 
|---|
| 553 | * If matching VMA is found (according to criterias specified by | 
|---|
| 554 | * query_addr/query_flags, all the out fields are filled out, and ioctl() | 
|---|
| 555 | * returns 0. If there is no matching VMA, -ENOENT will be returned. | 
|---|
| 556 | * In case of any other error, negative error code other than -ENOENT is | 
|---|
| 557 | * returned. | 
|---|
| 558 | * | 
|---|
| 559 | * Most of the data is similar to the one returned as text in /proc/<pid>/maps | 
|---|
| 560 | * file, but procmap_query provides more querying flexibility. There are no | 
|---|
| 561 | * consistency guarantees between subsequent ioctl() calls, but data returned | 
|---|
| 562 | * for matched VMA is self-consistent. | 
|---|
| 563 | */ | 
|---|
| 564 | struct procmap_query { | 
|---|
| 565 | /* Query struct size, for backwards/forward compatibility */ | 
|---|
| 566 | __u64 size; | 
|---|
| 567 | /* | 
|---|
| 568 | * Query flags, a combination of enum procmap_query_flags values. | 
|---|
| 569 | * Defines query filtering and behavior, see enum procmap_query_flags. | 
|---|
| 570 | * | 
|---|
| 571 | * Input argument, provided by user. Kernel doesn't modify it. | 
|---|
| 572 | */ | 
|---|
| 573 | __u64 query_flags;		/* in */ | 
|---|
| 574 | /* | 
|---|
| 575 | * Query address. By default, VMA that covers this address will | 
|---|
| 576 | * be looked up. PROCMAP_QUERY_* flags above modify this default | 
|---|
| 577 | * behavior further. | 
|---|
| 578 | * | 
|---|
| 579 | * Input argument, provided by user. Kernel doesn't modify it. | 
|---|
| 580 | */ | 
|---|
| 581 | __u64 query_addr;		/* in */ | 
|---|
| 582 | /* VMA starting (inclusive) and ending (exclusive) address, if VMA is found. */ | 
|---|
| 583 | __u64 vma_start;		/* out */ | 
|---|
| 584 | __u64 vma_end;			/* out */ | 
|---|
| 585 | /* VMA permissions flags. A combination of PROCMAP_QUERY_VMA_* flags. */ | 
|---|
| 586 | __u64 vma_flags;		/* out */ | 
|---|
| 587 | /* VMA backing page size granularity. */ | 
|---|
| 588 | __u64 vma_page_size;		/* out */ | 
|---|
| 589 | /* | 
|---|
| 590 | * VMA file offset. If VMA has file backing, this specifies offset | 
|---|
| 591 | * within the file that VMA's start address corresponds to. | 
|---|
| 592 | * Is set to zero if VMA has no backing file. | 
|---|
| 593 | */ | 
|---|
| 594 | __u64 vma_offset;		/* out */ | 
|---|
| 595 | /* Backing file's inode number, or zero, if VMA has no backing file. */ | 
|---|
| 596 | __u64 inode;			/* out */ | 
|---|
| 597 | /* Backing file's device major/minor number, or zero, if VMA has no backing file. */ | 
|---|
| 598 | __u32 dev_major;		/* out */ | 
|---|
| 599 | __u32 dev_minor;		/* out */ | 
|---|
| 600 | /* | 
|---|
| 601 | * If set to non-zero value, signals the request to return VMA name | 
|---|
| 602 | * (i.e., VMA's backing file's absolute path, with " (deleted)" suffix | 
|---|
| 603 | * appended, if file was unlinked from FS) for matched VMA. VMA name | 
|---|
| 604 | * can also be some special name (e.g., "[heap]", "[stack]") or could | 
|---|
| 605 | * be even user-supplied with prctl(PR_SET_VMA, PR_SET_VMA_ANON_NAME). | 
|---|
| 606 | * | 
|---|
| 607 | * Kernel will set this field to zero, if VMA has no associated name. | 
|---|
| 608 | * Otherwise kernel will return actual amount of bytes filled in | 
|---|
| 609 | * user-supplied buffer (see vma_name_addr field below), including the | 
|---|
| 610 | * terminating zero. | 
|---|
| 611 | * | 
|---|
| 612 | * If VMA name is longer that user-supplied maximum buffer size, | 
|---|
| 613 | * -E2BIG error is returned. | 
|---|
| 614 | * | 
|---|
| 615 | * If this field is set to non-zero value, vma_name_addr should point | 
|---|
| 616 | * to valid user space memory buffer of at least vma_name_size bytes. | 
|---|
| 617 | * If set to zero, vma_name_addr should be set to zero as well | 
|---|
| 618 | */ | 
|---|
| 619 | __u32 vma_name_size;		/* in/out */ | 
|---|
| 620 | /* | 
|---|
| 621 | * If set to non-zero value, signals the request to extract and return | 
|---|
| 622 | * VMA's backing file's build ID, if the backing file is an ELF file | 
|---|
| 623 | * and it contains embedded build ID. | 
|---|
| 624 | * | 
|---|
| 625 | * Kernel will set this field to zero, if VMA has no backing file, | 
|---|
| 626 | * backing file is not an ELF file, or ELF file has no build ID | 
|---|
| 627 | * embedded. | 
|---|
| 628 | * | 
|---|
| 629 | * Build ID is a binary value (not a string). Kernel will set | 
|---|
| 630 | * build_id_size field to exact number of bytes used for build ID. | 
|---|
| 631 | * If build ID is requested and present, but needs more bytes than | 
|---|
| 632 | * user-supplied maximum buffer size (see build_id_addr field below), | 
|---|
| 633 | * -E2BIG error will be returned. | 
|---|
| 634 | * | 
|---|
| 635 | * If this field is set to non-zero value, build_id_addr should point | 
|---|
| 636 | * to valid user space memory buffer of at least build_id_size bytes. | 
|---|
| 637 | * If set to zero, build_id_addr should be set to zero as well | 
|---|
| 638 | */ | 
|---|
| 639 | __u32 build_id_size;		/* in/out */ | 
|---|
| 640 | /* | 
|---|
| 641 | * User-supplied address of a buffer of at least vma_name_size bytes | 
|---|
| 642 | * for kernel to fill with matched VMA's name (see vma_name_size field | 
|---|
| 643 | * description above for details). | 
|---|
| 644 | * | 
|---|
| 645 | * Should be set to zero if VMA name should not be returned. | 
|---|
| 646 | */ | 
|---|
| 647 | __u64 vma_name_addr;		/* in */ | 
|---|
| 648 | /* | 
|---|
| 649 | * User-supplied address of a buffer of at least build_id_size bytes | 
|---|
| 650 | * for kernel to fill with matched VMA's ELF build ID, if available | 
|---|
| 651 | * (see build_id_size field description above for details). | 
|---|
| 652 | * | 
|---|
| 653 | * Should be set to zero if build ID should not be returned. | 
|---|
| 654 | */ | 
|---|
| 655 | __u64 build_id_addr;		/* in */ | 
|---|
| 656 | }; | 
|---|
| 657 |  | 
|---|
| 658 | #endif /* _UAPI_LINUX_FS_H */ | 
|---|
| 659 |  | 
|---|