1/* SPDX-License-Identifier: GPL-2.0 */ 2#ifndef _BCACHEFS_IOCTL_H 3#define _BCACHEFS_IOCTL_H 4 5#include <linux/uuid.h> 6#include <asm/ioctl.h> 7#include "bcachefs_format.h" 8 9/* 10 * Flags common to multiple ioctls: 11 */ 12#define BCH_FORCE_IF_DATA_LOST (1 << 0) 13#define BCH_FORCE_IF_METADATA_LOST (1 << 1) 14#define BCH_FORCE_IF_DATA_DEGRADED (1 << 2) 15#define BCH_FORCE_IF_METADATA_DEGRADED (1 << 3) 16 17#define BCH_FORCE_IF_LOST \ 18 (BCH_FORCE_IF_DATA_LOST| \ 19 BCH_FORCE_IF_METADATA_LOST) 20#define BCH_FORCE_IF_DEGRADED \ 21 (BCH_FORCE_IF_DATA_DEGRADED| \ 22 BCH_FORCE_IF_METADATA_DEGRADED) 23 24/* 25 * If cleared, ioctl that refer to a device pass it as a pointer to a pathname 26 * (e.g. /dev/sda1); if set, the dev field is the device's index within the 27 * filesystem: 28 */ 29#define BCH_BY_INDEX (1 << 4) 30 31/* 32 * For BCH_IOCTL_READ_SUPER: get superblock of a specific device, not filesystem 33 * wide superblock: 34 */ 35#define BCH_READ_DEV (1 << 5) 36 37/* global control dev: */ 38 39/* These are currently broken, and probably unnecessary: */ 40#if 0 41#define BCH_IOCTL_ASSEMBLE _IOW(0xbc, 1, struct bch_ioctl_assemble) 42#define BCH_IOCTL_INCREMENTAL _IOW(0xbc, 2, struct bch_ioctl_incremental) 43 44struct bch_ioctl_assemble { 45 __u32 flags; 46 __u32 nr_devs; 47 __u64 pad; 48 __u64 devs[]; 49}; 50 51struct bch_ioctl_incremental { 52 __u32 flags; 53 __u64 pad; 54 __u64 dev; 55}; 56#endif 57 58/* filesystem ioctls: */ 59 60#define BCH_IOCTL_QUERY_UUID _IOR(0xbc, 1, struct bch_ioctl_query_uuid) 61 62/* These only make sense when we also have incremental assembly */ 63#if 0 64#define BCH_IOCTL_START _IOW(0xbc, 2, struct bch_ioctl_start) 65#define BCH_IOCTL_STOP _IO(0xbc, 3) 66#endif 67 68#define BCH_IOCTL_DISK_ADD _IOW(0xbc, 4, struct bch_ioctl_disk) 69#define BCH_IOCTL_DISK_REMOVE _IOW(0xbc, 5, struct bch_ioctl_disk) 70#define BCH_IOCTL_DISK_ONLINE _IOW(0xbc, 6, struct bch_ioctl_disk) 71#define BCH_IOCTL_DISK_OFFLINE _IOW(0xbc, 7, struct bch_ioctl_disk) 72#define BCH_IOCTL_DISK_SET_STATE _IOW(0xbc, 8, struct bch_ioctl_disk_set_state) 73#define BCH_IOCTL_DATA _IOW(0xbc, 10, struct bch_ioctl_data) 74#define BCH_IOCTL_FS_USAGE _IOWR(0xbc, 11, struct bch_ioctl_fs_usage) 75#define BCH_IOCTL_DEV_USAGE _IOWR(0xbc, 11, struct bch_ioctl_dev_usage) 76#define BCH_IOCTL_READ_SUPER _IOW(0xbc, 12, struct bch_ioctl_read_super) 77#define BCH_IOCTL_DISK_GET_IDX _IOW(0xbc, 13, struct bch_ioctl_disk_get_idx) 78#define BCH_IOCTL_DISK_RESIZE _IOW(0xbc, 14, struct bch_ioctl_disk_resize) 79#define BCH_IOCTL_DISK_RESIZE_JOURNAL _IOW(0xbc,15, struct bch_ioctl_disk_resize_journal) 80 81#define BCH_IOCTL_SUBVOLUME_CREATE _IOW(0xbc, 16, struct bch_ioctl_subvolume) 82#define BCH_IOCTL_SUBVOLUME_DESTROY _IOW(0xbc, 17, struct bch_ioctl_subvolume) 83 84#define BCH_IOCTL_DEV_USAGE_V2 _IOWR(0xbc, 18, struct bch_ioctl_dev_usage_v2) 85 86#define BCH_IOCTL_FSCK_OFFLINE _IOW(0xbc, 19, struct bch_ioctl_fsck_offline) 87#define BCH_IOCTL_FSCK_ONLINE _IOW(0xbc, 20, struct bch_ioctl_fsck_online) 88 89/* ioctl below act on a particular file, not the filesystem as a whole: */ 90 91#define BCHFS_IOC_REINHERIT_ATTRS _IOR(0xbc, 64, const char __user *) 92 93/* 94 * BCH_IOCTL_QUERY_UUID: get filesystem UUID 95 * 96 * Returns user visible UUID, not internal UUID (which may not ever be changed); 97 * the filesystem's sysfs directory may be found under /sys/fs/bcachefs with 98 * this UUID. 99 */ 100struct bch_ioctl_query_uuid { 101 __uuid_t uuid; 102}; 103 104#if 0 105struct bch_ioctl_start { 106 __u32 flags; 107 __u32 pad; 108}; 109#endif 110 111/* 112 * BCH_IOCTL_DISK_ADD: add a new device to an existing filesystem 113 * 114 * The specified device must not be open or in use. On success, the new device 115 * will be an online member of the filesystem just like any other member. 116 * 117 * The device must first be prepared by userspace by formatting with a bcachefs 118 * superblock, which is only used for passing in superblock options/parameters 119 * for that device (in struct bch_member). The new device's superblock should 120 * not claim to be a member of any existing filesystem - UUIDs on it will be 121 * ignored. 122 */ 123 124/* 125 * BCH_IOCTL_DISK_REMOVE: permanently remove a member device from a filesystem 126 * 127 * Any data present on @dev will be permanently deleted, and @dev will be 128 * removed from its slot in the filesystem's list of member devices. The device 129 * may be either offline or offline. 130 * 131 * Will fail removing @dev would leave us with insufficient read write devices 132 * or degraded/unavailable data, unless the approprate BCH_FORCE_IF_* flags are 133 * set. 134 */ 135 136/* 137 * BCH_IOCTL_DISK_ONLINE: given a disk that is already a member of a filesystem 138 * but is not open (e.g. because we started in degraded mode), bring it online 139 * 140 * all existing data on @dev will be available once the device is online, 141 * exactly as if @dev was present when the filesystem was first mounted 142 */ 143 144/* 145 * BCH_IOCTL_DISK_OFFLINE: offline a disk, causing the kernel to close that 146 * block device, without removing it from the filesystem (so it can be brought 147 * back online later) 148 * 149 * Data present on @dev will be unavailable while @dev is offline (unless 150 * replicated), but will still be intact and untouched if @dev is brought back 151 * online 152 * 153 * Will fail (similarly to BCH_IOCTL_DISK_SET_STATE) if offlining @dev would 154 * leave us with insufficient read write devices or degraded/unavailable data, 155 * unless the approprate BCH_FORCE_IF_* flags are set. 156 */ 157 158struct bch_ioctl_disk { 159 __u32 flags; 160 __u32 pad; 161 __u64 dev; 162}; 163 164/* 165 * BCH_IOCTL_DISK_SET_STATE: modify state of a member device of a filesystem 166 * 167 * @new_state - one of the bch_member_state states (rw, ro, failed, 168 * spare) 169 * 170 * Will refuse to change member state if we would then have insufficient devices 171 * to write to, or if it would result in degraded data (when @new_state is 172 * failed or spare) unless the appropriate BCH_FORCE_IF_* flags are set. 173 */ 174struct bch_ioctl_disk_set_state { 175 __u32 flags; 176 __u8 new_state; 177 __u8 pad[3]; 178 __u64 dev; 179}; 180 181#define BCH_DATA_OPS() \ 182 x(scrub, 0) \ 183 x(rereplicate, 1) \ 184 x(migrate, 2) \ 185 x(rewrite_old_nodes, 3) \ 186 x(drop_extra_replicas, 4) 187 188enum bch_data_ops { 189#define x(t, n) BCH_DATA_OP_##t = n, 190 BCH_DATA_OPS() 191#undef x 192 BCH_DATA_OP_NR 193}; 194 195/* 196 * BCH_IOCTL_DATA: operations that walk and manipulate filesystem data (e.g. 197 * scrub, rereplicate, migrate). 198 * 199 * This ioctl kicks off a job in the background, and returns a file descriptor. 200 * Reading from the file descriptor returns a struct bch_ioctl_data_event, 201 * indicating current progress, and closing the file descriptor will stop the 202 * job. The file descriptor is O_CLOEXEC. 203 */ 204struct bch_ioctl_data { 205 __u16 op; 206 __u8 start_btree; 207 __u8 end_btree; 208 __u32 flags; 209 210 struct bpos start_pos; 211 struct bpos end_pos; 212 213 union { 214 struct { 215 __u32 dev; 216 __u32 pad; 217 } migrate; 218 struct { 219 __u64 pad[8]; 220 }; 221 }; 222} __packed __aligned(8); 223 224enum bch_data_event { 225 BCH_DATA_EVENT_PROGRESS = 0, 226 /* XXX: add an event for reporting errors */ 227 BCH_DATA_EVENT_NR = 1, 228}; 229 230struct bch_ioctl_data_progress { 231 __u8 data_type; 232 __u8 btree_id; 233 __u8 pad[2]; 234 struct bpos pos; 235 236 __u64 sectors_done; 237 __u64 sectors_total; 238} __packed __aligned(8); 239 240struct bch_ioctl_data_event { 241 __u8 type; 242 __u8 pad[7]; 243 union { 244 struct bch_ioctl_data_progress p; 245 __u64 pad2[15]; 246 }; 247} __packed __aligned(8); 248 249struct bch_replicas_usage { 250 __u64 sectors; 251 struct bch_replicas_entry_v1 r; 252} __packed; 253 254static inline struct bch_replicas_usage * 255replicas_usage_next(struct bch_replicas_usage *u) 256{ 257 return (void *) u + replicas_entry_bytes(&u->r) + 8; 258} 259 260/* 261 * BCH_IOCTL_FS_USAGE: query filesystem disk space usage 262 * 263 * Returns disk space usage broken out by data type, number of replicas, and 264 * by component device 265 * 266 * @replica_entries_bytes - size, in bytes, allocated for replica usage entries 267 * 268 * On success, @replica_entries_bytes will be changed to indicate the number of 269 * bytes actually used. 270 * 271 * Returns -ERANGE if @replica_entries_bytes was too small 272 */ 273struct bch_ioctl_fs_usage { 274 __u64 capacity; 275 __u64 used; 276 __u64 online_reserved; 277 __u64 persistent_reserved[BCH_REPLICAS_MAX]; 278 279 __u32 replica_entries_bytes; 280 __u32 pad; 281 282 struct bch_replicas_usage replicas[]; 283}; 284 285/* 286 * BCH_IOCTL_DEV_USAGE: query device disk space usage 287 * 288 * Returns disk space usage broken out by data type - both by buckets and 289 * sectors. 290 */ 291struct bch_ioctl_dev_usage { 292 __u64 dev; 293 __u32 flags; 294 __u8 state; 295 __u8 pad[7]; 296 297 __u32 bucket_size; 298 __u64 nr_buckets; 299 300 __u64 buckets_ec; 301 302 struct bch_ioctl_dev_usage_type { 303 __u64 buckets; 304 __u64 sectors; 305 __u64 fragmented; 306 } d[10]; 307}; 308 309struct bch_ioctl_dev_usage_v2 { 310 __u64 dev; 311 __u32 flags; 312 __u8 state; 313 __u8 nr_data_types; 314 __u8 pad[6]; 315 316 __u32 bucket_size; 317 __u64 nr_buckets; 318 319 struct bch_ioctl_dev_usage_type d[]; 320}; 321 322/* 323 * BCH_IOCTL_READ_SUPER: read filesystem superblock 324 * 325 * Equivalent to reading the superblock directly from the block device, except 326 * avoids racing with the kernel writing the superblock or having to figure out 327 * which block device to read 328 * 329 * @sb - buffer to read into 330 * @size - size of userspace allocated buffer 331 * @dev - device to read superblock for, if BCH_READ_DEV flag is 332 * specified 333 * 334 * Returns -ERANGE if buffer provided is too small 335 */ 336struct bch_ioctl_read_super { 337 __u32 flags; 338 __u32 pad; 339 __u64 dev; 340 __u64 size; 341 __u64 sb; 342}; 343 344/* 345 * BCH_IOCTL_DISK_GET_IDX: give a path to a block device, query filesystem to 346 * determine if disk is a (online) member - if so, returns device's index 347 * 348 * Returns -ENOENT if not found 349 */ 350struct bch_ioctl_disk_get_idx { 351 __u64 dev; 352}; 353 354/* 355 * BCH_IOCTL_DISK_RESIZE: resize filesystem on a device 356 * 357 * @dev - member to resize 358 * @nbuckets - new number of buckets 359 */ 360struct bch_ioctl_disk_resize { 361 __u32 flags; 362 __u32 pad; 363 __u64 dev; 364 __u64 nbuckets; 365}; 366 367/* 368 * BCH_IOCTL_DISK_RESIZE_JOURNAL: resize journal on a device 369 * 370 * @dev - member to resize 371 * @nbuckets - new number of buckets 372 */ 373struct bch_ioctl_disk_resize_journal { 374 __u32 flags; 375 __u32 pad; 376 __u64 dev; 377 __u64 nbuckets; 378}; 379 380struct bch_ioctl_subvolume { 381 __u32 flags; 382 __u32 dirfd; 383 __u16 mode; 384 __u16 pad[3]; 385 __u64 dst_ptr; 386 __u64 src_ptr; 387}; 388 389#define BCH_SUBVOL_SNAPSHOT_CREATE (1U << 0) 390#define BCH_SUBVOL_SNAPSHOT_RO (1U << 1) 391 392/* 393 * BCH_IOCTL_FSCK_OFFLINE: run fsck from the 'bcachefs fsck' userspace command, 394 * but with the kernel's implementation of fsck: 395 */ 396struct bch_ioctl_fsck_offline { 397 __u64 flags; 398 __u64 opts; /* string */ 399 __u64 nr_devs; 400 __u64 devs[] __counted_by(nr_devs); 401}; 402 403/* 404 * BCH_IOCTL_FSCK_ONLINE: run fsck from the 'bcachefs fsck' userspace command, 405 * but with the kernel's implementation of fsck: 406 */ 407struct bch_ioctl_fsck_online { 408 __u64 flags; 409 __u64 opts; /* string */ 410}; 411 412#endif /* _BCACHEFS_IOCTL_H */ 413