]>
Commit | Line | Data |
---|---|---|
3dcf60bc | 1 | // SPDX-License-Identifier: GPL-2.0 |
c59ede7b | 2 | #include <linux/capability.h> |
ee6a129d | 3 | #include <linux/compat.h> |
1da177e4 | 4 | #include <linux/blkdev.h> |
d5decd3b | 5 | #include <linux/export.h> |
5a0e3ad6 | 6 | #include <linux/gfp.h> |
1da177e4 | 7 | #include <linux/blkpg.h> |
a885c8c4 | 8 | #include <linux/hdreg.h> |
1da177e4 | 9 | #include <linux/backing-dev.h> |
ff01bb48 | 10 | #include <linux/fs.h> |
2056a782 | 11 | #include <linux/blktrace_api.h> |
bbd3e064 | 12 | #include <linux/pr.h> |
7c0f6ba6 | 13 | #include <linux/uaccess.h> |
50c52250 PB |
14 | #include <linux/pagemap.h> |
15 | #include <linux/io_uring/cmd.h> | |
16 | #include <uapi/linux/blkdev.h> | |
581e2600 | 17 | #include "blk.h" |
1da177e4 | 18 | |
5fb889f5 AB |
19 | static int blkpg_do_ioctl(struct block_device *bdev, |
20 | struct blkpg_partition __user *upart, int op) | |
1da177e4 | 21 | { |
7f6be376 | 22 | struct gendisk *disk = bdev->bd_disk; |
1da177e4 | 23 | struct blkpg_partition p; |
b9355185 | 24 | sector_t start, length, capacity, end; |
1da177e4 LT |
25 | |
26 | if (!capable(CAP_SYS_ADMIN)) | |
27 | return -EACCES; | |
5fb889f5 | 28 | if (copy_from_user(&p, upart, sizeof(struct blkpg_partition))) |
1da177e4 | 29 | return -EFAULT; |
fa01b1e9 | 30 | if (bdev_is_partition(bdev)) |
1da177e4 | 31 | return -EINVAL; |
88e34126 | 32 | |
fa9156ae CH |
33 | if (p.pno <= 0) |
34 | return -EINVAL; | |
e71bf0d0 | 35 | |
fa9156ae | 36 | if (op == BLKPG_DEL_PARTITION) |
926fbb16 | 37 | return bdev_del_partition(disk, p.pno); |
e71bf0d0 | 38 | |
ccb326b5 | 39 | if (p.start < 0 || p.length <= 0 || LLONG_MAX - p.length < p.start) |
6f64f866 ML |
40 | return -EINVAL; |
41 | /* Check that the partition is aligned to the block size */ | |
42 | if (!IS_ALIGNED(p.start | p.length, bdev_logical_block_size(bdev))) | |
43 | return -EINVAL; | |
44 | ||
fa9156ae CH |
45 | start = p.start >> SECTOR_SHIFT; |
46 | length = p.length >> SECTOR_SHIFT; | |
b9355185 LL |
47 | capacity = get_capacity(disk); |
48 | ||
49 | if (check_add_overflow(start, length, &end)) | |
50 | return -EINVAL; | |
51 | ||
52 | if (start >= capacity || end > capacity) | |
53 | return -EINVAL; | |
e71bf0d0 | 54 | |
fa9156ae CH |
55 | switch (op) { |
56 | case BLKPG_ADD_PARTITION: | |
7f6be376 | 57 | return bdev_add_partition(disk, p.pno, start, length); |
fa9156ae | 58 | case BLKPG_RESIZE_PARTITION: |
3d2e7989 | 59 | return bdev_resize_partition(disk, p.pno, start, length); |
fa9156ae CH |
60 | default: |
61 | return -EINVAL; | |
1da177e4 LT |
62 | } |
63 | } | |
64 | ||
5fb889f5 AB |
65 | static int blkpg_ioctl(struct block_device *bdev, |
66 | struct blkpg_ioctl_arg __user *arg) | |
67 | { | |
68 | struct blkpg_partition __user *udata; | |
69 | int op; | |
70 | ||
71 | if (get_user(op, &arg->op) || get_user(udata, &arg->data)) | |
72 | return -EFAULT; | |
73 | ||
74 | return blkpg_do_ioctl(bdev, udata, op); | |
75 | } | |
76 | ||
77 | #ifdef CONFIG_COMPAT | |
78 | struct compat_blkpg_ioctl_arg { | |
79 | compat_int_t op; | |
80 | compat_int_t flags; | |
81 | compat_int_t datalen; | |
82 | compat_caddr_t data; | |
83 | }; | |
84 | ||
85 | static int compat_blkpg_ioctl(struct block_device *bdev, | |
86 | struct compat_blkpg_ioctl_arg __user *arg) | |
87 | { | |
88 | compat_caddr_t udata; | |
89 | int op; | |
90 | ||
91 | if (get_user(op, &arg->op) || get_user(udata, &arg->data)) | |
92 | return -EFAULT; | |
93 | ||
94 | return blkpg_do_ioctl(bdev, compat_ptr(udata), op); | |
95 | } | |
96 | #endif | |
97 | ||
7a07210b PB |
98 | /* |
99 | * Check that [start, start + len) is a valid range from the block device's | |
100 | * perspective, including verifying that it can be correctly translated into | |
101 | * logical block addresses. | |
102 | */ | |
103 | static int blk_validate_byte_range(struct block_device *bdev, | |
104 | uint64_t start, uint64_t len) | |
105 | { | |
106 | unsigned int bs_mask = bdev_logical_block_size(bdev) - 1; | |
107 | uint64_t end; | |
108 | ||
109 | if ((start | len) & bs_mask) | |
110 | return -EINVAL; | |
111 | if (!len) | |
112 | return -EINVAL; | |
113 | if (check_add_overflow(start, len, &end) || end > bdev_nr_bytes(bdev)) | |
114 | return -EINVAL; | |
115 | ||
116 | return 0; | |
117 | } | |
118 | ||
05bdb996 | 119 | static int blk_ioctl_discard(struct block_device *bdev, blk_mode_t mode, |
44abff2c | 120 | unsigned long arg) |
d30a2605 | 121 | { |
7a07210b | 122 | uint64_t range[2], start, len; |
719c15a7 CH |
123 | struct bio *prev = NULL, *bio; |
124 | sector_t sector, nr_sects; | |
125 | struct blk_plug plug; | |
384d87ef | 126 | int err; |
d8e4bb81 | 127 | |
d8e4bb81 CH |
128 | if (copy_from_user(range, (void __user *)arg, sizeof(range))) |
129 | return -EFAULT; | |
d8e4bb81 CH |
130 | start = range[0]; |
131 | len = range[1]; | |
8d57a98c | 132 | |
7a07210b PB |
133 | if (!bdev_max_discard_sectors(bdev)) |
134 | return -EOPNOTSUPP; | |
d30a2605 | 135 | |
7a07210b PB |
136 | if (!(mode & BLK_OPEN_WRITE)) |
137 | return -EBADF; | |
138 | if (bdev_read_only(bdev)) | |
139 | return -EPERM; | |
140 | err = blk_validate_byte_range(bdev, start, len); | |
141 | if (err) | |
142 | return err; | |
384d87ef | 143 | |
881494ed | 144 | filemap_invalidate_lock(bdev->bd_mapping); |
7a07210b | 145 | err = truncate_bdev_range(bdev, mode, start, start + len - 1); |
384d87ef | 146 | if (err) |
7607c44c | 147 | goto fail; |
719c15a7 CH |
148 | |
149 | sector = start >> SECTOR_SHIFT; | |
150 | nr_sects = len >> SECTOR_SHIFT; | |
151 | ||
152 | blk_start_plug(&plug); | |
153 | while (1) { | |
154 | if (fatal_signal_pending(current)) { | |
155 | if (prev) | |
156 | bio_await_chain(prev); | |
157 | err = -EINTR; | |
158 | goto out_unplug; | |
159 | } | |
160 | bio = blk_alloc_discard_bio(bdev, §or, &nr_sects, | |
161 | GFP_KERNEL); | |
162 | if (!bio) | |
163 | break; | |
164 | prev = bio_chain_and_submit(prev, bio); | |
165 | } | |
166 | if (prev) { | |
167 | err = submit_bio_wait(prev); | |
168 | if (err == -EOPNOTSUPP) | |
169 | err = 0; | |
170 | bio_put(prev); | |
171 | } | |
172 | out_unplug: | |
173 | blk_finish_plug(&plug); | |
7607c44c | 174 | fail: |
881494ed | 175 | filemap_invalidate_unlock(bdev->bd_mapping); |
7607c44c | 176 | return err; |
d30a2605 DW |
177 | } |
178 | ||
05bdb996 | 179 | static int blk_ioctl_secure_erase(struct block_device *bdev, blk_mode_t mode, |
44abff2c CH |
180 | void __user *argp) |
181 | { | |
697ba0b6 | 182 | uint64_t start, len, end; |
44abff2c CH |
183 | uint64_t range[2]; |
184 | int err; | |
185 | ||
05bdb996 | 186 | if (!(mode & BLK_OPEN_WRITE)) |
44abff2c CH |
187 | return -EBADF; |
188 | if (!bdev_max_secure_erase_sectors(bdev)) | |
189 | return -EOPNOTSUPP; | |
190 | if (copy_from_user(range, argp, sizeof(range))) | |
191 | return -EFAULT; | |
192 | ||
193 | start = range[0]; | |
194 | len = range[1]; | |
195 | if ((start & 511) || (len & 511)) | |
196 | return -EINVAL; | |
697ba0b6 AD |
197 | if (check_add_overflow(start, len, &end) || |
198 | end > bdev_nr_bytes(bdev)) | |
44abff2c CH |
199 | return -EINVAL; |
200 | ||
224941e8 | 201 | filemap_invalidate_lock(bdev->bd_mapping); |
697ba0b6 | 202 | err = truncate_bdev_range(bdev, mode, start, end - 1); |
44abff2c CH |
203 | if (!err) |
204 | err = blkdev_issue_secure_erase(bdev, start >> 9, len >> 9, | |
205 | GFP_KERNEL); | |
224941e8 | 206 | filemap_invalidate_unlock(bdev->bd_mapping); |
44abff2c CH |
207 | return err; |
208 | } | |
209 | ||
210 | ||
05bdb996 | 211 | static int blk_ioctl_zeroout(struct block_device *bdev, blk_mode_t mode, |
d8e4bb81 | 212 | unsigned long arg) |
66ba32dc | 213 | { |
d8e4bb81 | 214 | uint64_t range[2]; |
22dd6d35 | 215 | uint64_t start, end, len; |
384d87ef | 216 | int err; |
d8e4bb81 | 217 | |
05bdb996 | 218 | if (!(mode & BLK_OPEN_WRITE)) |
d8e4bb81 CH |
219 | return -EBADF; |
220 | ||
221 | if (copy_from_user(range, (void __user *)arg, sizeof(range))) | |
222 | return -EFAULT; | |
223 | ||
224 | start = range[0]; | |
225 | len = range[1]; | |
22dd6d35 | 226 | end = start + len - 1; |
d8e4bb81 | 227 | |
66ba32dc MP |
228 | if (start & 511) |
229 | return -EINVAL; | |
230 | if (len & 511) | |
231 | return -EINVAL; | |
946e9937 | 232 | if (end >= (uint64_t)bdev_nr_bytes(bdev)) |
22dd6d35 DW |
233 | return -EINVAL; |
234 | if (end < start) | |
66ba32dc MP |
235 | return -EINVAL; |
236 | ||
22dd6d35 | 237 | /* Invalidate the page cache, including dirty pages */ |
881494ed | 238 | filemap_invalidate_lock(bdev->bd_mapping); |
384d87ef JK |
239 | err = truncate_bdev_range(bdev, mode, start, end); |
240 | if (err) | |
35e4c6c1 SK |
241 | goto fail; |
242 | ||
243 | err = blkdev_issue_zeroout(bdev, start >> 9, len >> 9, GFP_KERNEL, | |
bf86bcdb | 244 | BLKDEV_ZERO_NOUNMAP | BLKDEV_ZERO_KILLABLE); |
22dd6d35 | 245 | |
35e4c6c1 | 246 | fail: |
881494ed | 247 | filemap_invalidate_unlock(bdev->bd_mapping); |
35e4c6c1 | 248 | return err; |
66ba32dc MP |
249 | } |
250 | ||
9b81648c | 251 | static int put_ushort(unsigned short __user *argp, unsigned short val) |
1da177e4 | 252 | { |
9b81648c | 253 | return put_user(val, argp); |
1da177e4 LT |
254 | } |
255 | ||
9b81648c | 256 | static int put_int(int __user *argp, int val) |
1da177e4 | 257 | { |
9b81648c | 258 | return put_user(val, argp); |
1da177e4 LT |
259 | } |
260 | ||
9b81648c | 261 | static int put_uint(unsigned int __user *argp, unsigned int val) |
ac481c20 | 262 | { |
9b81648c | 263 | return put_user(val, argp); |
ac481c20 MP |
264 | } |
265 | ||
9b81648c | 266 | static int put_long(long __user *argp, long val) |
1da177e4 | 267 | { |
9b81648c | 268 | return put_user(val, argp); |
1da177e4 LT |
269 | } |
270 | ||
9b81648c | 271 | static int put_ulong(unsigned long __user *argp, unsigned long val) |
1da177e4 | 272 | { |
9b81648c | 273 | return put_user(val, argp); |
1da177e4 LT |
274 | } |
275 | ||
9b81648c | 276 | static int put_u64(u64 __user *argp, u64 val) |
1da177e4 | 277 | { |
9b81648c | 278 | return put_user(val, argp); |
1da177e4 LT |
279 | } |
280 | ||
bdc1ddad | 281 | #ifdef CONFIG_COMPAT |
c8210a57 | 282 | static int compat_put_long(compat_long_t __user *argp, long val) |
bdc1ddad | 283 | { |
9b81648c | 284 | return put_user(val, argp); |
bdc1ddad AB |
285 | } |
286 | ||
c8210a57 | 287 | static int compat_put_ulong(compat_ulong_t __user *argp, compat_ulong_t val) |
bdc1ddad | 288 | { |
9b81648c | 289 | return put_user(val, argp); |
bdc1ddad AB |
290 | } |
291 | #endif | |
292 | ||
ee6a129d AB |
293 | #ifdef CONFIG_COMPAT |
294 | /* | |
295 | * This is the equivalent of compat_ptr_ioctl(), to be used by block | |
296 | * drivers that implement only commands that are completely compatible | |
297 | * between 32-bit and 64-bit user space | |
298 | */ | |
05bdb996 | 299 | int blkdev_compat_ptr_ioctl(struct block_device *bdev, blk_mode_t mode, |
ee6a129d AB |
300 | unsigned cmd, unsigned long arg) |
301 | { | |
302 | struct gendisk *disk = bdev->bd_disk; | |
303 | ||
304 | if (disk->fops->ioctl) | |
305 | return disk->fops->ioctl(bdev, mode, cmd, | |
306 | (unsigned long)compat_ptr(arg)); | |
307 | ||
308 | return -ENOIOCTLCMD; | |
309 | } | |
310 | EXPORT_SYMBOL(blkdev_compat_ptr_ioctl); | |
311 | #endif | |
312 | ||
9a72a024 | 313 | static bool blkdev_pr_allowed(struct block_device *bdev, blk_mode_t mode) |
12629621 JX |
314 | { |
315 | /* no sense to make reservations for partitions */ | |
316 | if (bdev_is_partition(bdev)) | |
317 | return false; | |
318 | ||
319 | if (capable(CAP_SYS_ADMIN)) | |
320 | return true; | |
9a72a024 JX |
321 | /* |
322 | * Only allow unprivileged reservations if the file descriptor is open | |
323 | * for writing. | |
324 | */ | |
325 | return mode & BLK_OPEN_WRITE; | |
12629621 JX |
326 | } |
327 | ||
9a72a024 | 328 | static int blkdev_pr_register(struct block_device *bdev, blk_mode_t mode, |
bbd3e064 CH |
329 | struct pr_registration __user *arg) |
330 | { | |
331 | const struct pr_ops *ops = bdev->bd_disk->fops->pr_ops; | |
332 | struct pr_registration reg; | |
333 | ||
9a72a024 | 334 | if (!blkdev_pr_allowed(bdev, mode)) |
bbd3e064 CH |
335 | return -EPERM; |
336 | if (!ops || !ops->pr_register) | |
337 | return -EOPNOTSUPP; | |
338 | if (copy_from_user(®, arg, sizeof(reg))) | |
339 | return -EFAULT; | |
340 | ||
341 | if (reg.flags & ~PR_FL_IGNORE_KEY) | |
342 | return -EOPNOTSUPP; | |
343 | return ops->pr_register(bdev, reg.old_key, reg.new_key, reg.flags); | |
344 | } | |
345 | ||
9a72a024 | 346 | static int blkdev_pr_reserve(struct block_device *bdev, blk_mode_t mode, |
bbd3e064 CH |
347 | struct pr_reservation __user *arg) |
348 | { | |
349 | const struct pr_ops *ops = bdev->bd_disk->fops->pr_ops; | |
350 | struct pr_reservation rsv; | |
351 | ||
9a72a024 | 352 | if (!blkdev_pr_allowed(bdev, mode)) |
bbd3e064 CH |
353 | return -EPERM; |
354 | if (!ops || !ops->pr_reserve) | |
355 | return -EOPNOTSUPP; | |
356 | if (copy_from_user(&rsv, arg, sizeof(rsv))) | |
357 | return -EFAULT; | |
358 | ||
359 | if (rsv.flags & ~PR_FL_IGNORE_KEY) | |
360 | return -EOPNOTSUPP; | |
361 | return ops->pr_reserve(bdev, rsv.key, rsv.type, rsv.flags); | |
362 | } | |
363 | ||
9a72a024 | 364 | static int blkdev_pr_release(struct block_device *bdev, blk_mode_t mode, |
bbd3e064 CH |
365 | struct pr_reservation __user *arg) |
366 | { | |
367 | const struct pr_ops *ops = bdev->bd_disk->fops->pr_ops; | |
368 | struct pr_reservation rsv; | |
369 | ||
9a72a024 | 370 | if (!blkdev_pr_allowed(bdev, mode)) |
bbd3e064 CH |
371 | return -EPERM; |
372 | if (!ops || !ops->pr_release) | |
373 | return -EOPNOTSUPP; | |
374 | if (copy_from_user(&rsv, arg, sizeof(rsv))) | |
375 | return -EFAULT; | |
376 | ||
377 | if (rsv.flags) | |
378 | return -EOPNOTSUPP; | |
379 | return ops->pr_release(bdev, rsv.key, rsv.type); | |
380 | } | |
381 | ||
9a72a024 | 382 | static int blkdev_pr_preempt(struct block_device *bdev, blk_mode_t mode, |
bbd3e064 CH |
383 | struct pr_preempt __user *arg, bool abort) |
384 | { | |
385 | const struct pr_ops *ops = bdev->bd_disk->fops->pr_ops; | |
386 | struct pr_preempt p; | |
387 | ||
9a72a024 | 388 | if (!blkdev_pr_allowed(bdev, mode)) |
bbd3e064 CH |
389 | return -EPERM; |
390 | if (!ops || !ops->pr_preempt) | |
391 | return -EOPNOTSUPP; | |
392 | if (copy_from_user(&p, arg, sizeof(p))) | |
393 | return -EFAULT; | |
394 | ||
395 | if (p.flags) | |
396 | return -EOPNOTSUPP; | |
397 | return ops->pr_preempt(bdev, p.old_key, p.new_key, p.type, abort); | |
398 | } | |
399 | ||
9a72a024 | 400 | static int blkdev_pr_clear(struct block_device *bdev, blk_mode_t mode, |
bbd3e064 CH |
401 | struct pr_clear __user *arg) |
402 | { | |
403 | const struct pr_ops *ops = bdev->bd_disk->fops->pr_ops; | |
404 | struct pr_clear c; | |
405 | ||
9a72a024 | 406 | if (!blkdev_pr_allowed(bdev, mode)) |
bbd3e064 CH |
407 | return -EPERM; |
408 | if (!ops || !ops->pr_clear) | |
409 | return -EOPNOTSUPP; | |
410 | if (copy_from_user(&c, arg, sizeof(c))) | |
411 | return -EFAULT; | |
412 | ||
413 | if (c.flags) | |
414 | return -EOPNOTSUPP; | |
415 | return ops->pr_clear(bdev, c.key); | |
416 | } | |
417 | ||
5e4ea834 CH |
418 | static int blkdev_flushbuf(struct block_device *bdev, unsigned cmd, |
419 | unsigned long arg) | |
bb93e3a5 | 420 | { |
d8e4bb81 CH |
421 | if (!capable(CAP_SYS_ADMIN)) |
422 | return -EACCES; | |
2142b88c CH |
423 | |
424 | mutex_lock(&bdev->bd_holder_lock); | |
425 | if (bdev->bd_holder_ops && bdev->bd_holder_ops->sync) | |
426 | bdev->bd_holder_ops->sync(bdev); | |
fd146410 JK |
427 | else { |
428 | mutex_unlock(&bdev->bd_holder_lock); | |
2142b88c | 429 | sync_blockdev(bdev); |
fd146410 | 430 | } |
2142b88c | 431 | |
d8e4bb81 CH |
432 | invalidate_bdev(bdev); |
433 | return 0; | |
434 | } | |
d30a2605 | 435 | |
5e4ea834 CH |
436 | static int blkdev_roset(struct block_device *bdev, unsigned cmd, |
437 | unsigned long arg) | |
d8e4bb81 CH |
438 | { |
439 | int ret, n; | |
d30a2605 | 440 | |
bb749b31 ID |
441 | if (!capable(CAP_SYS_ADMIN)) |
442 | return -EACCES; | |
443 | ||
d8e4bb81 CH |
444 | if (get_user(n, (int __user *)arg)) |
445 | return -EFAULT; | |
e00adcad CH |
446 | if (bdev->bd_disk->fops->set_read_only) { |
447 | ret = bdev->bd_disk->fops->set_read_only(bdev, n); | |
448 | if (ret) | |
449 | return ret; | |
450 | } | |
01e198f0 AV |
451 | if (n) |
452 | bdev_set_flag(bdev, BD_READ_ONLY); | |
453 | else | |
454 | bdev_clear_flag(bdev, BD_READ_ONLY); | |
d8e4bb81 CH |
455 | return 0; |
456 | } | |
d30a2605 | 457 | |
d8e4bb81 CH |
458 | static int blkdev_getgeo(struct block_device *bdev, |
459 | struct hd_geometry __user *argp) | |
460 | { | |
461 | struct gendisk *disk = bdev->bd_disk; | |
462 | struct hd_geometry geo; | |
463 | int ret; | |
d30a2605 | 464 | |
d8e4bb81 CH |
465 | if (!argp) |
466 | return -EINVAL; | |
467 | if (!disk->fops->getgeo) | |
468 | return -ENOTTY; | |
469 | ||
470 | /* | |
471 | * We need to set the startsect first, the driver may | |
472 | * want to override it. | |
473 | */ | |
474 | memset(&geo, 0, sizeof(geo)); | |
475 | geo.start = get_start_sect(bdev); | |
476 | ret = disk->fops->getgeo(bdev, &geo); | |
477 | if (ret) | |
478 | return ret; | |
479 | if (copy_to_user(argp, &geo, sizeof(geo))) | |
480 | return -EFAULT; | |
481 | return 0; | |
482 | } | |
66ba32dc | 483 | |
bdc1ddad AB |
484 | #ifdef CONFIG_COMPAT |
485 | struct compat_hd_geometry { | |
486 | unsigned char heads; | |
487 | unsigned char sectors; | |
488 | unsigned short cylinders; | |
489 | u32 start; | |
490 | }; | |
491 | ||
9b81648c AB |
492 | static int compat_hdio_getgeo(struct block_device *bdev, |
493 | struct compat_hd_geometry __user *ugeo) | |
bdc1ddad | 494 | { |
9b81648c | 495 | struct gendisk *disk = bdev->bd_disk; |
bdc1ddad AB |
496 | struct hd_geometry geo; |
497 | int ret; | |
498 | ||
499 | if (!ugeo) | |
500 | return -EINVAL; | |
501 | if (!disk->fops->getgeo) | |
502 | return -ENOTTY; | |
503 | ||
504 | memset(&geo, 0, sizeof(geo)); | |
505 | /* | |
506 | * We need to set the startsect first, the driver may | |
507 | * want to override it. | |
508 | */ | |
509 | geo.start = get_start_sect(bdev); | |
510 | ret = disk->fops->getgeo(bdev, &geo); | |
511 | if (ret) | |
512 | return ret; | |
513 | ||
514 | ret = copy_to_user(ugeo, &geo, 4); | |
515 | ret |= put_user(geo.start, &ugeo->start); | |
516 | if (ret) | |
517 | ret = -EFAULT; | |
518 | ||
519 | return ret; | |
520 | } | |
521 | #endif | |
522 | ||
d8e4bb81 | 523 | /* set the logical block size */ |
ead083ae | 524 | static int blkdev_bszset(struct file *file, blk_mode_t mode, |
d8e4bb81 CH |
525 | int __user *argp) |
526 | { | |
ead083ae AV |
527 | // this one might be file_inode(file)->i_rdev - a rare valid |
528 | // use of file_inode() for those. | |
529 | dev_t dev = I_BDEV(file->f_mapping->host)->bd_dev; | |
530 | struct file *excl_file; | |
d8e4bb81 | 531 | int ret, n; |
66ba32dc | 532 | |
d8e4bb81 CH |
533 | if (!capable(CAP_SYS_ADMIN)) |
534 | return -EACCES; | |
535 | if (!argp) | |
536 | return -EINVAL; | |
537 | if (get_user(n, argp)) | |
538 | return -EFAULT; | |
66ba32dc | 539 | |
05bdb996 | 540 | if (mode & BLK_OPEN_EXCL) |
ead083ae | 541 | return set_blocksize(file, n); |
d30a2605 | 542 | |
ead083ae AV |
543 | excl_file = bdev_file_open_by_dev(dev, mode, &dev, NULL); |
544 | if (IS_ERR(excl_file)) | |
47816282 | 545 | return -EBUSY; |
ead083ae AV |
546 | ret = set_blocksize(excl_file, n); |
547 | fput(excl_file); | |
d8e4bb81 CH |
548 | return ret; |
549 | } | |
a885c8c4 | 550 | |
d8e4bb81 | 551 | /* |
9b81648c AB |
552 | * Common commands that are handled the same way on native and compat |
553 | * user space. Note the separate arg/argp parameters that are needed | |
554 | * to deal with the compat_ptr() conversion. | |
d8e4bb81 | 555 | */ |
05bdb996 | 556 | static int blkdev_common_ioctl(struct block_device *bdev, blk_mode_t mode, |
0f77b29a YK |
557 | unsigned int cmd, unsigned long arg, |
558 | void __user *argp) | |
d8e4bb81 | 559 | { |
d8e4bb81 CH |
560 | unsigned int max_sectors; |
561 | ||
562 | switch (cmd) { | |
563 | case BLKFLSBUF: | |
5e4ea834 | 564 | return blkdev_flushbuf(bdev, cmd, arg); |
d8e4bb81 | 565 | case BLKROSET: |
5e4ea834 | 566 | return blkdev_roset(bdev, cmd, arg); |
d8e4bb81 | 567 | case BLKDISCARD: |
44abff2c | 568 | return blk_ioctl_discard(bdev, mode, arg); |
d8e4bb81 | 569 | case BLKSECDISCARD: |
44abff2c | 570 | return blk_ioctl_secure_erase(bdev, mode, argp); |
d8e4bb81 CH |
571 | case BLKZEROOUT: |
572 | return blk_ioctl_zeroout(bdev, mode, arg); | |
7957d93b MC |
573 | case BLKGETDISKSEQ: |
574 | return put_u64(argp, bdev->bd_disk->diskseq); | |
3ed05a98 | 575 | case BLKREPORTZONE: |
5e4ea834 | 576 | return blkdev_report_zones_ioctl(bdev, cmd, arg); |
3ed05a98 | 577 | case BLKRESETZONE: |
e876df1f AJ |
578 | case BLKOPENZONE: |
579 | case BLKCLOSEZONE: | |
580 | case BLKFINISHZONE: | |
581 | return blkdev_zone_mgmt_ioctl(bdev, mode, cmd, arg); | |
72cd8757 | 582 | case BLKGETZONESZ: |
9b81648c | 583 | return put_uint(argp, bdev_zone_sectors(bdev)); |
65e4e3ee | 584 | case BLKGETNRZONES: |
b623e347 | 585 | return put_uint(argp, bdev_nr_zones(bdev)); |
45048d09 | 586 | case BLKROGET: |
9b81648c | 587 | return put_int(argp, bdev_read_only(bdev) != 0); |
ac481c20 | 588 | case BLKSSZGET: /* get block device logical block size */ |
9b81648c | 589 | return put_int(argp, bdev_logical_block_size(bdev)); |
ac481c20 | 590 | case BLKPBSZGET: /* get block device physical block size */ |
9b81648c | 591 | return put_uint(argp, bdev_physical_block_size(bdev)); |
ac481c20 | 592 | case BLKIOMIN: |
9b81648c | 593 | return put_uint(argp, bdev_io_min(bdev)); |
ac481c20 | 594 | case BLKIOOPT: |
9b81648c | 595 | return put_uint(argp, bdev_io_opt(bdev)); |
ac481c20 | 596 | case BLKALIGNOFF: |
9b81648c | 597 | return put_int(argp, bdev_alignment_offset(bdev)); |
98262f27 | 598 | case BLKDISCARDZEROES: |
9b81648c | 599 | return put_uint(argp, 0); |
45048d09 | 600 | case BLKSECTGET: |
63f26496 AM |
601 | max_sectors = min_t(unsigned int, USHRT_MAX, |
602 | queue_max_sectors(bdev_get_queue(bdev))); | |
9b81648c | 603 | return put_ushort(argp, max_sectors); |
ef00f59c | 604 | case BLKROTATIONAL: |
10f0d2a5 | 605 | return put_ushort(argp, !bdev_nonrot(bdev)); |
45048d09 AV |
606 | case BLKRASET: |
607 | case BLKFRASET: | |
608 | if(!capable(CAP_SYS_ADMIN)) | |
609 | return -EACCES; | |
a11d7fc2 | 610 | bdev->bd_disk->bdi->ra_pages = (arg * 512) / PAGE_SIZE; |
45048d09 | 611 | return 0; |
45048d09 | 612 | case BLKRRPART: |
e16e506c CH |
613 | if (!capable(CAP_SYS_ADMIN)) |
614 | return -EACCES; | |
615 | if (bdev_is_partition(bdev)) | |
616 | return -EINVAL; | |
752863bd CH |
617 | return disk_scan_partitions(bdev->bd_disk, |
618 | mode | BLK_OPEN_STRICT_SCAN); | |
45048d09 AV |
619 | case BLKTRACESTART: |
620 | case BLKTRACESTOP: | |
45048d09 | 621 | case BLKTRACETEARDOWN: |
d8e4bb81 | 622 | return blk_trace_ioctl(bdev, cmd, argp); |
bbd3e064 | 623 | case IOC_PR_REGISTER: |
9a72a024 | 624 | return blkdev_pr_register(bdev, mode, argp); |
bbd3e064 | 625 | case IOC_PR_RESERVE: |
9a72a024 | 626 | return blkdev_pr_reserve(bdev, mode, argp); |
bbd3e064 | 627 | case IOC_PR_RELEASE: |
9a72a024 | 628 | return blkdev_pr_release(bdev, mode, argp); |
bbd3e064 | 629 | case IOC_PR_PREEMPT: |
9a72a024 | 630 | return blkdev_pr_preempt(bdev, mode, argp, false); |
bbd3e064 | 631 | case IOC_PR_PREEMPT_ABORT: |
9a72a024 | 632 | return blkdev_pr_preempt(bdev, mode, argp, true); |
bbd3e064 | 633 | case IOC_PR_CLEAR: |
9a72a024 | 634 | return blkdev_pr_clear(bdev, mode, argp); |
45048d09 | 635 | default: |
9b81648c | 636 | return -ENOIOCTLCMD; |
45048d09 | 637 | } |
1da177e4 | 638 | } |
9b81648c AB |
639 | |
640 | /* | |
641 | * Always keep this in sync with compat_blkdev_ioctl() | |
642 | * to handle all incompatible commands in both functions. | |
643 | * | |
644 | * New commands must be compatible and go into blkdev_common_ioctl | |
645 | */ | |
8a709512 | 646 | long blkdev_ioctl(struct file *file, unsigned cmd, unsigned long arg) |
9b81648c | 647 | { |
8a709512 | 648 | struct block_device *bdev = I_BDEV(file->f_mapping->host); |
9b81648c | 649 | void __user *argp = (void __user *)arg; |
05bdb996 | 650 | blk_mode_t mode = file_to_blk_mode(file); |
8a709512 CH |
651 | int ret; |
652 | ||
9b81648c AB |
653 | switch (cmd) { |
654 | /* These need separate implementations for the data structure */ | |
655 | case HDIO_GETGEO: | |
656 | return blkdev_getgeo(bdev, argp); | |
657 | case BLKPG: | |
658 | return blkpg_ioctl(bdev, argp); | |
659 | ||
660 | /* Compat mode returns 32-bit data instead of 'long' */ | |
661 | case BLKRAGET: | |
662 | case BLKFRAGET: | |
663 | if (!argp) | |
664 | return -EINVAL; | |
a11d7fc2 CH |
665 | return put_long(argp, |
666 | (bdev->bd_disk->bdi->ra_pages * PAGE_SIZE) / 512); | |
9b81648c | 667 | case BLKGETSIZE: |
946e9937 | 668 | if (bdev_nr_sectors(bdev) > ~0UL) |
9b81648c | 669 | return -EFBIG; |
946e9937 | 670 | return put_ulong(argp, bdev_nr_sectors(bdev)); |
9b81648c AB |
671 | |
672 | /* The data is compatible, but the command number is different */ | |
673 | case BLKBSZGET: /* get block device soft block size (cf. BLKSSZGET) */ | |
674 | return put_int(argp, block_size(bdev)); | |
675 | case BLKBSZSET: | |
ead083ae | 676 | return blkdev_bszset(file, mode, argp); |
9b81648c | 677 | case BLKGETSIZE64: |
946e9937 | 678 | return put_u64(argp, bdev_nr_bytes(bdev)); |
9b81648c AB |
679 | |
680 | /* Incompatible alignment on i386 */ | |
681 | case BLKTRACESETUP: | |
682 | return blk_trace_ioctl(bdev, cmd, argp); | |
683 | default: | |
684 | break; | |
685 | } | |
686 | ||
0f77b29a | 687 | ret = blkdev_common_ioctl(bdev, mode, cmd, arg, argp); |
a7cb3d2f CH |
688 | if (ret != -ENOIOCTLCMD) |
689 | return ret; | |
9b81648c | 690 | |
a7cb3d2f CH |
691 | if (!bdev->bd_disk->fops->ioctl) |
692 | return -ENOTTY; | |
693 | return bdev->bd_disk->fops->ioctl(bdev, mode, cmd, arg); | |
9b81648c | 694 | } |
bdc1ddad AB |
695 | |
696 | #ifdef CONFIG_COMPAT | |
9b81648c | 697 | |
bdc1ddad AB |
698 | #define BLKBSZGET_32 _IOR(0x12, 112, int) |
699 | #define BLKBSZSET_32 _IOW(0x12, 113, int) | |
700 | #define BLKGETSIZE64_32 _IOR(0x12, 114, int) | |
701 | ||
702 | /* Most of the generic ioctls are handled in the normal fallback path. | |
703 | This assumes the blkdev's low level compat_ioctl always returns | |
704 | ENOIOCTLCMD for unknown ioctls. */ | |
705 | long compat_blkdev_ioctl(struct file *file, unsigned cmd, unsigned long arg) | |
706 | { | |
9b81648c AB |
707 | int ret; |
708 | void __user *argp = compat_ptr(arg); | |
4e7b5671 | 709 | struct block_device *bdev = I_BDEV(file->f_mapping->host); |
bdc1ddad | 710 | struct gendisk *disk = bdev->bd_disk; |
05bdb996 | 711 | blk_mode_t mode = file_to_blk_mode(file); |
bdc1ddad AB |
712 | |
713 | switch (cmd) { | |
9b81648c | 714 | /* These need separate implementations for the data structure */ |
bdc1ddad | 715 | case HDIO_GETGEO: |
9b81648c | 716 | return compat_hdio_getgeo(bdev, argp); |
bdc1ddad | 717 | case BLKPG: |
9b81648c AB |
718 | return compat_blkpg_ioctl(bdev, argp); |
719 | ||
720 | /* Compat mode returns 32-bit data instead of 'long' */ | |
bdc1ddad AB |
721 | case BLKRAGET: |
722 | case BLKFRAGET: | |
9b81648c | 723 | if (!argp) |
bdc1ddad | 724 | return -EINVAL; |
9b81648c | 725 | return compat_put_long(argp, |
a11d7fc2 | 726 | (bdev->bd_disk->bdi->ra_pages * PAGE_SIZE) / 512); |
bdc1ddad | 727 | case BLKGETSIZE: |
ccf16413 | 728 | if (bdev_nr_sectors(bdev) > ~(compat_ulong_t)0) |
bdc1ddad | 729 | return -EFBIG; |
946e9937 | 730 | return compat_put_ulong(argp, bdev_nr_sectors(bdev)); |
bdc1ddad | 731 | |
9b81648c AB |
732 | /* The data is compatible, but the command number is different */ |
733 | case BLKBSZGET_32: /* get the logical block size (cf. BLKSSZGET) */ | |
734 | return put_int(argp, bdev_logical_block_size(bdev)); | |
735 | case BLKBSZSET_32: | |
ead083ae | 736 | return blkdev_bszset(file, mode, argp); |
bdc1ddad | 737 | case BLKGETSIZE64_32: |
946e9937 | 738 | return put_u64(argp, bdev_nr_bytes(bdev)); |
bdc1ddad | 739 | |
9b81648c | 740 | /* Incompatible alignment on i386 */ |
bdc1ddad | 741 | case BLKTRACESETUP32: |
9b81648c | 742 | return blk_trace_ioctl(bdev, cmd, argp); |
bdc1ddad | 743 | default: |
9b81648c | 744 | break; |
bdc1ddad | 745 | } |
9b81648c | 746 | |
0f77b29a | 747 | ret = blkdev_common_ioctl(bdev, mode, cmd, arg, argp); |
9b81648c AB |
748 | if (ret == -ENOIOCTLCMD && disk->fops->compat_ioctl) |
749 | ret = disk->fops->compat_ioctl(bdev, mode, cmd, arg); | |
750 | ||
751 | return ret; | |
bdc1ddad AB |
752 | } |
753 | #endif | |
50c52250 PB |
754 | |
755 | struct blk_iou_cmd { | |
756 | int res; | |
757 | bool nowait; | |
758 | }; | |
759 | ||
760 | static void blk_cmd_complete(struct io_uring_cmd *cmd, unsigned int issue_flags) | |
761 | { | |
762 | struct blk_iou_cmd *bic = io_uring_cmd_to_pdu(cmd, struct blk_iou_cmd); | |
763 | ||
764 | if (bic->res == -EAGAIN && bic->nowait) | |
765 | io_uring_cmd_issue_blocking(cmd); | |
766 | else | |
767 | io_uring_cmd_done(cmd, bic->res, 0, issue_flags); | |
768 | } | |
769 | ||
770 | static void bio_cmd_bio_end_io(struct bio *bio) | |
771 | { | |
772 | struct io_uring_cmd *cmd = bio->bi_private; | |
773 | struct blk_iou_cmd *bic = io_uring_cmd_to_pdu(cmd, struct blk_iou_cmd); | |
774 | ||
775 | if (unlikely(bio->bi_status) && !bic->res) | |
776 | bic->res = blk_status_to_errno(bio->bi_status); | |
777 | ||
778 | io_uring_cmd_do_in_task_lazy(cmd, blk_cmd_complete); | |
779 | bio_put(bio); | |
780 | } | |
781 | ||
782 | static int blkdev_cmd_discard(struct io_uring_cmd *cmd, | |
783 | struct block_device *bdev, | |
784 | uint64_t start, uint64_t len, bool nowait) | |
785 | { | |
786 | struct blk_iou_cmd *bic = io_uring_cmd_to_pdu(cmd, struct blk_iou_cmd); | |
787 | gfp_t gfp = nowait ? GFP_NOWAIT : GFP_KERNEL; | |
788 | sector_t sector = start >> SECTOR_SHIFT; | |
789 | sector_t nr_sects = len >> SECTOR_SHIFT; | |
790 | struct bio *prev = NULL, *bio; | |
791 | int err; | |
792 | ||
793 | if (!bdev_max_discard_sectors(bdev)) | |
794 | return -EOPNOTSUPP; | |
795 | if (!(file_to_blk_mode(cmd->file) & BLK_OPEN_WRITE)) | |
796 | return -EBADF; | |
797 | if (bdev_read_only(bdev)) | |
798 | return -EPERM; | |
799 | err = blk_validate_byte_range(bdev, start, len); | |
800 | if (err) | |
801 | return err; | |
802 | ||
803 | err = filemap_invalidate_pages(bdev->bd_mapping, start, | |
804 | start + len - 1, nowait); | |
805 | if (err) | |
806 | return err; | |
807 | ||
808 | while (true) { | |
809 | bio = blk_alloc_discard_bio(bdev, §or, &nr_sects, gfp); | |
810 | if (!bio) | |
811 | break; | |
812 | if (nowait) { | |
813 | /* | |
814 | * Don't allow multi-bio non-blocking submissions as | |
815 | * subsequent bios may fail but we won't get a direct | |
816 | * indication of that. Normally, the caller should | |
817 | * retry from a blocking context. | |
818 | */ | |
819 | if (unlikely(nr_sects)) { | |
820 | bio_put(bio); | |
821 | return -EAGAIN; | |
822 | } | |
823 | bio->bi_opf |= REQ_NOWAIT; | |
824 | } | |
825 | ||
826 | prev = bio_chain_and_submit(prev, bio); | |
827 | } | |
828 | if (unlikely(!prev)) | |
829 | return -EAGAIN; | |
830 | if (unlikely(nr_sects)) | |
831 | bic->res = -EAGAIN; | |
832 | ||
833 | prev->bi_private = cmd; | |
834 | prev->bi_end_io = bio_cmd_bio_end_io; | |
835 | submit_bio(prev); | |
836 | return -EIOCBQUEUED; | |
837 | } | |
838 | ||
839 | int blkdev_uring_cmd(struct io_uring_cmd *cmd, unsigned int issue_flags) | |
840 | { | |
841 | struct block_device *bdev = I_BDEV(cmd->file->f_mapping->host); | |
842 | struct blk_iou_cmd *bic = io_uring_cmd_to_pdu(cmd, struct blk_iou_cmd); | |
843 | const struct io_uring_sqe *sqe = cmd->sqe; | |
844 | u32 cmd_op = cmd->cmd_op; | |
845 | uint64_t start, len; | |
846 | ||
847 | if (unlikely(sqe->ioprio || sqe->__pad1 || sqe->len || | |
848 | sqe->rw_flags || sqe->file_index)) | |
849 | return -EINVAL; | |
850 | ||
851 | bic->res = 0; | |
852 | bic->nowait = issue_flags & IO_URING_F_NONBLOCK; | |
853 | ||
854 | start = READ_ONCE(sqe->addr); | |
855 | len = READ_ONCE(sqe->addr3); | |
856 | ||
857 | switch (cmd_op) { | |
858 | case BLOCK_URING_CMD_DISCARD: | |
859 | return blkdev_cmd_discard(cmd, bdev, start, len, bic->nowait); | |
860 | } | |
861 | return -EINVAL; | |
862 | } |