]>
Commit | Line | Data |
---|---|---|
f31e7e40 DM |
1 | /* |
2 | * Functions related to generic helpers functions | |
3 | */ | |
4 | #include <linux/kernel.h> | |
5 | #include <linux/module.h> | |
6 | #include <linux/bio.h> | |
7 | #include <linux/blkdev.h> | |
8 | #include <linux/scatterlist.h> | |
9 | ||
10 | #include "blk.h" | |
11 | ||
5dba3089 LC |
12 | struct bio_batch { |
13 | atomic_t done; | |
4246a0b6 | 14 | int error; |
5dba3089 LC |
15 | struct completion *wait; |
16 | }; | |
17 | ||
4246a0b6 | 18 | static void bio_batch_end_io(struct bio *bio) |
f31e7e40 | 19 | { |
5dba3089 LC |
20 | struct bio_batch *bb = bio->bi_private; |
21 | ||
4246a0b6 CH |
22 | if (bio->bi_error && bio->bi_error != -EOPNOTSUPP) |
23 | bb->error = bio->bi_error; | |
5dba3089 LC |
24 | if (atomic_dec_and_test(&bb->done)) |
25 | complete(bb->wait); | |
f31e7e40 DM |
26 | bio_put(bio); |
27 | } | |
28 | ||
29 | /** | |
30 | * blkdev_issue_discard - queue a discard | |
31 | * @bdev: blockdev to issue discard for | |
32 | * @sector: start sector | |
33 | * @nr_sects: number of sectors to discard | |
34 | * @gfp_mask: memory allocation flags (for bio_alloc) | |
35 | * @flags: BLKDEV_IFL_* flags to control behaviour | |
36 | * | |
37 | * Description: | |
38 | * Issue a discard request for the sectors in question. | |
39 | */ | |
40 | int blkdev_issue_discard(struct block_device *bdev, sector_t sector, | |
41 | sector_t nr_sects, gfp_t gfp_mask, unsigned long flags) | |
42 | { | |
43 | DECLARE_COMPLETION_ONSTACK(wait); | |
44 | struct request_queue *q = bdev_get_queue(bdev); | |
8c555367 | 45 | int type = REQ_WRITE | REQ_DISCARD; |
a22c4d7e ML |
46 | unsigned int granularity; |
47 | int alignment; | |
5dba3089 | 48 | struct bio_batch bb; |
f31e7e40 | 49 | struct bio *bio; |
f31e7e40 | 50 | int ret = 0; |
0cfbcafc | 51 | struct blk_plug plug; |
f31e7e40 DM |
52 | |
53 | if (!q) | |
54 | return -ENXIO; | |
55 | ||
56 | if (!blk_queue_discard(q)) | |
57 | return -EOPNOTSUPP; | |
58 | ||
a22c4d7e ML |
59 | /* Zero-sector (unknown) and one-sector granularities are the same. */ |
60 | granularity = max(q->limits.discard_granularity >> 9, 1U); | |
61 | alignment = (bdev_discard_alignment(bdev) >> 9) % granularity; | |
62 | ||
dd3932ed | 63 | if (flags & BLKDEV_DISCARD_SECURE) { |
8d57a98c AH |
64 | if (!blk_queue_secdiscard(q)) |
65 | return -EOPNOTSUPP; | |
8c555367 | 66 | type |= REQ_SECURE; |
8d57a98c AH |
67 | } |
68 | ||
5dba3089 | 69 | atomic_set(&bb.done, 1); |
4246a0b6 | 70 | bb.error = 0; |
5dba3089 LC |
71 | bb.wait = &wait; |
72 | ||
0cfbcafc | 73 | blk_start_plug(&plug); |
5dba3089 | 74 | while (nr_sects) { |
c6e66634 | 75 | unsigned int req_sects; |
a22c4d7e | 76 | sector_t end_sect, tmp; |
c6e66634 | 77 | |
f31e7e40 | 78 | bio = bio_alloc(gfp_mask, 1); |
66ac0280 CH |
79 | if (!bio) { |
80 | ret = -ENOMEM; | |
81 | break; | |
82 | } | |
83 | ||
a22c4d7e ML |
84 | /* Make sure bi_size doesn't overflow */ |
85 | req_sects = min_t(sector_t, nr_sects, UINT_MAX >> 9); | |
86 | ||
87 | /* | |
88 | * If splitting a request, and the next starting sector would be | |
89 | * misaligned, stop the discard at the previous aligned sector. | |
90 | */ | |
c6e66634 | 91 | end_sect = sector + req_sects; |
a22c4d7e ML |
92 | tmp = end_sect; |
93 | if (req_sects < nr_sects && | |
94 | sector_div(tmp, granularity) != alignment) { | |
95 | end_sect = end_sect - alignment; | |
96 | sector_div(end_sect, granularity); | |
97 | end_sect = end_sect * granularity + alignment; | |
98 | req_sects = end_sect - sector; | |
99 | } | |
c6e66634 | 100 | |
4f024f37 | 101 | bio->bi_iter.bi_sector = sector; |
5dba3089 | 102 | bio->bi_end_io = bio_batch_end_io; |
f31e7e40 | 103 | bio->bi_bdev = bdev; |
5dba3089 | 104 | bio->bi_private = &bb; |
f31e7e40 | 105 | |
4f024f37 | 106 | bio->bi_iter.bi_size = req_sects << 9; |
c6e66634 PB |
107 | nr_sects -= req_sects; |
108 | sector = end_sect; | |
f31e7e40 | 109 | |
5dba3089 | 110 | atomic_inc(&bb.done); |
f31e7e40 | 111 | submit_bio(type, bio); |
c8123f8c JA |
112 | |
113 | /* | |
114 | * We can loop for a long time in here, if someone does | |
115 | * full device discards (like mkfs). Be nice and allow | |
116 | * us to schedule out to avoid softlocking if preempt | |
117 | * is disabled. | |
118 | */ | |
119 | cond_resched(); | |
5dba3089 | 120 | } |
0cfbcafc | 121 | blk_finish_plug(&plug); |
f31e7e40 | 122 | |
5dba3089 LC |
123 | /* Wait for bios in-flight */ |
124 | if (!atomic_dec_and_test(&bb.done)) | |
5577022f | 125 | wait_for_completion_io(&wait); |
f31e7e40 | 126 | |
4246a0b6 CH |
127 | if (bb.error) |
128 | return bb.error; | |
f31e7e40 | 129 | return ret; |
f31e7e40 DM |
130 | } |
131 | EXPORT_SYMBOL(blkdev_issue_discard); | |
3f14d792 | 132 | |
4363ac7c MP |
133 | /** |
134 | * blkdev_issue_write_same - queue a write same operation | |
135 | * @bdev: target blockdev | |
136 | * @sector: start sector | |
137 | * @nr_sects: number of sectors to write | |
138 | * @gfp_mask: memory allocation flags (for bio_alloc) | |
139 | * @page: page containing data to write | |
140 | * | |
141 | * Description: | |
142 | * Issue a write same request for the sectors in question. | |
143 | */ | |
144 | int blkdev_issue_write_same(struct block_device *bdev, sector_t sector, | |
145 | sector_t nr_sects, gfp_t gfp_mask, | |
146 | struct page *page) | |
147 | { | |
148 | DECLARE_COMPLETION_ONSTACK(wait); | |
149 | struct request_queue *q = bdev_get_queue(bdev); | |
150 | unsigned int max_write_same_sectors; | |
151 | struct bio_batch bb; | |
152 | struct bio *bio; | |
153 | int ret = 0; | |
154 | ||
155 | if (!q) | |
156 | return -ENXIO; | |
157 | ||
b49a0871 ML |
158 | /* Ensure that max_write_same_sectors doesn't overflow bi_size */ |
159 | max_write_same_sectors = UINT_MAX >> 9; | |
4363ac7c MP |
160 | |
161 | atomic_set(&bb.done, 1); | |
4246a0b6 | 162 | bb.error = 0; |
4363ac7c MP |
163 | bb.wait = &wait; |
164 | ||
165 | while (nr_sects) { | |
166 | bio = bio_alloc(gfp_mask, 1); | |
167 | if (!bio) { | |
168 | ret = -ENOMEM; | |
169 | break; | |
170 | } | |
171 | ||
4f024f37 | 172 | bio->bi_iter.bi_sector = sector; |
4363ac7c MP |
173 | bio->bi_end_io = bio_batch_end_io; |
174 | bio->bi_bdev = bdev; | |
175 | bio->bi_private = &bb; | |
176 | bio->bi_vcnt = 1; | |
177 | bio->bi_io_vec->bv_page = page; | |
178 | bio->bi_io_vec->bv_offset = 0; | |
179 | bio->bi_io_vec->bv_len = bdev_logical_block_size(bdev); | |
180 | ||
181 | if (nr_sects > max_write_same_sectors) { | |
4f024f37 | 182 | bio->bi_iter.bi_size = max_write_same_sectors << 9; |
4363ac7c MP |
183 | nr_sects -= max_write_same_sectors; |
184 | sector += max_write_same_sectors; | |
185 | } else { | |
4f024f37 | 186 | bio->bi_iter.bi_size = nr_sects << 9; |
4363ac7c MP |
187 | nr_sects = 0; |
188 | } | |
189 | ||
190 | atomic_inc(&bb.done); | |
191 | submit_bio(REQ_WRITE | REQ_WRITE_SAME, bio); | |
192 | } | |
193 | ||
194 | /* Wait for bios in-flight */ | |
195 | if (!atomic_dec_and_test(&bb.done)) | |
5577022f | 196 | wait_for_completion_io(&wait); |
4363ac7c | 197 | |
4246a0b6 CH |
198 | if (bb.error) |
199 | return bb.error; | |
4363ac7c MP |
200 | return ret; |
201 | } | |
202 | EXPORT_SYMBOL(blkdev_issue_write_same); | |
203 | ||
3f14d792 | 204 | /** |
291d24f6 | 205 | * blkdev_issue_zeroout - generate number of zero filed write bios |
3f14d792 DM |
206 | * @bdev: blockdev to issue |
207 | * @sector: start sector | |
208 | * @nr_sects: number of sectors to write | |
209 | * @gfp_mask: memory allocation flags (for bio_alloc) | |
3f14d792 DM |
210 | * |
211 | * Description: | |
212 | * Generate and issue number of bios with zerofiled pages. | |
3f14d792 DM |
213 | */ |
214 | ||
35086784 FF |
215 | static int __blkdev_issue_zeroout(struct block_device *bdev, sector_t sector, |
216 | sector_t nr_sects, gfp_t gfp_mask) | |
3f14d792 | 217 | { |
18edc8ea | 218 | int ret; |
3f14d792 DM |
219 | struct bio *bio; |
220 | struct bio_batch bb; | |
0aeea189 | 221 | unsigned int sz; |
3f14d792 DM |
222 | DECLARE_COMPLETION_ONSTACK(wait); |
223 | ||
0aeea189 | 224 | atomic_set(&bb.done, 1); |
4246a0b6 | 225 | bb.error = 0; |
3f14d792 | 226 | bb.wait = &wait; |
3f14d792 | 227 | |
18edc8ea | 228 | ret = 0; |
3f14d792 DM |
229 | while (nr_sects != 0) { |
230 | bio = bio_alloc(gfp_mask, | |
231 | min(nr_sects, (sector_t)BIO_MAX_PAGES)); | |
18edc8ea DM |
232 | if (!bio) { |
233 | ret = -ENOMEM; | |
3f14d792 | 234 | break; |
18edc8ea | 235 | } |
3f14d792 | 236 | |
4f024f37 | 237 | bio->bi_iter.bi_sector = sector; |
3f14d792 DM |
238 | bio->bi_bdev = bdev; |
239 | bio->bi_end_io = bio_batch_end_io; | |
dd3932ed | 240 | bio->bi_private = &bb; |
3f14d792 | 241 | |
0341aafb JA |
242 | while (nr_sects != 0) { |
243 | sz = min((sector_t) PAGE_SIZE >> 9 , nr_sects); | |
3f14d792 DM |
244 | ret = bio_add_page(bio, ZERO_PAGE(0), sz << 9, 0); |
245 | nr_sects -= ret >> 9; | |
246 | sector += ret >> 9; | |
247 | if (ret < (sz << 9)) | |
248 | break; | |
249 | } | |
18edc8ea | 250 | ret = 0; |
0aeea189 | 251 | atomic_inc(&bb.done); |
3f14d792 DM |
252 | submit_bio(WRITE, bio); |
253 | } | |
3f14d792 | 254 | |
dd3932ed | 255 | /* Wait for bios in-flight */ |
0aeea189 | 256 | if (!atomic_dec_and_test(&bb.done)) |
5577022f | 257 | wait_for_completion_io(&wait); |
3f14d792 | 258 | |
4246a0b6 CH |
259 | if (bb.error) |
260 | return bb.error; | |
3f14d792 DM |
261 | return ret; |
262 | } | |
579e8f3c MP |
263 | |
264 | /** | |
265 | * blkdev_issue_zeroout - zero-fill a block range | |
266 | * @bdev: blockdev to write | |
267 | * @sector: start sector | |
268 | * @nr_sects: number of sectors to write | |
269 | * @gfp_mask: memory allocation flags (for bio_alloc) | |
d93ba7a5 | 270 | * @discard: whether to discard the block range |
579e8f3c MP |
271 | * |
272 | * Description: | |
d93ba7a5 MP |
273 | * Zero-fill a block range. If the discard flag is set and the block |
274 | * device guarantees that subsequent READ operations to the block range | |
275 | * in question will return zeroes, the blocks will be discarded. Should | |
276 | * the discard request fail, if the discard flag is not set, or if | |
277 | * discard_zeroes_data is not supported, this function will resort to | |
278 | * zeroing the blocks manually, thus provisioning (allocating, | |
279 | * anchoring) them. If the block device supports the WRITE SAME command | |
280 | * blkdev_issue_zeroout() will use it to optimize the process of | |
281 | * clearing the block range. Otherwise the zeroing will be performed | |
282 | * using regular WRITE calls. | |
579e8f3c MP |
283 | */ |
284 | ||
285 | int blkdev_issue_zeroout(struct block_device *bdev, sector_t sector, | |
d93ba7a5 | 286 | sector_t nr_sects, gfp_t gfp_mask, bool discard) |
579e8f3c | 287 | { |
d93ba7a5 | 288 | struct request_queue *q = bdev_get_queue(bdev); |
d93ba7a5 | 289 | |
9f9ee1f2 MP |
290 | if (discard && blk_queue_discard(q) && q->limits.discard_zeroes_data && |
291 | blkdev_issue_discard(bdev, sector, nr_sects, gfp_mask, 0) == 0) | |
292 | return 0; | |
d93ba7a5 | 293 | |
9f9ee1f2 MP |
294 | if (bdev_write_same(bdev) && |
295 | blkdev_issue_write_same(bdev, sector, nr_sects, gfp_mask, | |
296 | ZERO_PAGE(0)) == 0) | |
297 | return 0; | |
579e8f3c MP |
298 | |
299 | return __blkdev_issue_zeroout(bdev, sector, nr_sects, gfp_mask); | |
300 | } | |
3f14d792 | 301 | EXPORT_SYMBOL(blkdev_issue_zeroout); |