]>
Commit | Line | Data |
---|---|---|
5442680f RK |
1 | /* |
2 | * alloc.c - NILFS dat/inode allocator | |
3 | * | |
4 | * Copyright (C) 2006-2008 Nippon Telegraph and Telephone Corporation. | |
5 | * | |
6 | * This program is free software; you can redistribute it and/or modify | |
7 | * it under the terms of the GNU General Public License as published by | |
8 | * the Free Software Foundation; either version 2 of the License, or | |
9 | * (at your option) any later version. | |
10 | * | |
11 | * This program is distributed in the hope that it will be useful, | |
12 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
14 | * GNU General Public License for more details. | |
15 | * | |
4b420ab4 RK |
16 | * Originally written by Koji Sato. |
17 | * Two allocators were unified by Ryusuke Konishi and Amagai Yoshiji. | |
5442680f RK |
18 | */ |
19 | ||
20 | #include <linux/types.h> | |
21 | #include <linux/buffer_head.h> | |
22 | #include <linux/fs.h> | |
23 | #include <linux/bitops.h> | |
5a0e3ad6 | 24 | #include <linux/slab.h> |
5442680f RK |
25 | #include "mdt.h" |
26 | #include "alloc.h" | |
27 | ||
28 | ||
db55d922 RK |
29 | /** |
30 | * nilfs_palloc_groups_per_desc_block - get the number of groups that a group | |
31 | * descriptor block can maintain | |
32 | * @inode: inode of metadata file using this allocator | |
33 | */ | |
5442680f RK |
34 | static inline unsigned long |
35 | nilfs_palloc_groups_per_desc_block(const struct inode *inode) | |
36 | { | |
f3048d17 | 37 | return i_blocksize(inode) / |
5442680f RK |
38 | sizeof(struct nilfs_palloc_group_desc); |
39 | } | |
40 | ||
db55d922 RK |
41 | /** |
42 | * nilfs_palloc_groups_count - get maximum number of groups | |
43 | * @inode: inode of metadata file using this allocator | |
44 | */ | |
5442680f RK |
45 | static inline unsigned long |
46 | nilfs_palloc_groups_count(const struct inode *inode) | |
47 | { | |
48 | return 1UL << (BITS_PER_LONG - (inode->i_blkbits + 3 /* log2(8) */)); | |
49 | } | |
50 | ||
db55d922 RK |
51 | /** |
52 | * nilfs_palloc_init_blockgroup - initialize private variables for allocator | |
53 | * @inode: inode of metadata file using this allocator | |
54 | * @entry_size: size of the persistent object | |
55 | */ | |
0c6c44cb | 56 | int nilfs_palloc_init_blockgroup(struct inode *inode, unsigned int entry_size) |
5442680f RK |
57 | { |
58 | struct nilfs_mdt_info *mi = NILFS_MDT(inode); | |
59 | ||
60 | mi->mi_bgl = kmalloc(sizeof(*mi->mi_bgl), GFP_NOFS); | |
61 | if (!mi->mi_bgl) | |
62 | return -ENOMEM; | |
63 | ||
64 | bgl_lock_init(mi->mi_bgl); | |
65 | ||
66 | nilfs_mdt_set_entry_size(inode, entry_size, 0); | |
67 | ||
68 | mi->mi_blocks_per_group = | |
69 | DIV_ROUND_UP(nilfs_palloc_entries_per_group(inode), | |
70 | mi->mi_entries_per_block) + 1; | |
076a378b RK |
71 | /* |
72 | * Number of blocks in a group including entry blocks | |
73 | * and a bitmap block | |
74 | */ | |
5442680f RK |
75 | mi->mi_blocks_per_desc_block = |
76 | nilfs_palloc_groups_per_desc_block(inode) * | |
77 | mi->mi_blocks_per_group + 1; | |
076a378b RK |
78 | /* |
79 | * Number of blocks per descriptor including the | |
80 | * descriptor block | |
81 | */ | |
5442680f RK |
82 | return 0; |
83 | } | |
84 | ||
db55d922 RK |
85 | /** |
86 | * nilfs_palloc_group - get group number and offset from an entry number | |
87 | * @inode: inode of metadata file using this allocator | |
88 | * @nr: serial number of the entry (e.g. inode number) | |
89 | * @offset: pointer to store offset number in the group | |
90 | */ | |
5442680f RK |
91 | static unsigned long nilfs_palloc_group(const struct inode *inode, __u64 nr, |
92 | unsigned long *offset) | |
93 | { | |
94 | __u64 group = nr; | |
95 | ||
96 | *offset = do_div(group, nilfs_palloc_entries_per_group(inode)); | |
97 | return group; | |
98 | } | |
99 | ||
db55d922 RK |
100 | /** |
101 | * nilfs_palloc_desc_blkoff - get block offset of a group descriptor block | |
102 | * @inode: inode of metadata file using this allocator | |
103 | * @group: group number | |
104 | * | |
105 | * nilfs_palloc_desc_blkoff() returns block offset of the descriptor | |
106 | * block which contains a descriptor of the specified group. | |
107 | */ | |
5442680f RK |
108 | static unsigned long |
109 | nilfs_palloc_desc_blkoff(const struct inode *inode, unsigned long group) | |
110 | { | |
111 | unsigned long desc_block = | |
112 | group / nilfs_palloc_groups_per_desc_block(inode); | |
113 | return desc_block * NILFS_MDT(inode)->mi_blocks_per_desc_block; | |
114 | } | |
115 | ||
db55d922 RK |
116 | /** |
117 | * nilfs_palloc_bitmap_blkoff - get block offset of a bitmap block | |
118 | * @inode: inode of metadata file using this allocator | |
119 | * @group: group number | |
120 | * | |
121 | * nilfs_palloc_bitmap_blkoff() returns block offset of the bitmap | |
122 | * block used to allocate/deallocate entries in the specified group. | |
123 | */ | |
5442680f RK |
124 | static unsigned long |
125 | nilfs_palloc_bitmap_blkoff(const struct inode *inode, unsigned long group) | |
126 | { | |
127 | unsigned long desc_offset = | |
128 | group % nilfs_palloc_groups_per_desc_block(inode); | |
129 | return nilfs_palloc_desc_blkoff(inode, group) + 1 + | |
130 | desc_offset * NILFS_MDT(inode)->mi_blocks_per_group; | |
131 | } | |
132 | ||
db55d922 RK |
133 | /** |
134 | * nilfs_palloc_group_desc_nfrees - get the number of free entries in a group | |
db55d922 | 135 | * @desc: pointer to descriptor structure for the group |
4e9e63a6 | 136 | * @lock: spin lock protecting @desc |
db55d922 | 137 | */ |
5442680f | 138 | static unsigned long |
4e9e63a6 RK |
139 | nilfs_palloc_group_desc_nfrees(const struct nilfs_palloc_group_desc *desc, |
140 | spinlock_t *lock) | |
5442680f RK |
141 | { |
142 | unsigned long nfree; | |
143 | ||
4e9e63a6 | 144 | spin_lock(lock); |
5442680f | 145 | nfree = le32_to_cpu(desc->pg_nfrees); |
4e9e63a6 | 146 | spin_unlock(lock); |
5442680f RK |
147 | return nfree; |
148 | } | |
149 | ||
db55d922 RK |
150 | /** |
151 | * nilfs_palloc_group_desc_add_entries - adjust count of free entries | |
db55d922 | 152 | * @desc: pointer to descriptor structure for the group |
4e9e63a6 | 153 | * @lock: spin lock protecting @desc |
db55d922 RK |
154 | * @n: delta to be added |
155 | */ | |
d0c14a9e | 156 | static u32 |
4e9e63a6 RK |
157 | nilfs_palloc_group_desc_add_entries(struct nilfs_palloc_group_desc *desc, |
158 | spinlock_t *lock, u32 n) | |
5442680f | 159 | { |
d0c14a9e RK |
160 | u32 nfree; |
161 | ||
4e9e63a6 | 162 | spin_lock(lock); |
5442680f | 163 | le32_add_cpu(&desc->pg_nfrees, n); |
d0c14a9e | 164 | nfree = le32_to_cpu(desc->pg_nfrees); |
4e9e63a6 | 165 | spin_unlock(lock); |
d0c14a9e | 166 | return nfree; |
5442680f RK |
167 | } |
168 | ||
db55d922 RK |
169 | /** |
170 | * nilfs_palloc_entry_blkoff - get block offset of an entry block | |
171 | * @inode: inode of metadata file using this allocator | |
172 | * @nr: serial number of the entry (e.g. inode number) | |
173 | */ | |
5442680f RK |
174 | static unsigned long |
175 | nilfs_palloc_entry_blkoff(const struct inode *inode, __u64 nr) | |
176 | { | |
177 | unsigned long group, group_offset; | |
178 | ||
179 | group = nilfs_palloc_group(inode, nr, &group_offset); | |
180 | ||
181 | return nilfs_palloc_bitmap_blkoff(inode, group) + 1 + | |
182 | group_offset / NILFS_MDT(inode)->mi_entries_per_block; | |
183 | } | |
184 | ||
db55d922 RK |
185 | /** |
186 | * nilfs_palloc_desc_block_init - initialize buffer of a group descriptor block | |
187 | * @inode: inode of metadata file | |
188 | * @bh: buffer head of the buffer to be initialized | |
189 | * @kaddr: kernel address mapped for the page including the buffer | |
190 | */ | |
5442680f RK |
191 | static void nilfs_palloc_desc_block_init(struct inode *inode, |
192 | struct buffer_head *bh, void *kaddr) | |
193 | { | |
194 | struct nilfs_palloc_group_desc *desc = kaddr + bh_offset(bh); | |
195 | unsigned long n = nilfs_palloc_groups_per_desc_block(inode); | |
196 | __le32 nfrees; | |
197 | ||
198 | nfrees = cpu_to_le32(nilfs_palloc_entries_per_group(inode)); | |
199 | while (n-- > 0) { | |
200 | desc->pg_nfrees = nfrees; | |
201 | desc++; | |
202 | } | |
203 | } | |
204 | ||
70622a20 RK |
205 | static int nilfs_palloc_get_block(struct inode *inode, unsigned long blkoff, |
206 | int create, | |
207 | void (*init_block)(struct inode *, | |
208 | struct buffer_head *, | |
209 | void *), | |
210 | struct buffer_head **bhp, | |
211 | struct nilfs_bh_assoc *prev, | |
212 | spinlock_t *lock) | |
213 | { | |
214 | int ret; | |
215 | ||
216 | spin_lock(lock); | |
217 | if (prev->bh && blkoff == prev->blkoff) { | |
218 | get_bh(prev->bh); | |
219 | *bhp = prev->bh; | |
220 | spin_unlock(lock); | |
221 | return 0; | |
222 | } | |
223 | spin_unlock(lock); | |
224 | ||
225 | ret = nilfs_mdt_get_block(inode, blkoff, create, init_block, bhp); | |
226 | if (!ret) { | |
227 | spin_lock(lock); | |
228 | /* | |
229 | * The following code must be safe for change of the | |
230 | * cache contents during the get block call. | |
231 | */ | |
232 | brelse(prev->bh); | |
233 | get_bh(*bhp); | |
234 | prev->bh = *bhp; | |
235 | prev->blkoff = blkoff; | |
236 | spin_unlock(lock); | |
237 | } | |
238 | return ret; | |
239 | } | |
240 | ||
da019954 RK |
241 | /** |
242 | * nilfs_palloc_delete_block - delete a block on the persistent allocator file | |
243 | * @inode: inode of metadata file using this allocator | |
244 | * @blkoff: block offset | |
245 | * @prev: nilfs_bh_assoc struct of the last used buffer | |
246 | * @lock: spin lock protecting @prev | |
247 | */ | |
248 | static int nilfs_palloc_delete_block(struct inode *inode, unsigned long blkoff, | |
249 | struct nilfs_bh_assoc *prev, | |
250 | spinlock_t *lock) | |
251 | { | |
252 | spin_lock(lock); | |
253 | if (prev->bh && blkoff == prev->blkoff) { | |
254 | brelse(prev->bh); | |
255 | prev->bh = NULL; | |
256 | } | |
257 | spin_unlock(lock); | |
258 | return nilfs_mdt_delete_block(inode, blkoff); | |
259 | } | |
260 | ||
db55d922 RK |
261 | /** |
262 | * nilfs_palloc_get_desc_block - get buffer head of a group descriptor block | |
263 | * @inode: inode of metadata file using this allocator | |
264 | * @group: group number | |
265 | * @create: create flag | |
266 | * @bhp: pointer to store the resultant buffer head | |
267 | */ | |
5442680f RK |
268 | static int nilfs_palloc_get_desc_block(struct inode *inode, |
269 | unsigned long group, | |
270 | int create, struct buffer_head **bhp) | |
271 | { | |
70622a20 RK |
272 | struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache; |
273 | ||
274 | return nilfs_palloc_get_block(inode, | |
275 | nilfs_palloc_desc_blkoff(inode, group), | |
276 | create, nilfs_palloc_desc_block_init, | |
277 | bhp, &cache->prev_desc, &cache->lock); | |
5442680f RK |
278 | } |
279 | ||
db55d922 RK |
280 | /** |
281 | * nilfs_palloc_get_bitmap_block - get buffer head of a bitmap block | |
282 | * @inode: inode of metadata file using this allocator | |
283 | * @group: group number | |
284 | * @create: create flag | |
285 | * @bhp: pointer to store the resultant buffer head | |
286 | */ | |
5442680f RK |
287 | static int nilfs_palloc_get_bitmap_block(struct inode *inode, |
288 | unsigned long group, | |
289 | int create, struct buffer_head **bhp) | |
290 | { | |
70622a20 RK |
291 | struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache; |
292 | ||
293 | return nilfs_palloc_get_block(inode, | |
294 | nilfs_palloc_bitmap_blkoff(inode, group), | |
295 | create, NULL, bhp, | |
296 | &cache->prev_bitmap, &cache->lock); | |
5442680f RK |
297 | } |
298 | ||
da019954 RK |
299 | /** |
300 | * nilfs_palloc_delete_bitmap_block - delete a bitmap block | |
301 | * @inode: inode of metadata file using this allocator | |
302 | * @group: group number | |
303 | */ | |
304 | static int nilfs_palloc_delete_bitmap_block(struct inode *inode, | |
305 | unsigned long group) | |
306 | { | |
307 | struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache; | |
308 | ||
309 | return nilfs_palloc_delete_block(inode, | |
310 | nilfs_palloc_bitmap_blkoff(inode, | |
311 | group), | |
312 | &cache->prev_bitmap, &cache->lock); | |
313 | } | |
314 | ||
db55d922 RK |
315 | /** |
316 | * nilfs_palloc_get_entry_block - get buffer head of an entry block | |
317 | * @inode: inode of metadata file using this allocator | |
318 | * @nr: serial number of the entry (e.g. inode number) | |
319 | * @create: create flag | |
320 | * @bhp: pointer to store the resultant buffer head | |
321 | */ | |
5442680f RK |
322 | int nilfs_palloc_get_entry_block(struct inode *inode, __u64 nr, |
323 | int create, struct buffer_head **bhp) | |
324 | { | |
70622a20 RK |
325 | struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache; |
326 | ||
327 | return nilfs_palloc_get_block(inode, | |
328 | nilfs_palloc_entry_blkoff(inode, nr), | |
329 | create, NULL, bhp, | |
330 | &cache->prev_entry, &cache->lock); | |
5442680f RK |
331 | } |
332 | ||
da019954 RK |
333 | /** |
334 | * nilfs_palloc_delete_entry_block - delete an entry block | |
335 | * @inode: inode of metadata file using this allocator | |
336 | * @nr: serial number of the entry | |
337 | */ | |
338 | static int nilfs_palloc_delete_entry_block(struct inode *inode, __u64 nr) | |
339 | { | |
340 | struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache; | |
341 | ||
342 | return nilfs_palloc_delete_block(inode, | |
343 | nilfs_palloc_entry_blkoff(inode, nr), | |
344 | &cache->prev_entry, &cache->lock); | |
345 | } | |
346 | ||
db55d922 RK |
347 | /** |
348 | * nilfs_palloc_block_get_group_desc - get kernel address of a group descriptor | |
349 | * @inode: inode of metadata file using this allocator | |
350 | * @group: group number | |
351 | * @bh: buffer head of the buffer storing the group descriptor block | |
352 | * @kaddr: kernel address mapped for the page including the buffer | |
353 | */ | |
5442680f RK |
354 | static struct nilfs_palloc_group_desc * |
355 | nilfs_palloc_block_get_group_desc(const struct inode *inode, | |
356 | unsigned long group, | |
357 | const struct buffer_head *bh, void *kaddr) | |
358 | { | |
359 | return (struct nilfs_palloc_group_desc *)(kaddr + bh_offset(bh)) + | |
360 | group % nilfs_palloc_groups_per_desc_block(inode); | |
361 | } | |
362 | ||
db55d922 RK |
363 | /** |
364 | * nilfs_palloc_block_get_entry - get kernel address of an entry | |
365 | * @inode: inode of metadata file using this allocator | |
366 | * @nr: serial number of the entry (e.g. inode number) | |
367 | * @bh: buffer head of the buffer storing the entry block | |
368 | * @kaddr: kernel address mapped for the page including the buffer | |
369 | */ | |
5442680f RK |
370 | void *nilfs_palloc_block_get_entry(const struct inode *inode, __u64 nr, |
371 | const struct buffer_head *bh, void *kaddr) | |
372 | { | |
373 | unsigned long entry_offset, group_offset; | |
374 | ||
375 | nilfs_palloc_group(inode, nr, &group_offset); | |
376 | entry_offset = group_offset % NILFS_MDT(inode)->mi_entries_per_block; | |
377 | ||
378 | return kaddr + bh_offset(bh) + | |
379 | entry_offset * NILFS_MDT(inode)->mi_entry_size; | |
380 | } | |
381 | ||
db55d922 RK |
382 | /** |
383 | * nilfs_palloc_find_available_slot - find available slot in a group | |
db55d922 | 384 | * @bitmap: bitmap of the group |
4e9e63a6 | 385 | * @target: offset number of an entry in the group (start point) |
db55d922 | 386 | * @bsize: size in bits |
4e9e63a6 | 387 | * @lock: spin lock protecting @bitmap |
db55d922 | 388 | */ |
4e9e63a6 | 389 | static int nilfs_palloc_find_available_slot(unsigned char *bitmap, |
5442680f | 390 | unsigned long target, |
0c6c44cb | 391 | unsigned int bsize, |
4e9e63a6 | 392 | spinlock_t *lock) |
5442680f | 393 | { |
18c41b37 RK |
394 | int pos, end = bsize; |
395 | ||
396 | if (likely(target < bsize)) { | |
397 | pos = target; | |
398 | do { | |
399 | pos = nilfs_find_next_zero_bit(bitmap, end, pos); | |
400 | if (pos >= end) | |
401 | break; | |
402 | if (!nilfs_set_bit_atomic(lock, pos, bitmap)) | |
403 | return pos; | |
404 | } while (++pos < end); | |
405 | ||
406 | end = target; | |
4e9e63a6 | 407 | } |
5442680f | 408 | |
18c41b37 RK |
409 | /* wrap around */ |
410 | for (pos = 0; pos < end; pos++) { | |
411 | pos = nilfs_find_next_zero_bit(bitmap, end, pos); | |
412 | if (pos >= end) | |
413 | break; | |
414 | if (!nilfs_set_bit_atomic(lock, pos, bitmap)) | |
415 | return pos; | |
5442680f | 416 | } |
18c41b37 | 417 | |
5442680f RK |
418 | return -ENOSPC; |
419 | } | |
420 | ||
db55d922 RK |
421 | /** |
422 | * nilfs_palloc_rest_groups_in_desc_block - get the remaining number of groups | |
423 | * in a group descriptor block | |
424 | * @inode: inode of metadata file using this allocator | |
425 | * @curr: current group number | |
426 | * @max: maximum number of groups | |
427 | */ | |
5442680f RK |
428 | static unsigned long |
429 | nilfs_palloc_rest_groups_in_desc_block(const struct inode *inode, | |
430 | unsigned long curr, unsigned long max) | |
431 | { | |
432 | return min_t(unsigned long, | |
433 | nilfs_palloc_groups_per_desc_block(inode) - | |
434 | curr % nilfs_palloc_groups_per_desc_block(inode), | |
435 | max - curr + 1); | |
436 | } | |
437 | ||
c7ef972c VD |
438 | /** |
439 | * nilfs_palloc_count_desc_blocks - count descriptor blocks number | |
440 | * @inode: inode of metadata file using this allocator | |
441 | * @desc_blocks: descriptor blocks number [out] | |
442 | */ | |
443 | static int nilfs_palloc_count_desc_blocks(struct inode *inode, | |
444 | unsigned long *desc_blocks) | |
445 | { | |
3568a13f | 446 | __u64 blknum; |
c7ef972c VD |
447 | int ret; |
448 | ||
449 | ret = nilfs_bmap_last_key(NILFS_I(inode)->i_bmap, &blknum); | |
450 | if (likely(!ret)) | |
451 | *desc_blocks = DIV_ROUND_UP( | |
3568a13f RK |
452 | (unsigned long)blknum, |
453 | NILFS_MDT(inode)->mi_blocks_per_desc_block); | |
c7ef972c VD |
454 | return ret; |
455 | } | |
456 | ||
457 | /** | |
458 | * nilfs_palloc_mdt_file_can_grow - check potential opportunity for | |
459 | * MDT file growing | |
460 | * @inode: inode of metadata file using this allocator | |
461 | * @desc_blocks: known current descriptor blocks count | |
462 | */ | |
463 | static inline bool nilfs_palloc_mdt_file_can_grow(struct inode *inode, | |
464 | unsigned long desc_blocks) | |
465 | { | |
466 | return (nilfs_palloc_groups_per_desc_block(inode) * desc_blocks) < | |
467 | nilfs_palloc_groups_count(inode); | |
468 | } | |
469 | ||
470 | /** | |
471 | * nilfs_palloc_count_max_entries - count max number of entries that can be | |
472 | * described by descriptor blocks count | |
473 | * @inode: inode of metadata file using this allocator | |
474 | * @nused: current number of used entries | |
475 | * @nmaxp: max number of entries [out] | |
476 | */ | |
477 | int nilfs_palloc_count_max_entries(struct inode *inode, u64 nused, u64 *nmaxp) | |
478 | { | |
479 | unsigned long desc_blocks = 0; | |
480 | u64 entries_per_desc_block, nmax; | |
481 | int err; | |
482 | ||
483 | err = nilfs_palloc_count_desc_blocks(inode, &desc_blocks); | |
484 | if (unlikely(err)) | |
485 | return err; | |
486 | ||
487 | entries_per_desc_block = (u64)nilfs_palloc_entries_per_group(inode) * | |
488 | nilfs_palloc_groups_per_desc_block(inode); | |
489 | nmax = entries_per_desc_block * desc_blocks; | |
490 | ||
491 | if (nused == nmax && | |
492 | nilfs_palloc_mdt_file_can_grow(inode, desc_blocks)) | |
493 | nmax += entries_per_desc_block; | |
494 | ||
495 | if (nused > nmax) | |
496 | return -ERANGE; | |
497 | ||
498 | *nmaxp = nmax; | |
499 | return 0; | |
500 | } | |
501 | ||
db55d922 RK |
502 | /** |
503 | * nilfs_palloc_prepare_alloc_entry - prepare to allocate a persistent object | |
504 | * @inode: inode of metadata file using this allocator | |
505 | * @req: nilfs_palloc_req structure exchanged for the allocation | |
506 | */ | |
5442680f RK |
507 | int nilfs_palloc_prepare_alloc_entry(struct inode *inode, |
508 | struct nilfs_palloc_req *req) | |
509 | { | |
510 | struct buffer_head *desc_bh, *bitmap_bh; | |
511 | struct nilfs_palloc_group_desc *desc; | |
512 | unsigned char *bitmap; | |
513 | void *desc_kaddr, *bitmap_kaddr; | |
514 | unsigned long group, maxgroup, ngroups; | |
515 | unsigned long group_offset, maxgroup_offset; | |
09ef29e0 | 516 | unsigned long n, entries_per_group; |
5442680f | 517 | unsigned long i, j; |
4e9e63a6 | 518 | spinlock_t *lock; |
5442680f RK |
519 | int pos, ret; |
520 | ||
521 | ngroups = nilfs_palloc_groups_count(inode); | |
522 | maxgroup = ngroups - 1; | |
523 | group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset); | |
524 | entries_per_group = nilfs_palloc_entries_per_group(inode); | |
5442680f RK |
525 | |
526 | for (i = 0; i < ngroups; i += n) { | |
527 | if (group >= ngroups) { | |
528 | /* wrap around */ | |
529 | group = 0; | |
530 | maxgroup = nilfs_palloc_group(inode, req->pr_entry_nr, | |
531 | &maxgroup_offset) - 1; | |
532 | } | |
533 | ret = nilfs_palloc_get_desc_block(inode, group, 1, &desc_bh); | |
534 | if (ret < 0) | |
535 | return ret; | |
536 | desc_kaddr = kmap(desc_bh->b_page); | |
537 | desc = nilfs_palloc_block_get_group_desc( | |
538 | inode, group, desc_bh, desc_kaddr); | |
539 | n = nilfs_palloc_rest_groups_in_desc_block(inode, group, | |
540 | maxgroup); | |
541 | for (j = 0; j < n; j++, desc++, group++) { | |
4e9e63a6 RK |
542 | lock = nilfs_mdt_bgl_lock(inode, group); |
543 | if (nilfs_palloc_group_desc_nfrees(desc, lock) > 0) { | |
5442680f RK |
544 | ret = nilfs_palloc_get_bitmap_block( |
545 | inode, group, 1, &bitmap_bh); | |
546 | if (ret < 0) | |
547 | goto out_desc; | |
548 | bitmap_kaddr = kmap(bitmap_bh->b_page); | |
141bbdba | 549 | bitmap = bitmap_kaddr + bh_offset(bitmap_bh); |
5442680f | 550 | pos = nilfs_palloc_find_available_slot( |
4e9e63a6 RK |
551 | bitmap, group_offset, |
552 | entries_per_group, lock); | |
5442680f RK |
553 | if (pos >= 0) { |
554 | /* found a free entry */ | |
555 | nilfs_palloc_group_desc_add_entries( | |
4e9e63a6 | 556 | desc, lock, -1); |
5442680f RK |
557 | req->pr_entry_nr = |
558 | entries_per_group * group + pos; | |
559 | kunmap(desc_bh->b_page); | |
560 | kunmap(bitmap_bh->b_page); | |
561 | ||
562 | req->pr_desc_bh = desc_bh; | |
563 | req->pr_bitmap_bh = bitmap_bh; | |
564 | return 0; | |
565 | } | |
566 | kunmap(bitmap_bh->b_page); | |
567 | brelse(bitmap_bh); | |
568 | } | |
569 | ||
570 | group_offset = 0; | |
571 | } | |
572 | ||
573 | kunmap(desc_bh->b_page); | |
574 | brelse(desc_bh); | |
575 | } | |
576 | ||
577 | /* no entries left */ | |
578 | return -ENOSPC; | |
579 | ||
580 | out_desc: | |
581 | kunmap(desc_bh->b_page); | |
582 | brelse(desc_bh); | |
583 | return ret; | |
584 | } | |
585 | ||
db55d922 RK |
586 | /** |
587 | * nilfs_palloc_commit_alloc_entry - finish allocation of a persistent object | |
588 | * @inode: inode of metadata file using this allocator | |
589 | * @req: nilfs_palloc_req structure exchanged for the allocation | |
590 | */ | |
5442680f RK |
591 | void nilfs_palloc_commit_alloc_entry(struct inode *inode, |
592 | struct nilfs_palloc_req *req) | |
593 | { | |
5fc7b141 RK |
594 | mark_buffer_dirty(req->pr_bitmap_bh); |
595 | mark_buffer_dirty(req->pr_desc_bh); | |
5442680f RK |
596 | nilfs_mdt_mark_dirty(inode); |
597 | ||
598 | brelse(req->pr_bitmap_bh); | |
599 | brelse(req->pr_desc_bh); | |
600 | } | |
601 | ||
db55d922 RK |
602 | /** |
603 | * nilfs_palloc_commit_free_entry - finish deallocating a persistent object | |
604 | * @inode: inode of metadata file using this allocator | |
605 | * @req: nilfs_palloc_req structure exchanged for the removal | |
606 | */ | |
5442680f RK |
607 | void nilfs_palloc_commit_free_entry(struct inode *inode, |
608 | struct nilfs_palloc_req *req) | |
609 | { | |
610 | struct nilfs_palloc_group_desc *desc; | |
611 | unsigned long group, group_offset; | |
612 | unsigned char *bitmap; | |
613 | void *desc_kaddr, *bitmap_kaddr; | |
4e9e63a6 | 614 | spinlock_t *lock; |
5442680f RK |
615 | |
616 | group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset); | |
617 | desc_kaddr = kmap(req->pr_desc_bh->b_page); | |
618 | desc = nilfs_palloc_block_get_group_desc(inode, group, | |
619 | req->pr_desc_bh, desc_kaddr); | |
620 | bitmap_kaddr = kmap(req->pr_bitmap_bh->b_page); | |
141bbdba | 621 | bitmap = bitmap_kaddr + bh_offset(req->pr_bitmap_bh); |
4e9e63a6 | 622 | lock = nilfs_mdt_bgl_lock(inode, group); |
5442680f | 623 | |
4e9e63a6 | 624 | if (!nilfs_clear_bit_atomic(lock, group_offset, bitmap)) |
d6517deb RK |
625 | nilfs_msg(inode->i_sb, KERN_WARNING, |
626 | "%s (ino=%lu): entry number %llu already freed", | |
627 | __func__, inode->i_ino, | |
628 | (unsigned long long)req->pr_entry_nr); | |
9954e7af | 629 | else |
4e9e63a6 | 630 | nilfs_palloc_group_desc_add_entries(desc, lock, 1); |
5442680f RK |
631 | |
632 | kunmap(req->pr_bitmap_bh->b_page); | |
633 | kunmap(req->pr_desc_bh->b_page); | |
634 | ||
5fc7b141 RK |
635 | mark_buffer_dirty(req->pr_desc_bh); |
636 | mark_buffer_dirty(req->pr_bitmap_bh); | |
5442680f RK |
637 | nilfs_mdt_mark_dirty(inode); |
638 | ||
639 | brelse(req->pr_bitmap_bh); | |
640 | brelse(req->pr_desc_bh); | |
641 | } | |
642 | ||
db55d922 RK |
643 | /** |
644 | * nilfs_palloc_abort_alloc_entry - cancel allocation of a persistent object | |
645 | * @inode: inode of metadata file using this allocator | |
646 | * @req: nilfs_palloc_req structure exchanged for the allocation | |
647 | */ | |
5442680f RK |
648 | void nilfs_palloc_abort_alloc_entry(struct inode *inode, |
649 | struct nilfs_palloc_req *req) | |
650 | { | |
651 | struct nilfs_palloc_group_desc *desc; | |
652 | void *desc_kaddr, *bitmap_kaddr; | |
653 | unsigned char *bitmap; | |
654 | unsigned long group, group_offset; | |
4e9e63a6 | 655 | spinlock_t *lock; |
5442680f RK |
656 | |
657 | group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset); | |
658 | desc_kaddr = kmap(req->pr_desc_bh->b_page); | |
659 | desc = nilfs_palloc_block_get_group_desc(inode, group, | |
660 | req->pr_desc_bh, desc_kaddr); | |
661 | bitmap_kaddr = kmap(req->pr_bitmap_bh->b_page); | |
141bbdba | 662 | bitmap = bitmap_kaddr + bh_offset(req->pr_bitmap_bh); |
4e9e63a6 RK |
663 | lock = nilfs_mdt_bgl_lock(inode, group); |
664 | ||
665 | if (!nilfs_clear_bit_atomic(lock, group_offset, bitmap)) | |
d6517deb RK |
666 | nilfs_msg(inode->i_sb, KERN_WARNING, |
667 | "%s (ino=%lu): entry number %llu already freed", | |
668 | __func__, inode->i_ino, | |
669 | (unsigned long long)req->pr_entry_nr); | |
9954e7af | 670 | else |
4e9e63a6 | 671 | nilfs_palloc_group_desc_add_entries(desc, lock, 1); |
5442680f RK |
672 | |
673 | kunmap(req->pr_bitmap_bh->b_page); | |
674 | kunmap(req->pr_desc_bh->b_page); | |
675 | ||
676 | brelse(req->pr_bitmap_bh); | |
677 | brelse(req->pr_desc_bh); | |
678 | ||
679 | req->pr_entry_nr = 0; | |
680 | req->pr_bitmap_bh = NULL; | |
681 | req->pr_desc_bh = NULL; | |
682 | } | |
683 | ||
db55d922 RK |
684 | /** |
685 | * nilfs_palloc_prepare_free_entry - prepare to deallocate a persistent object | |
686 | * @inode: inode of metadata file using this allocator | |
687 | * @req: nilfs_palloc_req structure exchanged for the removal | |
688 | */ | |
5442680f RK |
689 | int nilfs_palloc_prepare_free_entry(struct inode *inode, |
690 | struct nilfs_palloc_req *req) | |
691 | { | |
692 | struct buffer_head *desc_bh, *bitmap_bh; | |
693 | unsigned long group, group_offset; | |
694 | int ret; | |
695 | ||
696 | group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset); | |
697 | ret = nilfs_palloc_get_desc_block(inode, group, 1, &desc_bh); | |
698 | if (ret < 0) | |
699 | return ret; | |
700 | ret = nilfs_palloc_get_bitmap_block(inode, group, 1, &bitmap_bh); | |
701 | if (ret < 0) { | |
702 | brelse(desc_bh); | |
703 | return ret; | |
704 | } | |
705 | ||
706 | req->pr_desc_bh = desc_bh; | |
707 | req->pr_bitmap_bh = bitmap_bh; | |
708 | return 0; | |
709 | } | |
710 | ||
db55d922 RK |
711 | /** |
712 | * nilfs_palloc_abort_free_entry - cancel deallocating a persistent object | |
713 | * @inode: inode of metadata file using this allocator | |
714 | * @req: nilfs_palloc_req structure exchanged for the removal | |
715 | */ | |
5442680f RK |
716 | void nilfs_palloc_abort_free_entry(struct inode *inode, |
717 | struct nilfs_palloc_req *req) | |
718 | { | |
719 | brelse(req->pr_bitmap_bh); | |
720 | brelse(req->pr_desc_bh); | |
721 | ||
722 | req->pr_entry_nr = 0; | |
723 | req->pr_bitmap_bh = NULL; | |
724 | req->pr_desc_bh = NULL; | |
725 | } | |
726 | ||
db55d922 RK |
727 | /** |
728 | * nilfs_palloc_freev - deallocate a set of persistent objects | |
729 | * @inode: inode of metadata file using this allocator | |
730 | * @entry_nrs: array of entry numbers to be deallocated | |
731 | * @nitems: number of entries stored in @entry_nrs | |
732 | */ | |
5442680f RK |
733 | int nilfs_palloc_freev(struct inode *inode, __u64 *entry_nrs, size_t nitems) |
734 | { | |
735 | struct buffer_head *desc_bh, *bitmap_bh; | |
736 | struct nilfs_palloc_group_desc *desc; | |
737 | unsigned char *bitmap; | |
738 | void *desc_kaddr, *bitmap_kaddr; | |
739 | unsigned long group, group_offset; | |
d0c14a9e | 740 | __u64 group_min_nr, last_nrs[8]; |
b2258094 | 741 | const unsigned long epg = nilfs_palloc_entries_per_group(inode); |
0c6c44cb RK |
742 | const unsigned int epb = NILFS_MDT(inode)->mi_entries_per_block; |
743 | unsigned int entry_start, end, pos; | |
4e9e63a6 | 744 | spinlock_t *lock; |
d0c14a9e RK |
745 | int i, j, k, ret; |
746 | u32 nfree; | |
5442680f | 747 | |
349dbc36 | 748 | for (i = 0; i < nitems; i = j) { |
d0c14a9e RK |
749 | int change_group = false; |
750 | int nempties = 0, n = 0; | |
751 | ||
5442680f RK |
752 | group = nilfs_palloc_group(inode, entry_nrs[i], &group_offset); |
753 | ret = nilfs_palloc_get_desc_block(inode, group, 0, &desc_bh); | |
754 | if (ret < 0) | |
755 | return ret; | |
756 | ret = nilfs_palloc_get_bitmap_block(inode, group, 0, | |
757 | &bitmap_bh); | |
758 | if (ret < 0) { | |
759 | brelse(desc_bh); | |
760 | return ret; | |
761 | } | |
b2258094 RK |
762 | |
763 | /* Get the first entry number of the group */ | |
764 | group_min_nr = (__u64)group * epg; | |
765 | ||
5442680f | 766 | bitmap_kaddr = kmap(bitmap_bh->b_page); |
141bbdba | 767 | bitmap = bitmap_kaddr + bh_offset(bitmap_bh); |
4e9e63a6 | 768 | lock = nilfs_mdt_bgl_lock(inode, group); |
d0c14a9e RK |
769 | |
770 | j = i; | |
771 | entry_start = rounddown(group_offset, epb); | |
772 | do { | |
4e9e63a6 RK |
773 | if (!nilfs_clear_bit_atomic(lock, group_offset, |
774 | bitmap)) { | |
d6517deb RK |
775 | nilfs_msg(inode->i_sb, KERN_WARNING, |
776 | "%s (ino=%lu): entry number %llu already freed", | |
777 | __func__, inode->i_ino, | |
778 | (unsigned long long)entry_nrs[j]); | |
9954e7af RK |
779 | } else { |
780 | n++; | |
5442680f | 781 | } |
d0c14a9e RK |
782 | |
783 | j++; | |
784 | if (j >= nitems || entry_nrs[j] < group_min_nr || | |
785 | entry_nrs[j] >= group_min_nr + epg) { | |
786 | change_group = true; | |
787 | } else { | |
788 | group_offset = entry_nrs[j] - group_min_nr; | |
789 | if (group_offset >= entry_start && | |
790 | group_offset < entry_start + epb) { | |
791 | /* This entry is in the same block */ | |
792 | continue; | |
793 | } | |
794 | } | |
795 | ||
796 | /* Test if the entry block is empty or not */ | |
797 | end = entry_start + epb; | |
798 | pos = nilfs_find_next_bit(bitmap, end, entry_start); | |
799 | if (pos >= end) { | |
800 | last_nrs[nempties++] = entry_nrs[j - 1]; | |
801 | if (nempties >= ARRAY_SIZE(last_nrs)) | |
802 | break; | |
803 | } | |
804 | ||
805 | if (change_group) | |
806 | break; | |
807 | ||
808 | /* Go on to the next entry block */ | |
809 | entry_start = rounddown(group_offset, epb); | |
810 | } while (true); | |
5442680f RK |
811 | |
812 | kunmap(bitmap_bh->b_page); | |
d0c14a9e RK |
813 | mark_buffer_dirty(bitmap_bh); |
814 | brelse(bitmap_bh); | |
5442680f | 815 | |
d0c14a9e RK |
816 | for (k = 0; k < nempties; k++) { |
817 | ret = nilfs_palloc_delete_entry_block(inode, | |
818 | last_nrs[k]); | |
d6517deb RK |
819 | if (ret && ret != -ENOENT) |
820 | nilfs_msg(inode->i_sb, KERN_WARNING, | |
821 | "error %d deleting block that object (entry=%llu, ino=%lu) belongs to", | |
822 | ret, (unsigned long long)last_nrs[k], | |
823 | inode->i_ino); | |
d0c14a9e RK |
824 | } |
825 | ||
826 | desc_kaddr = kmap_atomic(desc_bh->b_page); | |
827 | desc = nilfs_palloc_block_get_group_desc( | |
828 | inode, group, desc_bh, desc_kaddr); | |
829 | nfree = nilfs_palloc_group_desc_add_entries(desc, lock, n); | |
830 | kunmap_atomic(desc_kaddr); | |
5fc7b141 | 831 | mark_buffer_dirty(desc_bh); |
5442680f | 832 | nilfs_mdt_mark_dirty(inode); |
5442680f | 833 | brelse(desc_bh); |
d0c14a9e RK |
834 | |
835 | if (nfree == nilfs_palloc_entries_per_group(inode)) { | |
836 | ret = nilfs_palloc_delete_bitmap_block(inode, group); | |
d6517deb RK |
837 | if (ret && ret != -ENOENT) |
838 | nilfs_msg(inode->i_sb, KERN_WARNING, | |
839 | "error %d deleting bitmap block of group=%lu, ino=%lu", | |
840 | ret, group, inode->i_ino); | |
d0c14a9e | 841 | } |
5442680f RK |
842 | } |
843 | return 0; | |
844 | } | |
db38d5ad RK |
845 | |
846 | void nilfs_palloc_setup_cache(struct inode *inode, | |
847 | struct nilfs_palloc_cache *cache) | |
848 | { | |
849 | NILFS_MDT(inode)->mi_palloc_cache = cache; | |
850 | spin_lock_init(&cache->lock); | |
851 | } | |
852 | ||
853 | void nilfs_palloc_clear_cache(struct inode *inode) | |
854 | { | |
855 | struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache; | |
856 | ||
857 | spin_lock(&cache->lock); | |
858 | brelse(cache->prev_desc.bh); | |
859 | brelse(cache->prev_bitmap.bh); | |
860 | brelse(cache->prev_entry.bh); | |
861 | cache->prev_desc.bh = NULL; | |
862 | cache->prev_bitmap.bh = NULL; | |
863 | cache->prev_entry.bh = NULL; | |
864 | spin_unlock(&cache->lock); | |
865 | } | |
866 | ||
867 | void nilfs_palloc_destroy_cache(struct inode *inode) | |
868 | { | |
869 | nilfs_palloc_clear_cache(inode); | |
870 | NILFS_MDT(inode)->mi_palloc_cache = NULL; | |
871 | } |