]>
Commit | Line | Data |
---|---|---|
2b27bdcc | 1 | // SPDX-License-Identifier: GPL-2.0-only |
1e51764a AB |
2 | /* |
3 | * This file is part of UBIFS. | |
4 | * | |
5 | * Copyright (C) 2006-2008 Nokia Corporation. | |
6 | * | |
1e51764a AB |
7 | * Authors: Adrian Hunter |
8 | * Artem Bityutskiy (Битюцкий Артём) | |
9 | */ | |
10 | ||
11 | /* This file implements TNC functions for committing */ | |
12 | ||
2b1844a8 | 13 | #include <linux/random.h> |
8d7819b4 | 14 | #include "ubifs.h" |
1e51764a AB |
15 | |
16 | /** | |
17 | * make_idx_node - make an index node for fill-the-gaps method of TNC commit. | |
18 | * @c: UBIFS file-system description object | |
19 | * @idx: buffer in which to place new index node | |
20 | * @znode: znode from which to make new index node | |
21 | * @lnum: LEB number where new index node will be written | |
22 | * @offs: offset where new index node will be written | |
23 | * @len: length of new index node | |
24 | */ | |
25 | static int make_idx_node(struct ubifs_info *c, struct ubifs_idx_node *idx, | |
26 | struct ubifs_znode *znode, int lnum, int offs, int len) | |
27 | { | |
28 | struct ubifs_znode *zp; | |
16a26b20 | 29 | u8 hash[UBIFS_HASH_ARR_SZ]; |
1e51764a AB |
30 | int i, err; |
31 | ||
32 | /* Make index node */ | |
33 | idx->ch.node_type = UBIFS_IDX_NODE; | |
34 | idx->child_cnt = cpu_to_le16(znode->child_cnt); | |
35 | idx->level = cpu_to_le16(znode->level); | |
36 | for (i = 0; i < znode->child_cnt; i++) { | |
37 | struct ubifs_branch *br = ubifs_idx_branch(c, idx, i); | |
38 | struct ubifs_zbranch *zbr = &znode->zbranch[i]; | |
39 | ||
40 | key_write_idx(c, &zbr->key, &br->key); | |
41 | br->lnum = cpu_to_le32(zbr->lnum); | |
42 | br->offs = cpu_to_le32(zbr->offs); | |
43 | br->len = cpu_to_le32(zbr->len); | |
16a26b20 | 44 | ubifs_copy_hash(c, zbr->hash, ubifs_branch_hash(c, br)); |
1e51764a | 45 | if (!zbr->lnum || !zbr->len) { |
235c362b | 46 | ubifs_err(c, "bad ref in znode"); |
edf6be24 | 47 | ubifs_dump_znode(c, znode); |
1e51764a | 48 | if (zbr->znode) |
edf6be24 | 49 | ubifs_dump_znode(c, zbr->znode); |
df71b091 RW |
50 | |
51 | return -EINVAL; | |
1e51764a AB |
52 | } |
53 | } | |
54 | ubifs_prepare_node(c, idx, len, 0); | |
16a26b20 | 55 | ubifs_node_calc_hash(c, idx, hash); |
1e51764a | 56 | |
1e51764a AB |
57 | znode->lnum = lnum; |
58 | znode->offs = offs; | |
59 | znode->len = len; | |
1e51764a AB |
60 | |
61 | err = insert_old_idx_znode(c, znode); | |
62 | ||
63 | /* Update the parent */ | |
64 | zp = znode->parent; | |
65 | if (zp) { | |
66 | struct ubifs_zbranch *zbr; | |
67 | ||
68 | zbr = &zp->zbranch[znode->iip]; | |
69 | zbr->lnum = lnum; | |
70 | zbr->offs = offs; | |
71 | zbr->len = len; | |
16a26b20 | 72 | ubifs_copy_hash(c, hash, zbr->hash); |
1e51764a AB |
73 | } else { |
74 | c->zroot.lnum = lnum; | |
75 | c->zroot.offs = offs; | |
76 | c->zroot.len = len; | |
16a26b20 | 77 | ubifs_copy_hash(c, hash, c->zroot.hash); |
1e51764a AB |
78 | } |
79 | c->calc_idx_sz += ALIGN(len, 8); | |
80 | ||
81 | atomic_long_dec(&c->dirty_zn_cnt); | |
82 | ||
6eb61d58 RW |
83 | ubifs_assert(c, ubifs_zn_dirty(znode)); |
84 | ubifs_assert(c, ubifs_zn_cow(znode)); | |
1e51764a | 85 | |
06b282a4 AB |
86 | /* |
87 | * Note, unlike 'write_index()' we do not add memory barriers here | |
88 | * because this function is called with @c->tnc_mutex locked. | |
89 | */ | |
1e51764a AB |
90 | __clear_bit(DIRTY_ZNODE, &znode->flags); |
91 | __clear_bit(COW_ZNODE, &znode->flags); | |
92 | ||
93 | return err; | |
94 | } | |
95 | ||
96 | /** | |
97 | * fill_gap - make index nodes in gaps in dirty index LEBs. | |
98 | * @c: UBIFS file-system description object | |
99 | * @lnum: LEB number that gap appears in | |
100 | * @gap_start: offset of start of gap | |
101 | * @gap_end: offset of end of gap | |
102 | * @dirt: adds dirty space to this | |
103 | * | |
104 | * This function returns the number of index nodes written into the gap. | |
105 | */ | |
106 | static int fill_gap(struct ubifs_info *c, int lnum, int gap_start, int gap_end, | |
107 | int *dirt) | |
108 | { | |
109 | int len, gap_remains, gap_pos, written, pad_len; | |
110 | ||
6eb61d58 RW |
111 | ubifs_assert(c, (gap_start & 7) == 0); |
112 | ubifs_assert(c, (gap_end & 7) == 0); | |
113 | ubifs_assert(c, gap_end >= gap_start); | |
1e51764a AB |
114 | |
115 | gap_remains = gap_end - gap_start; | |
116 | if (!gap_remains) | |
117 | return 0; | |
118 | gap_pos = gap_start; | |
119 | written = 0; | |
120 | while (c->enext) { | |
121 | len = ubifs_idx_node_sz(c, c->enext->child_cnt); | |
122 | if (len < gap_remains) { | |
123 | struct ubifs_znode *znode = c->enext; | |
124 | const int alen = ALIGN(len, 8); | |
125 | int err; | |
126 | ||
6eb61d58 | 127 | ubifs_assert(c, alen <= gap_remains); |
1e51764a AB |
128 | err = make_idx_node(c, c->ileb_buf + gap_pos, znode, |
129 | lnum, gap_pos, len); | |
130 | if (err) | |
131 | return err; | |
132 | gap_remains -= alen; | |
133 | gap_pos += alen; | |
134 | c->enext = znode->cnext; | |
135 | if (c->enext == c->cnext) | |
136 | c->enext = NULL; | |
137 | written += 1; | |
138 | } else | |
139 | break; | |
140 | } | |
141 | if (gap_end == c->leb_size) { | |
142 | c->ileb_len = ALIGN(gap_pos, c->min_io_size); | |
143 | /* Pad to end of min_io_size */ | |
144 | pad_len = c->ileb_len - gap_pos; | |
145 | } else | |
146 | /* Pad to end of gap */ | |
147 | pad_len = gap_remains; | |
148 | dbg_gc("LEB %d:%d to %d len %d nodes written %d wasted bytes %d", | |
149 | lnum, gap_start, gap_end, gap_end - gap_start, written, pad_len); | |
150 | ubifs_pad(c, c->ileb_buf + gap_pos, pad_len); | |
151 | *dirt += pad_len; | |
152 | return written; | |
153 | } | |
154 | ||
155 | /** | |
156 | * find_old_idx - find an index node obsoleted since the last commit start. | |
157 | * @c: UBIFS file-system description object | |
158 | * @lnum: LEB number of obsoleted index node | |
159 | * @offs: offset of obsoleted index node | |
160 | * | |
161 | * Returns %1 if found and %0 otherwise. | |
162 | */ | |
163 | static int find_old_idx(struct ubifs_info *c, int lnum, int offs) | |
164 | { | |
165 | struct ubifs_old_idx *o; | |
166 | struct rb_node *p; | |
167 | ||
168 | p = c->old_idx.rb_node; | |
169 | while (p) { | |
170 | o = rb_entry(p, struct ubifs_old_idx, rb); | |
171 | if (lnum < o->lnum) | |
172 | p = p->rb_left; | |
173 | else if (lnum > o->lnum) | |
174 | p = p->rb_right; | |
175 | else if (offs < o->offs) | |
176 | p = p->rb_left; | |
177 | else if (offs > o->offs) | |
178 | p = p->rb_right; | |
179 | else | |
180 | return 1; | |
181 | } | |
182 | return 0; | |
183 | } | |
184 | ||
185 | /** | |
186 | * is_idx_node_in_use - determine if an index node can be overwritten. | |
187 | * @c: UBIFS file-system description object | |
188 | * @key: key of index node | |
189 | * @level: index node level | |
190 | * @lnum: LEB number of index node | |
191 | * @offs: offset of index node | |
192 | * | |
193 | * If @key / @lnum / @offs identify an index node that was not part of the old | |
194 | * index, then this function returns %0 (obsolete). Else if the index node was | |
195 | * part of the old index but is now dirty %1 is returned, else if it is clean %2 | |
196 | * is returned. A negative error code is returned on failure. | |
197 | */ | |
198 | static int is_idx_node_in_use(struct ubifs_info *c, union ubifs_key *key, | |
199 | int level, int lnum, int offs) | |
200 | { | |
201 | int ret; | |
202 | ||
203 | ret = is_idx_node_in_tnc(c, key, level, lnum, offs); | |
204 | if (ret < 0) | |
205 | return ret; /* Error code */ | |
206 | if (ret == 0) | |
207 | if (find_old_idx(c, lnum, offs)) | |
208 | return 1; | |
209 | return ret; | |
210 | } | |
211 | ||
212 | /** | |
213 | * layout_leb_in_gaps - layout index nodes using in-the-gaps method. | |
214 | * @c: UBIFS file-system description object | |
6abf5726 | 215 | * @p: return LEB number in @c->gap_lebs[p] |
1e51764a AB |
216 | * |
217 | * This function lays out new index nodes for dirty znodes using in-the-gaps | |
218 | * method of TNC commit. | |
219 | * This function merely puts the next znode into the next gap, making no attempt | |
220 | * to try to maximise the number of znodes that fit. | |
221 | * This function returns the number of index nodes written into the gaps, or a | |
222 | * negative error code on failure. | |
223 | */ | |
6abf5726 | 224 | static int layout_leb_in_gaps(struct ubifs_info *c, int p) |
1e51764a AB |
225 | { |
226 | struct ubifs_scan_leb *sleb; | |
227 | struct ubifs_scan_node *snod; | |
228 | int lnum, dirt = 0, gap_start, gap_end, err, written, tot_written; | |
229 | ||
230 | tot_written = 0; | |
231 | /* Get an index LEB with lots of obsolete index nodes */ | |
232 | lnum = ubifs_find_dirty_idx_leb(c); | |
233 | if (lnum < 0) | |
234 | /* | |
235 | * There also may be dirt in the index head that could be | |
236 | * filled, however we do not check there at present. | |
237 | */ | |
238 | return lnum; /* Error code */ | |
6abf5726 | 239 | c->gap_lebs[p] = lnum; |
1e51764a AB |
240 | dbg_gc("LEB %d", lnum); |
241 | /* | |
242 | * Scan the index LEB. We use the generic scan for this even though | |
243 | * it is more comprehensive and less efficient than is needed for this | |
244 | * purpose. | |
245 | */ | |
348709ba | 246 | sleb = ubifs_scan(c, lnum, 0, c->ileb_buf, 0); |
1e51764a AB |
247 | c->ileb_len = 0; |
248 | if (IS_ERR(sleb)) | |
249 | return PTR_ERR(sleb); | |
250 | gap_start = 0; | |
251 | list_for_each_entry(snod, &sleb->nodes, list) { | |
252 | struct ubifs_idx_node *idx; | |
253 | int in_use, level; | |
254 | ||
6eb61d58 | 255 | ubifs_assert(c, snod->type == UBIFS_IDX_NODE); |
1e51764a AB |
256 | idx = snod->node; |
257 | key_read(c, ubifs_idx_key(c, idx), &snod->key); | |
258 | level = le16_to_cpu(idx->level); | |
259 | /* Determine if the index node is in use (not obsolete) */ | |
260 | in_use = is_idx_node_in_use(c, &snod->key, level, lnum, | |
261 | snod->offs); | |
262 | if (in_use < 0) { | |
263 | ubifs_scan_destroy(sleb); | |
264 | return in_use; /* Error code */ | |
265 | } | |
266 | if (in_use) { | |
267 | if (in_use == 1) | |
268 | dirt += ALIGN(snod->len, 8); | |
269 | /* | |
270 | * The obsolete index nodes form gaps that can be | |
271 | * overwritten. This gap has ended because we have | |
272 | * found an index node that is still in use | |
273 | * i.e. not obsolete | |
274 | */ | |
275 | gap_end = snod->offs; | |
276 | /* Try to fill gap */ | |
277 | written = fill_gap(c, lnum, gap_start, gap_end, &dirt); | |
278 | if (written < 0) { | |
279 | ubifs_scan_destroy(sleb); | |
280 | return written; /* Error code */ | |
281 | } | |
282 | tot_written += written; | |
283 | gap_start = ALIGN(snod->offs + snod->len, 8); | |
284 | } | |
285 | } | |
286 | ubifs_scan_destroy(sleb); | |
287 | c->ileb_len = c->leb_size; | |
288 | gap_end = c->leb_size; | |
289 | /* Try to fill gap */ | |
290 | written = fill_gap(c, lnum, gap_start, gap_end, &dirt); | |
291 | if (written < 0) | |
292 | return written; /* Error code */ | |
293 | tot_written += written; | |
294 | if (tot_written == 0) { | |
295 | struct ubifs_lprops lp; | |
296 | ||
297 | dbg_gc("LEB %d wrote %d index nodes", lnum, tot_written); | |
298 | err = ubifs_read_one_lp(c, lnum, &lp); | |
299 | if (err) | |
300 | return err; | |
301 | if (lp.free == c->leb_size) { | |
302 | /* | |
303 | * We must have snatched this LEB from the idx_gc list | |
304 | * so we need to correct the free and dirty space. | |
305 | */ | |
306 | err = ubifs_change_one_lp(c, lnum, | |
307 | c->leb_size - c->ileb_len, | |
308 | dirt, 0, 0, 0); | |
309 | if (err) | |
310 | return err; | |
311 | } | |
312 | return 0; | |
313 | } | |
314 | err = ubifs_change_one_lp(c, lnum, c->leb_size - c->ileb_len, dirt, | |
315 | 0, 0, 0); | |
316 | if (err) | |
317 | return err; | |
b36a261e | 318 | err = ubifs_leb_change(c, lnum, c->ileb_buf, c->ileb_len); |
1e51764a AB |
319 | if (err) |
320 | return err; | |
321 | dbg_gc("LEB %d wrote %d index nodes", lnum, tot_written); | |
322 | return tot_written; | |
323 | } | |
324 | ||
325 | /** | |
326 | * get_leb_cnt - calculate the number of empty LEBs needed to commit. | |
327 | * @c: UBIFS file-system description object | |
328 | * @cnt: number of znodes to commit | |
329 | * | |
330 | * This function returns the number of empty LEBs needed to commit @cnt znodes | |
331 | * to the current index head. The number is not exact and may be more than | |
332 | * needed. | |
333 | */ | |
334 | static int get_leb_cnt(struct ubifs_info *c, int cnt) | |
335 | { | |
336 | int d; | |
337 | ||
338 | /* Assume maximum index node size (i.e. overestimate space needed) */ | |
339 | cnt -= (c->leb_size - c->ihead_offs) / c->max_idx_node_sz; | |
340 | if (cnt < 0) | |
341 | cnt = 0; | |
342 | d = c->leb_size / c->max_idx_node_sz; | |
343 | return DIV_ROUND_UP(cnt, d); | |
344 | } | |
345 | ||
346 | /** | |
347 | * layout_in_gaps - in-the-gaps method of committing TNC. | |
348 | * @c: UBIFS file-system description object | |
349 | * @cnt: number of dirty znodes to commit. | |
350 | * | |
351 | * This function lays out new index nodes for dirty znodes using in-the-gaps | |
352 | * method of TNC commit. | |
353 | * | |
354 | * This function returns %0 on success and a negative error code on failure. | |
355 | */ | |
356 | static int layout_in_gaps(struct ubifs_info *c, int cnt) | |
357 | { | |
6abf5726 | 358 | int err, leb_needed_cnt, written, p = 0, old_idx_lebs, *gap_lebs; |
1e51764a AB |
359 | |
360 | dbg_gc("%d znodes to write", cnt); | |
361 | ||
6da2ec56 KC |
362 | c->gap_lebs = kmalloc_array(c->lst.idx_lebs + 1, sizeof(int), |
363 | GFP_NOFS); | |
1e51764a AB |
364 | if (!c->gap_lebs) |
365 | return -ENOMEM; | |
366 | ||
6abf5726 | 367 | old_idx_lebs = c->lst.idx_lebs; |
1e51764a | 368 | do { |
6abf5726 | 369 | ubifs_assert(c, p < c->lst.idx_lebs); |
1e51764a AB |
370 | written = layout_leb_in_gaps(c, p); |
371 | if (written < 0) { | |
372 | err = written; | |
0010f18a AB |
373 | if (err != -ENOSPC) { |
374 | kfree(c->gap_lebs); | |
375 | c->gap_lebs = NULL; | |
376 | return err; | |
1e51764a | 377 | } |
8d7819b4 | 378 | if (!dbg_is_chk_index(c)) { |
0010f18a AB |
379 | /* |
380 | * Do not print scary warnings if the debugging | |
381 | * option which forces in-the-gaps is enabled. | |
382 | */ | |
235c362b | 383 | ubifs_warn(c, "out of space"); |
edf6be24 AB |
384 | ubifs_dump_budg(c, &c->bi); |
385 | ubifs_dump_lprops(c); | |
0010f18a AB |
386 | } |
387 | /* Try to commit anyway */ | |
0010f18a | 388 | break; |
1e51764a AB |
389 | } |
390 | p++; | |
391 | cnt -= written; | |
392 | leb_needed_cnt = get_leb_cnt(c, cnt); | |
393 | dbg_gc("%d znodes remaining, need %d LEBs, have %d", cnt, | |
394 | leb_needed_cnt, c->ileb_cnt); | |
6abf5726 ZC |
395 | /* |
396 | * Dynamically change the size of @c->gap_lebs to prevent | |
397 | * oob, because @c->lst.idx_lebs could be increased by | |
398 | * function @get_idx_gc_leb (called by layout_leb_in_gaps-> | |
399 | * ubifs_find_dirty_idx_leb) during loop. Only enlarge | |
400 | * @c->gap_lebs when needed. | |
401 | * | |
402 | */ | |
403 | if (leb_needed_cnt > c->ileb_cnt && p >= old_idx_lebs && | |
404 | old_idx_lebs < c->lst.idx_lebs) { | |
405 | old_idx_lebs = c->lst.idx_lebs; | |
406 | gap_lebs = krealloc(c->gap_lebs, sizeof(int) * | |
407 | (old_idx_lebs + 1), GFP_NOFS); | |
408 | if (!gap_lebs) { | |
409 | kfree(c->gap_lebs); | |
410 | c->gap_lebs = NULL; | |
411 | return -ENOMEM; | |
412 | } | |
413 | c->gap_lebs = gap_lebs; | |
414 | } | |
1e51764a AB |
415 | } while (leb_needed_cnt > c->ileb_cnt); |
416 | ||
6abf5726 | 417 | c->gap_lebs[p] = -1; |
1e51764a AB |
418 | return 0; |
419 | } | |
420 | ||
421 | /** | |
422 | * layout_in_empty_space - layout index nodes in empty space. | |
423 | * @c: UBIFS file-system description object | |
424 | * | |
425 | * This function lays out new index nodes for dirty znodes using empty LEBs. | |
426 | * | |
427 | * This function returns %0 on success and a negative error code on failure. | |
428 | */ | |
429 | static int layout_in_empty_space(struct ubifs_info *c) | |
430 | { | |
431 | struct ubifs_znode *znode, *cnext, *zp; | |
432 | int lnum, offs, len, next_len, buf_len, buf_offs, used, avail; | |
433 | int wlen, blen, err; | |
434 | ||
435 | cnext = c->enext; | |
436 | if (!cnext) | |
437 | return 0; | |
438 | ||
439 | lnum = c->ihead_lnum; | |
440 | buf_offs = c->ihead_offs; | |
441 | ||
442 | buf_len = ubifs_idx_node_sz(c, c->fanout); | |
443 | buf_len = ALIGN(buf_len, c->min_io_size); | |
444 | used = 0; | |
445 | avail = buf_len; | |
446 | ||
447 | /* Ensure there is enough room for first write */ | |
448 | next_len = ubifs_idx_node_sz(c, cnext->child_cnt); | |
449 | if (buf_offs + next_len > c->leb_size) | |
450 | lnum = -1; | |
451 | ||
452 | while (1) { | |
453 | znode = cnext; | |
454 | ||
455 | len = ubifs_idx_node_sz(c, znode->child_cnt); | |
456 | ||
457 | /* Determine the index node position */ | |
458 | if (lnum == -1) { | |
459 | if (c->ileb_nxt >= c->ileb_cnt) { | |
235c362b | 460 | ubifs_err(c, "out of space"); |
1e51764a AB |
461 | return -ENOSPC; |
462 | } | |
463 | lnum = c->ilebs[c->ileb_nxt++]; | |
464 | buf_offs = 0; | |
465 | used = 0; | |
466 | avail = buf_len; | |
467 | } | |
468 | ||
469 | offs = buf_offs + used; | |
470 | ||
1e51764a AB |
471 | znode->lnum = lnum; |
472 | znode->offs = offs; | |
473 | znode->len = len; | |
1e51764a AB |
474 | |
475 | /* Update the parent */ | |
476 | zp = znode->parent; | |
477 | if (zp) { | |
478 | struct ubifs_zbranch *zbr; | |
479 | int i; | |
480 | ||
481 | i = znode->iip; | |
482 | zbr = &zp->zbranch[i]; | |
483 | zbr->lnum = lnum; | |
484 | zbr->offs = offs; | |
485 | zbr->len = len; | |
486 | } else { | |
487 | c->zroot.lnum = lnum; | |
488 | c->zroot.offs = offs; | |
489 | c->zroot.len = len; | |
490 | } | |
491 | c->calc_idx_sz += ALIGN(len, 8); | |
492 | ||
493 | /* | |
494 | * Once lprops is updated, we can decrease the dirty znode count | |
495 | * but it is easier to just do it here. | |
496 | */ | |
497 | atomic_long_dec(&c->dirty_zn_cnt); | |
498 | ||
499 | /* | |
500 | * Calculate the next index node length to see if there is | |
501 | * enough room for it | |
502 | */ | |
503 | cnext = znode->cnext; | |
504 | if (cnext == c->cnext) | |
505 | next_len = 0; | |
506 | else | |
507 | next_len = ubifs_idx_node_sz(c, cnext->child_cnt); | |
508 | ||
1e51764a AB |
509 | /* Update buffer positions */ |
510 | wlen = used + len; | |
511 | used += ALIGN(len, 8); | |
512 | avail -= ALIGN(len, 8); | |
513 | ||
514 | if (next_len != 0 && | |
515 | buf_offs + used + next_len <= c->leb_size && | |
516 | avail > 0) | |
517 | continue; | |
518 | ||
519 | if (avail <= 0 && next_len && | |
520 | buf_offs + used + next_len <= c->leb_size) | |
521 | blen = buf_len; | |
522 | else | |
523 | blen = ALIGN(wlen, c->min_io_size); | |
524 | ||
525 | /* The buffer is full or there are no more znodes to do */ | |
526 | buf_offs += blen; | |
527 | if (next_len) { | |
528 | if (buf_offs + next_len > c->leb_size) { | |
529 | err = ubifs_update_one_lp(c, lnum, | |
530 | c->leb_size - buf_offs, blen - used, | |
531 | 0, 0); | |
532 | if (err) | |
533 | return err; | |
534 | lnum = -1; | |
535 | } | |
536 | used -= blen; | |
537 | if (used < 0) | |
538 | used = 0; | |
539 | avail = buf_len - used; | |
540 | continue; | |
541 | } | |
542 | err = ubifs_update_one_lp(c, lnum, c->leb_size - buf_offs, | |
543 | blen - used, 0, 0); | |
544 | if (err) | |
545 | return err; | |
546 | break; | |
547 | } | |
548 | ||
17c2f9f8 AB |
549 | c->dbg->new_ihead_lnum = lnum; |
550 | c->dbg->new_ihead_offs = buf_offs; | |
1e51764a AB |
551 | |
552 | return 0; | |
553 | } | |
554 | ||
555 | /** | |
556 | * layout_commit - determine positions of index nodes to commit. | |
557 | * @c: UBIFS file-system description object | |
558 | * @no_space: indicates that insufficient empty LEBs were allocated | |
559 | * @cnt: number of znodes to commit | |
560 | * | |
561 | * Calculate and update the positions of index nodes to commit. If there were | |
562 | * an insufficient number of empty LEBs allocated, then index nodes are placed | |
563 | * into the gaps created by obsolete index nodes in non-empty index LEBs. For | |
564 | * this purpose, an obsolete index node is one that was not in the index as at | |
565 | * the end of the last commit. To write "in-the-gaps" requires that those index | |
566 | * LEBs are updated atomically in-place. | |
567 | */ | |
568 | static int layout_commit(struct ubifs_info *c, int no_space, int cnt) | |
569 | { | |
570 | int err; | |
571 | ||
572 | if (no_space) { | |
573 | err = layout_in_gaps(c, cnt); | |
574 | if (err) | |
575 | return err; | |
576 | } | |
577 | err = layout_in_empty_space(c); | |
578 | return err; | |
579 | } | |
580 | ||
581 | /** | |
582 | * find_first_dirty - find first dirty znode. | |
583 | * @znode: znode to begin searching from | |
584 | */ | |
585 | static struct ubifs_znode *find_first_dirty(struct ubifs_znode *znode) | |
586 | { | |
587 | int i, cont; | |
588 | ||
589 | if (!znode) | |
590 | return NULL; | |
591 | ||
592 | while (1) { | |
593 | if (znode->level == 0) { | |
594 | if (ubifs_zn_dirty(znode)) | |
595 | return znode; | |
596 | return NULL; | |
597 | } | |
598 | cont = 0; | |
599 | for (i = 0; i < znode->child_cnt; i++) { | |
600 | struct ubifs_zbranch *zbr = &znode->zbranch[i]; | |
601 | ||
602 | if (zbr->znode && ubifs_zn_dirty(zbr->znode)) { | |
603 | znode = zbr->znode; | |
604 | cont = 1; | |
605 | break; | |
606 | } | |
607 | } | |
608 | if (!cont) { | |
609 | if (ubifs_zn_dirty(znode)) | |
610 | return znode; | |
611 | return NULL; | |
612 | } | |
613 | } | |
614 | } | |
615 | ||
616 | /** | |
617 | * find_next_dirty - find next dirty znode. | |
618 | * @znode: znode to begin searching from | |
619 | */ | |
620 | static struct ubifs_znode *find_next_dirty(struct ubifs_znode *znode) | |
621 | { | |
622 | int n = znode->iip + 1; | |
623 | ||
624 | znode = znode->parent; | |
625 | if (!znode) | |
626 | return NULL; | |
627 | for (; n < znode->child_cnt; n++) { | |
628 | struct ubifs_zbranch *zbr = &znode->zbranch[n]; | |
629 | ||
630 | if (zbr->znode && ubifs_zn_dirty(zbr->znode)) | |
631 | return find_first_dirty(zbr->znode); | |
632 | } | |
633 | return znode; | |
634 | } | |
635 | ||
636 | /** | |
637 | * get_znodes_to_commit - create list of dirty znodes to commit. | |
638 | * @c: UBIFS file-system description object | |
639 | * | |
640 | * This function returns the number of znodes to commit. | |
641 | */ | |
642 | static int get_znodes_to_commit(struct ubifs_info *c) | |
643 | { | |
644 | struct ubifs_znode *znode, *cnext; | |
645 | int cnt = 0; | |
646 | ||
647 | c->cnext = find_first_dirty(c->zroot.znode); | |
648 | znode = c->enext = c->cnext; | |
649 | if (!znode) { | |
650 | dbg_cmt("no znodes to commit"); | |
651 | return 0; | |
652 | } | |
653 | cnt += 1; | |
654 | while (1) { | |
6eb61d58 | 655 | ubifs_assert(c, !ubifs_zn_cow(znode)); |
1e51764a AB |
656 | __set_bit(COW_ZNODE, &znode->flags); |
657 | znode->alt = 0; | |
658 | cnext = find_next_dirty(znode); | |
659 | if (!cnext) { | |
660 | znode->cnext = c->cnext; | |
661 | break; | |
662 | } | |
16a26b20 SH |
663 | znode->cparent = znode->parent; |
664 | znode->ciip = znode->iip; | |
1e51764a AB |
665 | znode->cnext = cnext; |
666 | znode = cnext; | |
667 | cnt += 1; | |
668 | } | |
669 | dbg_cmt("committing %d znodes", cnt); | |
6eb61d58 | 670 | ubifs_assert(c, cnt == atomic_long_read(&c->dirty_zn_cnt)); |
1e51764a AB |
671 | return cnt; |
672 | } | |
673 | ||
674 | /** | |
675 | * alloc_idx_lebs - allocate empty LEBs to be used to commit. | |
676 | * @c: UBIFS file-system description object | |
677 | * @cnt: number of znodes to commit | |
678 | * | |
679 | * This function returns %-ENOSPC if it cannot allocate a sufficient number of | |
680 | * empty LEBs. %0 is returned on success, otherwise a negative error code | |
681 | * is returned. | |
682 | */ | |
683 | static int alloc_idx_lebs(struct ubifs_info *c, int cnt) | |
684 | { | |
685 | int i, leb_cnt, lnum; | |
686 | ||
687 | c->ileb_cnt = 0; | |
688 | c->ileb_nxt = 0; | |
689 | leb_cnt = get_leb_cnt(c, cnt); | |
690 | dbg_cmt("need about %d empty LEBS for TNC commit", leb_cnt); | |
691 | if (!leb_cnt) | |
692 | return 0; | |
6da2ec56 | 693 | c->ilebs = kmalloc_array(leb_cnt, sizeof(int), GFP_NOFS); |
1e51764a AB |
694 | if (!c->ilebs) |
695 | return -ENOMEM; | |
696 | for (i = 0; i < leb_cnt; i++) { | |
697 | lnum = ubifs_find_free_leb_for_idx(c); | |
698 | if (lnum < 0) | |
699 | return lnum; | |
700 | c->ilebs[c->ileb_cnt++] = lnum; | |
701 | dbg_cmt("LEB %d", lnum); | |
702 | } | |
8032bf12 | 703 | if (dbg_is_chk_index(c) && !get_random_u32_below(8)) |
1e51764a AB |
704 | return -ENOSPC; |
705 | return 0; | |
706 | } | |
707 | ||
708 | /** | |
709 | * free_unused_idx_lebs - free unused LEBs that were allocated for the commit. | |
710 | * @c: UBIFS file-system description object | |
711 | * | |
712 | * It is possible that we allocate more empty LEBs for the commit than we need. | |
713 | * This functions frees the surplus. | |
714 | * | |
715 | * This function returns %0 on success and a negative error code on failure. | |
716 | */ | |
717 | static int free_unused_idx_lebs(struct ubifs_info *c) | |
718 | { | |
719 | int i, err = 0, lnum, er; | |
720 | ||
721 | for (i = c->ileb_nxt; i < c->ileb_cnt; i++) { | |
722 | lnum = c->ilebs[i]; | |
723 | dbg_cmt("LEB %d", lnum); | |
724 | er = ubifs_change_one_lp(c, lnum, LPROPS_NC, LPROPS_NC, 0, | |
725 | LPROPS_INDEX | LPROPS_TAKEN, 0); | |
726 | if (!err) | |
727 | err = er; | |
728 | } | |
729 | return err; | |
730 | } | |
731 | ||
732 | /** | |
733 | * free_idx_lebs - free unused LEBs after commit end. | |
734 | * @c: UBIFS file-system description object | |
735 | * | |
736 | * This function returns %0 on success and a negative error code on failure. | |
737 | */ | |
738 | static int free_idx_lebs(struct ubifs_info *c) | |
739 | { | |
740 | int err; | |
741 | ||
742 | err = free_unused_idx_lebs(c); | |
743 | kfree(c->ilebs); | |
744 | c->ilebs = NULL; | |
745 | return err; | |
746 | } | |
747 | ||
748 | /** | |
749 | * ubifs_tnc_start_commit - start TNC commit. | |
750 | * @c: UBIFS file-system description object | |
751 | * @zroot: new index root position is returned here | |
752 | * | |
753 | * This function prepares the list of indexing nodes to commit and lays out | |
754 | * their positions on flash. If there is not enough free space it uses the | |
755 | * in-gap commit method. Returns zero in case of success and a negative error | |
756 | * code in case of failure. | |
757 | */ | |
758 | int ubifs_tnc_start_commit(struct ubifs_info *c, struct ubifs_zbranch *zroot) | |
759 | { | |
760 | int err = 0, cnt; | |
761 | ||
762 | mutex_lock(&c->tnc_mutex); | |
763 | err = dbg_check_tnc(c, 1); | |
764 | if (err) | |
765 | goto out; | |
766 | cnt = get_znodes_to_commit(c); | |
767 | if (cnt != 0) { | |
768 | int no_space = 0; | |
769 | ||
770 | err = alloc_idx_lebs(c, cnt); | |
771 | if (err == -ENOSPC) | |
772 | no_space = 1; | |
773 | else if (err) | |
774 | goto out_free; | |
775 | err = layout_commit(c, no_space, cnt); | |
776 | if (err) | |
777 | goto out_free; | |
6eb61d58 | 778 | ubifs_assert(c, atomic_long_read(&c->dirty_zn_cnt) == 0); |
1e51764a AB |
779 | err = free_unused_idx_lebs(c); |
780 | if (err) | |
781 | goto out; | |
782 | } | |
783 | destroy_old_idx(c); | |
784 | memcpy(zroot, &c->zroot, sizeof(struct ubifs_zbranch)); | |
785 | ||
786 | err = ubifs_save_dirty_idx_lnums(c); | |
787 | if (err) | |
788 | goto out; | |
789 | ||
790 | spin_lock(&c->space_lock); | |
791 | /* | |
792 | * Although we have not finished committing yet, update size of the | |
b137545c | 793 | * committed index ('c->bi.old_idx_sz') and zero out the index growth |
1e51764a AB |
794 | * budget. It is OK to do this now, because we've reserved all the |
795 | * space which is needed to commit the index, and it is save for the | |
796 | * budgeting subsystem to assume the index is already committed, | |
797 | * even though it is not. | |
798 | */ | |
6eb61d58 | 799 | ubifs_assert(c, c->bi.min_idx_lebs == ubifs_calc_min_idx_lebs(c)); |
b137545c AB |
800 | c->bi.old_idx_sz = c->calc_idx_sz; |
801 | c->bi.uncommitted_idx = 0; | |
802 | c->bi.min_idx_lebs = ubifs_calc_min_idx_lebs(c); | |
1e51764a AB |
803 | spin_unlock(&c->space_lock); |
804 | mutex_unlock(&c->tnc_mutex); | |
805 | ||
806 | dbg_cmt("number of index LEBs %d", c->lst.idx_lebs); | |
807 | dbg_cmt("size of index %llu", c->calc_idx_sz); | |
808 | return err; | |
809 | ||
810 | out_free: | |
811 | free_idx_lebs(c); | |
812 | out: | |
813 | mutex_unlock(&c->tnc_mutex); | |
814 | return err; | |
815 | } | |
816 | ||
817 | /** | |
818 | * write_index - write index nodes. | |
819 | * @c: UBIFS file-system description object | |
820 | * | |
821 | * This function writes the index nodes whose positions were laid out in the | |
822 | * layout_in_empty_space function. | |
823 | */ | |
824 | static int write_index(struct ubifs_info *c) | |
825 | { | |
826 | struct ubifs_idx_node *idx; | |
827 | struct ubifs_znode *znode, *cnext; | |
828 | int i, lnum, offs, len, next_len, buf_len, buf_offs, used; | |
1f42596e | 829 | int avail, wlen, err, lnum_pos = 0, blen, nxt_offs; |
1e51764a AB |
830 | |
831 | cnext = c->enext; | |
832 | if (!cnext) | |
833 | return 0; | |
834 | ||
835 | /* | |
836 | * Always write index nodes to the index head so that index nodes and | |
837 | * other types of nodes are never mixed in the same erase block. | |
838 | */ | |
839 | lnum = c->ihead_lnum; | |
840 | buf_offs = c->ihead_offs; | |
841 | ||
842 | /* Allocate commit buffer */ | |
843 | buf_len = ALIGN(c->max_idx_node_sz, c->min_io_size); | |
844 | used = 0; | |
845 | avail = buf_len; | |
846 | ||
847 | /* Ensure there is enough room for first write */ | |
848 | next_len = ubifs_idx_node_sz(c, cnext->child_cnt); | |
849 | if (buf_offs + next_len > c->leb_size) { | |
850 | err = ubifs_update_one_lp(c, lnum, LPROPS_NC, 0, 0, | |
851 | LPROPS_TAKEN); | |
852 | if (err) | |
853 | return err; | |
854 | lnum = -1; | |
855 | } | |
856 | ||
857 | while (1) { | |
16a26b20 SH |
858 | u8 hash[UBIFS_HASH_ARR_SZ]; |
859 | ||
1e51764a AB |
860 | cond_resched(); |
861 | ||
862 | znode = cnext; | |
863 | idx = c->cbuf + used; | |
864 | ||
865 | /* Make index node */ | |
866 | idx->ch.node_type = UBIFS_IDX_NODE; | |
867 | idx->child_cnt = cpu_to_le16(znode->child_cnt); | |
868 | idx->level = cpu_to_le16(znode->level); | |
869 | for (i = 0; i < znode->child_cnt; i++) { | |
870 | struct ubifs_branch *br = ubifs_idx_branch(c, idx, i); | |
871 | struct ubifs_zbranch *zbr = &znode->zbranch[i]; | |
872 | ||
873 | key_write_idx(c, &zbr->key, &br->key); | |
874 | br->lnum = cpu_to_le32(zbr->lnum); | |
875 | br->offs = cpu_to_le32(zbr->offs); | |
876 | br->len = cpu_to_le32(zbr->len); | |
16a26b20 | 877 | ubifs_copy_hash(c, zbr->hash, ubifs_branch_hash(c, br)); |
1e51764a | 878 | if (!zbr->lnum || !zbr->len) { |
235c362b | 879 | ubifs_err(c, "bad ref in znode"); |
edf6be24 | 880 | ubifs_dump_znode(c, znode); |
1e51764a | 881 | if (zbr->znode) |
edf6be24 | 882 | ubifs_dump_znode(c, zbr->znode); |
df71b091 RW |
883 | |
884 | return -EINVAL; | |
1e51764a AB |
885 | } |
886 | } | |
887 | len = ubifs_idx_node_sz(c, znode->child_cnt); | |
888 | ubifs_prepare_node(c, idx, len, 0); | |
16a26b20 SH |
889 | ubifs_node_calc_hash(c, idx, hash); |
890 | ||
891 | mutex_lock(&c->tnc_mutex); | |
892 | ||
893 | if (znode->cparent) | |
894 | ubifs_copy_hash(c, hash, | |
895 | znode->cparent->zbranch[znode->ciip].hash); | |
896 | ||
897 | if (znode->parent) { | |
898 | if (!ubifs_zn_obsolete(znode)) | |
899 | ubifs_copy_hash(c, hash, | |
900 | znode->parent->zbranch[znode->iip].hash); | |
901 | } else { | |
902 | ubifs_copy_hash(c, hash, c->zroot.hash); | |
903 | } | |
904 | ||
905 | mutex_unlock(&c->tnc_mutex); | |
1e51764a AB |
906 | |
907 | /* Determine the index node position */ | |
908 | if (lnum == -1) { | |
909 | lnum = c->ilebs[lnum_pos++]; | |
910 | buf_offs = 0; | |
911 | used = 0; | |
912 | avail = buf_len; | |
913 | } | |
914 | offs = buf_offs + used; | |
915 | ||
1e51764a AB |
916 | if (lnum != znode->lnum || offs != znode->offs || |
917 | len != znode->len) { | |
235c362b | 918 | ubifs_err(c, "inconsistent znode posn"); |
1e51764a AB |
919 | return -EINVAL; |
920 | } | |
1e51764a AB |
921 | |
922 | /* Grab some stuff from znode while we still can */ | |
923 | cnext = znode->cnext; | |
924 | ||
6eb61d58 RW |
925 | ubifs_assert(c, ubifs_zn_dirty(znode)); |
926 | ubifs_assert(c, ubifs_zn_cow(znode)); | |
1e51764a AB |
927 | |
928 | /* | |
929 | * It is important that other threads should see %DIRTY_ZNODE | |
930 | * flag cleared before %COW_ZNODE. Specifically, it matters in | |
931 | * the 'dirty_cow_znode()' function. This is the reason for the | |
932 | * first barrier. Also, we want the bit changes to be seen to | |
07c32de4 | 933 | * other threads ASAP, to avoid unnecessary copying, which is |
1e51764a AB |
934 | * the reason for the second barrier. |
935 | */ | |
936 | clear_bit(DIRTY_ZNODE, &znode->flags); | |
4e857c58 | 937 | smp_mb__before_atomic(); |
1e51764a | 938 | clear_bit(COW_ZNODE, &znode->flags); |
4e857c58 | 939 | smp_mb__after_atomic(); |
1e51764a | 940 | |
06b282a4 AB |
941 | /* |
942 | * We have marked the znode as clean but have not updated the | |
943 | * @c->clean_zn_cnt counter. If this znode becomes dirty again | |
944 | * before 'free_obsolete_znodes()' is called, then | |
945 | * @c->clean_zn_cnt will be decremented before it gets | |
946 | * incremented (resulting in 2 decrements for the same znode). | |
947 | * This means that @c->clean_zn_cnt may become negative for a | |
948 | * while. | |
949 | * | |
950 | * Q: why we cannot increment @c->clean_zn_cnt? | |
951 | * A: because we do not have the @c->tnc_mutex locked, and the | |
952 | * following code would be racy and buggy: | |
953 | * | |
954 | * if (!ubifs_zn_obsolete(znode)) { | |
955 | * atomic_long_inc(&c->clean_zn_cnt); | |
956 | * atomic_long_inc(&ubifs_clean_zn_cnt); | |
957 | * } | |
958 | * | |
959 | * Thus, we just delay the @c->clean_zn_cnt update until we | |
960 | * have the mutex locked. | |
961 | */ | |
962 | ||
1e51764a AB |
963 | /* Do not access znode from this point on */ |
964 | ||
965 | /* Update buffer positions */ | |
966 | wlen = used + len; | |
967 | used += ALIGN(len, 8); | |
968 | avail -= ALIGN(len, 8); | |
969 | ||
970 | /* | |
971 | * Calculate the next index node length to see if there is | |
972 | * enough room for it | |
973 | */ | |
974 | if (cnext == c->cnext) | |
975 | next_len = 0; | |
976 | else | |
977 | next_len = ubifs_idx_node_sz(c, cnext->child_cnt); | |
978 | ||
1f42596e AB |
979 | nxt_offs = buf_offs + used + next_len; |
980 | if (next_len && nxt_offs <= c->leb_size) { | |
981 | if (avail > 0) | |
1e51764a | 982 | continue; |
1f42596e AB |
983 | else |
984 | blen = buf_len; | |
1e51764a | 985 | } else { |
1f42596e AB |
986 | wlen = ALIGN(wlen, 8); |
987 | blen = ALIGN(wlen, c->min_io_size); | |
988 | ubifs_pad(c, c->cbuf + wlen, blen - wlen); | |
989 | } | |
990 | ||
991 | /* The buffer is full or there are no more znodes to do */ | |
b36a261e | 992 | err = ubifs_leb_write(c, lnum, c->cbuf, buf_offs, blen); |
1f42596e AB |
993 | if (err) |
994 | return err; | |
995 | buf_offs += blen; | |
996 | if (next_len) { | |
997 | if (nxt_offs > c->leb_size) { | |
998 | err = ubifs_update_one_lp(c, lnum, LPROPS_NC, 0, | |
999 | 0, LPROPS_TAKEN); | |
1000 | if (err) | |
1001 | return err; | |
1002 | lnum = -1; | |
1e51764a | 1003 | } |
1f42596e AB |
1004 | used -= blen; |
1005 | if (used < 0) | |
1006 | used = 0; | |
1007 | avail = buf_len - used; | |
1008 | memmove(c->cbuf, c->cbuf + blen, used); | |
1009 | continue; | |
1e51764a AB |
1010 | } |
1011 | break; | |
1012 | } | |
1013 | ||
17c2f9f8 AB |
1014 | if (lnum != c->dbg->new_ihead_lnum || |
1015 | buf_offs != c->dbg->new_ihead_offs) { | |
235c362b | 1016 | ubifs_err(c, "inconsistent ihead"); |
1e51764a AB |
1017 | return -EINVAL; |
1018 | } | |
1e51764a AB |
1019 | |
1020 | c->ihead_lnum = lnum; | |
1021 | c->ihead_offs = buf_offs; | |
1022 | ||
1023 | return 0; | |
1024 | } | |
1025 | ||
1026 | /** | |
1027 | * free_obsolete_znodes - free obsolete znodes. | |
1028 | * @c: UBIFS file-system description object | |
1029 | * | |
1030 | * At the end of commit end, obsolete znodes are freed. | |
1031 | */ | |
1032 | static void free_obsolete_znodes(struct ubifs_info *c) | |
1033 | { | |
1034 | struct ubifs_znode *znode, *cnext; | |
1035 | ||
1036 | cnext = c->cnext; | |
1037 | do { | |
1038 | znode = cnext; | |
1039 | cnext = znode->cnext; | |
f42eed7c | 1040 | if (ubifs_zn_obsolete(znode)) |
1e51764a AB |
1041 | kfree(znode); |
1042 | else { | |
1043 | znode->cnext = NULL; | |
1044 | atomic_long_inc(&c->clean_zn_cnt); | |
1045 | atomic_long_inc(&ubifs_clean_zn_cnt); | |
1046 | } | |
1047 | } while (cnext != c->cnext); | |
1048 | } | |
1049 | ||
1050 | /** | |
1051 | * return_gap_lebs - return LEBs used by the in-gap commit method. | |
1052 | * @c: UBIFS file-system description object | |
1053 | * | |
1054 | * This function clears the "taken" flag for the LEBs which were used by the | |
1055 | * "commit in-the-gaps" method. | |
1056 | */ | |
1057 | static int return_gap_lebs(struct ubifs_info *c) | |
1058 | { | |
1059 | int *p, err; | |
1060 | ||
1061 | if (!c->gap_lebs) | |
1062 | return 0; | |
1063 | ||
1064 | dbg_cmt(""); | |
1065 | for (p = c->gap_lebs; *p != -1; p++) { | |
1066 | err = ubifs_change_one_lp(c, *p, LPROPS_NC, LPROPS_NC, 0, | |
1067 | LPROPS_TAKEN, 0); | |
1068 | if (err) | |
1069 | return err; | |
1070 | } | |
1071 | ||
1072 | kfree(c->gap_lebs); | |
1073 | c->gap_lebs = NULL; | |
1074 | return 0; | |
1075 | } | |
1076 | ||
1077 | /** | |
1078 | * ubifs_tnc_end_commit - update the TNC for commit end. | |
1079 | * @c: UBIFS file-system description object | |
1080 | * | |
1081 | * Write the dirty znodes. | |
1082 | */ | |
1083 | int ubifs_tnc_end_commit(struct ubifs_info *c) | |
1084 | { | |
1085 | int err; | |
1086 | ||
1087 | if (!c->cnext) | |
1088 | return 0; | |
1089 | ||
1090 | err = return_gap_lebs(c); | |
1091 | if (err) | |
1092 | return err; | |
1093 | ||
1094 | err = write_index(c); | |
1095 | if (err) | |
1096 | return err; | |
1097 | ||
1098 | mutex_lock(&c->tnc_mutex); | |
1099 | ||
1100 | dbg_cmt("TNC height is %d", c->zroot.znode->level + 1); | |
1101 | ||
1102 | free_obsolete_znodes(c); | |
1103 | ||
1104 | c->cnext = NULL; | |
1105 | kfree(c->ilebs); | |
1106 | c->ilebs = NULL; | |
1107 | ||
1108 | mutex_unlock(&c->tnc_mutex); | |
1109 | ||
1110 | return 0; | |
1111 | } |