dm snapshot: fix metadata corruption
[linux/fpc-iii.git] / fs / jffs2 / nodemgmt.c
blob03310721712f7885aa043c1c2f88421d0a80649b
1 /*
2 * JFFS2 -- Journalling Flash File System, Version 2.
4 * Copyright © 2001-2007 Red Hat, Inc.
6 * Created by David Woodhouse <dwmw2@infradead.org>
8 * For licensing information, see the file 'LICENCE' in this directory.
12 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
14 #include <linux/kernel.h>
15 #include <linux/mtd/mtd.h>
16 #include <linux/compiler.h>
17 #include <linux/sched.h> /* For cond_resched() */
18 #include "nodelist.h"
19 #include "debug.h"
22 * Check whether the user is allowed to write.
24 static int jffs2_rp_can_write(struct jffs2_sb_info *c)
26 uint32_t avail;
27 struct jffs2_mount_opts *opts = &c->mount_opts;
29 avail = c->dirty_size + c->free_size + c->unchecked_size +
30 c->erasing_size - c->resv_blocks_write * c->sector_size
31 - c->nospc_dirty_size;
33 if (avail < 2 * opts->rp_size)
34 jffs2_dbg(1, "rpsize %u, dirty_size %u, free_size %u, "
35 "erasing_size %u, unchecked_size %u, "
36 "nr_erasing_blocks %u, avail %u, resrv %u\n",
37 opts->rp_size, c->dirty_size, c->free_size,
38 c->erasing_size, c->unchecked_size,
39 c->nr_erasing_blocks, avail, c->nospc_dirty_size);
41 if (avail > opts->rp_size)
42 return 1;
44 /* Always allow root */
45 if (capable(CAP_SYS_RESOURCE))
46 return 1;
48 jffs2_dbg(1, "forbid writing\n");
49 return 0;
52 /**
53 * jffs2_reserve_space - request physical space to write nodes to flash
54 * @c: superblock info
55 * @minsize: Minimum acceptable size of allocation
56 * @len: Returned value of allocation length
57 * @prio: Allocation type - ALLOC_{NORMAL,DELETION}
59 * Requests a block of physical space on the flash. Returns zero for success
60 * and puts 'len' into the appropriate place, or returns -ENOSPC or other
61 * error if appropriate. Doesn't return len since that's
63 * If it returns zero, jffs2_reserve_space() also downs the per-filesystem
64 * allocation semaphore, to prevent more than one allocation from being
65 * active at any time. The semaphore is later released by jffs2_commit_allocation()
67 * jffs2_reserve_space() may trigger garbage collection in order to make room
68 * for the requested allocation.
71 static int jffs2_do_reserve_space(struct jffs2_sb_info *c, uint32_t minsize,
72 uint32_t *len, uint32_t sumsize);
74 int jffs2_reserve_space(struct jffs2_sb_info *c, uint32_t minsize,
75 uint32_t *len, int prio, uint32_t sumsize)
77 int ret = -EAGAIN;
78 int blocksneeded = c->resv_blocks_write;
79 /* align it */
80 minsize = PAD(minsize);
82 jffs2_dbg(1, "%s(): Requested 0x%x bytes\n", __func__, minsize);
83 mutex_lock(&c->alloc_sem);
85 jffs2_dbg(1, "%s(): alloc sem got\n", __func__);
87 spin_lock(&c->erase_completion_lock);
90 * Check if the free space is greater then size of the reserved pool.
91 * If not, only allow root to proceed with writing.
93 if (prio != ALLOC_DELETION && !jffs2_rp_can_write(c)) {
94 ret = -ENOSPC;
95 goto out;
98 /* this needs a little more thought (true <tglx> :)) */
99 while(ret == -EAGAIN) {
100 while(c->nr_free_blocks + c->nr_erasing_blocks < blocksneeded) {
101 uint32_t dirty, avail;
103 /* calculate real dirty size
104 * dirty_size contains blocks on erase_pending_list
105 * those blocks are counted in c->nr_erasing_blocks.
106 * If one block is actually erased, it is not longer counted as dirty_space
107 * but it is counted in c->nr_erasing_blocks, so we add it and subtract it
108 * with c->nr_erasing_blocks * c->sector_size again.
109 * Blocks on erasable_list are counted as dirty_size, but not in c->nr_erasing_blocks
110 * This helps us to force gc and pick eventually a clean block to spread the load.
111 * We add unchecked_size here, as we hopefully will find some space to use.
112 * This will affect the sum only once, as gc first finishes checking
113 * of nodes.
115 dirty = c->dirty_size + c->erasing_size - c->nr_erasing_blocks * c->sector_size + c->unchecked_size;
116 if (dirty < c->nospc_dirty_size) {
117 if (prio == ALLOC_DELETION && c->nr_free_blocks + c->nr_erasing_blocks >= c->resv_blocks_deletion) {
118 jffs2_dbg(1, "%s(): Low on dirty space to GC, but it's a deletion. Allowing...\n",
119 __func__);
120 break;
122 jffs2_dbg(1, "dirty size 0x%08x + unchecked_size 0x%08x < nospc_dirty_size 0x%08x, returning -ENOSPC\n",
123 dirty, c->unchecked_size,
124 c->sector_size);
126 spin_unlock(&c->erase_completion_lock);
127 mutex_unlock(&c->alloc_sem);
128 return -ENOSPC;
131 /* Calc possibly available space. Possibly available means that we
132 * don't know, if unchecked size contains obsoleted nodes, which could give us some
133 * more usable space. This will affect the sum only once, as gc first finishes checking
134 * of nodes.
135 + Return -ENOSPC, if the maximum possibly available space is less or equal than
136 * blocksneeded * sector_size.
137 * This blocks endless gc looping on a filesystem, which is nearly full, even if
138 * the check above passes.
140 avail = c->free_size + c->dirty_size + c->erasing_size + c->unchecked_size;
141 if ( (avail / c->sector_size) <= blocksneeded) {
142 if (prio == ALLOC_DELETION && c->nr_free_blocks + c->nr_erasing_blocks >= c->resv_blocks_deletion) {
143 jffs2_dbg(1, "%s(): Low on possibly available space, but it's a deletion. Allowing...\n",
144 __func__);
145 break;
148 jffs2_dbg(1, "max. available size 0x%08x < blocksneeded * sector_size 0x%08x, returning -ENOSPC\n",
149 avail, blocksneeded * c->sector_size);
150 spin_unlock(&c->erase_completion_lock);
151 mutex_unlock(&c->alloc_sem);
152 return -ENOSPC;
155 mutex_unlock(&c->alloc_sem);
157 jffs2_dbg(1, "Triggering GC pass. nr_free_blocks %d, nr_erasing_blocks %d, free_size 0x%08x, dirty_size 0x%08x, wasted_size 0x%08x, used_size 0x%08x, erasing_size 0x%08x, bad_size 0x%08x (total 0x%08x of 0x%08x)\n",
158 c->nr_free_blocks, c->nr_erasing_blocks,
159 c->free_size, c->dirty_size, c->wasted_size,
160 c->used_size, c->erasing_size, c->bad_size,
161 c->free_size + c->dirty_size +
162 c->wasted_size + c->used_size +
163 c->erasing_size + c->bad_size,
164 c->flash_size);
165 spin_unlock(&c->erase_completion_lock);
167 ret = jffs2_garbage_collect_pass(c);
169 if (ret == -EAGAIN) {
170 spin_lock(&c->erase_completion_lock);
171 if (c->nr_erasing_blocks &&
172 list_empty(&c->erase_pending_list) &&
173 list_empty(&c->erase_complete_list)) {
174 DECLARE_WAITQUEUE(wait, current);
175 set_current_state(TASK_UNINTERRUPTIBLE);
176 add_wait_queue(&c->erase_wait, &wait);
177 jffs2_dbg(1, "%s waiting for erase to complete\n",
178 __func__);
179 spin_unlock(&c->erase_completion_lock);
181 schedule();
182 } else
183 spin_unlock(&c->erase_completion_lock);
184 } else if (ret)
185 return ret;
187 cond_resched();
189 if (signal_pending(current))
190 return -EINTR;
192 mutex_lock(&c->alloc_sem);
193 spin_lock(&c->erase_completion_lock);
196 ret = jffs2_do_reserve_space(c, minsize, len, sumsize);
197 if (ret) {
198 jffs2_dbg(1, "%s(): ret is %d\n", __func__, ret);
202 out:
203 spin_unlock(&c->erase_completion_lock);
204 if (!ret)
205 ret = jffs2_prealloc_raw_node_refs(c, c->nextblock, 1);
206 if (ret)
207 mutex_unlock(&c->alloc_sem);
208 return ret;
211 int jffs2_reserve_space_gc(struct jffs2_sb_info *c, uint32_t minsize,
212 uint32_t *len, uint32_t sumsize)
214 int ret = -EAGAIN;
215 minsize = PAD(minsize);
217 jffs2_dbg(1, "%s(): Requested 0x%x bytes\n", __func__, minsize);
219 spin_lock(&c->erase_completion_lock);
220 while(ret == -EAGAIN) {
221 ret = jffs2_do_reserve_space(c, minsize, len, sumsize);
222 if (ret) {
223 jffs2_dbg(1, "%s(): looping, ret is %d\n",
224 __func__, ret);
227 spin_unlock(&c->erase_completion_lock);
228 if (!ret)
229 ret = jffs2_prealloc_raw_node_refs(c, c->nextblock, 1);
231 return ret;
235 /* Classify nextblock (clean, dirty of verydirty) and force to select an other one */
237 static void jffs2_close_nextblock(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb)
240 if (c->nextblock == NULL) {
241 jffs2_dbg(1, "%s(): Erase block at 0x%08x has already been placed in a list\n",
242 __func__, jeb->offset);
243 return;
245 /* Check, if we have a dirty block now, or if it was dirty already */
246 if (ISDIRTY (jeb->wasted_size + jeb->dirty_size)) {
247 c->dirty_size += jeb->wasted_size;
248 c->wasted_size -= jeb->wasted_size;
249 jeb->dirty_size += jeb->wasted_size;
250 jeb->wasted_size = 0;
251 if (VERYDIRTY(c, jeb->dirty_size)) {
252 jffs2_dbg(1, "Adding full erase block at 0x%08x to very_dirty_list (free 0x%08x, dirty 0x%08x, used 0x%08x\n",
253 jeb->offset, jeb->free_size, jeb->dirty_size,
254 jeb->used_size);
255 list_add_tail(&jeb->list, &c->very_dirty_list);
256 } else {
257 jffs2_dbg(1, "Adding full erase block at 0x%08x to dirty_list (free 0x%08x, dirty 0x%08x, used 0x%08x\n",
258 jeb->offset, jeb->free_size, jeb->dirty_size,
259 jeb->used_size);
260 list_add_tail(&jeb->list, &c->dirty_list);
262 } else {
263 jffs2_dbg(1, "Adding full erase block at 0x%08x to clean_list (free 0x%08x, dirty 0x%08x, used 0x%08x\n",
264 jeb->offset, jeb->free_size, jeb->dirty_size,
265 jeb->used_size);
266 list_add_tail(&jeb->list, &c->clean_list);
268 c->nextblock = NULL;
272 /* Select a new jeb for nextblock */
274 static int jffs2_find_nextblock(struct jffs2_sb_info *c)
276 struct list_head *next;
278 /* Take the next block off the 'free' list */
280 if (list_empty(&c->free_list)) {
282 if (!c->nr_erasing_blocks &&
283 !list_empty(&c->erasable_list)) {
284 struct jffs2_eraseblock *ejeb;
286 ejeb = list_entry(c->erasable_list.next, struct jffs2_eraseblock, list);
287 list_move_tail(&ejeb->list, &c->erase_pending_list);
288 c->nr_erasing_blocks++;
289 jffs2_garbage_collect_trigger(c);
290 jffs2_dbg(1, "%s(): Triggering erase of erasable block at 0x%08x\n",
291 __func__, ejeb->offset);
294 if (!c->nr_erasing_blocks &&
295 !list_empty(&c->erasable_pending_wbuf_list)) {
296 jffs2_dbg(1, "%s(): Flushing write buffer\n",
297 __func__);
298 /* c->nextblock is NULL, no update to c->nextblock allowed */
299 spin_unlock(&c->erase_completion_lock);
300 jffs2_flush_wbuf_pad(c);
301 spin_lock(&c->erase_completion_lock);
302 /* Have another go. It'll be on the erasable_list now */
303 return -EAGAIN;
306 if (!c->nr_erasing_blocks) {
307 /* Ouch. We're in GC, or we wouldn't have got here.
308 And there's no space left. At all. */
309 pr_crit("Argh. No free space left for GC. nr_erasing_blocks is %d. nr_free_blocks is %d. (erasableempty: %s, erasingempty: %s, erasependingempty: %s)\n",
310 c->nr_erasing_blocks, c->nr_free_blocks,
311 list_empty(&c->erasable_list) ? "yes" : "no",
312 list_empty(&c->erasing_list) ? "yes" : "no",
313 list_empty(&c->erase_pending_list) ? "yes" : "no");
314 return -ENOSPC;
317 spin_unlock(&c->erase_completion_lock);
318 /* Don't wait for it; just erase one right now */
319 jffs2_erase_pending_blocks(c, 1);
320 spin_lock(&c->erase_completion_lock);
322 /* An erase may have failed, decreasing the
323 amount of free space available. So we must
324 restart from the beginning */
325 return -EAGAIN;
328 next = c->free_list.next;
329 list_del(next);
330 c->nextblock = list_entry(next, struct jffs2_eraseblock, list);
331 c->nr_free_blocks--;
333 jffs2_sum_reset_collected(c->summary); /* reset collected summary */
335 #ifdef CONFIG_JFFS2_FS_WRITEBUFFER
336 /* adjust write buffer offset, else we get a non contiguous write bug */
337 if (!(c->wbuf_ofs % c->sector_size) && !c->wbuf_len)
338 c->wbuf_ofs = 0xffffffff;
339 #endif
341 jffs2_dbg(1, "%s(): new nextblock = 0x%08x\n",
342 __func__, c->nextblock->offset);
344 return 0;
347 /* Called with alloc sem _and_ erase_completion_lock */
348 static int jffs2_do_reserve_space(struct jffs2_sb_info *c, uint32_t minsize,
349 uint32_t *len, uint32_t sumsize)
351 struct jffs2_eraseblock *jeb = c->nextblock;
352 uint32_t reserved_size; /* for summary information at the end of the jeb */
353 int ret;
355 restart:
356 reserved_size = 0;
358 if (jffs2_sum_active() && (sumsize != JFFS2_SUMMARY_NOSUM_SIZE)) {
359 /* NOSUM_SIZE means not to generate summary */
361 if (jeb) {
362 reserved_size = PAD(sumsize + c->summary->sum_size + JFFS2_SUMMARY_FRAME_SIZE);
363 dbg_summary("minsize=%d , jeb->free=%d ,"
364 "summary->size=%d , sumsize=%d\n",
365 minsize, jeb->free_size,
366 c->summary->sum_size, sumsize);
369 /* Is there enough space for writing out the current node, or we have to
370 write out summary information now, close this jeb and select new nextblock? */
371 if (jeb && (PAD(minsize) + PAD(c->summary->sum_size + sumsize +
372 JFFS2_SUMMARY_FRAME_SIZE) > jeb->free_size)) {
374 /* Has summary been disabled for this jeb? */
375 if (jffs2_sum_is_disabled(c->summary)) {
376 sumsize = JFFS2_SUMMARY_NOSUM_SIZE;
377 goto restart;
380 /* Writing out the collected summary information */
381 dbg_summary("generating summary for 0x%08x.\n", jeb->offset);
382 ret = jffs2_sum_write_sumnode(c);
384 if (ret)
385 return ret;
387 if (jffs2_sum_is_disabled(c->summary)) {
388 /* jffs2_write_sumnode() couldn't write out the summary information
389 diabling summary for this jeb and free the collected information
391 sumsize = JFFS2_SUMMARY_NOSUM_SIZE;
392 goto restart;
395 jffs2_close_nextblock(c, jeb);
396 jeb = NULL;
397 /* keep always valid value in reserved_size */
398 reserved_size = PAD(sumsize + c->summary->sum_size + JFFS2_SUMMARY_FRAME_SIZE);
400 } else {
401 if (jeb && minsize > jeb->free_size) {
402 uint32_t waste;
404 /* Skip the end of this block and file it as having some dirty space */
405 /* If there's a pending write to it, flush now */
407 if (jffs2_wbuf_dirty(c)) {
408 spin_unlock(&c->erase_completion_lock);
409 jffs2_dbg(1, "%s(): Flushing write buffer\n",
410 __func__);
411 jffs2_flush_wbuf_pad(c);
412 spin_lock(&c->erase_completion_lock);
413 jeb = c->nextblock;
414 goto restart;
417 spin_unlock(&c->erase_completion_lock);
419 ret = jffs2_prealloc_raw_node_refs(c, jeb, 1);
421 /* Just lock it again and continue. Nothing much can change because
422 we hold c->alloc_sem anyway. In fact, it's not entirely clear why
423 we hold c->erase_completion_lock in the majority of this function...
424 but that's a question for another (more caffeine-rich) day. */
425 spin_lock(&c->erase_completion_lock);
427 if (ret)
428 return ret;
430 waste = jeb->free_size;
431 jffs2_link_node_ref(c, jeb,
432 (jeb->offset + c->sector_size - waste) | REF_OBSOLETE,
433 waste, NULL);
434 /* FIXME: that made it count as dirty. Convert to wasted */
435 jeb->dirty_size -= waste;
436 c->dirty_size -= waste;
437 jeb->wasted_size += waste;
438 c->wasted_size += waste;
440 jffs2_close_nextblock(c, jeb);
441 jeb = NULL;
445 if (!jeb) {
447 ret = jffs2_find_nextblock(c);
448 if (ret)
449 return ret;
451 jeb = c->nextblock;
453 if (jeb->free_size != c->sector_size - c->cleanmarker_size) {
454 pr_warn("Eep. Block 0x%08x taken from free_list had free_size of 0x%08x!!\n",
455 jeb->offset, jeb->free_size);
456 goto restart;
459 /* OK, jeb (==c->nextblock) is now pointing at a block which definitely has
460 enough space */
461 *len = jeb->free_size - reserved_size;
463 if (c->cleanmarker_size && jeb->used_size == c->cleanmarker_size &&
464 !jeb->first_node->next_in_ino) {
465 /* Only node in it beforehand was a CLEANMARKER node (we think).
466 So mark it obsolete now that there's going to be another node
467 in the block. This will reduce used_size to zero but We've
468 already set c->nextblock so that jffs2_mark_node_obsolete()
469 won't try to refile it to the dirty_list.
471 spin_unlock(&c->erase_completion_lock);
472 jffs2_mark_node_obsolete(c, jeb->first_node);
473 spin_lock(&c->erase_completion_lock);
476 jffs2_dbg(1, "%s(): Giving 0x%x bytes at 0x%x\n",
477 __func__,
478 *len, jeb->offset + (c->sector_size - jeb->free_size));
479 return 0;
483 * jffs2_add_physical_node_ref - add a physical node reference to the list
484 * @c: superblock info
485 * @new: new node reference to add
486 * @len: length of this physical node
488 * Should only be used to report nodes for which space has been allocated
489 * by jffs2_reserve_space.
491 * Must be called with the alloc_sem held.
494 struct jffs2_raw_node_ref *jffs2_add_physical_node_ref(struct jffs2_sb_info *c,
495 uint32_t ofs, uint32_t len,
496 struct jffs2_inode_cache *ic)
498 struct jffs2_eraseblock *jeb;
499 struct jffs2_raw_node_ref *new;
501 jeb = &c->blocks[ofs / c->sector_size];
503 jffs2_dbg(1, "%s(): Node at 0x%x(%d), size 0x%x\n",
504 __func__, ofs & ~3, ofs & 3, len);
505 #if 1
506 /* Allow non-obsolete nodes only to be added at the end of c->nextblock,
507 if c->nextblock is set. Note that wbuf.c will file obsolete nodes
508 even after refiling c->nextblock */
509 if ((c->nextblock || ((ofs & 3) != REF_OBSOLETE))
510 && (jeb != c->nextblock || (ofs & ~3) != jeb->offset + (c->sector_size - jeb->free_size))) {
511 pr_warn("argh. node added in wrong place at 0x%08x(%d)\n",
512 ofs & ~3, ofs & 3);
513 if (c->nextblock)
514 pr_warn("nextblock 0x%08x", c->nextblock->offset);
515 else
516 pr_warn("No nextblock");
517 pr_cont(", expected at %08x\n",
518 jeb->offset + (c->sector_size - jeb->free_size));
519 return ERR_PTR(-EINVAL);
521 #endif
522 spin_lock(&c->erase_completion_lock);
524 new = jffs2_link_node_ref(c, jeb, ofs, len, ic);
526 if (!jeb->free_size && !jeb->dirty_size && !ISDIRTY(jeb->wasted_size)) {
527 /* If it lives on the dirty_list, jffs2_reserve_space will put it there */
528 jffs2_dbg(1, "Adding full erase block at 0x%08x to clean_list (free 0x%08x, dirty 0x%08x, used 0x%08x\n",
529 jeb->offset, jeb->free_size, jeb->dirty_size,
530 jeb->used_size);
531 if (jffs2_wbuf_dirty(c)) {
532 /* Flush the last write in the block if it's outstanding */
533 spin_unlock(&c->erase_completion_lock);
534 jffs2_flush_wbuf_pad(c);
535 spin_lock(&c->erase_completion_lock);
538 list_add_tail(&jeb->list, &c->clean_list);
539 c->nextblock = NULL;
541 jffs2_dbg_acct_sanity_check_nolock(c,jeb);
542 jffs2_dbg_acct_paranoia_check_nolock(c, jeb);
544 spin_unlock(&c->erase_completion_lock);
546 return new;
550 void jffs2_complete_reservation(struct jffs2_sb_info *c)
552 jffs2_dbg(1, "jffs2_complete_reservation()\n");
553 spin_lock(&c->erase_completion_lock);
554 jffs2_garbage_collect_trigger(c);
555 spin_unlock(&c->erase_completion_lock);
556 mutex_unlock(&c->alloc_sem);
559 static inline int on_list(struct list_head *obj, struct list_head *head)
561 struct list_head *this;
563 list_for_each(this, head) {
564 if (this == obj) {
565 jffs2_dbg(1, "%p is on list at %p\n", obj, head);
566 return 1;
570 return 0;
573 void jffs2_mark_node_obsolete(struct jffs2_sb_info *c, struct jffs2_raw_node_ref *ref)
575 struct jffs2_eraseblock *jeb;
576 int blocknr;
577 struct jffs2_unknown_node n;
578 int ret, addedsize;
579 size_t retlen;
580 uint32_t freed_len;
582 if(unlikely(!ref)) {
583 pr_notice("EEEEEK. jffs2_mark_node_obsolete called with NULL node\n");
584 return;
586 if (ref_obsolete(ref)) {
587 jffs2_dbg(1, "%s(): called with already obsolete node at 0x%08x\n",
588 __func__, ref_offset(ref));
589 return;
591 blocknr = ref->flash_offset / c->sector_size;
592 if (blocknr >= c->nr_blocks) {
593 pr_notice("raw node at 0x%08x is off the end of device!\n",
594 ref->flash_offset);
595 BUG();
597 jeb = &c->blocks[blocknr];
599 if (jffs2_can_mark_obsolete(c) && !jffs2_is_readonly(c) &&
600 !(c->flags & (JFFS2_SB_FLAG_SCANNING | JFFS2_SB_FLAG_BUILDING))) {
601 /* Hm. This may confuse static lock analysis. If any of the above
602 three conditions is false, we're going to return from this
603 function without actually obliterating any nodes or freeing
604 any jffs2_raw_node_refs. So we don't need to stop erases from
605 happening, or protect against people holding an obsolete
606 jffs2_raw_node_ref without the erase_completion_lock. */
607 mutex_lock(&c->erase_free_sem);
610 spin_lock(&c->erase_completion_lock);
612 freed_len = ref_totlen(c, jeb, ref);
614 if (ref_flags(ref) == REF_UNCHECKED) {
615 D1(if (unlikely(jeb->unchecked_size < freed_len)) {
616 pr_notice("raw unchecked node of size 0x%08x freed from erase block %d at 0x%08x, but unchecked_size was already 0x%08x\n",
617 freed_len, blocknr,
618 ref->flash_offset, jeb->used_size);
619 BUG();
621 jffs2_dbg(1, "Obsoleting previously unchecked node at 0x%08x of len %x\n",
622 ref_offset(ref), freed_len);
623 jeb->unchecked_size -= freed_len;
624 c->unchecked_size -= freed_len;
625 } else {
626 D1(if (unlikely(jeb->used_size < freed_len)) {
627 pr_notice("raw node of size 0x%08x freed from erase block %d at 0x%08x, but used_size was already 0x%08x\n",
628 freed_len, blocknr,
629 ref->flash_offset, jeb->used_size);
630 BUG();
632 jffs2_dbg(1, "Obsoleting node at 0x%08x of len %#x: ",
633 ref_offset(ref), freed_len);
634 jeb->used_size -= freed_len;
635 c->used_size -= freed_len;
638 // Take care, that wasted size is taken into concern
639 if ((jeb->dirty_size || ISDIRTY(jeb->wasted_size + freed_len)) && jeb != c->nextblock) {
640 jffs2_dbg(1, "Dirtying\n");
641 addedsize = freed_len;
642 jeb->dirty_size += freed_len;
643 c->dirty_size += freed_len;
645 /* Convert wasted space to dirty, if not a bad block */
646 if (jeb->wasted_size) {
647 if (on_list(&jeb->list, &c->bad_used_list)) {
648 jffs2_dbg(1, "Leaving block at %08x on the bad_used_list\n",
649 jeb->offset);
650 addedsize = 0; /* To fool the refiling code later */
651 } else {
652 jffs2_dbg(1, "Converting %d bytes of wasted space to dirty in block at %08x\n",
653 jeb->wasted_size, jeb->offset);
654 addedsize += jeb->wasted_size;
655 jeb->dirty_size += jeb->wasted_size;
656 c->dirty_size += jeb->wasted_size;
657 c->wasted_size -= jeb->wasted_size;
658 jeb->wasted_size = 0;
661 } else {
662 jffs2_dbg(1, "Wasting\n");
663 addedsize = 0;
664 jeb->wasted_size += freed_len;
665 c->wasted_size += freed_len;
667 ref->flash_offset = ref_offset(ref) | REF_OBSOLETE;
669 jffs2_dbg_acct_sanity_check_nolock(c, jeb);
670 jffs2_dbg_acct_paranoia_check_nolock(c, jeb);
672 if (c->flags & JFFS2_SB_FLAG_SCANNING) {
673 /* Flash scanning is in progress. Don't muck about with the block
674 lists because they're not ready yet, and don't actually
675 obliterate nodes that look obsolete. If they weren't
676 marked obsolete on the flash at the time they _became_
677 obsolete, there was probably a reason for that. */
678 spin_unlock(&c->erase_completion_lock);
679 /* We didn't lock the erase_free_sem */
680 return;
683 if (jeb == c->nextblock) {
684 jffs2_dbg(2, "Not moving nextblock 0x%08x to dirty/erase_pending list\n",
685 jeb->offset);
686 } else if (!jeb->used_size && !jeb->unchecked_size) {
687 if (jeb == c->gcblock) {
688 jffs2_dbg(1, "gcblock at 0x%08x completely dirtied. Clearing gcblock...\n",
689 jeb->offset);
690 c->gcblock = NULL;
691 } else {
692 jffs2_dbg(1, "Eraseblock at 0x%08x completely dirtied. Removing from (dirty?) list...\n",
693 jeb->offset);
694 list_del(&jeb->list);
696 if (jffs2_wbuf_dirty(c)) {
697 jffs2_dbg(1, "...and adding to erasable_pending_wbuf_list\n");
698 list_add_tail(&jeb->list, &c->erasable_pending_wbuf_list);
699 } else {
700 if (jiffies & 127) {
701 /* Most of the time, we just erase it immediately. Otherwise we
702 spend ages scanning it on mount, etc. */
703 jffs2_dbg(1, "...and adding to erase_pending_list\n");
704 list_add_tail(&jeb->list, &c->erase_pending_list);
705 c->nr_erasing_blocks++;
706 jffs2_garbage_collect_trigger(c);
707 } else {
708 /* Sometimes, however, we leave it elsewhere so it doesn't get
709 immediately reused, and we spread the load a bit. */
710 jffs2_dbg(1, "...and adding to erasable_list\n");
711 list_add_tail(&jeb->list, &c->erasable_list);
714 jffs2_dbg(1, "Done OK\n");
715 } else if (jeb == c->gcblock) {
716 jffs2_dbg(2, "Not moving gcblock 0x%08x to dirty_list\n",
717 jeb->offset);
718 } else if (ISDIRTY(jeb->dirty_size) && !ISDIRTY(jeb->dirty_size - addedsize)) {
719 jffs2_dbg(1, "Eraseblock at 0x%08x is freshly dirtied. Removing from clean list...\n",
720 jeb->offset);
721 list_del(&jeb->list);
722 jffs2_dbg(1, "...and adding to dirty_list\n");
723 list_add_tail(&jeb->list, &c->dirty_list);
724 } else if (VERYDIRTY(c, jeb->dirty_size) &&
725 !VERYDIRTY(c, jeb->dirty_size - addedsize)) {
726 jffs2_dbg(1, "Eraseblock at 0x%08x is now very dirty. Removing from dirty list...\n",
727 jeb->offset);
728 list_del(&jeb->list);
729 jffs2_dbg(1, "...and adding to very_dirty_list\n");
730 list_add_tail(&jeb->list, &c->very_dirty_list);
731 } else {
732 jffs2_dbg(1, "Eraseblock at 0x%08x not moved anywhere. (free 0x%08x, dirty 0x%08x, used 0x%08x)\n",
733 jeb->offset, jeb->free_size, jeb->dirty_size,
734 jeb->used_size);
737 spin_unlock(&c->erase_completion_lock);
739 if (!jffs2_can_mark_obsolete(c) || jffs2_is_readonly(c) ||
740 (c->flags & JFFS2_SB_FLAG_BUILDING)) {
741 /* We didn't lock the erase_free_sem */
742 return;
745 /* The erase_free_sem is locked, and has been since before we marked the node obsolete
746 and potentially put its eraseblock onto the erase_pending_list. Thus, we know that
747 the block hasn't _already_ been erased, and that 'ref' itself hasn't been freed yet
748 by jffs2_free_jeb_node_refs() in erase.c. Which is nice. */
750 jffs2_dbg(1, "obliterating obsoleted node at 0x%08x\n",
751 ref_offset(ref));
752 ret = jffs2_flash_read(c, ref_offset(ref), sizeof(n), &retlen, (char *)&n);
753 if (ret) {
754 pr_warn("Read error reading from obsoleted node at 0x%08x: %d\n",
755 ref_offset(ref), ret);
756 goto out_erase_sem;
758 if (retlen != sizeof(n)) {
759 pr_warn("Short read from obsoleted node at 0x%08x: %zd\n",
760 ref_offset(ref), retlen);
761 goto out_erase_sem;
763 if (PAD(je32_to_cpu(n.totlen)) != PAD(freed_len)) {
764 pr_warn("Node totlen on flash (0x%08x) != totlen from node ref (0x%08x)\n",
765 je32_to_cpu(n.totlen), freed_len);
766 goto out_erase_sem;
768 if (!(je16_to_cpu(n.nodetype) & JFFS2_NODE_ACCURATE)) {
769 jffs2_dbg(1, "Node at 0x%08x was already marked obsolete (nodetype 0x%04x)\n",
770 ref_offset(ref), je16_to_cpu(n.nodetype));
771 goto out_erase_sem;
773 /* XXX FIXME: This is ugly now */
774 n.nodetype = cpu_to_je16(je16_to_cpu(n.nodetype) & ~JFFS2_NODE_ACCURATE);
775 ret = jffs2_flash_write(c, ref_offset(ref), sizeof(n), &retlen, (char *)&n);
776 if (ret) {
777 pr_warn("Write error in obliterating obsoleted node at 0x%08x: %d\n",
778 ref_offset(ref), ret);
779 goto out_erase_sem;
781 if (retlen != sizeof(n)) {
782 pr_warn("Short write in obliterating obsoleted node at 0x%08x: %zd\n",
783 ref_offset(ref), retlen);
784 goto out_erase_sem;
787 /* Nodes which have been marked obsolete no longer need to be
788 associated with any inode. Remove them from the per-inode list.
790 Note we can't do this for NAND at the moment because we need
791 obsolete dirent nodes to stay on the lists, because of the
792 horridness in jffs2_garbage_collect_deletion_dirent(). Also
793 because we delete the inocache, and on NAND we need that to
794 stay around until all the nodes are actually erased, in order
795 to stop us from giving the same inode number to another newly
796 created inode. */
797 if (ref->next_in_ino) {
798 struct jffs2_inode_cache *ic;
799 struct jffs2_raw_node_ref **p;
801 spin_lock(&c->erase_completion_lock);
803 ic = jffs2_raw_ref_to_ic(ref);
804 for (p = &ic->nodes; (*p) != ref; p = &((*p)->next_in_ino))
807 *p = ref->next_in_ino;
808 ref->next_in_ino = NULL;
810 switch (ic->class) {
811 #ifdef CONFIG_JFFS2_FS_XATTR
812 case RAWNODE_CLASS_XATTR_DATUM:
813 jffs2_release_xattr_datum(c, (struct jffs2_xattr_datum *)ic);
814 break;
815 case RAWNODE_CLASS_XATTR_REF:
816 jffs2_release_xattr_ref(c, (struct jffs2_xattr_ref *)ic);
817 break;
818 #endif
819 default:
820 if (ic->nodes == (void *)ic && ic->pino_nlink == 0)
821 jffs2_del_ino_cache(c, ic);
822 break;
824 spin_unlock(&c->erase_completion_lock);
827 out_erase_sem:
828 mutex_unlock(&c->erase_free_sem);
831 int jffs2_thread_should_wake(struct jffs2_sb_info *c)
833 int ret = 0;
834 uint32_t dirty;
835 int nr_very_dirty = 0;
836 struct jffs2_eraseblock *jeb;
838 if (!list_empty(&c->erase_complete_list) ||
839 !list_empty(&c->erase_pending_list))
840 return 1;
842 if (c->unchecked_size) {
843 jffs2_dbg(1, "jffs2_thread_should_wake(): unchecked_size %d, checked_ino #%d\n",
844 c->unchecked_size, c->checked_ino);
845 return 1;
848 /* dirty_size contains blocks on erase_pending_list
849 * those blocks are counted in c->nr_erasing_blocks.
850 * If one block is actually erased, it is not longer counted as dirty_space
851 * but it is counted in c->nr_erasing_blocks, so we add it and subtract it
852 * with c->nr_erasing_blocks * c->sector_size again.
853 * Blocks on erasable_list are counted as dirty_size, but not in c->nr_erasing_blocks
854 * This helps us to force gc and pick eventually a clean block to spread the load.
856 dirty = c->dirty_size + c->erasing_size - c->nr_erasing_blocks * c->sector_size;
858 if (c->nr_free_blocks + c->nr_erasing_blocks < c->resv_blocks_gctrigger &&
859 (dirty > c->nospc_dirty_size))
860 ret = 1;
862 list_for_each_entry(jeb, &c->very_dirty_list, list) {
863 nr_very_dirty++;
864 if (nr_very_dirty == c->vdirty_blocks_gctrigger) {
865 ret = 1;
866 /* In debug mode, actually go through and count them all */
867 D1(continue);
868 break;
872 jffs2_dbg(1, "%s(): nr_free_blocks %d, nr_erasing_blocks %d, dirty_size 0x%x, vdirty_blocks %d: %s\n",
873 __func__, c->nr_free_blocks, c->nr_erasing_blocks,
874 c->dirty_size, nr_very_dirty, ret ? "yes" : "no");
876 return ret;