xref: /openbmc/linux/fs/jffs2/gc.c (revision d96fb997)
11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds  * JFFS2 -- Journalling Flash File System, Version 2.
31da177e4SLinus Torvalds  *
41da177e4SLinus Torvalds  * Copyright (C) 2001-2003 Red Hat, Inc.
51da177e4SLinus Torvalds  *
61da177e4SLinus Torvalds  * Created by David Woodhouse <dwmw2@infradead.org>
71da177e4SLinus Torvalds  *
81da177e4SLinus Torvalds  * For licensing information, see the file 'LICENCE' in this directory.
91da177e4SLinus Torvalds  *
10182ec4eeSThomas Gleixner  * $Id: gc.c,v 1.155 2005/11/07 11:14:39 gleixner Exp $
111da177e4SLinus Torvalds  *
121da177e4SLinus Torvalds  */
131da177e4SLinus Torvalds 
141da177e4SLinus Torvalds #include <linux/kernel.h>
151da177e4SLinus Torvalds #include <linux/mtd/mtd.h>
161da177e4SLinus Torvalds #include <linux/slab.h>
171da177e4SLinus Torvalds #include <linux/pagemap.h>
181da177e4SLinus Torvalds #include <linux/crc32.h>
191da177e4SLinus Torvalds #include <linux/compiler.h>
201da177e4SLinus Torvalds #include <linux/stat.h>
211da177e4SLinus Torvalds #include "nodelist.h"
221da177e4SLinus Torvalds #include "compr.h"
231da177e4SLinus Torvalds 
241da177e4SLinus Torvalds static int jffs2_garbage_collect_pristine(struct jffs2_sb_info *c,
251da177e4SLinus Torvalds 					  struct jffs2_inode_cache *ic,
261da177e4SLinus Torvalds 					  struct jffs2_raw_node_ref *raw);
271da177e4SLinus Torvalds static int jffs2_garbage_collect_metadata(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
281da177e4SLinus Torvalds 					struct jffs2_inode_info *f, struct jffs2_full_dnode *fd);
291da177e4SLinus Torvalds static int jffs2_garbage_collect_dirent(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
301da177e4SLinus Torvalds 					struct jffs2_inode_info *f, struct jffs2_full_dirent *fd);
311da177e4SLinus Torvalds static int jffs2_garbage_collect_deletion_dirent(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
321da177e4SLinus Torvalds 					struct jffs2_inode_info *f, struct jffs2_full_dirent *fd);
331da177e4SLinus Torvalds static int jffs2_garbage_collect_hole(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
341da177e4SLinus Torvalds 				      struct jffs2_inode_info *f, struct jffs2_full_dnode *fn,
351da177e4SLinus Torvalds 				      uint32_t start, uint32_t end);
361da177e4SLinus Torvalds static int jffs2_garbage_collect_dnode(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
371da177e4SLinus Torvalds 				       struct jffs2_inode_info *f, struct jffs2_full_dnode *fn,
381da177e4SLinus Torvalds 				       uint32_t start, uint32_t end);
391da177e4SLinus Torvalds static int jffs2_garbage_collect_live(struct jffs2_sb_info *c,  struct jffs2_eraseblock *jeb,
401da177e4SLinus Torvalds 			       struct jffs2_raw_node_ref *raw, struct jffs2_inode_info *f);
411da177e4SLinus Torvalds 
421da177e4SLinus Torvalds /* Called with erase_completion_lock held */
431da177e4SLinus Torvalds static struct jffs2_eraseblock *jffs2_find_gc_block(struct jffs2_sb_info *c)
441da177e4SLinus Torvalds {
451da177e4SLinus Torvalds 	struct jffs2_eraseblock *ret;
461da177e4SLinus Torvalds 	struct list_head *nextlist = NULL;
471da177e4SLinus Torvalds 	int n = jiffies % 128;
481da177e4SLinus Torvalds 
491da177e4SLinus Torvalds 	/* Pick an eraseblock to garbage collect next. This is where we'll
501da177e4SLinus Torvalds 	   put the clever wear-levelling algorithms. Eventually.  */
511da177e4SLinus Torvalds 	/* We possibly want to favour the dirtier blocks more when the
521da177e4SLinus Torvalds 	   number of free blocks is low. */
53a42163d7SArtem B. Bityuckiy again:
541da177e4SLinus Torvalds 	if (!list_empty(&c->bad_used_list) && c->nr_free_blocks > c->resv_blocks_gcbad) {
551da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from bad_used_list to GC next\n"));
561da177e4SLinus Torvalds 		nextlist = &c->bad_used_list;
571da177e4SLinus Torvalds 	} else if (n < 50 && !list_empty(&c->erasable_list)) {
581da177e4SLinus Torvalds 		/* Note that most of them will have gone directly to be erased.
591da177e4SLinus Torvalds 		   So don't favour the erasable_list _too_ much. */
601da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from erasable_list to GC next\n"));
611da177e4SLinus Torvalds 		nextlist = &c->erasable_list;
621da177e4SLinus Torvalds 	} else if (n < 110 && !list_empty(&c->very_dirty_list)) {
631da177e4SLinus Torvalds 		/* Most of the time, pick one off the very_dirty list */
641da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from very_dirty_list to GC next\n"));
651da177e4SLinus Torvalds 		nextlist = &c->very_dirty_list;
661da177e4SLinus Torvalds 	} else if (n < 126 && !list_empty(&c->dirty_list)) {
671da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from dirty_list to GC next\n"));
681da177e4SLinus Torvalds 		nextlist = &c->dirty_list;
691da177e4SLinus Torvalds 	} else if (!list_empty(&c->clean_list)) {
701da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from clean_list to GC next\n"));
711da177e4SLinus Torvalds 		nextlist = &c->clean_list;
721da177e4SLinus Torvalds 	} else if (!list_empty(&c->dirty_list)) {
731da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from dirty_list to GC next (clean_list was empty)\n"));
741da177e4SLinus Torvalds 
751da177e4SLinus Torvalds 		nextlist = &c->dirty_list;
761da177e4SLinus Torvalds 	} else if (!list_empty(&c->very_dirty_list)) {
771da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from very_dirty_list to GC next (clean_list and dirty_list were empty)\n"));
781da177e4SLinus Torvalds 		nextlist = &c->very_dirty_list;
791da177e4SLinus Torvalds 	} else if (!list_empty(&c->erasable_list)) {
801da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Picking block from erasable_list to GC next (clean_list and {very_,}dirty_list were empty)\n"));
811da177e4SLinus Torvalds 
821da177e4SLinus Torvalds 		nextlist = &c->erasable_list;
83a42163d7SArtem B. Bityuckiy 	} else if (!list_empty(&c->erasable_pending_wbuf_list)) {
84a42163d7SArtem B. Bityuckiy 		/* There are blocks are wating for the wbuf sync */
85a42163d7SArtem B. Bityuckiy 		D1(printk(KERN_DEBUG "Synching wbuf in order to reuse erasable_pending_wbuf_list blocks\n"));
863cceb9f6SArtem B. Bityuckiy 		spin_unlock(&c->erase_completion_lock);
87a42163d7SArtem B. Bityuckiy 		jffs2_flush_wbuf_pad(c);
883cceb9f6SArtem B. Bityuckiy 		spin_lock(&c->erase_completion_lock);
89a42163d7SArtem B. Bityuckiy 		goto again;
901da177e4SLinus Torvalds 	} else {
911da177e4SLinus Torvalds 		/* Eep. All were empty */
921da177e4SLinus Torvalds 		D1(printk(KERN_NOTICE "jffs2: No clean, dirty _or_ erasable blocks to GC from! Where are they all?\n"));
931da177e4SLinus Torvalds 		return NULL;
941da177e4SLinus Torvalds 	}
951da177e4SLinus Torvalds 
961da177e4SLinus Torvalds 	ret = list_entry(nextlist->next, struct jffs2_eraseblock, list);
971da177e4SLinus Torvalds 	list_del(&ret->list);
981da177e4SLinus Torvalds 	c->gcblock = ret;
991da177e4SLinus Torvalds 	ret->gc_node = ret->first_node;
1001da177e4SLinus Torvalds 	if (!ret->gc_node) {
1011da177e4SLinus Torvalds 		printk(KERN_WARNING "Eep. ret->gc_node for block at 0x%08x is NULL\n", ret->offset);
1021da177e4SLinus Torvalds 		BUG();
1031da177e4SLinus Torvalds 	}
1041da177e4SLinus Torvalds 
1051da177e4SLinus Torvalds 	/* Have we accidentally picked a clean block with wasted space ? */
1061da177e4SLinus Torvalds 	if (ret->wasted_size) {
1071da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Converting wasted_size %08x to dirty_size\n", ret->wasted_size));
1081da177e4SLinus Torvalds 		ret->dirty_size += ret->wasted_size;
1091da177e4SLinus Torvalds 		c->wasted_size -= ret->wasted_size;
1101da177e4SLinus Torvalds 		c->dirty_size += ret->wasted_size;
1111da177e4SLinus Torvalds 		ret->wasted_size = 0;
1121da177e4SLinus Torvalds 	}
1131da177e4SLinus Torvalds 
1141da177e4SLinus Torvalds 	return ret;
1151da177e4SLinus Torvalds }
1161da177e4SLinus Torvalds 
1171da177e4SLinus Torvalds /* jffs2_garbage_collect_pass
1181da177e4SLinus Torvalds  * Make a single attempt to progress GC. Move one node, and possibly
1191da177e4SLinus Torvalds  * start erasing one eraseblock.
1201da177e4SLinus Torvalds  */
1211da177e4SLinus Torvalds int jffs2_garbage_collect_pass(struct jffs2_sb_info *c)
1221da177e4SLinus Torvalds {
1231da177e4SLinus Torvalds 	struct jffs2_inode_info *f;
1241da177e4SLinus Torvalds 	struct jffs2_inode_cache *ic;
1251da177e4SLinus Torvalds 	struct jffs2_eraseblock *jeb;
1261da177e4SLinus Torvalds 	struct jffs2_raw_node_ref *raw;
1271da177e4SLinus Torvalds 	int ret = 0, inum, nlink;
1281da177e4SLinus Torvalds 
1291da177e4SLinus Torvalds 	if (down_interruptible(&c->alloc_sem))
1301da177e4SLinus Torvalds 		return -EINTR;
1311da177e4SLinus Torvalds 
1321da177e4SLinus Torvalds 	for (;;) {
1331da177e4SLinus Torvalds 		spin_lock(&c->erase_completion_lock);
1341da177e4SLinus Torvalds 		if (!c->unchecked_size)
1351da177e4SLinus Torvalds 			break;
1361da177e4SLinus Torvalds 
1371da177e4SLinus Torvalds 		/* We can't start doing GC yet. We haven't finished checking
1381da177e4SLinus Torvalds 		   the node CRCs etc. Do it now. */
1391da177e4SLinus Torvalds 
1401da177e4SLinus Torvalds 		/* checked_ino is protected by the alloc_sem */
1411da177e4SLinus Torvalds 		if (c->checked_ino > c->highest_ino) {
1421da177e4SLinus Torvalds 			printk(KERN_CRIT "Checked all inodes but still 0x%x bytes of unchecked space?\n",
1431da177e4SLinus Torvalds 			       c->unchecked_size);
144e0c8e42fSArtem B. Bityutskiy 			jffs2_dbg_dump_block_lists_nolock(c);
1451da177e4SLinus Torvalds 			spin_unlock(&c->erase_completion_lock);
1461da177e4SLinus Torvalds 			BUG();
1471da177e4SLinus Torvalds 		}
1481da177e4SLinus Torvalds 
1491da177e4SLinus Torvalds 		spin_unlock(&c->erase_completion_lock);
1501da177e4SLinus Torvalds 
1511da177e4SLinus Torvalds 		spin_lock(&c->inocache_lock);
1521da177e4SLinus Torvalds 
1531da177e4SLinus Torvalds 		ic = jffs2_get_ino_cache(c, c->checked_ino++);
1541da177e4SLinus Torvalds 
1551da177e4SLinus Torvalds 		if (!ic) {
1561da177e4SLinus Torvalds 			spin_unlock(&c->inocache_lock);
1571da177e4SLinus Torvalds 			continue;
1581da177e4SLinus Torvalds 		}
1591da177e4SLinus Torvalds 
1601da177e4SLinus Torvalds 		if (!ic->nlink) {
1611da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Skipping check of ino #%d with nlink zero\n",
1621da177e4SLinus Torvalds 				  ic->ino));
1631da177e4SLinus Torvalds 			spin_unlock(&c->inocache_lock);
1641da177e4SLinus Torvalds 			continue;
1651da177e4SLinus Torvalds 		}
1661da177e4SLinus Torvalds 		switch(ic->state) {
1671da177e4SLinus Torvalds 		case INO_STATE_CHECKEDABSENT:
1681da177e4SLinus Torvalds 		case INO_STATE_PRESENT:
1691da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Skipping ino #%u already checked\n", ic->ino));
1701da177e4SLinus Torvalds 			spin_unlock(&c->inocache_lock);
1711da177e4SLinus Torvalds 			continue;
1721da177e4SLinus Torvalds 
1731da177e4SLinus Torvalds 		case INO_STATE_GC:
1741da177e4SLinus Torvalds 		case INO_STATE_CHECKING:
1751da177e4SLinus Torvalds 			printk(KERN_WARNING "Inode #%u is in state %d during CRC check phase!\n", ic->ino, ic->state);
1761da177e4SLinus Torvalds 			spin_unlock(&c->inocache_lock);
1771da177e4SLinus Torvalds 			BUG();
1781da177e4SLinus Torvalds 
1791da177e4SLinus Torvalds 		case INO_STATE_READING:
1801da177e4SLinus Torvalds 			/* We need to wait for it to finish, lest we move on
1811da177e4SLinus Torvalds 			   and trigger the BUG() above while we haven't yet
1821da177e4SLinus Torvalds 			   finished checking all its nodes */
1831da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Waiting for ino #%u to finish reading\n", ic->ino));
184d96fb997SDavid Woodhouse 			/* We need to come back again for the _same_ inode. We've
185d96fb997SDavid Woodhouse 			 made no progress in this case, but that should be OK */
186d96fb997SDavid Woodhouse 			c->checked_ino--;
187d96fb997SDavid Woodhouse 
1881da177e4SLinus Torvalds 			up(&c->alloc_sem);
1891da177e4SLinus Torvalds 			sleep_on_spinunlock(&c->inocache_wq, &c->inocache_lock);
1901da177e4SLinus Torvalds 			return 0;
1911da177e4SLinus Torvalds 
1921da177e4SLinus Torvalds 		default:
1931da177e4SLinus Torvalds 			BUG();
1941da177e4SLinus Torvalds 
1951da177e4SLinus Torvalds 		case INO_STATE_UNCHECKED:
1961da177e4SLinus Torvalds 			;
1971da177e4SLinus Torvalds 		}
1981da177e4SLinus Torvalds 		ic->state = INO_STATE_CHECKING;
1991da177e4SLinus Torvalds 		spin_unlock(&c->inocache_lock);
2001da177e4SLinus Torvalds 
2011da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "jffs2_garbage_collect_pass() triggering inode scan of ino#%u\n", ic->ino));
2021da177e4SLinus Torvalds 
2031da177e4SLinus Torvalds 		ret = jffs2_do_crccheck_inode(c, ic);
2041da177e4SLinus Torvalds 		if (ret)
2051da177e4SLinus Torvalds 			printk(KERN_WARNING "Returned error for crccheck of ino #%u. Expect badness...\n", ic->ino);
2061da177e4SLinus Torvalds 
2071da177e4SLinus Torvalds 		jffs2_set_inocache_state(c, ic, INO_STATE_CHECKEDABSENT);
2081da177e4SLinus Torvalds 		up(&c->alloc_sem);
2091da177e4SLinus Torvalds 		return ret;
2101da177e4SLinus Torvalds 	}
2111da177e4SLinus Torvalds 
2121da177e4SLinus Torvalds 	/* First, work out which block we're garbage-collecting */
2131da177e4SLinus Torvalds 	jeb = c->gcblock;
2141da177e4SLinus Torvalds 
2151da177e4SLinus Torvalds 	if (!jeb)
2161da177e4SLinus Torvalds 		jeb = jffs2_find_gc_block(c);
2171da177e4SLinus Torvalds 
2181da177e4SLinus Torvalds 	if (!jeb) {
2191da177e4SLinus Torvalds 		D1 (printk(KERN_NOTICE "jffs2: Couldn't find erase block to garbage collect!\n"));
2201da177e4SLinus Torvalds 		spin_unlock(&c->erase_completion_lock);
2211da177e4SLinus Torvalds 		up(&c->alloc_sem);
2221da177e4SLinus Torvalds 		return -EIO;
2231da177e4SLinus Torvalds 	}
2241da177e4SLinus Torvalds 
2251da177e4SLinus Torvalds 	D1(printk(KERN_DEBUG "GC from block %08x, used_size %08x, dirty_size %08x, free_size %08x\n", jeb->offset, jeb->used_size, jeb->dirty_size, jeb->free_size));
2261da177e4SLinus Torvalds 	D1(if (c->nextblock)
2271da177e4SLinus Torvalds 	   printk(KERN_DEBUG "Nextblock at  %08x, used_size %08x, dirty_size %08x, wasted_size %08x, free_size %08x\n", c->nextblock->offset, c->nextblock->used_size, c->nextblock->dirty_size, c->nextblock->wasted_size, c->nextblock->free_size));
2281da177e4SLinus Torvalds 
2291da177e4SLinus Torvalds 	if (!jeb->used_size) {
2301da177e4SLinus Torvalds 		up(&c->alloc_sem);
2311da177e4SLinus Torvalds 		goto eraseit;
2321da177e4SLinus Torvalds 	}
2331da177e4SLinus Torvalds 
2341da177e4SLinus Torvalds 	raw = jeb->gc_node;
2351da177e4SLinus Torvalds 
2361da177e4SLinus Torvalds 	while(ref_obsolete(raw)) {
2371da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Node at 0x%08x is obsolete... skipping\n", ref_offset(raw)));
2381da177e4SLinus Torvalds 		raw = raw->next_phys;
2391da177e4SLinus Torvalds 		if (unlikely(!raw)) {
2401da177e4SLinus Torvalds 			printk(KERN_WARNING "eep. End of raw list while still supposedly nodes to GC\n");
2411da177e4SLinus Torvalds 			printk(KERN_WARNING "erase block at 0x%08x. free_size 0x%08x, dirty_size 0x%08x, used_size 0x%08x\n",
2421da177e4SLinus Torvalds 			       jeb->offset, jeb->free_size, jeb->dirty_size, jeb->used_size);
2431da177e4SLinus Torvalds 			jeb->gc_node = raw;
2441da177e4SLinus Torvalds 			spin_unlock(&c->erase_completion_lock);
2451da177e4SLinus Torvalds 			up(&c->alloc_sem);
2461da177e4SLinus Torvalds 			BUG();
2471da177e4SLinus Torvalds 		}
2481da177e4SLinus Torvalds 	}
2491da177e4SLinus Torvalds 	jeb->gc_node = raw;
2501da177e4SLinus Torvalds 
2511da177e4SLinus Torvalds 	D1(printk(KERN_DEBUG "Going to garbage collect node at 0x%08x\n", ref_offset(raw)));
2521da177e4SLinus Torvalds 
2531da177e4SLinus Torvalds 	if (!raw->next_in_ino) {
2541da177e4SLinus Torvalds 		/* Inode-less node. Clean marker, snapshot or something like that */
2551da177e4SLinus Torvalds 		/* FIXME: If it's something that needs to be copied, including something
2561da177e4SLinus Torvalds 		   we don't grok that has JFFS2_NODETYPE_RWCOMPAT_COPY, we should do so */
2571da177e4SLinus Torvalds 		spin_unlock(&c->erase_completion_lock);
2581da177e4SLinus Torvalds 		jffs2_mark_node_obsolete(c, raw);
2591da177e4SLinus Torvalds 		up(&c->alloc_sem);
2601da177e4SLinus Torvalds 		goto eraseit_lock;
2611da177e4SLinus Torvalds 	}
2621da177e4SLinus Torvalds 
2631da177e4SLinus Torvalds 	ic = jffs2_raw_ref_to_ic(raw);
2641da177e4SLinus Torvalds 
2651da177e4SLinus Torvalds 	/* We need to hold the inocache. Either the erase_completion_lock or
2661da177e4SLinus Torvalds 	   the inocache_lock are sufficient; we trade down since the inocache_lock
2671da177e4SLinus Torvalds 	   causes less contention. */
2681da177e4SLinus Torvalds 	spin_lock(&c->inocache_lock);
2691da177e4SLinus Torvalds 
2701da177e4SLinus Torvalds 	spin_unlock(&c->erase_completion_lock);
2711da177e4SLinus Torvalds 
2721da177e4SLinus Torvalds 	D1(printk(KERN_DEBUG "jffs2_garbage_collect_pass collecting from block @0x%08x. Node @0x%08x(%d), ino #%u\n", jeb->offset, ref_offset(raw), ref_flags(raw), ic->ino));
2731da177e4SLinus Torvalds 
2741da177e4SLinus Torvalds 	/* Three possibilities:
2751da177e4SLinus Torvalds 	   1. Inode is already in-core. We must iget it and do proper
2761da177e4SLinus Torvalds 	      updating to its fragtree, etc.
2771da177e4SLinus Torvalds 	   2. Inode is not in-core, node is REF_PRISTINE. We lock the
2781da177e4SLinus Torvalds 	      inocache to prevent a read_inode(), copy the node intact.
2791da177e4SLinus Torvalds 	   3. Inode is not in-core, node is not pristine. We must iget()
2801da177e4SLinus Torvalds 	      and take the slow path.
2811da177e4SLinus Torvalds 	*/
2821da177e4SLinus Torvalds 
2831da177e4SLinus Torvalds 	switch(ic->state) {
2841da177e4SLinus Torvalds 	case INO_STATE_CHECKEDABSENT:
2851da177e4SLinus Torvalds 		/* It's been checked, but it's not currently in-core.
2861da177e4SLinus Torvalds 		   We can just copy any pristine nodes, but have
2871da177e4SLinus Torvalds 		   to prevent anyone else from doing read_inode() while
2881da177e4SLinus Torvalds 		   we're at it, so we set the state accordingly */
2891da177e4SLinus Torvalds 		if (ref_flags(raw) == REF_PRISTINE)
2901da177e4SLinus Torvalds 			ic->state = INO_STATE_GC;
2911da177e4SLinus Torvalds 		else {
2921da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Ino #%u is absent but node not REF_PRISTINE. Reading.\n",
2931da177e4SLinus Torvalds 				  ic->ino));
2941da177e4SLinus Torvalds 		}
2951da177e4SLinus Torvalds 		break;
2961da177e4SLinus Torvalds 
2971da177e4SLinus Torvalds 	case INO_STATE_PRESENT:
2981da177e4SLinus Torvalds 		/* It's in-core. GC must iget() it. */
2991da177e4SLinus Torvalds 		break;
3001da177e4SLinus Torvalds 
3011da177e4SLinus Torvalds 	case INO_STATE_UNCHECKED:
3021da177e4SLinus Torvalds 	case INO_STATE_CHECKING:
3031da177e4SLinus Torvalds 	case INO_STATE_GC:
3041da177e4SLinus Torvalds 		/* Should never happen. We should have finished checking
3051da177e4SLinus Torvalds 		   by the time we actually start doing any GC, and since
3061da177e4SLinus Torvalds 		   we're holding the alloc_sem, no other garbage collection
3071da177e4SLinus Torvalds 		   can happen.
3081da177e4SLinus Torvalds 		*/
3091da177e4SLinus Torvalds 		printk(KERN_CRIT "Inode #%u already in state %d in jffs2_garbage_collect_pass()!\n",
3101da177e4SLinus Torvalds 		       ic->ino, ic->state);
3111da177e4SLinus Torvalds 		up(&c->alloc_sem);
3121da177e4SLinus Torvalds 		spin_unlock(&c->inocache_lock);
3131da177e4SLinus Torvalds 		BUG();
3141da177e4SLinus Torvalds 
3151da177e4SLinus Torvalds 	case INO_STATE_READING:
3161da177e4SLinus Torvalds 		/* Someone's currently trying to read it. We must wait for
3171da177e4SLinus Torvalds 		   them to finish and then go through the full iget() route
3181da177e4SLinus Torvalds 		   to do the GC. However, sometimes read_inode() needs to get
3191da177e4SLinus Torvalds 		   the alloc_sem() (for marking nodes invalid) so we must
3201da177e4SLinus Torvalds 		   drop the alloc_sem before sleeping. */
3211da177e4SLinus Torvalds 
3221da177e4SLinus Torvalds 		up(&c->alloc_sem);
3231da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "jffs2_garbage_collect_pass() waiting for ino #%u in state %d\n",
3241da177e4SLinus Torvalds 			  ic->ino, ic->state));
3251da177e4SLinus Torvalds 		sleep_on_spinunlock(&c->inocache_wq, &c->inocache_lock);
3261da177e4SLinus Torvalds 		/* And because we dropped the alloc_sem we must start again from the
3271da177e4SLinus Torvalds 		   beginning. Ponder chance of livelock here -- we're returning success
3281da177e4SLinus Torvalds 		   without actually making any progress.
3291da177e4SLinus Torvalds 
3301da177e4SLinus Torvalds 		   Q: What are the chances that the inode is back in INO_STATE_READING
3311da177e4SLinus Torvalds 		   again by the time we next enter this function? And that this happens
3321da177e4SLinus Torvalds 		   enough times to cause a real delay?
3331da177e4SLinus Torvalds 
3341da177e4SLinus Torvalds 		   A: Small enough that I don't care :)
3351da177e4SLinus Torvalds 		*/
3361da177e4SLinus Torvalds 		return 0;
3371da177e4SLinus Torvalds 	}
3381da177e4SLinus Torvalds 
3391da177e4SLinus Torvalds 	/* OK. Now if the inode is in state INO_STATE_GC, we are going to copy the
3401da177e4SLinus Torvalds 	   node intact, and we don't have to muck about with the fragtree etc.
3411da177e4SLinus Torvalds 	   because we know it's not in-core. If it _was_ in-core, we go through
3421da177e4SLinus Torvalds 	   all the iget() crap anyway */
3431da177e4SLinus Torvalds 
3441da177e4SLinus Torvalds 	if (ic->state == INO_STATE_GC) {
3451da177e4SLinus Torvalds 		spin_unlock(&c->inocache_lock);
3461da177e4SLinus Torvalds 
3471da177e4SLinus Torvalds 		ret = jffs2_garbage_collect_pristine(c, ic, raw);
3481da177e4SLinus Torvalds 
3491da177e4SLinus Torvalds 		spin_lock(&c->inocache_lock);
3501da177e4SLinus Torvalds 		ic->state = INO_STATE_CHECKEDABSENT;
3511da177e4SLinus Torvalds 		wake_up(&c->inocache_wq);
3521da177e4SLinus Torvalds 
3531da177e4SLinus Torvalds 		if (ret != -EBADFD) {
3541da177e4SLinus Torvalds 			spin_unlock(&c->inocache_lock);
3551da177e4SLinus Torvalds 			goto release_sem;
3561da177e4SLinus Torvalds 		}
3571da177e4SLinus Torvalds 
3581da177e4SLinus Torvalds 		/* Fall through if it wanted us to, with inocache_lock held */
3591da177e4SLinus Torvalds 	}
3601da177e4SLinus Torvalds 
3611da177e4SLinus Torvalds 	/* Prevent the fairly unlikely race where the gcblock is
3621da177e4SLinus Torvalds 	   entirely obsoleted by the final close of a file which had
3631da177e4SLinus Torvalds 	   the only valid nodes in the block, followed by erasure,
3641da177e4SLinus Torvalds 	   followed by freeing of the ic because the erased block(s)
3651da177e4SLinus Torvalds 	   held _all_ the nodes of that inode.... never been seen but
3661da177e4SLinus Torvalds 	   it's vaguely possible. */
3671da177e4SLinus Torvalds 
3681da177e4SLinus Torvalds 	inum = ic->ino;
3691da177e4SLinus Torvalds 	nlink = ic->nlink;
3701da177e4SLinus Torvalds 	spin_unlock(&c->inocache_lock);
3711da177e4SLinus Torvalds 
3721da177e4SLinus Torvalds 	f = jffs2_gc_fetch_inode(c, inum, nlink);
3731da177e4SLinus Torvalds 	if (IS_ERR(f)) {
3741da177e4SLinus Torvalds 		ret = PTR_ERR(f);
3751da177e4SLinus Torvalds 		goto release_sem;
3761da177e4SLinus Torvalds 	}
3771da177e4SLinus Torvalds 	if (!f) {
3781da177e4SLinus Torvalds 		ret = 0;
3791da177e4SLinus Torvalds 		goto release_sem;
3801da177e4SLinus Torvalds 	}
3811da177e4SLinus Torvalds 
3821da177e4SLinus Torvalds 	ret = jffs2_garbage_collect_live(c, jeb, raw, f);
3831da177e4SLinus Torvalds 
3841da177e4SLinus Torvalds 	jffs2_gc_release_inode(c, f);
3851da177e4SLinus Torvalds 
3861da177e4SLinus Torvalds  release_sem:
3871da177e4SLinus Torvalds 	up(&c->alloc_sem);
3881da177e4SLinus Torvalds 
3891da177e4SLinus Torvalds  eraseit_lock:
3901da177e4SLinus Torvalds 	/* If we've finished this block, start it erasing */
3911da177e4SLinus Torvalds 	spin_lock(&c->erase_completion_lock);
3921da177e4SLinus Torvalds 
3931da177e4SLinus Torvalds  eraseit:
3941da177e4SLinus Torvalds 	if (c->gcblock && !c->gcblock->used_size) {
3951da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Block at 0x%08x completely obsoleted by GC. Moving to erase_pending_list\n", c->gcblock->offset));
3961da177e4SLinus Torvalds 		/* We're GC'ing an empty block? */
3971da177e4SLinus Torvalds 		list_add_tail(&c->gcblock->list, &c->erase_pending_list);
3981da177e4SLinus Torvalds 		c->gcblock = NULL;
3991da177e4SLinus Torvalds 		c->nr_erasing_blocks++;
4001da177e4SLinus Torvalds 		jffs2_erase_pending_trigger(c);
4011da177e4SLinus Torvalds 	}
4021da177e4SLinus Torvalds 	spin_unlock(&c->erase_completion_lock);
4031da177e4SLinus Torvalds 
4041da177e4SLinus Torvalds 	return ret;
4051da177e4SLinus Torvalds }
4061da177e4SLinus Torvalds 
4071da177e4SLinus Torvalds static int jffs2_garbage_collect_live(struct jffs2_sb_info *c,  struct jffs2_eraseblock *jeb,
4081da177e4SLinus Torvalds 				      struct jffs2_raw_node_ref *raw, struct jffs2_inode_info *f)
4091da177e4SLinus Torvalds {
4101da177e4SLinus Torvalds 	struct jffs2_node_frag *frag;
4111da177e4SLinus Torvalds 	struct jffs2_full_dnode *fn = NULL;
4121da177e4SLinus Torvalds 	struct jffs2_full_dirent *fd;
4131da177e4SLinus Torvalds 	uint32_t start = 0, end = 0, nrfrags = 0;
4141da177e4SLinus Torvalds 	int ret = 0;
4151da177e4SLinus Torvalds 
4161da177e4SLinus Torvalds 	down(&f->sem);
4171da177e4SLinus Torvalds 
4181da177e4SLinus Torvalds 	/* Now we have the lock for this inode. Check that it's still the one at the head
4191da177e4SLinus Torvalds 	   of the list. */
4201da177e4SLinus Torvalds 
4211da177e4SLinus Torvalds 	spin_lock(&c->erase_completion_lock);
4221da177e4SLinus Torvalds 
4231da177e4SLinus Torvalds 	if (c->gcblock != jeb) {
4241da177e4SLinus Torvalds 		spin_unlock(&c->erase_completion_lock);
4251da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "GC block is no longer gcblock. Restart\n"));
4261da177e4SLinus Torvalds 		goto upnout;
4271da177e4SLinus Torvalds 	}
4281da177e4SLinus Torvalds 	if (ref_obsolete(raw)) {
4291da177e4SLinus Torvalds 		spin_unlock(&c->erase_completion_lock);
4301da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "node to be GC'd was obsoleted in the meantime.\n"));
4311da177e4SLinus Torvalds 		/* They'll call again */
4321da177e4SLinus Torvalds 		goto upnout;
4331da177e4SLinus Torvalds 	}
4341da177e4SLinus Torvalds 	spin_unlock(&c->erase_completion_lock);
4351da177e4SLinus Torvalds 
4361da177e4SLinus Torvalds 	/* OK. Looks safe. And nobody can get us now because we have the semaphore. Move the block */
4371da177e4SLinus Torvalds 	if (f->metadata && f->metadata->raw == raw) {
4381da177e4SLinus Torvalds 		fn = f->metadata;
4391da177e4SLinus Torvalds 		ret = jffs2_garbage_collect_metadata(c, jeb, f, fn);
4401da177e4SLinus Torvalds 		goto upnout;
4411da177e4SLinus Torvalds 	}
4421da177e4SLinus Torvalds 
4431da177e4SLinus Torvalds 	/* FIXME. Read node and do lookup? */
4441da177e4SLinus Torvalds 	for (frag = frag_first(&f->fragtree); frag; frag = frag_next(frag)) {
4451da177e4SLinus Torvalds 		if (frag->node && frag->node->raw == raw) {
4461da177e4SLinus Torvalds 			fn = frag->node;
4471da177e4SLinus Torvalds 			end = frag->ofs + frag->size;
4481da177e4SLinus Torvalds 			if (!nrfrags++)
4491da177e4SLinus Torvalds 				start = frag->ofs;
4501da177e4SLinus Torvalds 			if (nrfrags == frag->node->frags)
4511da177e4SLinus Torvalds 				break; /* We've found them all */
4521da177e4SLinus Torvalds 		}
4531da177e4SLinus Torvalds 	}
4541da177e4SLinus Torvalds 	if (fn) {
4551da177e4SLinus Torvalds 		if (ref_flags(raw) == REF_PRISTINE) {
4561da177e4SLinus Torvalds 			ret = jffs2_garbage_collect_pristine(c, f->inocache, raw);
4571da177e4SLinus Torvalds 			if (!ret) {
4581da177e4SLinus Torvalds 				/* Urgh. Return it sensibly. */
4591da177e4SLinus Torvalds 				frag->node->raw = f->inocache->nodes;
4601da177e4SLinus Torvalds 			}
4611da177e4SLinus Torvalds 			if (ret != -EBADFD)
4621da177e4SLinus Torvalds 				goto upnout;
4631da177e4SLinus Torvalds 		}
4641da177e4SLinus Torvalds 		/* We found a datanode. Do the GC */
4651da177e4SLinus Torvalds 		if((start >> PAGE_CACHE_SHIFT) < ((end-1) >> PAGE_CACHE_SHIFT)) {
4661da177e4SLinus Torvalds 			/* It crosses a page boundary. Therefore, it must be a hole. */
4671da177e4SLinus Torvalds 			ret = jffs2_garbage_collect_hole(c, jeb, f, fn, start, end);
4681da177e4SLinus Torvalds 		} else {
4691da177e4SLinus Torvalds 			/* It could still be a hole. But we GC the page this way anyway */
4701da177e4SLinus Torvalds 			ret = jffs2_garbage_collect_dnode(c, jeb, f, fn, start, end);
4711da177e4SLinus Torvalds 		}
4721da177e4SLinus Torvalds 		goto upnout;
4731da177e4SLinus Torvalds 	}
4741da177e4SLinus Torvalds 
4751da177e4SLinus Torvalds 	/* Wasn't a dnode. Try dirent */
4761da177e4SLinus Torvalds 	for (fd = f->dents; fd; fd=fd->next) {
4771da177e4SLinus Torvalds 		if (fd->raw == raw)
4781da177e4SLinus Torvalds 			break;
4791da177e4SLinus Torvalds 	}
4801da177e4SLinus Torvalds 
4811da177e4SLinus Torvalds 	if (fd && fd->ino) {
4821da177e4SLinus Torvalds 		ret = jffs2_garbage_collect_dirent(c, jeb, f, fd);
4831da177e4SLinus Torvalds 	} else if (fd) {
4841da177e4SLinus Torvalds 		ret = jffs2_garbage_collect_deletion_dirent(c, jeb, f, fd);
4851da177e4SLinus Torvalds 	} else {
4861da177e4SLinus Torvalds 		printk(KERN_WARNING "Raw node at 0x%08x wasn't in node lists for ino #%u\n",
4871da177e4SLinus Torvalds 		       ref_offset(raw), f->inocache->ino);
4881da177e4SLinus Torvalds 		if (ref_obsolete(raw)) {
4891da177e4SLinus Torvalds 			printk(KERN_WARNING "But it's obsolete so we don't mind too much\n");
4901da177e4SLinus Torvalds 		} else {
491e0c8e42fSArtem B. Bityutskiy 			jffs2_dbg_dump_node(c, ref_offset(raw));
492e0c8e42fSArtem B. Bityutskiy 			BUG();
4931da177e4SLinus Torvalds 		}
4941da177e4SLinus Torvalds 	}
4951da177e4SLinus Torvalds  upnout:
4961da177e4SLinus Torvalds 	up(&f->sem);
4971da177e4SLinus Torvalds 
4981da177e4SLinus Torvalds 	return ret;
4991da177e4SLinus Torvalds }
5001da177e4SLinus Torvalds 
5011da177e4SLinus Torvalds static int jffs2_garbage_collect_pristine(struct jffs2_sb_info *c,
5021da177e4SLinus Torvalds 					  struct jffs2_inode_cache *ic,
5031da177e4SLinus Torvalds 					  struct jffs2_raw_node_ref *raw)
5041da177e4SLinus Torvalds {
5051da177e4SLinus Torvalds 	union jffs2_node_union *node;
5061da177e4SLinus Torvalds 	struct jffs2_raw_node_ref *nraw;
5071da177e4SLinus Torvalds 	size_t retlen;
5081da177e4SLinus Torvalds 	int ret;
5091da177e4SLinus Torvalds 	uint32_t phys_ofs, alloclen;
5101da177e4SLinus Torvalds 	uint32_t crc, rawlen;
5111da177e4SLinus Torvalds 	int retried = 0;
5121da177e4SLinus Torvalds 
5131da177e4SLinus Torvalds 	D1(printk(KERN_DEBUG "Going to GC REF_PRISTINE node at 0x%08x\n", ref_offset(raw)));
5141da177e4SLinus Torvalds 
5151da177e4SLinus Torvalds 	rawlen = ref_totlen(c, c->gcblock, raw);
5161da177e4SLinus Torvalds 
5171da177e4SLinus Torvalds 	/* Ask for a small amount of space (or the totlen if smaller) because we
5181da177e4SLinus Torvalds 	   don't want to force wastage of the end of a block if splitting would
5191da177e4SLinus Torvalds 	   work. */
520e631ddbaSFerenc Havasi 	ret = jffs2_reserve_space_gc(c, min_t(uint32_t, sizeof(struct jffs2_raw_inode) +
521e631ddbaSFerenc Havasi 				JFFS2_MIN_DATA_LEN, rawlen), &phys_ofs, &alloclen, rawlen);
522e631ddbaSFerenc Havasi 				/* this is not the exact summary size of it,
523e631ddbaSFerenc Havasi 					it is only an upper estimation */
524e631ddbaSFerenc Havasi 
5251da177e4SLinus Torvalds 	if (ret)
5261da177e4SLinus Torvalds 		return ret;
5271da177e4SLinus Torvalds 
5281da177e4SLinus Torvalds 	if (alloclen < rawlen) {
5291da177e4SLinus Torvalds 		/* Doesn't fit untouched. We'll go the old route and split it */
5301da177e4SLinus Torvalds 		return -EBADFD;
5311da177e4SLinus Torvalds 	}
5321da177e4SLinus Torvalds 
5331da177e4SLinus Torvalds 	node = kmalloc(rawlen, GFP_KERNEL);
5341da177e4SLinus Torvalds 	if (!node)
5351da177e4SLinus Torvalds                return -ENOMEM;
5361da177e4SLinus Torvalds 
5371da177e4SLinus Torvalds 	ret = jffs2_flash_read(c, ref_offset(raw), rawlen, &retlen, (char *)node);
5381da177e4SLinus Torvalds 	if (!ret && retlen != rawlen)
5391da177e4SLinus Torvalds 		ret = -EIO;
5401da177e4SLinus Torvalds 	if (ret)
5411da177e4SLinus Torvalds 		goto out_node;
5421da177e4SLinus Torvalds 
5431da177e4SLinus Torvalds 	crc = crc32(0, node, sizeof(struct jffs2_unknown_node)-4);
5441da177e4SLinus Torvalds 	if (je32_to_cpu(node->u.hdr_crc) != crc) {
5451da177e4SLinus Torvalds 		printk(KERN_WARNING "Header CRC failed on REF_PRISTINE node at 0x%08x: Read 0x%08x, calculated 0x%08x\n",
5461da177e4SLinus Torvalds 		       ref_offset(raw), je32_to_cpu(node->u.hdr_crc), crc);
5471da177e4SLinus Torvalds 		goto bail;
5481da177e4SLinus Torvalds 	}
5491da177e4SLinus Torvalds 
5501da177e4SLinus Torvalds 	switch(je16_to_cpu(node->u.nodetype)) {
5511da177e4SLinus Torvalds 	case JFFS2_NODETYPE_INODE:
5521da177e4SLinus Torvalds 		crc = crc32(0, node, sizeof(node->i)-8);
5531da177e4SLinus Torvalds 		if (je32_to_cpu(node->i.node_crc) != crc) {
5541da177e4SLinus Torvalds 			printk(KERN_WARNING "Node CRC failed on REF_PRISTINE data node at 0x%08x: Read 0x%08x, calculated 0x%08x\n",
5551da177e4SLinus Torvalds 			       ref_offset(raw), je32_to_cpu(node->i.node_crc), crc);
5561da177e4SLinus Torvalds 			goto bail;
5571da177e4SLinus Torvalds 		}
5581da177e4SLinus Torvalds 
5591da177e4SLinus Torvalds 		if (je32_to_cpu(node->i.dsize)) {
5601da177e4SLinus Torvalds 			crc = crc32(0, node->i.data, je32_to_cpu(node->i.csize));
5611da177e4SLinus Torvalds 			if (je32_to_cpu(node->i.data_crc) != crc) {
5621da177e4SLinus Torvalds 				printk(KERN_WARNING "Data CRC failed on REF_PRISTINE data node at 0x%08x: Read 0x%08x, calculated 0x%08x\n",
5631da177e4SLinus Torvalds 				       ref_offset(raw), je32_to_cpu(node->i.data_crc), crc);
5641da177e4SLinus Torvalds 				goto bail;
5651da177e4SLinus Torvalds 			}
5661da177e4SLinus Torvalds 		}
5671da177e4SLinus Torvalds 		break;
5681da177e4SLinus Torvalds 
5691da177e4SLinus Torvalds 	case JFFS2_NODETYPE_DIRENT:
5701da177e4SLinus Torvalds 		crc = crc32(0, node, sizeof(node->d)-8);
5711da177e4SLinus Torvalds 		if (je32_to_cpu(node->d.node_crc) != crc) {
5721da177e4SLinus Torvalds 			printk(KERN_WARNING "Node CRC failed on REF_PRISTINE dirent node at 0x%08x: Read 0x%08x, calculated 0x%08x\n",
5731da177e4SLinus Torvalds 			       ref_offset(raw), je32_to_cpu(node->d.node_crc), crc);
5741da177e4SLinus Torvalds 			goto bail;
5751da177e4SLinus Torvalds 		}
5761da177e4SLinus Torvalds 
5771da177e4SLinus Torvalds 		if (node->d.nsize) {
5781da177e4SLinus Torvalds 			crc = crc32(0, node->d.name, node->d.nsize);
5791da177e4SLinus Torvalds 			if (je32_to_cpu(node->d.name_crc) != crc) {
5801da177e4SLinus Torvalds 				printk(KERN_WARNING "Name CRC failed on REF_PRISTINE dirent ode at 0x%08x: Read 0x%08x, calculated 0x%08x\n",
5811da177e4SLinus Torvalds 				       ref_offset(raw), je32_to_cpu(node->d.name_crc), crc);
5821da177e4SLinus Torvalds 				goto bail;
5831da177e4SLinus Torvalds 			}
5841da177e4SLinus Torvalds 		}
5851da177e4SLinus Torvalds 		break;
5861da177e4SLinus Torvalds 	default:
5871da177e4SLinus Torvalds 		printk(KERN_WARNING "Unknown node type for REF_PRISTINE node at 0x%08x: 0x%04x\n",
5881da177e4SLinus Torvalds 		       ref_offset(raw), je16_to_cpu(node->u.nodetype));
5891da177e4SLinus Torvalds 		goto bail;
5901da177e4SLinus Torvalds 	}
5911da177e4SLinus Torvalds 
5921da177e4SLinus Torvalds 	nraw = jffs2_alloc_raw_node_ref();
5931da177e4SLinus Torvalds 	if (!nraw) {
5941da177e4SLinus Torvalds 		ret = -ENOMEM;
5951da177e4SLinus Torvalds 		goto out_node;
5961da177e4SLinus Torvalds 	}
5971da177e4SLinus Torvalds 
5981da177e4SLinus Torvalds 	/* OK, all the CRCs are good; this node can just be copied as-is. */
5991da177e4SLinus Torvalds  retry:
6001da177e4SLinus Torvalds 	nraw->flash_offset = phys_ofs;
6011da177e4SLinus Torvalds 	nraw->__totlen = rawlen;
6021da177e4SLinus Torvalds 	nraw->next_phys = NULL;
6031da177e4SLinus Torvalds 
6041da177e4SLinus Torvalds 	ret = jffs2_flash_write(c, phys_ofs, rawlen, &retlen, (char *)node);
6051da177e4SLinus Torvalds 
6061da177e4SLinus Torvalds 	if (ret || (retlen != rawlen)) {
6071da177e4SLinus Torvalds 		printk(KERN_NOTICE "Write of %d bytes at 0x%08x failed. returned %d, retlen %zd\n",
6081da177e4SLinus Torvalds                        rawlen, phys_ofs, ret, retlen);
6091da177e4SLinus Torvalds 		if (retlen) {
6101da177e4SLinus Torvalds                         /* Doesn't belong to any inode */
6111da177e4SLinus Torvalds 			nraw->next_in_ino = NULL;
6121da177e4SLinus Torvalds 
6131da177e4SLinus Torvalds 			nraw->flash_offset |= REF_OBSOLETE;
6141da177e4SLinus Torvalds 			jffs2_add_physical_node_ref(c, nraw);
6151da177e4SLinus Torvalds 			jffs2_mark_node_obsolete(c, nraw);
6161da177e4SLinus Torvalds 		} else {
6171da177e4SLinus Torvalds 			printk(KERN_NOTICE "Not marking the space at 0x%08x as dirty because the flash driver returned retlen zero\n", nraw->flash_offset);
6181da177e4SLinus Torvalds                         jffs2_free_raw_node_ref(nraw);
6191da177e4SLinus Torvalds 		}
6201da177e4SLinus Torvalds 		if (!retried && (nraw = jffs2_alloc_raw_node_ref())) {
6211da177e4SLinus Torvalds 			/* Try to reallocate space and retry */
6221da177e4SLinus Torvalds 			uint32_t dummy;
6231da177e4SLinus Torvalds 			struct jffs2_eraseblock *jeb = &c->blocks[phys_ofs / c->sector_size];
6241da177e4SLinus Torvalds 
6251da177e4SLinus Torvalds 			retried = 1;
6261da177e4SLinus Torvalds 
6271da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Retrying failed write of REF_PRISTINE node.\n"));
6281da177e4SLinus Torvalds 
629730554d9SArtem B. Bityutskiy 			jffs2_dbg_acct_sanity_check(c,jeb);
630730554d9SArtem B. Bityutskiy 			jffs2_dbg_acct_paranoia_check(c, jeb);
6311da177e4SLinus Torvalds 
632e631ddbaSFerenc Havasi 			ret = jffs2_reserve_space_gc(c, rawlen, &phys_ofs, &dummy, rawlen);
633e631ddbaSFerenc Havasi 						/* this is not the exact summary size of it,
634e631ddbaSFerenc Havasi 							it is only an upper estimation */
6351da177e4SLinus Torvalds 
6361da177e4SLinus Torvalds 			if (!ret) {
6371da177e4SLinus Torvalds 				D1(printk(KERN_DEBUG "Allocated space at 0x%08x to retry failed write.\n", phys_ofs));
6381da177e4SLinus Torvalds 
639730554d9SArtem B. Bityutskiy 				jffs2_dbg_acct_sanity_check(c,jeb);
640730554d9SArtem B. Bityutskiy 				jffs2_dbg_acct_paranoia_check(c, jeb);
6411da177e4SLinus Torvalds 
6421da177e4SLinus Torvalds 				goto retry;
6431da177e4SLinus Torvalds 			}
6441da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Failed to allocate space to retry failed write: %d!\n", ret));
6451da177e4SLinus Torvalds 			jffs2_free_raw_node_ref(nraw);
6461da177e4SLinus Torvalds 		}
6471da177e4SLinus Torvalds 
6481da177e4SLinus Torvalds 		jffs2_free_raw_node_ref(nraw);
6491da177e4SLinus Torvalds 		if (!ret)
6501da177e4SLinus Torvalds 			ret = -EIO;
6511da177e4SLinus Torvalds 		goto out_node;
6521da177e4SLinus Torvalds 	}
6531da177e4SLinus Torvalds 	nraw->flash_offset |= REF_PRISTINE;
6541da177e4SLinus Torvalds 	jffs2_add_physical_node_ref(c, nraw);
6551da177e4SLinus Torvalds 
6561da177e4SLinus Torvalds 	/* Link into per-inode list. This is safe because of the ic
6571da177e4SLinus Torvalds 	   state being INO_STATE_GC. Note that if we're doing this
6581da177e4SLinus Torvalds 	   for an inode which is in-core, the 'nraw' pointer is then
6591da177e4SLinus Torvalds 	   going to be fetched from ic->nodes by our caller. */
6601da177e4SLinus Torvalds 	spin_lock(&c->erase_completion_lock);
6611da177e4SLinus Torvalds         nraw->next_in_ino = ic->nodes;
6621da177e4SLinus Torvalds         ic->nodes = nraw;
6631da177e4SLinus Torvalds 	spin_unlock(&c->erase_completion_lock);
6641da177e4SLinus Torvalds 
6651da177e4SLinus Torvalds 	jffs2_mark_node_obsolete(c, raw);
6661da177e4SLinus Torvalds 	D1(printk(KERN_DEBUG "WHEEE! GC REF_PRISTINE node at 0x%08x succeeded\n", ref_offset(raw)));
6671da177e4SLinus Torvalds 
6681da177e4SLinus Torvalds  out_node:
6691da177e4SLinus Torvalds 	kfree(node);
6701da177e4SLinus Torvalds 	return ret;
6711da177e4SLinus Torvalds  bail:
6721da177e4SLinus Torvalds 	ret = -EBADFD;
6731da177e4SLinus Torvalds 	goto out_node;
6741da177e4SLinus Torvalds }
6751da177e4SLinus Torvalds 
6761da177e4SLinus Torvalds static int jffs2_garbage_collect_metadata(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
6771da177e4SLinus Torvalds 					struct jffs2_inode_info *f, struct jffs2_full_dnode *fn)
6781da177e4SLinus Torvalds {
6791da177e4SLinus Torvalds 	struct jffs2_full_dnode *new_fn;
6801da177e4SLinus Torvalds 	struct jffs2_raw_inode ri;
6818557fd51SArtem B. Bityuckiy 	struct jffs2_node_frag *last_frag;
6821da177e4SLinus Torvalds 	jint16_t dev;
6831da177e4SLinus Torvalds 	char *mdata = NULL, mdatalen = 0;
6848557fd51SArtem B. Bityuckiy 	uint32_t alloclen, phys_ofs, ilen;
6851da177e4SLinus Torvalds 	int ret;
6861da177e4SLinus Torvalds 
6871da177e4SLinus Torvalds 	if (S_ISBLK(JFFS2_F_I_MODE(f)) ||
6881da177e4SLinus Torvalds 	    S_ISCHR(JFFS2_F_I_MODE(f)) ) {
6891da177e4SLinus Torvalds 		/* For these, we don't actually need to read the old node */
6901da177e4SLinus Torvalds 		/* FIXME: for minor or major > 255. */
6911da177e4SLinus Torvalds 		dev = cpu_to_je16(((JFFS2_F_I_RDEV_MAJ(f) << 8) |
6921da177e4SLinus Torvalds 			JFFS2_F_I_RDEV_MIN(f)));
6931da177e4SLinus Torvalds 		mdata = (char *)&dev;
6941da177e4SLinus Torvalds 		mdatalen = sizeof(dev);
6951da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "jffs2_garbage_collect_metadata(): Writing %d bytes of kdev_t\n", mdatalen));
6961da177e4SLinus Torvalds 	} else if (S_ISLNK(JFFS2_F_I_MODE(f))) {
6971da177e4SLinus Torvalds 		mdatalen = fn->size;
6981da177e4SLinus Torvalds 		mdata = kmalloc(fn->size, GFP_KERNEL);
6991da177e4SLinus Torvalds 		if (!mdata) {
7001da177e4SLinus Torvalds 			printk(KERN_WARNING "kmalloc of mdata failed in jffs2_garbage_collect_metadata()\n");
7011da177e4SLinus Torvalds 			return -ENOMEM;
7021da177e4SLinus Torvalds 		}
7031da177e4SLinus Torvalds 		ret = jffs2_read_dnode(c, f, fn, mdata, 0, mdatalen);
7041da177e4SLinus Torvalds 		if (ret) {
7051da177e4SLinus Torvalds 			printk(KERN_WARNING "read of old metadata failed in jffs2_garbage_collect_metadata(): %d\n", ret);
7061da177e4SLinus Torvalds 			kfree(mdata);
7071da177e4SLinus Torvalds 			return ret;
7081da177e4SLinus Torvalds 		}
7091da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "jffs2_garbage_collect_metadata(): Writing %d bites of symlink target\n", mdatalen));
7101da177e4SLinus Torvalds 
7111da177e4SLinus Torvalds 	}
7121da177e4SLinus Torvalds 
713e631ddbaSFerenc Havasi 	ret = jffs2_reserve_space_gc(c, sizeof(ri) + mdatalen, &phys_ofs, &alloclen,
714e631ddbaSFerenc Havasi 				JFFS2_SUMMARY_INODE_SIZE);
7151da177e4SLinus Torvalds 	if (ret) {
7161da177e4SLinus Torvalds 		printk(KERN_WARNING "jffs2_reserve_space_gc of %zd bytes for garbage_collect_metadata failed: %d\n",
7171da177e4SLinus Torvalds 		       sizeof(ri)+ mdatalen, ret);
7181da177e4SLinus Torvalds 		goto out;
7191da177e4SLinus Torvalds 	}
7201da177e4SLinus Torvalds 
7218557fd51SArtem B. Bityuckiy 	last_frag = frag_last(&f->fragtree);
7228557fd51SArtem B. Bityuckiy 	if (last_frag)
7238557fd51SArtem B. Bityuckiy 		/* Fetch the inode length from the fragtree rather then
7248557fd51SArtem B. Bityuckiy 		 * from i_size since i_size may have not been updated yet */
7258557fd51SArtem B. Bityuckiy 		ilen = last_frag->ofs + last_frag->size;
7268557fd51SArtem B. Bityuckiy 	else
7278557fd51SArtem B. Bityuckiy 		ilen = JFFS2_F_I_SIZE(f);
7288557fd51SArtem B. Bityuckiy 
7291da177e4SLinus Torvalds 	memset(&ri, 0, sizeof(ri));
7301da177e4SLinus Torvalds 	ri.magic = cpu_to_je16(JFFS2_MAGIC_BITMASK);
7311da177e4SLinus Torvalds 	ri.nodetype = cpu_to_je16(JFFS2_NODETYPE_INODE);
7321da177e4SLinus Torvalds 	ri.totlen = cpu_to_je32(sizeof(ri) + mdatalen);
7331da177e4SLinus Torvalds 	ri.hdr_crc = cpu_to_je32(crc32(0, &ri, sizeof(struct jffs2_unknown_node)-4));
7341da177e4SLinus Torvalds 
7351da177e4SLinus Torvalds 	ri.ino = cpu_to_je32(f->inocache->ino);
7361da177e4SLinus Torvalds 	ri.version = cpu_to_je32(++f->highest_version);
7371da177e4SLinus Torvalds 	ri.mode = cpu_to_jemode(JFFS2_F_I_MODE(f));
7381da177e4SLinus Torvalds 	ri.uid = cpu_to_je16(JFFS2_F_I_UID(f));
7391da177e4SLinus Torvalds 	ri.gid = cpu_to_je16(JFFS2_F_I_GID(f));
7408557fd51SArtem B. Bityuckiy 	ri.isize = cpu_to_je32(ilen);
7411da177e4SLinus Torvalds 	ri.atime = cpu_to_je32(JFFS2_F_I_ATIME(f));
7421da177e4SLinus Torvalds 	ri.ctime = cpu_to_je32(JFFS2_F_I_CTIME(f));
7431da177e4SLinus Torvalds 	ri.mtime = cpu_to_je32(JFFS2_F_I_MTIME(f));
7441da177e4SLinus Torvalds 	ri.offset = cpu_to_je32(0);
7451da177e4SLinus Torvalds 	ri.csize = cpu_to_je32(mdatalen);
7461da177e4SLinus Torvalds 	ri.dsize = cpu_to_je32(mdatalen);
7471da177e4SLinus Torvalds 	ri.compr = JFFS2_COMPR_NONE;
7481da177e4SLinus Torvalds 	ri.node_crc = cpu_to_je32(crc32(0, &ri, sizeof(ri)-8));
7491da177e4SLinus Torvalds 	ri.data_crc = cpu_to_je32(crc32(0, mdata, mdatalen));
7501da177e4SLinus Torvalds 
7511da177e4SLinus Torvalds 	new_fn = jffs2_write_dnode(c, f, &ri, mdata, mdatalen, phys_ofs, ALLOC_GC);
7521da177e4SLinus Torvalds 
7531da177e4SLinus Torvalds 	if (IS_ERR(new_fn)) {
7541da177e4SLinus Torvalds 		printk(KERN_WARNING "Error writing new dnode: %ld\n", PTR_ERR(new_fn));
7551da177e4SLinus Torvalds 		ret = PTR_ERR(new_fn);
7561da177e4SLinus Torvalds 		goto out;
7571da177e4SLinus Torvalds 	}
7581da177e4SLinus Torvalds 	jffs2_mark_node_obsolete(c, fn->raw);
7591da177e4SLinus Torvalds 	jffs2_free_full_dnode(fn);
7601da177e4SLinus Torvalds 	f->metadata = new_fn;
7611da177e4SLinus Torvalds  out:
7621da177e4SLinus Torvalds 	if (S_ISLNK(JFFS2_F_I_MODE(f)))
7631da177e4SLinus Torvalds 		kfree(mdata);
7641da177e4SLinus Torvalds 	return ret;
7651da177e4SLinus Torvalds }
7661da177e4SLinus Torvalds 
7671da177e4SLinus Torvalds static int jffs2_garbage_collect_dirent(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
7681da177e4SLinus Torvalds 					struct jffs2_inode_info *f, struct jffs2_full_dirent *fd)
7691da177e4SLinus Torvalds {
7701da177e4SLinus Torvalds 	struct jffs2_full_dirent *new_fd;
7711da177e4SLinus Torvalds 	struct jffs2_raw_dirent rd;
7721da177e4SLinus Torvalds 	uint32_t alloclen, phys_ofs;
7731da177e4SLinus Torvalds 	int ret;
7741da177e4SLinus Torvalds 
7751da177e4SLinus Torvalds 	rd.magic = cpu_to_je16(JFFS2_MAGIC_BITMASK);
7761da177e4SLinus Torvalds 	rd.nodetype = cpu_to_je16(JFFS2_NODETYPE_DIRENT);
7771da177e4SLinus Torvalds 	rd.nsize = strlen(fd->name);
7781da177e4SLinus Torvalds 	rd.totlen = cpu_to_je32(sizeof(rd) + rd.nsize);
7791da177e4SLinus Torvalds 	rd.hdr_crc = cpu_to_je32(crc32(0, &rd, sizeof(struct jffs2_unknown_node)-4));
7801da177e4SLinus Torvalds 
7811da177e4SLinus Torvalds 	rd.pino = cpu_to_je32(f->inocache->ino);
7821da177e4SLinus Torvalds 	rd.version = cpu_to_je32(++f->highest_version);
7831da177e4SLinus Torvalds 	rd.ino = cpu_to_je32(fd->ino);
7843a69e0cdSArtem B. Bityutskiy 	/* If the times on this inode were set by explicit utime() they can be different,
7853a69e0cdSArtem B. Bityutskiy 	   so refrain from splatting them. */
7863a69e0cdSArtem B. Bityutskiy 	if (JFFS2_F_I_MTIME(f) == JFFS2_F_I_CTIME(f))
7873a69e0cdSArtem B. Bityutskiy 		rd.mctime = cpu_to_je32(JFFS2_F_I_MTIME(f));
7883a69e0cdSArtem B. Bityutskiy 	else
7893a69e0cdSArtem B. Bityutskiy 		rd.mctime = cpu_to_je32(0);
7901da177e4SLinus Torvalds 	rd.type = fd->type;
7911da177e4SLinus Torvalds 	rd.node_crc = cpu_to_je32(crc32(0, &rd, sizeof(rd)-8));
7921da177e4SLinus Torvalds 	rd.name_crc = cpu_to_je32(crc32(0, fd->name, rd.nsize));
7931da177e4SLinus Torvalds 
794e631ddbaSFerenc Havasi 	ret = jffs2_reserve_space_gc(c, sizeof(rd)+rd.nsize, &phys_ofs, &alloclen,
795e631ddbaSFerenc Havasi 				JFFS2_SUMMARY_DIRENT_SIZE(rd.nsize));
7961da177e4SLinus Torvalds 	if (ret) {
7971da177e4SLinus Torvalds 		printk(KERN_WARNING "jffs2_reserve_space_gc of %zd bytes for garbage_collect_dirent failed: %d\n",
7981da177e4SLinus Torvalds 		       sizeof(rd)+rd.nsize, ret);
7991da177e4SLinus Torvalds 		return ret;
8001da177e4SLinus Torvalds 	}
8011da177e4SLinus Torvalds 	new_fd = jffs2_write_dirent(c, f, &rd, fd->name, rd.nsize, phys_ofs, ALLOC_GC);
8021da177e4SLinus Torvalds 
8031da177e4SLinus Torvalds 	if (IS_ERR(new_fd)) {
8041da177e4SLinus Torvalds 		printk(KERN_WARNING "jffs2_write_dirent in garbage_collect_dirent failed: %ld\n", PTR_ERR(new_fd));
8051da177e4SLinus Torvalds 		return PTR_ERR(new_fd);
8061da177e4SLinus Torvalds 	}
8071da177e4SLinus Torvalds 	jffs2_add_fd_to_list(c, new_fd, &f->dents);
8081da177e4SLinus Torvalds 	return 0;
8091da177e4SLinus Torvalds }
8101da177e4SLinus Torvalds 
8111da177e4SLinus Torvalds static int jffs2_garbage_collect_deletion_dirent(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
8121da177e4SLinus Torvalds 					struct jffs2_inode_info *f, struct jffs2_full_dirent *fd)
8131da177e4SLinus Torvalds {
8141da177e4SLinus Torvalds 	struct jffs2_full_dirent **fdp = &f->dents;
8151da177e4SLinus Torvalds 	int found = 0;
8161da177e4SLinus Torvalds 
8171da177e4SLinus Torvalds 	/* On a medium where we can't actually mark nodes obsolete
8181da177e4SLinus Torvalds 	   pernamently, such as NAND flash, we need to work out
8191da177e4SLinus Torvalds 	   whether this deletion dirent is still needed to actively
8201da177e4SLinus Torvalds 	   delete a 'real' dirent with the same name that's still
8211da177e4SLinus Torvalds 	   somewhere else on the flash. */
8221da177e4SLinus Torvalds 	if (!jffs2_can_mark_obsolete(c)) {
8231da177e4SLinus Torvalds 		struct jffs2_raw_dirent *rd;
8241da177e4SLinus Torvalds 		struct jffs2_raw_node_ref *raw;
8251da177e4SLinus Torvalds 		int ret;
8261da177e4SLinus Torvalds 		size_t retlen;
8271da177e4SLinus Torvalds 		int name_len = strlen(fd->name);
8281da177e4SLinus Torvalds 		uint32_t name_crc = crc32(0, fd->name, name_len);
8291da177e4SLinus Torvalds 		uint32_t rawlen = ref_totlen(c, jeb, fd->raw);
8301da177e4SLinus Torvalds 
8311da177e4SLinus Torvalds 		rd = kmalloc(rawlen, GFP_KERNEL);
8321da177e4SLinus Torvalds 		if (!rd)
8331da177e4SLinus Torvalds 			return -ENOMEM;
8341da177e4SLinus Torvalds 
8351da177e4SLinus Torvalds 		/* Prevent the erase code from nicking the obsolete node refs while
8361da177e4SLinus Torvalds 		   we're looking at them. I really don't like this extra lock but
8371da177e4SLinus Torvalds 		   can't see any alternative. Suggestions on a postcard to... */
8381da177e4SLinus Torvalds 		down(&c->erase_free_sem);
8391da177e4SLinus Torvalds 
8401da177e4SLinus Torvalds 		for (raw = f->inocache->nodes; raw != (void *)f->inocache; raw = raw->next_in_ino) {
8411da177e4SLinus Torvalds 
8421da177e4SLinus Torvalds 			/* We only care about obsolete ones */
8431da177e4SLinus Torvalds 			if (!(ref_obsolete(raw)))
8441da177e4SLinus Torvalds 				continue;
8451da177e4SLinus Torvalds 
8461da177e4SLinus Torvalds 			/* Any dirent with the same name is going to have the same length... */
8471da177e4SLinus Torvalds 			if (ref_totlen(c, NULL, raw) != rawlen)
8481da177e4SLinus Torvalds 				continue;
8491da177e4SLinus Torvalds 
8501da177e4SLinus Torvalds 			/* Doesn't matter if there's one in the same erase block. We're going to
8511da177e4SLinus Torvalds 			   delete it too at the same time. */
8523be36675SAndrew Victor 			if (SECTOR_ADDR(raw->flash_offset) == SECTOR_ADDR(fd->raw->flash_offset))
8531da177e4SLinus Torvalds 				continue;
8541da177e4SLinus Torvalds 
8551da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Check potential deletion dirent at %08x\n", ref_offset(raw)));
8561da177e4SLinus Torvalds 
8571da177e4SLinus Torvalds 			/* This is an obsolete node belonging to the same directory, and it's of the right
8581da177e4SLinus Torvalds 			   length. We need to take a closer look...*/
8591da177e4SLinus Torvalds 			ret = jffs2_flash_read(c, ref_offset(raw), rawlen, &retlen, (char *)rd);
8601da177e4SLinus Torvalds 			if (ret) {
8611da177e4SLinus Torvalds 				printk(KERN_WARNING "jffs2_g_c_deletion_dirent(): Read error (%d) reading obsolete node at %08x\n", ret, ref_offset(raw));
8621da177e4SLinus Torvalds 				/* If we can't read it, we don't need to continue to obsolete it. Continue */
8631da177e4SLinus Torvalds 				continue;
8641da177e4SLinus Torvalds 			}
8651da177e4SLinus Torvalds 			if (retlen != rawlen) {
8661da177e4SLinus Torvalds 				printk(KERN_WARNING "jffs2_g_c_deletion_dirent(): Short read (%zd not %u) reading header from obsolete node at %08x\n",
8671da177e4SLinus Torvalds 				       retlen, rawlen, ref_offset(raw));
8681da177e4SLinus Torvalds 				continue;
8691da177e4SLinus Torvalds 			}
8701da177e4SLinus Torvalds 
8711da177e4SLinus Torvalds 			if (je16_to_cpu(rd->nodetype) != JFFS2_NODETYPE_DIRENT)
8721da177e4SLinus Torvalds 				continue;
8731da177e4SLinus Torvalds 
8741da177e4SLinus Torvalds 			/* If the name CRC doesn't match, skip */
8751da177e4SLinus Torvalds 			if (je32_to_cpu(rd->name_crc) != name_crc)
8761da177e4SLinus Torvalds 				continue;
8771da177e4SLinus Torvalds 
8781da177e4SLinus Torvalds 			/* If the name length doesn't match, or it's another deletion dirent, skip */
8791da177e4SLinus Torvalds 			if (rd->nsize != name_len || !je32_to_cpu(rd->ino))
8801da177e4SLinus Torvalds 				continue;
8811da177e4SLinus Torvalds 
8821da177e4SLinus Torvalds 			/* OK, check the actual name now */
8831da177e4SLinus Torvalds 			if (memcmp(rd->name, fd->name, name_len))
8841da177e4SLinus Torvalds 				continue;
8851da177e4SLinus Torvalds 
8861da177e4SLinus Torvalds 			/* OK. The name really does match. There really is still an older node on
8871da177e4SLinus Torvalds 			   the flash which our deletion dirent obsoletes. So we have to write out
8881da177e4SLinus Torvalds 			   a new deletion dirent to replace it */
8891da177e4SLinus Torvalds 			up(&c->erase_free_sem);
8901da177e4SLinus Torvalds 
8911da177e4SLinus Torvalds 			D1(printk(KERN_DEBUG "Deletion dirent at %08x still obsoletes real dirent \"%s\" at %08x for ino #%u\n",
8921da177e4SLinus Torvalds 				  ref_offset(fd->raw), fd->name, ref_offset(raw), je32_to_cpu(rd->ino)));
8931da177e4SLinus Torvalds 			kfree(rd);
8941da177e4SLinus Torvalds 
8951da177e4SLinus Torvalds 			return jffs2_garbage_collect_dirent(c, jeb, f, fd);
8961da177e4SLinus Torvalds 		}
8971da177e4SLinus Torvalds 
8981da177e4SLinus Torvalds 		up(&c->erase_free_sem);
8991da177e4SLinus Torvalds 		kfree(rd);
9001da177e4SLinus Torvalds 	}
9011da177e4SLinus Torvalds 
9023a69e0cdSArtem B. Bityutskiy 	/* FIXME: If we're deleting a dirent which contains the current mtime and ctime,
9033a69e0cdSArtem B. Bityutskiy 	   we should update the metadata node with those times accordingly */
9043a69e0cdSArtem B. Bityutskiy 
9051da177e4SLinus Torvalds 	/* No need for it any more. Just mark it obsolete and remove it from the list */
9061da177e4SLinus Torvalds 	while (*fdp) {
9071da177e4SLinus Torvalds 		if ((*fdp) == fd) {
9081da177e4SLinus Torvalds 			found = 1;
9091da177e4SLinus Torvalds 			*fdp = fd->next;
9101da177e4SLinus Torvalds 			break;
9111da177e4SLinus Torvalds 		}
9121da177e4SLinus Torvalds 		fdp = &(*fdp)->next;
9131da177e4SLinus Torvalds 	}
9141da177e4SLinus Torvalds 	if (!found) {
9151da177e4SLinus Torvalds 		printk(KERN_WARNING "Deletion dirent \"%s\" not found in list for ino #%u\n", fd->name, f->inocache->ino);
9161da177e4SLinus Torvalds 	}
9171da177e4SLinus Torvalds 	jffs2_mark_node_obsolete(c, fd->raw);
9181da177e4SLinus Torvalds 	jffs2_free_full_dirent(fd);
9191da177e4SLinus Torvalds 	return 0;
9201da177e4SLinus Torvalds }
9211da177e4SLinus Torvalds 
9221da177e4SLinus Torvalds static int jffs2_garbage_collect_hole(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
9231da177e4SLinus Torvalds 				      struct jffs2_inode_info *f, struct jffs2_full_dnode *fn,
9241da177e4SLinus Torvalds 				      uint32_t start, uint32_t end)
9251da177e4SLinus Torvalds {
9261da177e4SLinus Torvalds 	struct jffs2_raw_inode ri;
9271da177e4SLinus Torvalds 	struct jffs2_node_frag *frag;
9281da177e4SLinus Torvalds 	struct jffs2_full_dnode *new_fn;
9298557fd51SArtem B. Bityuckiy 	uint32_t alloclen, phys_ofs, ilen;
9301da177e4SLinus Torvalds 	int ret;
9311da177e4SLinus Torvalds 
9321da177e4SLinus Torvalds 	D1(printk(KERN_DEBUG "Writing replacement hole node for ino #%u from offset 0x%x to 0x%x\n",
9331da177e4SLinus Torvalds 		  f->inocache->ino, start, end));
9341da177e4SLinus Torvalds 
9351da177e4SLinus Torvalds 	memset(&ri, 0, sizeof(ri));
9361da177e4SLinus Torvalds 
9371da177e4SLinus Torvalds 	if(fn->frags > 1) {
9381da177e4SLinus Torvalds 		size_t readlen;
9391da177e4SLinus Torvalds 		uint32_t crc;
9401da177e4SLinus Torvalds 		/* It's partially obsoleted by a later write. So we have to
9411da177e4SLinus Torvalds 		   write it out again with the _same_ version as before */
9421da177e4SLinus Torvalds 		ret = jffs2_flash_read(c, ref_offset(fn->raw), sizeof(ri), &readlen, (char *)&ri);
9431da177e4SLinus Torvalds 		if (readlen != sizeof(ri) || ret) {
9441da177e4SLinus Torvalds 			printk(KERN_WARNING "Node read failed in jffs2_garbage_collect_hole. Ret %d, retlen %zd. Data will be lost by writing new hole node\n", ret, readlen);
9451da177e4SLinus Torvalds 			goto fill;
9461da177e4SLinus Torvalds 		}
9471da177e4SLinus Torvalds 		if (je16_to_cpu(ri.nodetype) != JFFS2_NODETYPE_INODE) {
9481da177e4SLinus Torvalds 			printk(KERN_WARNING "jffs2_garbage_collect_hole: Node at 0x%08x had node type 0x%04x instead of JFFS2_NODETYPE_INODE(0x%04x)\n",
9491da177e4SLinus Torvalds 			       ref_offset(fn->raw),
9501da177e4SLinus Torvalds 			       je16_to_cpu(ri.nodetype), JFFS2_NODETYPE_INODE);
9511da177e4SLinus Torvalds 			return -EIO;
9521da177e4SLinus Torvalds 		}
9531da177e4SLinus Torvalds 		if (je32_to_cpu(ri.totlen) != sizeof(ri)) {
9541da177e4SLinus Torvalds 			printk(KERN_WARNING "jffs2_garbage_collect_hole: Node at 0x%08x had totlen 0x%x instead of expected 0x%zx\n",
9551da177e4SLinus Torvalds 			       ref_offset(fn->raw),
9561da177e4SLinus Torvalds 			       je32_to_cpu(ri.totlen), sizeof(ri));
9571da177e4SLinus Torvalds 			return -EIO;
9581da177e4SLinus Torvalds 		}
9591da177e4SLinus Torvalds 		crc = crc32(0, &ri, sizeof(ri)-8);
9601da177e4SLinus Torvalds 		if (crc != je32_to_cpu(ri.node_crc)) {
9611da177e4SLinus Torvalds 			printk(KERN_WARNING "jffs2_garbage_collect_hole: Node at 0x%08x had CRC 0x%08x which doesn't match calculated CRC 0x%08x\n",
9621da177e4SLinus Torvalds 			       ref_offset(fn->raw),
9631da177e4SLinus Torvalds 			       je32_to_cpu(ri.node_crc), crc);
9641da177e4SLinus Torvalds 			/* FIXME: We could possibly deal with this by writing new holes for each frag */
9651da177e4SLinus Torvalds 			printk(KERN_WARNING "Data in the range 0x%08x to 0x%08x of inode #%u will be lost\n",
9661da177e4SLinus Torvalds 			       start, end, f->inocache->ino);
9671da177e4SLinus Torvalds 			goto fill;
9681da177e4SLinus Torvalds 		}
9691da177e4SLinus Torvalds 		if (ri.compr != JFFS2_COMPR_ZERO) {
9701da177e4SLinus Torvalds 			printk(KERN_WARNING "jffs2_garbage_collect_hole: Node 0x%08x wasn't a hole node!\n", ref_offset(fn->raw));
9711da177e4SLinus Torvalds 			printk(KERN_WARNING "Data in the range 0x%08x to 0x%08x of inode #%u will be lost\n",
9721da177e4SLinus Torvalds 			       start, end, f->inocache->ino);
9731da177e4SLinus Torvalds 			goto fill;
9741da177e4SLinus Torvalds 		}
9751da177e4SLinus Torvalds 	} else {
9761da177e4SLinus Torvalds 	fill:
9771da177e4SLinus Torvalds 		ri.magic = cpu_to_je16(JFFS2_MAGIC_BITMASK);
9781da177e4SLinus Torvalds 		ri.nodetype = cpu_to_je16(JFFS2_NODETYPE_INODE);
9791da177e4SLinus Torvalds 		ri.totlen = cpu_to_je32(sizeof(ri));
9801da177e4SLinus Torvalds 		ri.hdr_crc = cpu_to_je32(crc32(0, &ri, sizeof(struct jffs2_unknown_node)-4));
9811da177e4SLinus Torvalds 
9821da177e4SLinus Torvalds 		ri.ino = cpu_to_je32(f->inocache->ino);
9831da177e4SLinus Torvalds 		ri.version = cpu_to_je32(++f->highest_version);
9841da177e4SLinus Torvalds 		ri.offset = cpu_to_je32(start);
9851da177e4SLinus Torvalds 		ri.dsize = cpu_to_je32(end - start);
9861da177e4SLinus Torvalds 		ri.csize = cpu_to_je32(0);
9871da177e4SLinus Torvalds 		ri.compr = JFFS2_COMPR_ZERO;
9881da177e4SLinus Torvalds 	}
9898557fd51SArtem B. Bityuckiy 
9908557fd51SArtem B. Bityuckiy 	frag = frag_last(&f->fragtree);
9918557fd51SArtem B. Bityuckiy 	if (frag)
9928557fd51SArtem B. Bityuckiy 		/* Fetch the inode length from the fragtree rather then
9938557fd51SArtem B. Bityuckiy 		 * from i_size since i_size may have not been updated yet */
9948557fd51SArtem B. Bityuckiy 		ilen = frag->ofs + frag->size;
9958557fd51SArtem B. Bityuckiy 	else
9968557fd51SArtem B. Bityuckiy 		ilen = JFFS2_F_I_SIZE(f);
9978557fd51SArtem B. Bityuckiy 
9981da177e4SLinus Torvalds 	ri.mode = cpu_to_jemode(JFFS2_F_I_MODE(f));
9991da177e4SLinus Torvalds 	ri.uid = cpu_to_je16(JFFS2_F_I_UID(f));
10001da177e4SLinus Torvalds 	ri.gid = cpu_to_je16(JFFS2_F_I_GID(f));
10018557fd51SArtem B. Bityuckiy 	ri.isize = cpu_to_je32(ilen);
10021da177e4SLinus Torvalds 	ri.atime = cpu_to_je32(JFFS2_F_I_ATIME(f));
10031da177e4SLinus Torvalds 	ri.ctime = cpu_to_je32(JFFS2_F_I_CTIME(f));
10041da177e4SLinus Torvalds 	ri.mtime = cpu_to_je32(JFFS2_F_I_MTIME(f));
10051da177e4SLinus Torvalds 	ri.data_crc = cpu_to_je32(0);
10061da177e4SLinus Torvalds 	ri.node_crc = cpu_to_je32(crc32(0, &ri, sizeof(ri)-8));
10071da177e4SLinus Torvalds 
1008e631ddbaSFerenc Havasi 	ret = jffs2_reserve_space_gc(c, sizeof(ri), &phys_ofs, &alloclen,
1009e631ddbaSFerenc Havasi 				JFFS2_SUMMARY_INODE_SIZE);
10101da177e4SLinus Torvalds 	if (ret) {
10111da177e4SLinus Torvalds 		printk(KERN_WARNING "jffs2_reserve_space_gc of %zd bytes for garbage_collect_hole failed: %d\n",
10121da177e4SLinus Torvalds 		       sizeof(ri), ret);
10131da177e4SLinus Torvalds 		return ret;
10141da177e4SLinus Torvalds 	}
10151da177e4SLinus Torvalds 	new_fn = jffs2_write_dnode(c, f, &ri, NULL, 0, phys_ofs, ALLOC_GC);
10161da177e4SLinus Torvalds 
10171da177e4SLinus Torvalds 	if (IS_ERR(new_fn)) {
10181da177e4SLinus Torvalds 		printk(KERN_WARNING "Error writing new hole node: %ld\n", PTR_ERR(new_fn));
10191da177e4SLinus Torvalds 		return PTR_ERR(new_fn);
10201da177e4SLinus Torvalds 	}
10211da177e4SLinus Torvalds 	if (je32_to_cpu(ri.version) == f->highest_version) {
10221da177e4SLinus Torvalds 		jffs2_add_full_dnode_to_inode(c, f, new_fn);
10231da177e4SLinus Torvalds 		if (f->metadata) {
10241da177e4SLinus Torvalds 			jffs2_mark_node_obsolete(c, f->metadata->raw);
10251da177e4SLinus Torvalds 			jffs2_free_full_dnode(f->metadata);
10261da177e4SLinus Torvalds 			f->metadata = NULL;
10271da177e4SLinus Torvalds 		}
10281da177e4SLinus Torvalds 		return 0;
10291da177e4SLinus Torvalds 	}
10301da177e4SLinus Torvalds 
10311da177e4SLinus Torvalds 	/*
10321da177e4SLinus Torvalds 	 * We should only get here in the case where the node we are
10331da177e4SLinus Torvalds 	 * replacing had more than one frag, so we kept the same version
10341da177e4SLinus Torvalds 	 * number as before. (Except in case of error -- see 'goto fill;'
10351da177e4SLinus Torvalds 	 * above.)
10361da177e4SLinus Torvalds 	 */
10371da177e4SLinus Torvalds 	D1(if(unlikely(fn->frags <= 1)) {
10381da177e4SLinus Torvalds 		printk(KERN_WARNING "jffs2_garbage_collect_hole: Replacing fn with %d frag(s) but new ver %d != highest_version %d of ino #%d\n",
10391da177e4SLinus Torvalds 		       fn->frags, je32_to_cpu(ri.version), f->highest_version,
10401da177e4SLinus Torvalds 		       je32_to_cpu(ri.ino));
10411da177e4SLinus Torvalds 	});
10421da177e4SLinus Torvalds 
10431da177e4SLinus Torvalds 	/* This is a partially-overlapped hole node. Mark it REF_NORMAL not REF_PRISTINE */
10441da177e4SLinus Torvalds 	mark_ref_normal(new_fn->raw);
10451da177e4SLinus Torvalds 
10461da177e4SLinus Torvalds 	for (frag = jffs2_lookup_node_frag(&f->fragtree, fn->ofs);
10471da177e4SLinus Torvalds 	     frag; frag = frag_next(frag)) {
10481da177e4SLinus Torvalds 		if (frag->ofs > fn->size + fn->ofs)
10491da177e4SLinus Torvalds 			break;
10501da177e4SLinus Torvalds 		if (frag->node == fn) {
10511da177e4SLinus Torvalds 			frag->node = new_fn;
10521da177e4SLinus Torvalds 			new_fn->frags++;
10531da177e4SLinus Torvalds 			fn->frags--;
10541da177e4SLinus Torvalds 		}
10551da177e4SLinus Torvalds 	}
10561da177e4SLinus Torvalds 	if (fn->frags) {
10571da177e4SLinus Torvalds 		printk(KERN_WARNING "jffs2_garbage_collect_hole: Old node still has frags!\n");
10581da177e4SLinus Torvalds 		BUG();
10591da177e4SLinus Torvalds 	}
10601da177e4SLinus Torvalds 	if (!new_fn->frags) {
10611da177e4SLinus Torvalds 		printk(KERN_WARNING "jffs2_garbage_collect_hole: New node has no frags!\n");
10621da177e4SLinus Torvalds 		BUG();
10631da177e4SLinus Torvalds 	}
10641da177e4SLinus Torvalds 
10651da177e4SLinus Torvalds 	jffs2_mark_node_obsolete(c, fn->raw);
10661da177e4SLinus Torvalds 	jffs2_free_full_dnode(fn);
10671da177e4SLinus Torvalds 
10681da177e4SLinus Torvalds 	return 0;
10691da177e4SLinus Torvalds }
10701da177e4SLinus Torvalds 
10711da177e4SLinus Torvalds static int jffs2_garbage_collect_dnode(struct jffs2_sb_info *c, struct jffs2_eraseblock *jeb,
10721da177e4SLinus Torvalds 				       struct jffs2_inode_info *f, struct jffs2_full_dnode *fn,
10731da177e4SLinus Torvalds 				       uint32_t start, uint32_t end)
10741da177e4SLinus Torvalds {
10751da177e4SLinus Torvalds 	struct jffs2_full_dnode *new_fn;
10761da177e4SLinus Torvalds 	struct jffs2_raw_inode ri;
10771da177e4SLinus Torvalds 	uint32_t alloclen, phys_ofs, offset, orig_end, orig_start;
10781da177e4SLinus Torvalds 	int ret = 0;
10791da177e4SLinus Torvalds 	unsigned char *comprbuf = NULL, *writebuf;
10801da177e4SLinus Torvalds 	unsigned long pg;
10811da177e4SLinus Torvalds 	unsigned char *pg_ptr;
10821da177e4SLinus Torvalds 
10831da177e4SLinus Torvalds 	memset(&ri, 0, sizeof(ri));
10841da177e4SLinus Torvalds 
10851da177e4SLinus Torvalds 	D1(printk(KERN_DEBUG "Writing replacement dnode for ino #%u from offset 0x%x to 0x%x\n",
10861da177e4SLinus Torvalds 		  f->inocache->ino, start, end));
10871da177e4SLinus Torvalds 
10881da177e4SLinus Torvalds 	orig_end = end;
10891da177e4SLinus Torvalds 	orig_start = start;
10901da177e4SLinus Torvalds 
10911da177e4SLinus Torvalds 	if (c->nr_free_blocks + c->nr_erasing_blocks > c->resv_blocks_gcmerge) {
10921da177e4SLinus Torvalds 		/* Attempt to do some merging. But only expand to cover logically
10931da177e4SLinus Torvalds 		   adjacent frags if the block containing them is already considered
10941da177e4SLinus Torvalds 		   to be dirty. Otherwise we end up with GC just going round in
10951da177e4SLinus Torvalds 		   circles dirtying the nodes it already wrote out, especially
10961da177e4SLinus Torvalds 		   on NAND where we have small eraseblocks and hence a much higher
10971da177e4SLinus Torvalds 		   chance of nodes having to be split to cross boundaries. */
10981da177e4SLinus Torvalds 
10991da177e4SLinus Torvalds 		struct jffs2_node_frag *frag;
11001da177e4SLinus Torvalds 		uint32_t min, max;
11011da177e4SLinus Torvalds 
11021da177e4SLinus Torvalds 		min = start & ~(PAGE_CACHE_SIZE-1);
11031da177e4SLinus Torvalds 		max = min + PAGE_CACHE_SIZE;
11041da177e4SLinus Torvalds 
11051da177e4SLinus Torvalds 		frag = jffs2_lookup_node_frag(&f->fragtree, start);
11061da177e4SLinus Torvalds 
11071da177e4SLinus Torvalds 		/* BUG_ON(!frag) but that'll happen anyway... */
11081da177e4SLinus Torvalds 
11091da177e4SLinus Torvalds 		BUG_ON(frag->ofs != start);
11101da177e4SLinus Torvalds 
11111da177e4SLinus Torvalds 		/* First grow down... */
11121da177e4SLinus Torvalds 		while((frag = frag_prev(frag)) && frag->ofs >= min) {
11131da177e4SLinus Torvalds 
11141da177e4SLinus Torvalds 			/* If the previous frag doesn't even reach the beginning, there's
11151da177e4SLinus Torvalds 			   excessive fragmentation. Just merge. */
11161da177e4SLinus Torvalds 			if (frag->ofs > min) {
11171da177e4SLinus Torvalds 				D1(printk(KERN_DEBUG "Expanding down to cover partial frag (0x%x-0x%x)\n",
11181da177e4SLinus Torvalds 					  frag->ofs, frag->ofs+frag->size));
11191da177e4SLinus Torvalds 				start = frag->ofs;
11201da177e4SLinus Torvalds 				continue;
11211da177e4SLinus Torvalds 			}
11221da177e4SLinus Torvalds 			/* OK. This frag holds the first byte of the page. */
11231da177e4SLinus Torvalds 			if (!frag->node || !frag->node->raw) {
11241da177e4SLinus Torvalds 				D1(printk(KERN_DEBUG "First frag in page is hole (0x%x-0x%x). Not expanding down.\n",
11251da177e4SLinus Torvalds 					  frag->ofs, frag->ofs+frag->size));
11261da177e4SLinus Torvalds 				break;
11271da177e4SLinus Torvalds 			} else {
11281da177e4SLinus Torvalds 
11291da177e4SLinus Torvalds 				/* OK, it's a frag which extends to the beginning of the page. Does it live
11301da177e4SLinus Torvalds 				   in a block which is still considered clean? If so, don't obsolete it.
11311da177e4SLinus Torvalds 				   If not, cover it anyway. */
11321da177e4SLinus Torvalds 
11331da177e4SLinus Torvalds 				struct jffs2_raw_node_ref *raw = frag->node->raw;
11341da177e4SLinus Torvalds 				struct jffs2_eraseblock *jeb;
11351da177e4SLinus Torvalds 
11361da177e4SLinus Torvalds 				jeb = &c->blocks[raw->flash_offset / c->sector_size];
11371da177e4SLinus Torvalds 
11381da177e4SLinus Torvalds 				if (jeb == c->gcblock) {
11391da177e4SLinus Torvalds 					D1(printk(KERN_DEBUG "Expanding down to cover frag (0x%x-0x%x) in gcblock at %08x\n",
11401da177e4SLinus Torvalds 						  frag->ofs, frag->ofs+frag->size, ref_offset(raw)));
11411da177e4SLinus Torvalds 					start = frag->ofs;
11421da177e4SLinus Torvalds 					break;
11431da177e4SLinus Torvalds 				}
11441da177e4SLinus Torvalds 				if (!ISDIRTY(jeb->dirty_size + jeb->wasted_size)) {
11451da177e4SLinus Torvalds 					D1(printk(KERN_DEBUG "Not expanding down to cover frag (0x%x-0x%x) in clean block %08x\n",
11461da177e4SLinus Torvalds 						  frag->ofs, frag->ofs+frag->size, jeb->offset));
11471da177e4SLinus Torvalds 					break;
11481da177e4SLinus Torvalds 				}
11491da177e4SLinus Torvalds 
11501da177e4SLinus Torvalds 				D1(printk(KERN_DEBUG "Expanding down to cover frag (0x%x-0x%x) in dirty block %08x\n",
11511da177e4SLinus Torvalds 						  frag->ofs, frag->ofs+frag->size, jeb->offset));
11521da177e4SLinus Torvalds 				start = frag->ofs;
11531da177e4SLinus Torvalds 				break;
11541da177e4SLinus Torvalds 			}
11551da177e4SLinus Torvalds 		}
11561da177e4SLinus Torvalds 
11571da177e4SLinus Torvalds 		/* ... then up */
11581da177e4SLinus Torvalds 
11591da177e4SLinus Torvalds 		/* Find last frag which is actually part of the node we're to GC. */
11601da177e4SLinus Torvalds 		frag = jffs2_lookup_node_frag(&f->fragtree, end-1);
11611da177e4SLinus Torvalds 
11621da177e4SLinus Torvalds 		while((frag = frag_next(frag)) && frag->ofs+frag->size <= max) {
11631da177e4SLinus Torvalds 
11641da177e4SLinus Torvalds 			/* If the previous frag doesn't even reach the beginning, there's lots
11651da177e4SLinus Torvalds 			   of fragmentation. Just merge. */
11661da177e4SLinus Torvalds 			if (frag->ofs+frag->size < max) {
11671da177e4SLinus Torvalds 				D1(printk(KERN_DEBUG "Expanding up to cover partial frag (0x%x-0x%x)\n",
11681da177e4SLinus Torvalds 					  frag->ofs, frag->ofs+frag->size));
11691da177e4SLinus Torvalds 				end = frag->ofs + frag->size;
11701da177e4SLinus Torvalds 				continue;
11711da177e4SLinus Torvalds 			}
11721da177e4SLinus Torvalds 
11731da177e4SLinus Torvalds 			if (!frag->node || !frag->node->raw) {
11741da177e4SLinus Torvalds 				D1(printk(KERN_DEBUG "Last frag in page is hole (0x%x-0x%x). Not expanding up.\n",
11751da177e4SLinus Torvalds 					  frag->ofs, frag->ofs+frag->size));
11761da177e4SLinus Torvalds 				break;
11771da177e4SLinus Torvalds 			} else {
11781da177e4SLinus Torvalds 
11791da177e4SLinus Torvalds 				/* OK, it's a frag which extends to the beginning of the page. Does it live
11801da177e4SLinus Torvalds 				   in a block which is still considered clean? If so, don't obsolete it.
11811da177e4SLinus Torvalds 				   If not, cover it anyway. */
11821da177e4SLinus Torvalds 
11831da177e4SLinus Torvalds 				struct jffs2_raw_node_ref *raw = frag->node->raw;
11841da177e4SLinus Torvalds 				struct jffs2_eraseblock *jeb;
11851da177e4SLinus Torvalds 
11861da177e4SLinus Torvalds 				jeb = &c->blocks[raw->flash_offset / c->sector_size];
11871da177e4SLinus Torvalds 
11881da177e4SLinus Torvalds 				if (jeb == c->gcblock) {
11891da177e4SLinus Torvalds 					D1(printk(KERN_DEBUG "Expanding up to cover frag (0x%x-0x%x) in gcblock at %08x\n",
11901da177e4SLinus Torvalds 						  frag->ofs, frag->ofs+frag->size, ref_offset(raw)));
11911da177e4SLinus Torvalds 					end = frag->ofs + frag->size;
11921da177e4SLinus Torvalds 					break;
11931da177e4SLinus Torvalds 				}
11941da177e4SLinus Torvalds 				if (!ISDIRTY(jeb->dirty_size + jeb->wasted_size)) {
11951da177e4SLinus Torvalds 					D1(printk(KERN_DEBUG "Not expanding up to cover frag (0x%x-0x%x) in clean block %08x\n",
11961da177e4SLinus Torvalds 						  frag->ofs, frag->ofs+frag->size, jeb->offset));
11971da177e4SLinus Torvalds 					break;
11981da177e4SLinus Torvalds 				}
11991da177e4SLinus Torvalds 
12001da177e4SLinus Torvalds 				D1(printk(KERN_DEBUG "Expanding up to cover frag (0x%x-0x%x) in dirty block %08x\n",
12011da177e4SLinus Torvalds 						  frag->ofs, frag->ofs+frag->size, jeb->offset));
12021da177e4SLinus Torvalds 				end = frag->ofs + frag->size;
12031da177e4SLinus Torvalds 				break;
12041da177e4SLinus Torvalds 			}
12051da177e4SLinus Torvalds 		}
12061da177e4SLinus Torvalds 		D1(printk(KERN_DEBUG "Expanded dnode to write from (0x%x-0x%x) to (0x%x-0x%x)\n",
12071da177e4SLinus Torvalds 			  orig_start, orig_end, start, end));
12081da177e4SLinus Torvalds 
12098557fd51SArtem B. Bityuckiy 		D1(BUG_ON(end > frag_last(&f->fragtree)->ofs + frag_last(&f->fragtree)->size));
12101da177e4SLinus Torvalds 		BUG_ON(end < orig_end);
12111da177e4SLinus Torvalds 		BUG_ON(start > orig_start);
12121da177e4SLinus Torvalds 	}
12131da177e4SLinus Torvalds 
12141da177e4SLinus Torvalds 	/* First, use readpage() to read the appropriate page into the page cache */
12151da177e4SLinus Torvalds 	/* Q: What happens if we actually try to GC the _same_ page for which commit_write()
12161da177e4SLinus Torvalds 	 *    triggered garbage collection in the first place?
12171da177e4SLinus Torvalds 	 * A: I _think_ it's OK. read_cache_page shouldn't deadlock, we'll write out the
12181da177e4SLinus Torvalds 	 *    page OK. We'll actually write it out again in commit_write, which is a little
12191da177e4SLinus Torvalds 	 *    suboptimal, but at least we're correct.
12201da177e4SLinus Torvalds 	 */
12211da177e4SLinus Torvalds 	pg_ptr = jffs2_gc_fetch_page(c, f, start, &pg);
12221da177e4SLinus Torvalds 
12231da177e4SLinus Torvalds 	if (IS_ERR(pg_ptr)) {
12241da177e4SLinus Torvalds 		printk(KERN_WARNING "read_cache_page() returned error: %ld\n", PTR_ERR(pg_ptr));
12251da177e4SLinus Torvalds 		return PTR_ERR(pg_ptr);
12261da177e4SLinus Torvalds 	}
12271da177e4SLinus Torvalds 
12281da177e4SLinus Torvalds 	offset = start;
12291da177e4SLinus Torvalds 	while(offset < orig_end) {
12301da177e4SLinus Torvalds 		uint32_t datalen;
12311da177e4SLinus Torvalds 		uint32_t cdatalen;
12321da177e4SLinus Torvalds 		uint16_t comprtype = JFFS2_COMPR_NONE;
12331da177e4SLinus Torvalds 
1234e631ddbaSFerenc Havasi 		ret = jffs2_reserve_space_gc(c, sizeof(ri) + JFFS2_MIN_DATA_LEN, &phys_ofs,
1235e631ddbaSFerenc Havasi 					&alloclen, JFFS2_SUMMARY_INODE_SIZE);
12361da177e4SLinus Torvalds 
12371da177e4SLinus Torvalds 		if (ret) {
12381da177e4SLinus Torvalds 			printk(KERN_WARNING "jffs2_reserve_space_gc of %zd bytes for garbage_collect_dnode failed: %d\n",
12391da177e4SLinus Torvalds 			       sizeof(ri)+ JFFS2_MIN_DATA_LEN, ret);
12401da177e4SLinus Torvalds 			break;
12411da177e4SLinus Torvalds 		}
12421da177e4SLinus Torvalds 		cdatalen = min_t(uint32_t, alloclen - sizeof(ri), end - offset);
12431da177e4SLinus Torvalds 		datalen = end - offset;
12441da177e4SLinus Torvalds 
12451da177e4SLinus Torvalds 		writebuf = pg_ptr + (offset & (PAGE_CACHE_SIZE -1));
12461da177e4SLinus Torvalds 
12471da177e4SLinus Torvalds 		comprtype = jffs2_compress(c, f, writebuf, &comprbuf, &datalen, &cdatalen);
12481da177e4SLinus Torvalds 
12491da177e4SLinus Torvalds 		ri.magic = cpu_to_je16(JFFS2_MAGIC_BITMASK);
12501da177e4SLinus Torvalds 		ri.nodetype = cpu_to_je16(JFFS2_NODETYPE_INODE);
12511da177e4SLinus Torvalds 		ri.totlen = cpu_to_je32(sizeof(ri) + cdatalen);
12521da177e4SLinus Torvalds 		ri.hdr_crc = cpu_to_je32(crc32(0, &ri, sizeof(struct jffs2_unknown_node)-4));
12531da177e4SLinus Torvalds 
12541da177e4SLinus Torvalds 		ri.ino = cpu_to_je32(f->inocache->ino);
12551da177e4SLinus Torvalds 		ri.version = cpu_to_je32(++f->highest_version);
12561da177e4SLinus Torvalds 		ri.mode = cpu_to_jemode(JFFS2_F_I_MODE(f));
12571da177e4SLinus Torvalds 		ri.uid = cpu_to_je16(JFFS2_F_I_UID(f));
12581da177e4SLinus Torvalds 		ri.gid = cpu_to_je16(JFFS2_F_I_GID(f));
12591da177e4SLinus Torvalds 		ri.isize = cpu_to_je32(JFFS2_F_I_SIZE(f));
12601da177e4SLinus Torvalds 		ri.atime = cpu_to_je32(JFFS2_F_I_ATIME(f));
12611da177e4SLinus Torvalds 		ri.ctime = cpu_to_je32(JFFS2_F_I_CTIME(f));
12621da177e4SLinus Torvalds 		ri.mtime = cpu_to_je32(JFFS2_F_I_MTIME(f));
12631da177e4SLinus Torvalds 		ri.offset = cpu_to_je32(offset);
12641da177e4SLinus Torvalds 		ri.csize = cpu_to_je32(cdatalen);
12651da177e4SLinus Torvalds 		ri.dsize = cpu_to_je32(datalen);
12661da177e4SLinus Torvalds 		ri.compr = comprtype & 0xff;
12671da177e4SLinus Torvalds 		ri.usercompr = (comprtype >> 8) & 0xff;
12681da177e4SLinus Torvalds 		ri.node_crc = cpu_to_je32(crc32(0, &ri, sizeof(ri)-8));
12691da177e4SLinus Torvalds 		ri.data_crc = cpu_to_je32(crc32(0, comprbuf, cdatalen));
12701da177e4SLinus Torvalds 
12711da177e4SLinus Torvalds 		new_fn = jffs2_write_dnode(c, f, &ri, comprbuf, cdatalen, phys_ofs, ALLOC_GC);
12721da177e4SLinus Torvalds 
12731da177e4SLinus Torvalds 		jffs2_free_comprbuf(comprbuf, writebuf);
12741da177e4SLinus Torvalds 
12751da177e4SLinus Torvalds 		if (IS_ERR(new_fn)) {
12761da177e4SLinus Torvalds 			printk(KERN_WARNING "Error writing new dnode: %ld\n", PTR_ERR(new_fn));
12771da177e4SLinus Torvalds 			ret = PTR_ERR(new_fn);
12781da177e4SLinus Torvalds 			break;
12791da177e4SLinus Torvalds 		}
12801da177e4SLinus Torvalds 		ret = jffs2_add_full_dnode_to_inode(c, f, new_fn);
12811da177e4SLinus Torvalds 		offset += datalen;
12821da177e4SLinus Torvalds 		if (f->metadata) {
12831da177e4SLinus Torvalds 			jffs2_mark_node_obsolete(c, f->metadata->raw);
12841da177e4SLinus Torvalds 			jffs2_free_full_dnode(f->metadata);
12851da177e4SLinus Torvalds 			f->metadata = NULL;
12861da177e4SLinus Torvalds 		}
12871da177e4SLinus Torvalds 	}
12881da177e4SLinus Torvalds 
12891da177e4SLinus Torvalds 	jffs2_gc_release_page(c, pg_ptr, &pg);
12901da177e4SLinus Torvalds 	return ret;
12911da177e4SLinus Torvalds }
1292