staging:iio:events: Use kfifo for event queue
[linux-2.6/btrfs-unstable.git] / fs / jffs2 / readinode.c
blob3093ac4fb24c2966c39b4987040dc9b5a3c33855
1 /*
2 * JFFS2 -- Journalling Flash File System, Version 2.
4 * Copyright © 2001-2007 Red Hat, Inc.
6 * Created by David Woodhouse <dwmw2@infradead.org>
8 * For licensing information, see the file 'LICENCE' in this directory.
12 #include <linux/kernel.h>
13 #include <linux/sched.h>
14 #include <linux/slab.h>
15 #include <linux/fs.h>
16 #include <linux/crc32.h>
17 #include <linux/pagemap.h>
18 #include <linux/mtd/mtd.h>
19 #include <linux/compiler.h>
20 #include "nodelist.h"
23 * Check the data CRC of the node.
25 * Returns: 0 if the data CRC is correct;
26 * 1 - if incorrect;
27 * error code if an error occurred.
29 static int check_node_data(struct jffs2_sb_info *c, struct jffs2_tmp_dnode_info *tn)
31 struct jffs2_raw_node_ref *ref = tn->fn->raw;
32 int err = 0, pointed = 0;
33 struct jffs2_eraseblock *jeb;
34 unsigned char *buffer;
35 uint32_t crc, ofs, len;
36 size_t retlen;
38 BUG_ON(tn->csize == 0);
40 /* Calculate how many bytes were already checked */
41 ofs = ref_offset(ref) + sizeof(struct jffs2_raw_inode);
42 len = tn->csize;
44 if (jffs2_is_writebuffered(c)) {
45 int adj = ofs % c->wbuf_pagesize;
46 if (likely(adj))
47 adj = c->wbuf_pagesize - adj;
49 if (adj >= tn->csize) {
50 dbg_readinode("no need to check node at %#08x, data length %u, data starts at %#08x - it has already been checked.\n",
51 ref_offset(ref), tn->csize, ofs);
52 goto adj_acc;
55 ofs += adj;
56 len -= adj;
59 dbg_readinode("check node at %#08x, data length %u, partial CRC %#08x, correct CRC %#08x, data starts at %#08x, start checking from %#08x - %u bytes.\n",
60 ref_offset(ref), tn->csize, tn->partial_crc, tn->data_crc, ofs - len, ofs, len);
62 #ifndef __ECOS
63 /* TODO: instead, incapsulate point() stuff to jffs2_flash_read(),
64 * adding and jffs2_flash_read_end() interface. */
65 err = mtd_point(c->mtd, ofs, len, &retlen, (void **)&buffer, NULL);
66 if (!err && retlen < len) {
67 JFFS2_WARNING("MTD point returned len too short: %zu instead of %u.\n", retlen, tn->csize);
68 mtd_unpoint(c->mtd, ofs, retlen);
69 } else if (err) {
70 if (err != -EOPNOTSUPP)
71 JFFS2_WARNING("MTD point failed: error code %d.\n", err);
72 } else
73 pointed = 1; /* succefully pointed to device */
74 #endif
76 if (!pointed) {
77 buffer = kmalloc(len, GFP_KERNEL);
78 if (unlikely(!buffer))
79 return -ENOMEM;
81 /* TODO: this is very frequent pattern, make it a separate
82 * routine */
83 err = jffs2_flash_read(c, ofs, len, &retlen, buffer);
84 if (err) {
85 JFFS2_ERROR("can not read %d bytes from 0x%08x, error code: %d.\n", len, ofs, err);
86 goto free_out;
89 if (retlen != len) {
90 JFFS2_ERROR("short read at %#08x: %zd instead of %d.\n", ofs, retlen, len);
91 err = -EIO;
92 goto free_out;
96 /* Continue calculating CRC */
97 crc = crc32(tn->partial_crc, buffer, len);
98 if(!pointed)
99 kfree(buffer);
100 #ifndef __ECOS
101 else
102 mtd_unpoint(c->mtd, ofs, len);
103 #endif
105 if (crc != tn->data_crc) {
106 JFFS2_NOTICE("wrong data CRC in data node at 0x%08x: read %#08x, calculated %#08x.\n",
107 ref_offset(ref), tn->data_crc, crc);
108 return 1;
111 adj_acc:
112 jeb = &c->blocks[ref->flash_offset / c->sector_size];
113 len = ref_totlen(c, jeb, ref);
114 /* If it should be REF_NORMAL, it'll get marked as such when
115 we build the fragtree, shortly. No need to worry about GC
116 moving it while it's marked REF_PRISTINE -- GC won't happen
117 till we've finished checking every inode anyway. */
118 ref->flash_offset |= REF_PRISTINE;
120 * Mark the node as having been checked and fix the
121 * accounting accordingly.
123 spin_lock(&c->erase_completion_lock);
124 jeb->used_size += len;
125 jeb->unchecked_size -= len;
126 c->used_size += len;
127 c->unchecked_size -= len;
128 jffs2_dbg_acct_paranoia_check_nolock(c, jeb);
129 spin_unlock(&c->erase_completion_lock);
131 return 0;
133 free_out:
134 if(!pointed)
135 kfree(buffer);
136 #ifndef __ECOS
137 else
138 mtd_unpoint(c->mtd, ofs, len);
139 #endif
140 return err;
144 * Helper function for jffs2_add_older_frag_to_fragtree().
146 * Checks the node if we are in the checking stage.
148 static int check_tn_node(struct jffs2_sb_info *c, struct jffs2_tmp_dnode_info *tn)
150 int ret;
152 BUG_ON(ref_obsolete(tn->fn->raw));
154 /* We only check the data CRC of unchecked nodes */
155 if (ref_flags(tn->fn->raw) != REF_UNCHECKED)
156 return 0;
158 dbg_readinode("check node %#04x-%#04x, phys offs %#08x\n",
159 tn->fn->ofs, tn->fn->ofs + tn->fn->size, ref_offset(tn->fn->raw));
161 ret = check_node_data(c, tn);
162 if (unlikely(ret < 0)) {
163 JFFS2_ERROR("check_node_data() returned error: %d.\n",
164 ret);
165 } else if (unlikely(ret > 0)) {
166 dbg_readinode("CRC error, mark it obsolete.\n");
167 jffs2_mark_node_obsolete(c, tn->fn->raw);
170 return ret;
173 static struct jffs2_tmp_dnode_info *jffs2_lookup_tn(struct rb_root *tn_root, uint32_t offset)
175 struct rb_node *next;
176 struct jffs2_tmp_dnode_info *tn = NULL;
178 dbg_readinode("root %p, offset %d\n", tn_root, offset);
180 next = tn_root->rb_node;
182 while (next) {
183 tn = rb_entry(next, struct jffs2_tmp_dnode_info, rb);
185 if (tn->fn->ofs < offset)
186 next = tn->rb.rb_right;
187 else if (tn->fn->ofs >= offset)
188 next = tn->rb.rb_left;
189 else
190 break;
193 return tn;
197 static void jffs2_kill_tn(struct jffs2_sb_info *c, struct jffs2_tmp_dnode_info *tn)
199 jffs2_mark_node_obsolete(c, tn->fn->raw);
200 jffs2_free_full_dnode(tn->fn);
201 jffs2_free_tmp_dnode_info(tn);
204 * This function is used when we read an inode. Data nodes arrive in
205 * arbitrary order -- they may be older or newer than the nodes which
206 * are already in the tree. Where overlaps occur, the older node can
207 * be discarded as long as the newer passes the CRC check. We don't
208 * bother to keep track of holes in this rbtree, and neither do we deal
209 * with frags -- we can have multiple entries starting at the same
210 * offset, and the one with the smallest length will come first in the
211 * ordering.
213 * Returns 0 if the node was handled (including marking it obsolete)
214 * < 0 an if error occurred
216 static int jffs2_add_tn_to_tree(struct jffs2_sb_info *c,
217 struct jffs2_readinode_info *rii,
218 struct jffs2_tmp_dnode_info *tn)
220 uint32_t fn_end = tn->fn->ofs + tn->fn->size;
221 struct jffs2_tmp_dnode_info *this, *ptn;
223 dbg_readinode("insert fragment %#04x-%#04x, ver %u at %08x\n", tn->fn->ofs, fn_end, tn->version, ref_offset(tn->fn->raw));
225 /* If a node has zero dsize, we only have to keep if it if it might be the
226 node with highest version -- i.e. the one which will end up as f->metadata.
227 Note that such nodes won't be REF_UNCHECKED since there are no data to
228 check anyway. */
229 if (!tn->fn->size) {
230 if (rii->mdata_tn) {
231 if (rii->mdata_tn->version < tn->version) {
232 /* We had a candidate mdata node already */
233 dbg_readinode("kill old mdata with ver %d\n", rii->mdata_tn->version);
234 jffs2_kill_tn(c, rii->mdata_tn);
235 } else {
236 dbg_readinode("kill new mdata with ver %d (older than existing %d\n",
237 tn->version, rii->mdata_tn->version);
238 jffs2_kill_tn(c, tn);
239 return 0;
242 rii->mdata_tn = tn;
243 dbg_readinode("keep new mdata with ver %d\n", tn->version);
244 return 0;
247 /* Find the earliest node which _may_ be relevant to this one */
248 this = jffs2_lookup_tn(&rii->tn_root, tn->fn->ofs);
249 if (this) {
250 /* If the node is coincident with another at a lower address,
251 back up until the other node is found. It may be relevant */
252 while (this->overlapped) {
253 ptn = tn_prev(this);
254 if (!ptn) {
256 * We killed a node which set the overlapped
257 * flags during the scan. Fix it up.
259 this->overlapped = 0;
260 break;
262 this = ptn;
264 dbg_readinode("'this' found %#04x-%#04x (%s)\n", this->fn->ofs, this->fn->ofs + this->fn->size, this->fn ? "data" : "hole");
267 while (this) {
268 if (this->fn->ofs > fn_end)
269 break;
270 dbg_readinode("Ponder this ver %d, 0x%x-0x%x\n",
271 this->version, this->fn->ofs, this->fn->size);
273 if (this->version == tn->version) {
274 /* Version number collision means REF_PRISTINE GC. Accept either of them
275 as long as the CRC is correct. Check the one we have already... */
276 if (!check_tn_node(c, this)) {
277 /* The one we already had was OK. Keep it and throw away the new one */
278 dbg_readinode("Like old node. Throw away new\n");
279 jffs2_kill_tn(c, tn);
280 return 0;
281 } else {
282 /* Who cares if the new one is good; keep it for now anyway. */
283 dbg_readinode("Like new node. Throw away old\n");
284 rb_replace_node(&this->rb, &tn->rb, &rii->tn_root);
285 jffs2_kill_tn(c, this);
286 /* Same overlapping from in front and behind */
287 return 0;
290 if (this->version < tn->version &&
291 this->fn->ofs >= tn->fn->ofs &&
292 this->fn->ofs + this->fn->size <= fn_end) {
293 /* New node entirely overlaps 'this' */
294 if (check_tn_node(c, tn)) {
295 dbg_readinode("new node bad CRC\n");
296 jffs2_kill_tn(c, tn);
297 return 0;
299 /* ... and is good. Kill 'this' and any subsequent nodes which are also overlapped */
300 while (this && this->fn->ofs + this->fn->size <= fn_end) {
301 struct jffs2_tmp_dnode_info *next = tn_next(this);
302 if (this->version < tn->version) {
303 tn_erase(this, &rii->tn_root);
304 dbg_readinode("Kill overlapped ver %d, 0x%x-0x%x\n",
305 this->version, this->fn->ofs,
306 this->fn->ofs+this->fn->size);
307 jffs2_kill_tn(c, this);
309 this = next;
311 dbg_readinode("Done killing overlapped nodes\n");
312 continue;
314 if (this->version > tn->version &&
315 this->fn->ofs <= tn->fn->ofs &&
316 this->fn->ofs+this->fn->size >= fn_end) {
317 /* New node entirely overlapped by 'this' */
318 if (!check_tn_node(c, this)) {
319 dbg_readinode("Good CRC on old node. Kill new\n");
320 jffs2_kill_tn(c, tn);
321 return 0;
323 /* ... but 'this' was bad. Replace it... */
324 dbg_readinode("Bad CRC on old overlapping node. Kill it\n");
325 tn_erase(this, &rii->tn_root);
326 jffs2_kill_tn(c, this);
327 break;
330 this = tn_next(this);
333 /* We neither completely obsoleted nor were completely
334 obsoleted by an earlier node. Insert into the tree */
336 struct rb_node *parent;
337 struct rb_node **link = &rii->tn_root.rb_node;
338 struct jffs2_tmp_dnode_info *insert_point = NULL;
340 while (*link) {
341 parent = *link;
342 insert_point = rb_entry(parent, struct jffs2_tmp_dnode_info, rb);
343 if (tn->fn->ofs > insert_point->fn->ofs)
344 link = &insert_point->rb.rb_right;
345 else if (tn->fn->ofs < insert_point->fn->ofs ||
346 tn->fn->size < insert_point->fn->size)
347 link = &insert_point->rb.rb_left;
348 else
349 link = &insert_point->rb.rb_right;
351 rb_link_node(&tn->rb, &insert_point->rb, link);
352 rb_insert_color(&tn->rb, &rii->tn_root);
355 /* If there's anything behind that overlaps us, note it */
356 this = tn_prev(tn);
357 if (this) {
358 while (1) {
359 if (this->fn->ofs + this->fn->size > tn->fn->ofs) {
360 dbg_readinode("Node is overlapped by %p (v %d, 0x%x-0x%x)\n",
361 this, this->version, this->fn->ofs,
362 this->fn->ofs+this->fn->size);
363 tn->overlapped = 1;
364 break;
366 if (!this->overlapped)
367 break;
369 ptn = tn_prev(this);
370 if (!ptn) {
372 * We killed a node which set the overlapped
373 * flags during the scan. Fix it up.
375 this->overlapped = 0;
376 break;
378 this = ptn;
382 /* If the new node overlaps anything ahead, note it */
383 this = tn_next(tn);
384 while (this && this->fn->ofs < fn_end) {
385 this->overlapped = 1;
386 dbg_readinode("Node ver %d, 0x%x-0x%x is overlapped\n",
387 this->version, this->fn->ofs,
388 this->fn->ofs+this->fn->size);
389 this = tn_next(this);
391 return 0;
394 /* Trivial function to remove the last node in the tree. Which by definition
395 has no right-hand -- so can be removed just by making its only child (if
396 any) take its place under its parent. */
397 static void eat_last(struct rb_root *root, struct rb_node *node)
399 struct rb_node *parent = rb_parent(node);
400 struct rb_node **link;
402 /* LAST! */
403 BUG_ON(node->rb_right);
405 if (!parent)
406 link = &root->rb_node;
407 else if (node == parent->rb_left)
408 link = &parent->rb_left;
409 else
410 link = &parent->rb_right;
412 *link = node->rb_left;
413 /* Colour doesn't matter now. Only the parent pointer. */
414 if (node->rb_left)
415 node->rb_left->rb_parent_color = node->rb_parent_color;
418 /* We put this in reverse order, so we can just use eat_last */
419 static void ver_insert(struct rb_root *ver_root, struct jffs2_tmp_dnode_info *tn)
421 struct rb_node **link = &ver_root->rb_node;
422 struct rb_node *parent = NULL;
423 struct jffs2_tmp_dnode_info *this_tn;
425 while (*link) {
426 parent = *link;
427 this_tn = rb_entry(parent, struct jffs2_tmp_dnode_info, rb);
429 if (tn->version > this_tn->version)
430 link = &parent->rb_left;
431 else
432 link = &parent->rb_right;
434 dbg_readinode("Link new node at %p (root is %p)\n", link, ver_root);
435 rb_link_node(&tn->rb, parent, link);
436 rb_insert_color(&tn->rb, ver_root);
439 /* Build final, normal fragtree from tn tree. It doesn't matter which order
440 we add nodes to the real fragtree, as long as they don't overlap. And
441 having thrown away the majority of overlapped nodes as we went, there
442 really shouldn't be many sets of nodes which do overlap. If we start at
443 the end, we can use the overlap markers -- we can just eat nodes which
444 aren't overlapped, and when we encounter nodes which _do_ overlap we
445 sort them all into a temporary tree in version order before replaying them. */
446 static int jffs2_build_inode_fragtree(struct jffs2_sb_info *c,
447 struct jffs2_inode_info *f,
448 struct jffs2_readinode_info *rii)
450 struct jffs2_tmp_dnode_info *pen, *last, *this;
451 struct rb_root ver_root = RB_ROOT;
452 uint32_t high_ver = 0;
454 if (rii->mdata_tn) {
455 dbg_readinode("potential mdata is ver %d at %p\n", rii->mdata_tn->version, rii->mdata_tn);
456 high_ver = rii->mdata_tn->version;
457 rii->latest_ref = rii->mdata_tn->fn->raw;
459 #ifdef JFFS2_DBG_READINODE_MESSAGES
460 this = tn_last(&rii->tn_root);
461 while (this) {
462 dbg_readinode("tn %p ver %d range 0x%x-0x%x ov %d\n", this, this->version, this->fn->ofs,
463 this->fn->ofs+this->fn->size, this->overlapped);
464 this = tn_prev(this);
466 #endif
467 pen = tn_last(&rii->tn_root);
468 while ((last = pen)) {
469 pen = tn_prev(last);
471 eat_last(&rii->tn_root, &last->rb);
472 ver_insert(&ver_root, last);
474 if (unlikely(last->overlapped)) {
475 if (pen)
476 continue;
478 * We killed a node which set the overlapped
479 * flags during the scan. Fix it up.
481 last->overlapped = 0;
484 /* Now we have a bunch of nodes in reverse version
485 order, in the tree at ver_root. Most of the time,
486 there'll actually be only one node in the 'tree',
487 in fact. */
488 this = tn_last(&ver_root);
490 while (this) {
491 struct jffs2_tmp_dnode_info *vers_next;
492 int ret;
493 vers_next = tn_prev(this);
494 eat_last(&ver_root, &this->rb);
495 if (check_tn_node(c, this)) {
496 dbg_readinode("node ver %d, 0x%x-0x%x failed CRC\n",
497 this->version, this->fn->ofs,
498 this->fn->ofs+this->fn->size);
499 jffs2_kill_tn(c, this);
500 } else {
501 if (this->version > high_ver) {
502 /* Note that this is different from the other
503 highest_version, because this one is only
504 counting _valid_ nodes which could give the
505 latest inode metadata */
506 high_ver = this->version;
507 rii->latest_ref = this->fn->raw;
509 dbg_readinode("Add %p (v %d, 0x%x-0x%x, ov %d) to fragtree\n",
510 this, this->version, this->fn->ofs,
511 this->fn->ofs+this->fn->size, this->overlapped);
513 ret = jffs2_add_full_dnode_to_inode(c, f, this->fn);
514 if (ret) {
515 /* Free the nodes in vers_root; let the caller
516 deal with the rest */
517 JFFS2_ERROR("Add node to tree failed %d\n", ret);
518 while (1) {
519 vers_next = tn_prev(this);
520 if (check_tn_node(c, this))
521 jffs2_mark_node_obsolete(c, this->fn->raw);
522 jffs2_free_full_dnode(this->fn);
523 jffs2_free_tmp_dnode_info(this);
524 this = vers_next;
525 if (!this)
526 break;
527 eat_last(&ver_root, &vers_next->rb);
529 return ret;
531 jffs2_free_tmp_dnode_info(this);
533 this = vers_next;
536 return 0;
539 static void jffs2_free_tmp_dnode_info_list(struct rb_root *list)
541 struct rb_node *this;
542 struct jffs2_tmp_dnode_info *tn;
544 this = list->rb_node;
546 /* Now at bottom of tree */
547 while (this) {
548 if (this->rb_left)
549 this = this->rb_left;
550 else if (this->rb_right)
551 this = this->rb_right;
552 else {
553 tn = rb_entry(this, struct jffs2_tmp_dnode_info, rb);
554 jffs2_free_full_dnode(tn->fn);
555 jffs2_free_tmp_dnode_info(tn);
557 this = rb_parent(this);
558 if (!this)
559 break;
561 if (this->rb_left == &tn->rb)
562 this->rb_left = NULL;
563 else if (this->rb_right == &tn->rb)
564 this->rb_right = NULL;
565 else BUG();
568 *list = RB_ROOT;
571 static void jffs2_free_full_dirent_list(struct jffs2_full_dirent *fd)
573 struct jffs2_full_dirent *next;
575 while (fd) {
576 next = fd->next;
577 jffs2_free_full_dirent(fd);
578 fd = next;
582 /* Returns first valid node after 'ref'. May return 'ref' */
583 static struct jffs2_raw_node_ref *jffs2_first_valid_node(struct jffs2_raw_node_ref *ref)
585 while (ref && ref->next_in_ino) {
586 if (!ref_obsolete(ref))
587 return ref;
588 dbg_noderef("node at 0x%08x is obsoleted. Ignoring.\n", ref_offset(ref));
589 ref = ref->next_in_ino;
591 return NULL;
595 * Helper function for jffs2_get_inode_nodes().
596 * It is called every time an directory entry node is found.
598 * Returns: 0 on success;
599 * negative error code on failure.
601 static inline int read_direntry(struct jffs2_sb_info *c, struct jffs2_raw_node_ref *ref,
602 struct jffs2_raw_dirent *rd, size_t read,
603 struct jffs2_readinode_info *rii)
605 struct jffs2_full_dirent *fd;
606 uint32_t crc;
608 /* Obsoleted. This cannot happen, surely? dwmw2 20020308 */
609 BUG_ON(ref_obsolete(ref));
611 crc = crc32(0, rd, sizeof(*rd) - 8);
612 if (unlikely(crc != je32_to_cpu(rd->node_crc))) {
613 JFFS2_NOTICE("header CRC failed on dirent node at %#08x: read %#08x, calculated %#08x\n",
614 ref_offset(ref), je32_to_cpu(rd->node_crc), crc);
615 jffs2_mark_node_obsolete(c, ref);
616 return 0;
619 /* If we've never checked the CRCs on this node, check them now */
620 if (ref_flags(ref) == REF_UNCHECKED) {
621 struct jffs2_eraseblock *jeb;
622 int len;
624 /* Sanity check */
625 if (unlikely(PAD((rd->nsize + sizeof(*rd))) != PAD(je32_to_cpu(rd->totlen)))) {
626 JFFS2_ERROR("illegal nsize in node at %#08x: nsize %#02x, totlen %#04x\n",
627 ref_offset(ref), rd->nsize, je32_to_cpu(rd->totlen));
628 jffs2_mark_node_obsolete(c, ref);
629 return 0;
632 jeb = &c->blocks[ref->flash_offset / c->sector_size];
633 len = ref_totlen(c, jeb, ref);
635 spin_lock(&c->erase_completion_lock);
636 jeb->used_size += len;
637 jeb->unchecked_size -= len;
638 c->used_size += len;
639 c->unchecked_size -= len;
640 ref->flash_offset = ref_offset(ref) | dirent_node_state(rd);
641 spin_unlock(&c->erase_completion_lock);
644 fd = jffs2_alloc_full_dirent(rd->nsize + 1);
645 if (unlikely(!fd))
646 return -ENOMEM;
648 fd->raw = ref;
649 fd->version = je32_to_cpu(rd->version);
650 fd->ino = je32_to_cpu(rd->ino);
651 fd->type = rd->type;
653 if (fd->version > rii->highest_version)
654 rii->highest_version = fd->version;
656 /* Pick out the mctime of the latest dirent */
657 if(fd->version > rii->mctime_ver && je32_to_cpu(rd->mctime)) {
658 rii->mctime_ver = fd->version;
659 rii->latest_mctime = je32_to_cpu(rd->mctime);
663 * Copy as much of the name as possible from the raw
664 * dirent we've already read from the flash.
666 if (read > sizeof(*rd))
667 memcpy(&fd->name[0], &rd->name[0],
668 min_t(uint32_t, rd->nsize, (read - sizeof(*rd)) ));
670 /* Do we need to copy any more of the name directly from the flash? */
671 if (rd->nsize + sizeof(*rd) > read) {
672 /* FIXME: point() */
673 int err;
674 int already = read - sizeof(*rd);
676 err = jffs2_flash_read(c, (ref_offset(ref)) + read,
677 rd->nsize - already, &read, &fd->name[already]);
678 if (unlikely(read != rd->nsize - already) && likely(!err))
679 return -EIO;
681 if (unlikely(err)) {
682 JFFS2_ERROR("read remainder of name: error %d\n", err);
683 jffs2_free_full_dirent(fd);
684 return -EIO;
688 fd->nhash = full_name_hash(fd->name, rd->nsize);
689 fd->next = NULL;
690 fd->name[rd->nsize] = '\0';
693 * Wheee. We now have a complete jffs2_full_dirent structure, with
694 * the name in it and everything. Link it into the list
696 jffs2_add_fd_to_list(c, fd, &rii->fds);
698 return 0;
702 * Helper function for jffs2_get_inode_nodes().
703 * It is called every time an inode node is found.
705 * Returns: 0 on success (possibly after marking a bad node obsolete);
706 * negative error code on failure.
708 static inline int read_dnode(struct jffs2_sb_info *c, struct jffs2_raw_node_ref *ref,
709 struct jffs2_raw_inode *rd, int rdlen,
710 struct jffs2_readinode_info *rii)
712 struct jffs2_tmp_dnode_info *tn;
713 uint32_t len, csize;
714 int ret = 0;
715 uint32_t crc;
717 /* Obsoleted. This cannot happen, surely? dwmw2 20020308 */
718 BUG_ON(ref_obsolete(ref));
720 crc = crc32(0, rd, sizeof(*rd) - 8);
721 if (unlikely(crc != je32_to_cpu(rd->node_crc))) {
722 JFFS2_NOTICE("node CRC failed on dnode at %#08x: read %#08x, calculated %#08x\n",
723 ref_offset(ref), je32_to_cpu(rd->node_crc), crc);
724 jffs2_mark_node_obsolete(c, ref);
725 return 0;
728 tn = jffs2_alloc_tmp_dnode_info();
729 if (!tn) {
730 JFFS2_ERROR("failed to allocate tn (%zu bytes).\n", sizeof(*tn));
731 return -ENOMEM;
734 tn->partial_crc = 0;
735 csize = je32_to_cpu(rd->csize);
737 /* If we've never checked the CRCs on this node, check them now */
738 if (ref_flags(ref) == REF_UNCHECKED) {
740 /* Sanity checks */
741 if (unlikely(je32_to_cpu(rd->offset) > je32_to_cpu(rd->isize)) ||
742 unlikely(PAD(je32_to_cpu(rd->csize) + sizeof(*rd)) != PAD(je32_to_cpu(rd->totlen)))) {
743 JFFS2_WARNING("inode node header CRC is corrupted at %#08x\n", ref_offset(ref));
744 jffs2_dbg_dump_node(c, ref_offset(ref));
745 jffs2_mark_node_obsolete(c, ref);
746 goto free_out;
749 if (jffs2_is_writebuffered(c) && csize != 0) {
750 /* At this point we are supposed to check the data CRC
751 * of our unchecked node. But thus far, we do not
752 * know whether the node is valid or obsolete. To
753 * figure this out, we need to walk all the nodes of
754 * the inode and build the inode fragtree. We don't
755 * want to spend time checking data of nodes which may
756 * later be found to be obsolete. So we put off the full
757 * data CRC checking until we have read all the inode
758 * nodes and have started building the fragtree.
760 * The fragtree is being built starting with nodes
761 * having the highest version number, so we'll be able
762 * to detect whether a node is valid (i.e., it is not
763 * overlapped by a node with higher version) or not.
764 * And we'll be able to check only those nodes, which
765 * are not obsolete.
767 * Of course, this optimization only makes sense in case
768 * of NAND flashes (or other flashes with
769 * !jffs2_can_mark_obsolete()), since on NOR flashes
770 * nodes are marked obsolete physically.
772 * Since NAND flashes (or other flashes with
773 * jffs2_is_writebuffered(c)) are anyway read by
774 * fractions of c->wbuf_pagesize, and we have just read
775 * the node header, it is likely that the starting part
776 * of the node data is also read when we read the
777 * header. So we don't mind to check the CRC of the
778 * starting part of the data of the node now, and check
779 * the second part later (in jffs2_check_node_data()).
780 * Of course, we will not need to re-read and re-check
781 * the NAND page which we have just read. This is why we
782 * read the whole NAND page at jffs2_get_inode_nodes(),
783 * while we needed only the node header.
785 unsigned char *buf;
787 /* 'buf' will point to the start of data */
788 buf = (unsigned char *)rd + sizeof(*rd);
789 /* len will be the read data length */
790 len = min_t(uint32_t, rdlen - sizeof(*rd), csize);
791 tn->partial_crc = crc32(0, buf, len);
793 dbg_readinode("Calculates CRC (%#08x) for %d bytes, csize %d\n", tn->partial_crc, len, csize);
795 /* If we actually calculated the whole data CRC
796 * and it is wrong, drop the node. */
797 if (len >= csize && unlikely(tn->partial_crc != je32_to_cpu(rd->data_crc))) {
798 JFFS2_NOTICE("wrong data CRC in data node at 0x%08x: read %#08x, calculated %#08x.\n",
799 ref_offset(ref), tn->partial_crc, je32_to_cpu(rd->data_crc));
800 jffs2_mark_node_obsolete(c, ref);
801 goto free_out;
804 } else if (csize == 0) {
806 * We checked the header CRC. If the node has no data, adjust
807 * the space accounting now. For other nodes this will be done
808 * later either when the node is marked obsolete or when its
809 * data is checked.
811 struct jffs2_eraseblock *jeb;
813 dbg_readinode("the node has no data.\n");
814 jeb = &c->blocks[ref->flash_offset / c->sector_size];
815 len = ref_totlen(c, jeb, ref);
817 spin_lock(&c->erase_completion_lock);
818 jeb->used_size += len;
819 jeb->unchecked_size -= len;
820 c->used_size += len;
821 c->unchecked_size -= len;
822 ref->flash_offset = ref_offset(ref) | REF_NORMAL;
823 spin_unlock(&c->erase_completion_lock);
827 tn->fn = jffs2_alloc_full_dnode();
828 if (!tn->fn) {
829 JFFS2_ERROR("alloc fn failed\n");
830 ret = -ENOMEM;
831 goto free_out;
834 tn->version = je32_to_cpu(rd->version);
835 tn->fn->ofs = je32_to_cpu(rd->offset);
836 tn->data_crc = je32_to_cpu(rd->data_crc);
837 tn->csize = csize;
838 tn->fn->raw = ref;
839 tn->overlapped = 0;
841 if (tn->version > rii->highest_version)
842 rii->highest_version = tn->version;
844 /* There was a bug where we wrote hole nodes out with
845 csize/dsize swapped. Deal with it */
846 if (rd->compr == JFFS2_COMPR_ZERO && !je32_to_cpu(rd->dsize) && csize)
847 tn->fn->size = csize;
848 else // normal case...
849 tn->fn->size = je32_to_cpu(rd->dsize);
851 dbg_readinode2("dnode @%08x: ver %u, offset %#04x, dsize %#04x, csize %#04x\n",
852 ref_offset(ref), je32_to_cpu(rd->version),
853 je32_to_cpu(rd->offset), je32_to_cpu(rd->dsize), csize);
855 ret = jffs2_add_tn_to_tree(c, rii, tn);
857 if (ret) {
858 jffs2_free_full_dnode(tn->fn);
859 free_out:
860 jffs2_free_tmp_dnode_info(tn);
861 return ret;
863 #ifdef JFFS2_DBG_READINODE2_MESSAGES
864 dbg_readinode2("After adding ver %d:\n", je32_to_cpu(rd->version));
865 tn = tn_first(&rii->tn_root);
866 while (tn) {
867 dbg_readinode2("%p: v %d r 0x%x-0x%x ov %d\n",
868 tn, tn->version, tn->fn->ofs,
869 tn->fn->ofs+tn->fn->size, tn->overlapped);
870 tn = tn_next(tn);
872 #endif
873 return 0;
877 * Helper function for jffs2_get_inode_nodes().
878 * It is called every time an unknown node is found.
880 * Returns: 0 on success;
881 * negative error code on failure.
883 static inline int read_unknown(struct jffs2_sb_info *c, struct jffs2_raw_node_ref *ref, struct jffs2_unknown_node *un)
885 /* We don't mark unknown nodes as REF_UNCHECKED */
886 if (ref_flags(ref) == REF_UNCHECKED) {
887 JFFS2_ERROR("REF_UNCHECKED but unknown node at %#08x\n",
888 ref_offset(ref));
889 JFFS2_ERROR("Node is {%04x,%04x,%08x,%08x}. Please report this error.\n",
890 je16_to_cpu(un->magic), je16_to_cpu(un->nodetype),
891 je32_to_cpu(un->totlen), je32_to_cpu(un->hdr_crc));
892 jffs2_mark_node_obsolete(c, ref);
893 return 0;
896 un->nodetype = cpu_to_je16(JFFS2_NODE_ACCURATE | je16_to_cpu(un->nodetype));
898 switch(je16_to_cpu(un->nodetype) & JFFS2_COMPAT_MASK) {
900 case JFFS2_FEATURE_INCOMPAT:
901 JFFS2_ERROR("unknown INCOMPAT nodetype %#04X at %#08x\n",
902 je16_to_cpu(un->nodetype), ref_offset(ref));
903 /* EEP */
904 BUG();
905 break;
907 case JFFS2_FEATURE_ROCOMPAT:
908 JFFS2_ERROR("unknown ROCOMPAT nodetype %#04X at %#08x\n",
909 je16_to_cpu(un->nodetype), ref_offset(ref));
910 BUG_ON(!(c->flags & JFFS2_SB_FLAG_RO));
911 break;
913 case JFFS2_FEATURE_RWCOMPAT_COPY:
914 JFFS2_NOTICE("unknown RWCOMPAT_COPY nodetype %#04X at %#08x\n",
915 je16_to_cpu(un->nodetype), ref_offset(ref));
916 break;
918 case JFFS2_FEATURE_RWCOMPAT_DELETE:
919 JFFS2_NOTICE("unknown RWCOMPAT_DELETE nodetype %#04X at %#08x\n",
920 je16_to_cpu(un->nodetype), ref_offset(ref));
921 jffs2_mark_node_obsolete(c, ref);
922 return 0;
925 return 0;
929 * Helper function for jffs2_get_inode_nodes().
930 * The function detects whether more data should be read and reads it if yes.
932 * Returns: 0 on success;
933 * negative error code on failure.
935 static int read_more(struct jffs2_sb_info *c, struct jffs2_raw_node_ref *ref,
936 int needed_len, int *rdlen, unsigned char *buf)
938 int err, to_read = needed_len - *rdlen;
939 size_t retlen;
940 uint32_t offs;
942 if (jffs2_is_writebuffered(c)) {
943 int rem = to_read % c->wbuf_pagesize;
945 if (rem)
946 to_read += c->wbuf_pagesize - rem;
949 /* We need to read more data */
950 offs = ref_offset(ref) + *rdlen;
952 dbg_readinode("read more %d bytes\n", to_read);
954 err = jffs2_flash_read(c, offs, to_read, &retlen, buf + *rdlen);
955 if (err) {
956 JFFS2_ERROR("can not read %d bytes from 0x%08x, "
957 "error code: %d.\n", to_read, offs, err);
958 return err;
961 if (retlen < to_read) {
962 JFFS2_ERROR("short read at %#08x: %zu instead of %d.\n",
963 offs, retlen, to_read);
964 return -EIO;
967 *rdlen += to_read;
968 return 0;
971 /* Get tmp_dnode_info and full_dirent for all non-obsolete nodes associated
972 with this ino. Perform a preliminary ordering on data nodes, throwing away
973 those which are completely obsoleted by newer ones. The naïve approach we
974 use to take of just returning them _all_ in version order will cause us to
975 run out of memory in certain degenerate cases. */
976 static int jffs2_get_inode_nodes(struct jffs2_sb_info *c, struct jffs2_inode_info *f,
977 struct jffs2_readinode_info *rii)
979 struct jffs2_raw_node_ref *ref, *valid_ref;
980 unsigned char *buf = NULL;
981 union jffs2_node_union *node;
982 size_t retlen;
983 int len, err;
985 rii->mctime_ver = 0;
987 dbg_readinode("ino #%u\n", f->inocache->ino);
989 /* FIXME: in case of NOR and available ->point() this
990 * needs to be fixed. */
991 len = sizeof(union jffs2_node_union) + c->wbuf_pagesize;
992 buf = kmalloc(len, GFP_KERNEL);
993 if (!buf)
994 return -ENOMEM;
996 spin_lock(&c->erase_completion_lock);
997 valid_ref = jffs2_first_valid_node(f->inocache->nodes);
998 if (!valid_ref && f->inocache->ino != 1)
999 JFFS2_WARNING("Eep. No valid nodes for ino #%u.\n", f->inocache->ino);
1000 while (valid_ref) {
1001 /* We can hold a pointer to a non-obsolete node without the spinlock,
1002 but _obsolete_ nodes may disappear at any time, if the block
1003 they're in gets erased. So if we mark 'ref' obsolete while we're
1004 not holding the lock, it can go away immediately. For that reason,
1005 we find the next valid node first, before processing 'ref'.
1007 ref = valid_ref;
1008 valid_ref = jffs2_first_valid_node(ref->next_in_ino);
1009 spin_unlock(&c->erase_completion_lock);
1011 cond_resched();
1014 * At this point we don't know the type of the node we're going
1015 * to read, so we do not know the size of its header. In order
1016 * to minimize the amount of flash IO we assume the header is
1017 * of size = JFFS2_MIN_NODE_HEADER.
1019 len = JFFS2_MIN_NODE_HEADER;
1020 if (jffs2_is_writebuffered(c)) {
1021 int end, rem;
1024 * We are about to read JFFS2_MIN_NODE_HEADER bytes,
1025 * but this flash has some minimal I/O unit. It is
1026 * possible that we'll need to read more soon, so read
1027 * up to the next min. I/O unit, in order not to
1028 * re-read the same min. I/O unit twice.
1030 end = ref_offset(ref) + len;
1031 rem = end % c->wbuf_pagesize;
1032 if (rem)
1033 end += c->wbuf_pagesize - rem;
1034 len = end - ref_offset(ref);
1037 dbg_readinode("read %d bytes at %#08x(%d).\n", len, ref_offset(ref), ref_flags(ref));
1039 /* FIXME: point() */
1040 err = jffs2_flash_read(c, ref_offset(ref), len, &retlen, buf);
1041 if (err) {
1042 JFFS2_ERROR("can not read %d bytes from 0x%08x, error code: %d.\n", len, ref_offset(ref), err);
1043 goto free_out;
1046 if (retlen < len) {
1047 JFFS2_ERROR("short read at %#08x: %zu instead of %d.\n", ref_offset(ref), retlen, len);
1048 err = -EIO;
1049 goto free_out;
1052 node = (union jffs2_node_union *)buf;
1054 /* No need to mask in the valid bit; it shouldn't be invalid */
1055 if (je32_to_cpu(node->u.hdr_crc) != crc32(0, node, sizeof(node->u)-4)) {
1056 JFFS2_NOTICE("Node header CRC failed at %#08x. {%04x,%04x,%08x,%08x}\n",
1057 ref_offset(ref), je16_to_cpu(node->u.magic),
1058 je16_to_cpu(node->u.nodetype),
1059 je32_to_cpu(node->u.totlen),
1060 je32_to_cpu(node->u.hdr_crc));
1061 jffs2_dbg_dump_node(c, ref_offset(ref));
1062 jffs2_mark_node_obsolete(c, ref);
1063 goto cont;
1065 if (je16_to_cpu(node->u.magic) != JFFS2_MAGIC_BITMASK) {
1066 /* Not a JFFS2 node, whinge and move on */
1067 JFFS2_NOTICE("Wrong magic bitmask 0x%04x in node header at %#08x.\n",
1068 je16_to_cpu(node->u.magic), ref_offset(ref));
1069 jffs2_mark_node_obsolete(c, ref);
1070 goto cont;
1073 switch (je16_to_cpu(node->u.nodetype)) {
1075 case JFFS2_NODETYPE_DIRENT:
1077 if (JFFS2_MIN_NODE_HEADER < sizeof(struct jffs2_raw_dirent) &&
1078 len < sizeof(struct jffs2_raw_dirent)) {
1079 err = read_more(c, ref, sizeof(struct jffs2_raw_dirent), &len, buf);
1080 if (unlikely(err))
1081 goto free_out;
1084 err = read_direntry(c, ref, &node->d, retlen, rii);
1085 if (unlikely(err))
1086 goto free_out;
1088 break;
1090 case JFFS2_NODETYPE_INODE:
1092 if (JFFS2_MIN_NODE_HEADER < sizeof(struct jffs2_raw_inode) &&
1093 len < sizeof(struct jffs2_raw_inode)) {
1094 err = read_more(c, ref, sizeof(struct jffs2_raw_inode), &len, buf);
1095 if (unlikely(err))
1096 goto free_out;
1099 err = read_dnode(c, ref, &node->i, len, rii);
1100 if (unlikely(err))
1101 goto free_out;
1103 break;
1105 default:
1106 if (JFFS2_MIN_NODE_HEADER < sizeof(struct jffs2_unknown_node) &&
1107 len < sizeof(struct jffs2_unknown_node)) {
1108 err = read_more(c, ref, sizeof(struct jffs2_unknown_node), &len, buf);
1109 if (unlikely(err))
1110 goto free_out;
1113 err = read_unknown(c, ref, &node->u);
1114 if (unlikely(err))
1115 goto free_out;
1118 cont:
1119 spin_lock(&c->erase_completion_lock);
1122 spin_unlock(&c->erase_completion_lock);
1123 kfree(buf);
1125 f->highest_version = rii->highest_version;
1127 dbg_readinode("nodes of inode #%u were read, the highest version is %u, latest_mctime %u, mctime_ver %u.\n",
1128 f->inocache->ino, rii->highest_version, rii->latest_mctime,
1129 rii->mctime_ver);
1130 return 0;
1132 free_out:
1133 jffs2_free_tmp_dnode_info_list(&rii->tn_root);
1134 jffs2_free_full_dirent_list(rii->fds);
1135 rii->fds = NULL;
1136 kfree(buf);
1137 return err;
1140 static int jffs2_do_read_inode_internal(struct jffs2_sb_info *c,
1141 struct jffs2_inode_info *f,
1142 struct jffs2_raw_inode *latest_node)
1144 struct jffs2_readinode_info rii;
1145 uint32_t crc, new_size;
1146 size_t retlen;
1147 int ret;
1149 dbg_readinode("ino #%u pino/nlink is %d\n", f->inocache->ino,
1150 f->inocache->pino_nlink);
1152 memset(&rii, 0, sizeof(rii));
1154 /* Grab all nodes relevant to this ino */
1155 ret = jffs2_get_inode_nodes(c, f, &rii);
1157 if (ret) {
1158 JFFS2_ERROR("cannot read nodes for ino %u, returned error is %d\n", f->inocache->ino, ret);
1159 if (f->inocache->state == INO_STATE_READING)
1160 jffs2_set_inocache_state(c, f->inocache, INO_STATE_CHECKEDABSENT);
1161 return ret;
1164 ret = jffs2_build_inode_fragtree(c, f, &rii);
1165 if (ret) {
1166 JFFS2_ERROR("Failed to build final fragtree for inode #%u: error %d\n",
1167 f->inocache->ino, ret);
1168 if (f->inocache->state == INO_STATE_READING)
1169 jffs2_set_inocache_state(c, f->inocache, INO_STATE_CHECKEDABSENT);
1170 jffs2_free_tmp_dnode_info_list(&rii.tn_root);
1171 /* FIXME: We could at least crc-check them all */
1172 if (rii.mdata_tn) {
1173 jffs2_free_full_dnode(rii.mdata_tn->fn);
1174 jffs2_free_tmp_dnode_info(rii.mdata_tn);
1175 rii.mdata_tn = NULL;
1177 return ret;
1180 if (rii.mdata_tn) {
1181 if (rii.mdata_tn->fn->raw == rii.latest_ref) {
1182 f->metadata = rii.mdata_tn->fn;
1183 jffs2_free_tmp_dnode_info(rii.mdata_tn);
1184 } else {
1185 jffs2_kill_tn(c, rii.mdata_tn);
1187 rii.mdata_tn = NULL;
1190 f->dents = rii.fds;
1192 jffs2_dbg_fragtree_paranoia_check_nolock(f);
1194 if (unlikely(!rii.latest_ref)) {
1195 /* No data nodes for this inode. */
1196 if (f->inocache->ino != 1) {
1197 JFFS2_WARNING("no data nodes found for ino #%u\n", f->inocache->ino);
1198 if (!rii.fds) {
1199 if (f->inocache->state == INO_STATE_READING)
1200 jffs2_set_inocache_state(c, f->inocache, INO_STATE_CHECKEDABSENT);
1201 return -EIO;
1203 JFFS2_NOTICE("but it has children so we fake some modes for it\n");
1205 latest_node->mode = cpu_to_jemode(S_IFDIR|S_IRUGO|S_IWUSR|S_IXUGO);
1206 latest_node->version = cpu_to_je32(0);
1207 latest_node->atime = latest_node->ctime = latest_node->mtime = cpu_to_je32(0);
1208 latest_node->isize = cpu_to_je32(0);
1209 latest_node->gid = cpu_to_je16(0);
1210 latest_node->uid = cpu_to_je16(0);
1211 if (f->inocache->state == INO_STATE_READING)
1212 jffs2_set_inocache_state(c, f->inocache, INO_STATE_PRESENT);
1213 return 0;
1216 ret = jffs2_flash_read(c, ref_offset(rii.latest_ref), sizeof(*latest_node), &retlen, (void *)latest_node);
1217 if (ret || retlen != sizeof(*latest_node)) {
1218 JFFS2_ERROR("failed to read from flash: error %d, %zd of %zd bytes read\n",
1219 ret, retlen, sizeof(*latest_node));
1220 /* FIXME: If this fails, there seems to be a memory leak. Find it. */
1221 mutex_unlock(&f->sem);
1222 jffs2_do_clear_inode(c, f);
1223 return ret?ret:-EIO;
1226 crc = crc32(0, latest_node, sizeof(*latest_node)-8);
1227 if (crc != je32_to_cpu(latest_node->node_crc)) {
1228 JFFS2_ERROR("CRC failed for read_inode of inode %u at physical location 0x%x\n",
1229 f->inocache->ino, ref_offset(rii.latest_ref));
1230 mutex_unlock(&f->sem);
1231 jffs2_do_clear_inode(c, f);
1232 return -EIO;
1235 switch(jemode_to_cpu(latest_node->mode) & S_IFMT) {
1236 case S_IFDIR:
1237 if (rii.mctime_ver > je32_to_cpu(latest_node->version)) {
1238 /* The times in the latest_node are actually older than
1239 mctime in the latest dirent. Cheat. */
1240 latest_node->ctime = latest_node->mtime = cpu_to_je32(rii.latest_mctime);
1242 break;
1245 case S_IFREG:
1246 /* If it was a regular file, truncate it to the latest node's isize */
1247 new_size = jffs2_truncate_fragtree(c, &f->fragtree, je32_to_cpu(latest_node->isize));
1248 if (new_size != je32_to_cpu(latest_node->isize)) {
1249 JFFS2_WARNING("Truncating ino #%u to %d bytes failed because it only had %d bytes to start with!\n",
1250 f->inocache->ino, je32_to_cpu(latest_node->isize), new_size);
1251 latest_node->isize = cpu_to_je32(new_size);
1253 break;
1255 case S_IFLNK:
1256 /* Hack to work around broken isize in old symlink code.
1257 Remove this when dwmw2 comes to his senses and stops
1258 symlinks from being an entirely gratuitous special
1259 case. */
1260 if (!je32_to_cpu(latest_node->isize))
1261 latest_node->isize = latest_node->dsize;
1263 if (f->inocache->state != INO_STATE_CHECKING) {
1264 /* Symlink's inode data is the target path. Read it and
1265 * keep in RAM to facilitate quick follow symlink
1266 * operation. */
1267 f->target = kmalloc(je32_to_cpu(latest_node->csize) + 1, GFP_KERNEL);
1268 if (!f->target) {
1269 JFFS2_ERROR("can't allocate %d bytes of memory for the symlink target path cache\n", je32_to_cpu(latest_node->csize));
1270 mutex_unlock(&f->sem);
1271 jffs2_do_clear_inode(c, f);
1272 return -ENOMEM;
1275 ret = jffs2_flash_read(c, ref_offset(rii.latest_ref) + sizeof(*latest_node),
1276 je32_to_cpu(latest_node->csize), &retlen, (char *)f->target);
1278 if (ret || retlen != je32_to_cpu(latest_node->csize)) {
1279 if (retlen != je32_to_cpu(latest_node->csize))
1280 ret = -EIO;
1281 kfree(f->target);
1282 f->target = NULL;
1283 mutex_unlock(&f->sem);
1284 jffs2_do_clear_inode(c, f);
1285 return ret;
1288 f->target[je32_to_cpu(latest_node->csize)] = '\0';
1289 dbg_readinode("symlink's target '%s' cached\n", f->target);
1292 /* fall through... */
1294 case S_IFBLK:
1295 case S_IFCHR:
1296 /* Certain inode types should have only one data node, and it's
1297 kept as the metadata node */
1298 if (f->metadata) {
1299 JFFS2_ERROR("Argh. Special inode #%u with mode 0%o had metadata node\n",
1300 f->inocache->ino, jemode_to_cpu(latest_node->mode));
1301 mutex_unlock(&f->sem);
1302 jffs2_do_clear_inode(c, f);
1303 return -EIO;
1305 if (!frag_first(&f->fragtree)) {
1306 JFFS2_ERROR("Argh. Special inode #%u with mode 0%o has no fragments\n",
1307 f->inocache->ino, jemode_to_cpu(latest_node->mode));
1308 mutex_unlock(&f->sem);
1309 jffs2_do_clear_inode(c, f);
1310 return -EIO;
1312 /* ASSERT: f->fraglist != NULL */
1313 if (frag_next(frag_first(&f->fragtree))) {
1314 JFFS2_ERROR("Argh. Special inode #%u with mode 0x%x had more than one node\n",
1315 f->inocache->ino, jemode_to_cpu(latest_node->mode));
1316 /* FIXME: Deal with it - check crc32, check for duplicate node, check times and discard the older one */
1317 mutex_unlock(&f->sem);
1318 jffs2_do_clear_inode(c, f);
1319 return -EIO;
1321 /* OK. We're happy */
1322 f->metadata = frag_first(&f->fragtree)->node;
1323 jffs2_free_node_frag(frag_first(&f->fragtree));
1324 f->fragtree = RB_ROOT;
1325 break;
1327 if (f->inocache->state == INO_STATE_READING)
1328 jffs2_set_inocache_state(c, f->inocache, INO_STATE_PRESENT);
1330 return 0;
1333 /* Scan the list of all nodes present for this ino, build map of versions, etc. */
1334 int jffs2_do_read_inode(struct jffs2_sb_info *c, struct jffs2_inode_info *f,
1335 uint32_t ino, struct jffs2_raw_inode *latest_node)
1337 dbg_readinode("read inode #%u\n", ino);
1339 retry_inocache:
1340 spin_lock(&c->inocache_lock);
1341 f->inocache = jffs2_get_ino_cache(c, ino);
1343 if (f->inocache) {
1344 /* Check its state. We may need to wait before we can use it */
1345 switch(f->inocache->state) {
1346 case INO_STATE_UNCHECKED:
1347 case INO_STATE_CHECKEDABSENT:
1348 f->inocache->state = INO_STATE_READING;
1349 break;
1351 case INO_STATE_CHECKING:
1352 case INO_STATE_GC:
1353 /* If it's in either of these states, we need
1354 to wait for whoever's got it to finish and
1355 put it back. */
1356 dbg_readinode("waiting for ino #%u in state %d\n", ino, f->inocache->state);
1357 sleep_on_spinunlock(&c->inocache_wq, &c->inocache_lock);
1358 goto retry_inocache;
1360 case INO_STATE_READING:
1361 case INO_STATE_PRESENT:
1362 /* Eep. This should never happen. It can
1363 happen if Linux calls read_inode() again
1364 before clear_inode() has finished though. */
1365 JFFS2_ERROR("Eep. Trying to read_inode #%u when it's already in state %d!\n", ino, f->inocache->state);
1366 /* Fail. That's probably better than allowing it to succeed */
1367 f->inocache = NULL;
1368 break;
1370 default:
1371 BUG();
1374 spin_unlock(&c->inocache_lock);
1376 if (!f->inocache && ino == 1) {
1377 /* Special case - no root inode on medium */
1378 f->inocache = jffs2_alloc_inode_cache();
1379 if (!f->inocache) {
1380 JFFS2_ERROR("cannot allocate inocache for root inode\n");
1381 return -ENOMEM;
1383 dbg_readinode("creating inocache for root inode\n");
1384 memset(f->inocache, 0, sizeof(struct jffs2_inode_cache));
1385 f->inocache->ino = f->inocache->pino_nlink = 1;
1386 f->inocache->nodes = (struct jffs2_raw_node_ref *)f->inocache;
1387 f->inocache->state = INO_STATE_READING;
1388 jffs2_add_ino_cache(c, f->inocache);
1390 if (!f->inocache) {
1391 JFFS2_ERROR("requestied to read an nonexistent ino %u\n", ino);
1392 return -ENOENT;
1395 return jffs2_do_read_inode_internal(c, f, latest_node);
1398 int jffs2_do_crccheck_inode(struct jffs2_sb_info *c, struct jffs2_inode_cache *ic)
1400 struct jffs2_raw_inode n;
1401 struct jffs2_inode_info *f = kzalloc(sizeof(*f), GFP_KERNEL);
1402 int ret;
1404 if (!f)
1405 return -ENOMEM;
1407 mutex_init(&f->sem);
1408 mutex_lock(&f->sem);
1409 f->inocache = ic;
1411 ret = jffs2_do_read_inode_internal(c, f, &n);
1412 if (!ret) {
1413 mutex_unlock(&f->sem);
1414 jffs2_do_clear_inode(c, f);
1416 kfree (f);
1417 return ret;
1420 void jffs2_do_clear_inode(struct jffs2_sb_info *c, struct jffs2_inode_info *f)
1422 struct jffs2_full_dirent *fd, *fds;
1423 int deleted;
1425 jffs2_xattr_delete_inode(c, f->inocache);
1426 mutex_lock(&f->sem);
1427 deleted = f->inocache && !f->inocache->pino_nlink;
1429 if (f->inocache && f->inocache->state != INO_STATE_CHECKING)
1430 jffs2_set_inocache_state(c, f->inocache, INO_STATE_CLEARING);
1432 if (f->metadata) {
1433 if (deleted)
1434 jffs2_mark_node_obsolete(c, f->metadata->raw);
1435 jffs2_free_full_dnode(f->metadata);
1438 jffs2_kill_fragtree(&f->fragtree, deleted?c:NULL);
1440 if (f->target) {
1441 kfree(f->target);
1442 f->target = NULL;
1445 fds = f->dents;
1446 while(fds) {
1447 fd = fds;
1448 fds = fd->next;
1449 jffs2_free_full_dirent(fd);
1452 if (f->inocache && f->inocache->state != INO_STATE_CHECKING) {
1453 jffs2_set_inocache_state(c, f->inocache, INO_STATE_CHECKEDABSENT);
1454 if (f->inocache->nodes == (void *)f->inocache)
1455 jffs2_del_ino_cache(c, f->inocache);
1458 mutex_unlock(&f->sem);