2 * Copyright (C) 2005, 2006
3 * Avishay Traeger (avishay@gmail.com)
4 * Copyright (C) 2008, 2009
5 * Boaz Harrosh <bharrosh@panasas.com>
7 * Copyrights for code taken from ext2:
8 * Copyright (C) 1992, 1993, 1994, 1995
9 * Remy Card (card@masi.ibp.fr)
10 * Laboratoire MASI - Institut Blaise Pascal
11 * Universite Pierre et Marie Curie (Paris VI)
13 * linux/fs/minix/inode.c
14 * Copyright (C) 1991, 1992 Linus Torvalds
16 * This file is part of exofs.
18 * exofs is free software; you can redistribute it and/or modify
19 * it under the terms of the GNU General Public License as published by
20 * the Free Software Foundation. Since it is based on ext2, and the only
21 * valid version of GPL for the Linux kernel is version 2, the only valid
22 * version of GPL for exofs is version 2.
24 * exofs is distributed in the hope that it will be useful,
25 * but WITHOUT ANY WARRANTY; without even the implied warranty of
26 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
27 * GNU General Public License for more details.
29 * You should have received a copy of the GNU General Public License
30 * along with exofs; if not, write to the Free Software
31 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
36 static inline unsigned exofs_chunk_size(struct inode
*inode
)
38 return inode
->i_sb
->s_blocksize
;
41 static inline void exofs_put_page(struct page
*page
)
44 page_cache_release(page
);
47 /* Accesses dir's inode->i_size must be called under inode lock */
48 static inline unsigned long dir_pages(struct inode
*inode
)
50 return (inode
->i_size
+ PAGE_CACHE_SIZE
- 1) >> PAGE_CACHE_SHIFT
;
53 static unsigned exofs_last_byte(struct inode
*inode
, unsigned long page_nr
)
55 loff_t last_byte
= inode
->i_size
;
57 last_byte
-= page_nr
<< PAGE_CACHE_SHIFT
;
58 if (last_byte
> PAGE_CACHE_SIZE
)
59 last_byte
= PAGE_CACHE_SIZE
;
63 static int exofs_commit_chunk(struct page
*page
, loff_t pos
, unsigned len
)
65 struct address_space
*mapping
= page
->mapping
;
66 struct inode
*dir
= mapping
->host
;
71 if (!PageUptodate(page
))
72 SetPageUptodate(page
);
74 if (pos
+len
> dir
->i_size
) {
75 i_size_write(dir
, pos
+len
);
76 mark_inode_dirty(dir
);
81 err
= write_one_page(page
, 1);
88 static void exofs_check_page(struct page
*page
)
90 struct inode
*dir
= page
->mapping
->host
;
91 unsigned chunk_size
= exofs_chunk_size(dir
);
92 char *kaddr
= page_address(page
);
93 unsigned offs
, rec_len
;
94 unsigned limit
= PAGE_CACHE_SIZE
;
95 struct exofs_dir_entry
*p
;
98 /* if the page is the last one in the directory */
99 if ((dir
->i_size
>> PAGE_CACHE_SHIFT
) == page
->index
) {
100 limit
= dir
->i_size
& ~PAGE_CACHE_MASK
;
101 if (limit
& (chunk_size
- 1))
106 for (offs
= 0; offs
<= limit
- EXOFS_DIR_REC_LEN(1); offs
+= rec_len
) {
107 p
= (struct exofs_dir_entry
*)(kaddr
+ offs
);
108 rec_len
= le16_to_cpu(p
->rec_len
);
110 if (rec_len
< EXOFS_DIR_REC_LEN(1))
114 if (rec_len
< EXOFS_DIR_REC_LEN(p
->name_len
))
116 if (((offs
+ rec_len
- 1) ^ offs
) & ~(chunk_size
-1))
122 SetPageChecked(page
);
126 EXOFS_ERR("ERROR [exofs_check_page]: "
127 "size of directory #%lu is not a multiple of chunk size",
132 error
= "rec_len is smaller than minimal";
135 error
= "unaligned directory entry";
138 error
= "rec_len is too small for name_len";
141 error
= "directory entry across blocks";
145 "ERROR [exofs_check_page]: bad entry in directory #%lu: %s - "
146 "offset=%lu, inode=%llu, rec_len=%d, name_len=%d",
147 dir
->i_ino
, error
, (page
->index
<<PAGE_CACHE_SHIFT
)+offs
,
148 _LLU(le64_to_cpu(p
->inode_no
)),
149 rec_len
, p
->name_len
);
152 p
= (struct exofs_dir_entry
*)(kaddr
+ offs
);
153 EXOFS_ERR("ERROR [exofs_check_page]: "
154 "entry in directory #%lu spans the page boundary"
155 "offset=%lu, inode=%llu",
156 dir
->i_ino
, (page
->index
<<PAGE_CACHE_SHIFT
)+offs
,
157 _LLU(le64_to_cpu(p
->inode_no
)));
159 SetPageChecked(page
);
163 static struct page
*exofs_get_page(struct inode
*dir
, unsigned long n
)
165 struct address_space
*mapping
= dir
->i_mapping
;
166 struct page
*page
= read_mapping_page(mapping
, n
, NULL
);
170 if (!PageChecked(page
))
171 exofs_check_page(page
);
178 exofs_put_page(page
);
179 return ERR_PTR(-EIO
);
182 static inline int exofs_match(int len
, const unsigned char *name
,
183 struct exofs_dir_entry
*de
)
185 if (len
!= de
->name_len
)
189 return !memcmp(name
, de
->name
, len
);
193 struct exofs_dir_entry
*exofs_next_entry(struct exofs_dir_entry
*p
)
195 return (struct exofs_dir_entry
*)((char *)p
+ le16_to_cpu(p
->rec_len
));
198 static inline unsigned
199 exofs_validate_entry(char *base
, unsigned offset
, unsigned mask
)
201 struct exofs_dir_entry
*de
= (struct exofs_dir_entry
*)(base
+ offset
);
202 struct exofs_dir_entry
*p
=
203 (struct exofs_dir_entry
*)(base
+ (offset
&mask
));
204 while ((char *)p
< (char *)de
) {
207 p
= exofs_next_entry(p
);
209 return (char *)p
- base
;
212 static unsigned char exofs_filetype_table
[EXOFS_FT_MAX
] = {
213 [EXOFS_FT_UNKNOWN
] = DT_UNKNOWN
,
214 [EXOFS_FT_REG_FILE
] = DT_REG
,
215 [EXOFS_FT_DIR
] = DT_DIR
,
216 [EXOFS_FT_CHRDEV
] = DT_CHR
,
217 [EXOFS_FT_BLKDEV
] = DT_BLK
,
218 [EXOFS_FT_FIFO
] = DT_FIFO
,
219 [EXOFS_FT_SOCK
] = DT_SOCK
,
220 [EXOFS_FT_SYMLINK
] = DT_LNK
,
224 static unsigned char exofs_type_by_mode
[S_IFMT
>> S_SHIFT
] = {
225 [S_IFREG
>> S_SHIFT
] = EXOFS_FT_REG_FILE
,
226 [S_IFDIR
>> S_SHIFT
] = EXOFS_FT_DIR
,
227 [S_IFCHR
>> S_SHIFT
] = EXOFS_FT_CHRDEV
,
228 [S_IFBLK
>> S_SHIFT
] = EXOFS_FT_BLKDEV
,
229 [S_IFIFO
>> S_SHIFT
] = EXOFS_FT_FIFO
,
230 [S_IFSOCK
>> S_SHIFT
] = EXOFS_FT_SOCK
,
231 [S_IFLNK
>> S_SHIFT
] = EXOFS_FT_SYMLINK
,
235 void exofs_set_de_type(struct exofs_dir_entry
*de
, struct inode
*inode
)
237 mode_t mode
= inode
->i_mode
;
238 de
->file_type
= exofs_type_by_mode
[(mode
& S_IFMT
) >> S_SHIFT
];
242 exofs_readdir(struct file
*filp
, void *dirent
, filldir_t filldir
)
244 loff_t pos
= filp
->f_pos
;
245 struct inode
*inode
= filp
->f_path
.dentry
->d_inode
;
246 unsigned int offset
= pos
& ~PAGE_CACHE_MASK
;
247 unsigned long n
= pos
>> PAGE_CACHE_SHIFT
;
248 unsigned long npages
= dir_pages(inode
);
249 unsigned chunk_mask
= ~(exofs_chunk_size(inode
)-1);
250 unsigned char *types
= NULL
;
251 int need_revalidate
= (filp
->f_version
!= inode
->i_version
);
253 if (pos
> inode
->i_size
- EXOFS_DIR_REC_LEN(1))
256 types
= exofs_filetype_table
;
258 for ( ; n
< npages
; n
++, offset
= 0) {
260 struct exofs_dir_entry
*de
;
261 struct page
*page
= exofs_get_page(inode
, n
);
267 filp
->f_pos
+= PAGE_CACHE_SIZE
- offset
;
268 return PTR_ERR(page
);
270 kaddr
= page_address(page
);
271 if (unlikely(need_revalidate
)) {
273 offset
= exofs_validate_entry(kaddr
, offset
,
275 filp
->f_pos
= (n
<<PAGE_CACHE_SHIFT
) + offset
;
277 filp
->f_version
= inode
->i_version
;
280 de
= (struct exofs_dir_entry
*)(kaddr
+ offset
);
281 limit
= kaddr
+ exofs_last_byte(inode
, n
) -
282 EXOFS_DIR_REC_LEN(1);
283 for (; (char *)de
<= limit
; de
= exofs_next_entry(de
)) {
284 if (de
->rec_len
== 0) {
286 "zero-length directory entry");
287 exofs_put_page(page
);
292 unsigned char d_type
= DT_UNKNOWN
;
294 if (types
&& de
->file_type
< EXOFS_FT_MAX
)
295 d_type
= types
[de
->file_type
];
297 offset
= (char *)de
- kaddr
;
298 over
= filldir(dirent
, de
->name
, de
->name_len
,
299 (n
<<PAGE_CACHE_SHIFT
) | offset
,
300 le64_to_cpu(de
->inode_no
),
303 exofs_put_page(page
);
307 filp
->f_pos
+= le16_to_cpu(de
->rec_len
);
309 exofs_put_page(page
);
315 struct exofs_dir_entry
*exofs_find_entry(struct inode
*dir
,
316 struct dentry
*dentry
, struct page
**res_page
)
318 const unsigned char *name
= dentry
->d_name
.name
;
319 int namelen
= dentry
->d_name
.len
;
320 unsigned reclen
= EXOFS_DIR_REC_LEN(namelen
);
321 unsigned long start
, n
;
322 unsigned long npages
= dir_pages(dir
);
323 struct page
*page
= NULL
;
324 struct exofs_i_info
*oi
= exofs_i(dir
);
325 struct exofs_dir_entry
*de
;
332 start
= oi
->i_dir_start_lookup
;
338 page
= exofs_get_page(dir
, n
);
340 kaddr
= page_address(page
);
341 de
= (struct exofs_dir_entry
*) kaddr
;
342 kaddr
+= exofs_last_byte(dir
, n
) - reclen
;
343 while ((char *) de
<= kaddr
) {
344 if (de
->rec_len
== 0) {
346 "ERROR: exofs_find_entry: "
347 "zero-length directory entry");
348 exofs_put_page(page
);
351 if (exofs_match(namelen
, name
, de
))
353 de
= exofs_next_entry(de
);
355 exofs_put_page(page
);
359 } while (n
!= start
);
365 oi
->i_dir_start_lookup
= n
;
369 struct exofs_dir_entry
*exofs_dotdot(struct inode
*dir
, struct page
**p
)
371 struct page
*page
= exofs_get_page(dir
, 0);
372 struct exofs_dir_entry
*de
= NULL
;
375 de
= exofs_next_entry(
376 (struct exofs_dir_entry
*)page_address(page
));
382 ino_t
exofs_parent_ino(struct dentry
*child
)
385 struct exofs_dir_entry
*de
;
388 de
= exofs_dotdot(child
->d_inode
, &page
);
392 ino
= le64_to_cpu(de
->inode_no
);
393 exofs_put_page(page
);
397 ino_t
exofs_inode_by_name(struct inode
*dir
, struct dentry
*dentry
)
400 struct exofs_dir_entry
*de
;
403 de
= exofs_find_entry(dir
, dentry
, &page
);
405 res
= le64_to_cpu(de
->inode_no
);
406 exofs_put_page(page
);
411 int exofs_set_link(struct inode
*dir
, struct exofs_dir_entry
*de
,
412 struct page
*page
, struct inode
*inode
)
414 loff_t pos
= page_offset(page
) +
415 (char *) de
- (char *) page_address(page
);
416 unsigned len
= le16_to_cpu(de
->rec_len
);
420 err
= exofs_write_begin(NULL
, page
->mapping
, pos
, len
,
421 AOP_FLAG_UNINTERRUPTIBLE
, &page
, NULL
);
423 EXOFS_ERR("exofs_set_link: exofs_write_begin FAILED => %d\n",
426 de
->inode_no
= cpu_to_le64(inode
->i_ino
);
427 exofs_set_de_type(de
, inode
);
429 err
= exofs_commit_chunk(page
, pos
, len
);
430 exofs_put_page(page
);
431 dir
->i_mtime
= dir
->i_ctime
= CURRENT_TIME
;
432 mark_inode_dirty(dir
);
436 int exofs_add_link(struct dentry
*dentry
, struct inode
*inode
)
438 struct inode
*dir
= dentry
->d_parent
->d_inode
;
439 const unsigned char *name
= dentry
->d_name
.name
;
440 int namelen
= dentry
->d_name
.len
;
441 unsigned chunk_size
= exofs_chunk_size(dir
);
442 unsigned reclen
= EXOFS_DIR_REC_LEN(namelen
);
443 unsigned short rec_len
, name_len
;
444 struct page
*page
= NULL
;
445 struct exofs_sb_info
*sbi
= inode
->i_sb
->s_fs_info
;
446 struct exofs_dir_entry
*de
;
447 unsigned long npages
= dir_pages(dir
);
453 for (n
= 0; n
<= npages
; n
++) {
456 page
= exofs_get_page(dir
, n
);
461 kaddr
= page_address(page
);
462 dir_end
= kaddr
+ exofs_last_byte(dir
, n
);
463 de
= (struct exofs_dir_entry
*)kaddr
;
464 kaddr
+= PAGE_CACHE_SIZE
- reclen
;
465 while ((char *)de
<= kaddr
) {
466 if ((char *)de
== dir_end
) {
468 rec_len
= chunk_size
;
469 de
->rec_len
= cpu_to_le16(chunk_size
);
473 if (de
->rec_len
== 0) {
474 EXOFS_ERR("ERROR: exofs_add_link: "
475 "zero-length directory entry");
480 if (exofs_match(namelen
, name
, de
))
482 name_len
= EXOFS_DIR_REC_LEN(de
->name_len
);
483 rec_len
= le16_to_cpu(de
->rec_len
);
484 if (!de
->inode_no
&& rec_len
>= reclen
)
486 if (rec_len
>= name_len
+ reclen
)
488 de
= (struct exofs_dir_entry
*) ((char *) de
+ rec_len
);
491 exofs_put_page(page
);
494 EXOFS_ERR("exofs_add_link: BAD dentry=%p or inode=%p", dentry
, inode
);
498 pos
= page_offset(page
) +
499 (char *)de
- (char *)page_address(page
);
500 err
= exofs_write_begin(NULL
, page
->mapping
, pos
, rec_len
, 0,
505 struct exofs_dir_entry
*de1
=
506 (struct exofs_dir_entry
*)((char *)de
+ name_len
);
507 de1
->rec_len
= cpu_to_le16(rec_len
- name_len
);
508 de
->rec_len
= cpu_to_le16(name_len
);
511 de
->name_len
= namelen
;
512 memcpy(de
->name
, name
, namelen
);
513 de
->inode_no
= cpu_to_le64(inode
->i_ino
);
514 exofs_set_de_type(de
, inode
);
515 err
= exofs_commit_chunk(page
, pos
, rec_len
);
516 dir
->i_mtime
= dir
->i_ctime
= CURRENT_TIME
;
517 mark_inode_dirty(dir
);
521 exofs_put_page(page
);
529 int exofs_delete_entry(struct exofs_dir_entry
*dir
, struct page
*page
)
531 struct address_space
*mapping
= page
->mapping
;
532 struct inode
*inode
= mapping
->host
;
533 struct exofs_sb_info
*sbi
= inode
->i_sb
->s_fs_info
;
534 char *kaddr
= page_address(page
);
535 unsigned from
= ((char *)dir
- kaddr
) & ~(exofs_chunk_size(inode
)-1);
536 unsigned to
= ((char *)dir
- kaddr
) + le16_to_cpu(dir
->rec_len
);
538 struct exofs_dir_entry
*pde
= NULL
;
539 struct exofs_dir_entry
*de
= (struct exofs_dir_entry
*) (kaddr
+ from
);
543 if (de
->rec_len
== 0) {
544 EXOFS_ERR("ERROR: exofs_delete_entry:"
545 "zero-length directory entry");
550 de
= exofs_next_entry(de
);
553 from
= (char *)pde
- (char *)page_address(page
);
554 pos
= page_offset(page
) + from
;
556 err
= exofs_write_begin(NULL
, page
->mapping
, pos
, to
- from
, 0,
559 EXOFS_ERR("exofs_delete_entry: exofs_write_begin FAILED => %d\n",
562 pde
->rec_len
= cpu_to_le16(to
- from
);
565 err
= exofs_commit_chunk(page
, pos
, to
- from
);
566 inode
->i_ctime
= inode
->i_mtime
= CURRENT_TIME
;
567 mark_inode_dirty(inode
);
570 exofs_put_page(page
);
574 /* kept aligned on 4 bytes */
575 #define THIS_DIR ".\0\0"
576 #define PARENT_DIR "..\0"
578 int exofs_make_empty(struct inode
*inode
, struct inode
*parent
)
580 struct address_space
*mapping
= inode
->i_mapping
;
581 struct page
*page
= grab_cache_page(mapping
, 0);
582 unsigned chunk_size
= exofs_chunk_size(inode
);
583 struct exofs_dir_entry
*de
;
590 err
= exofs_write_begin(NULL
, page
->mapping
, 0, chunk_size
, 0,
597 kaddr
= kmap_atomic(page
, KM_USER0
);
598 de
= (struct exofs_dir_entry
*)kaddr
;
600 de
->rec_len
= cpu_to_le16(EXOFS_DIR_REC_LEN(1));
601 memcpy(de
->name
, THIS_DIR
, sizeof(THIS_DIR
));
602 de
->inode_no
= cpu_to_le64(inode
->i_ino
);
603 exofs_set_de_type(de
, inode
);
605 de
= (struct exofs_dir_entry
*)(kaddr
+ EXOFS_DIR_REC_LEN(1));
607 de
->rec_len
= cpu_to_le16(chunk_size
- EXOFS_DIR_REC_LEN(1));
608 de
->inode_no
= cpu_to_le64(parent
->i_ino
);
609 memcpy(de
->name
, PARENT_DIR
, sizeof(PARENT_DIR
));
610 exofs_set_de_type(de
, inode
);
611 kunmap_atomic(kaddr
, KM_USER0
);
612 err
= exofs_commit_chunk(page
, 0, chunk_size
);
614 page_cache_release(page
);
618 int exofs_empty_dir(struct inode
*inode
)
620 struct page
*page
= NULL
;
621 unsigned long i
, npages
= dir_pages(inode
);
623 for (i
= 0; i
< npages
; i
++) {
625 struct exofs_dir_entry
*de
;
626 page
= exofs_get_page(inode
, i
);
631 kaddr
= page_address(page
);
632 de
= (struct exofs_dir_entry
*)kaddr
;
633 kaddr
+= exofs_last_byte(inode
, i
) - EXOFS_DIR_REC_LEN(1);
635 while ((char *)de
<= kaddr
) {
636 if (de
->rec_len
== 0) {
637 EXOFS_ERR("ERROR: exofs_empty_dir: "
638 "zero-length directory entry"
639 "kaddr=%p, de=%p\n", kaddr
, de
);
642 if (de
->inode_no
!= 0) {
643 /* check for . and .. */
644 if (de
->name
[0] != '.')
646 if (de
->name_len
> 2)
648 if (de
->name_len
< 2) {
649 if (le64_to_cpu(de
->inode_no
) !=
652 } else if (de
->name
[1] != '.')
655 de
= exofs_next_entry(de
);
657 exofs_put_page(page
);
662 exofs_put_page(page
);
666 const struct file_operations exofs_dir_operations
= {
667 .llseek
= generic_file_llseek
,
668 .read
= generic_read_dir
,
669 .readdir
= exofs_readdir
,