1 /* $NetBSD: ext2fs_vfsops.c,v 1.151 2009/10/19 18:41:17 bouyer Exp $ */
4 * Copyright (c) 1989, 1991, 1993, 1994
5 * The Regents of the University of California. All rights reserved.
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions
10 * 1. Redistributions of source code must retain the above copyright
11 * notice, this list of conditions and the following disclaimer.
12 * 2. Redistributions in binary form must reproduce the above copyright
13 * notice, this list of conditions and the following disclaimer in the
14 * documentation and/or other materials provided with the distribution.
15 * 3. Neither the name of the University nor the names of its contributors
16 * may be used to endorse or promote products derived from this software
17 * without specific prior written permission.
19 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
31 * @(#)ffs_vfsops.c 8.14 (Berkeley) 11/28/94
32 * Modified for ext2fs by Manuel Bouyer.
36 * Copyright (c) 1997 Manuel Bouyer.
38 * Redistribution and use in source and binary forms, with or without
39 * modification, are permitted provided that the following conditions
41 * 1. Redistributions of source code must retain the above copyright
42 * notice, this list of conditions and the following disclaimer.
43 * 2. Redistributions in binary form must reproduce the above copyright
44 * notice, this list of conditions and the following disclaimer in the
45 * documentation and/or other materials provided with the distribution.
47 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
48 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
49 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
50 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
51 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
52 * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
53 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
54 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
55 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
56 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
58 * @(#)ffs_vfsops.c 8.14 (Berkeley) 11/28/94
59 * Modified for ext2fs by Manuel Bouyer.
62 #include <sys/cdefs.h>
63 __KERNEL_RCSID(0, "$NetBSD: ext2fs_vfsops.c,v 1.151 2009/10/19 18:41:17 bouyer Exp $");
65 #if defined(_KERNEL_OPT)
66 #include "opt_compat_netbsd.h"
69 #include <sys/param.h>
70 #include <sys/systm.h>
71 #include <sys/sysctl.h>
72 #include <sys/namei.h>
74 #include <sys/kernel.h>
75 #include <sys/vnode.h>
76 #include <sys/socket.h>
77 #include <sys/mount.h>
79 #include <sys/device.h>
82 #include <sys/disklabel.h>
83 #include <sys/ioctl.h>
84 #include <sys/errno.h>
85 #include <sys/malloc.h>
89 #include <sys/kauth.h>
90 #include <sys/module.h>
92 #include <miscfs/genfs/genfs.h>
93 #include <miscfs/specfs/specdev.h>
95 #include <ufs/ufs/quota.h>
96 #include <ufs/ufs/ufsmount.h>
97 #include <ufs/ufs/inode.h>
98 #include <ufs/ufs/dir.h>
99 #include <ufs/ufs/ufs_extern.h>
101 #include <ufs/ext2fs/ext2fs.h>
102 #include <ufs/ext2fs/ext2fs_dir.h>
103 #include <ufs/ext2fs/ext2fs_extern.h>
105 MODULE(MODULE_CLASS_VFS
, ext2fs
, "ffs");
107 int ext2fs_sbupdate(struct ufsmount
*, int);
108 static int ext2fs_checksb(struct ext2fs
*, int);
110 static struct sysctllog
*ext2fs_sysctl_log
;
112 extern const struct vnodeopv_desc ext2fs_vnodeop_opv_desc
;
113 extern const struct vnodeopv_desc ext2fs_specop_opv_desc
;
114 extern const struct vnodeopv_desc ext2fs_fifoop_opv_desc
;
116 const struct vnodeopv_desc
* const ext2fs_vnodeopv_descs
[] = {
117 &ext2fs_vnodeop_opv_desc
,
118 &ext2fs_specop_opv_desc
,
119 &ext2fs_fifoop_opv_desc
,
123 struct vfsops ext2fs_vfsops
= {
125 sizeof (struct ufs_args
),
140 (int (*)(struct mount
*, struct vnode
*, struct timespec
*)) eopnotsupp
,
142 (void *)eopnotsupp
, /* vfs_suspendctl */
143 genfs_renamelock_enter
,
144 genfs_renamelock_exit
,
146 ext2fs_vnodeopv_descs
,
151 static const struct genfs_ops ext2fs_genfsops
= {
152 .gop_size
= genfs_size
,
153 .gop_alloc
= ext2fs_gop_alloc
,
154 .gop_write
= genfs_gop_write
,
155 .gop_markupdate
= ufs_gop_markupdate
,
158 static const struct ufs_ops ext2fs_ufsops
= {
159 .uo_itimes
= ext2fs_itimes
,
160 .uo_update
= ext2fs_update
,
161 .uo_vfree
= ext2fs_vfree
,
162 .uo_unmark_vnode
= (void (*)(vnode_t
*))nullop
,
165 /* Fill in the inode uid/gid from ext2 halves. */
167 ext2fs_set_inode_guid(struct inode
*ip
)
170 ip
->i_gid
= ip
->i_e2fs_gid
;
171 ip
->i_uid
= ip
->i_e2fs_uid
;
172 if (ip
->i_e2fs
->e2fs
.e2fs_rev
> E2FS_REV0
) {
173 ip
->i_gid
|= ip
->i_e2fs_gid_high
<< 16;
174 ip
->i_uid
|= ip
->i_e2fs_uid_high
<< 16;
179 ext2fs_modcmd(modcmd_t cmd
, void *arg
)
184 case MODULE_CMD_INIT
:
185 error
= vfs_attach(&ext2fs_vfsops
);
188 sysctl_createv(&ext2fs_sysctl_log
, 0, NULL
, NULL
,
190 CTLTYPE_NODE
, "vfs", NULL
,
193 sysctl_createv(&ext2fs_sysctl_log
, 0, NULL
, NULL
,
195 CTLTYPE_NODE
, "ext2fs",
196 SYSCTL_DESCR("Linux EXT2FS file system"),
198 CTL_VFS
, 17, CTL_EOL
);
200 * XXX the "17" above could be dynamic, thereby eliminating
201 * one more instance of the "number to vfs" mapping problem,
202 * but "17" is the order as taken from sys/mount.h
205 case MODULE_CMD_FINI
:
206 error
= vfs_detach(&ext2fs_vfsops
);
209 sysctl_teardown(&ext2fs_sysctl_log
);
220 * XXX Same structure as FFS inodes? Should we share a common pool?
222 struct pool ext2fs_inode_pool
;
223 struct pool ext2fs_dinode_pool
;
225 extern u_long ext2gennumber
;
231 pool_init(&ext2fs_inode_pool
, sizeof(struct inode
), 0, 0, 0,
232 "ext2fsinopl", &pool_allocator_nointr
, IPL_NONE
);
233 pool_init(&ext2fs_dinode_pool
, sizeof(struct ext2fs_dinode
), 0, 0, 0,
234 "ext2dinopl", &pool_allocator_nointr
, IPL_NONE
);
249 pool_destroy(&ext2fs_inode_pool
);
250 pool_destroy(&ext2fs_dinode_pool
);
254 * Called by main() when ext2fs is going to be mounted as root.
256 * Name is updated by mount(8) after booting.
258 #define ROOTNAME "root_device"
261 ext2fs_mountroot(void)
263 extern struct vnode
*rootvp
;
266 struct ufsmount
*ump
;
269 if (device_class(root_device
) != DV_DISK
)
272 if ((error
= vfs_rootmountalloc(MOUNT_EXT2FS
, "root_device", &mp
))) {
277 if ((error
= ext2fs_mountfs(rootvp
, mp
)) != 0) {
278 vfs_unbusy(mp
, false, NULL
);
282 mutex_enter(&mountlist_lock
);
283 CIRCLEQ_INSERT_TAIL(&mountlist
, mp
, mnt_list
);
284 mutex_exit(&mountlist_lock
);
287 memset(fs
->e2fs_fsmnt
, 0, sizeof(fs
->e2fs_fsmnt
));
288 (void) copystr(mp
->mnt_stat
.f_mntonname
, fs
->e2fs_fsmnt
,
289 sizeof(fs
->e2fs_fsmnt
) - 1, 0);
290 if (fs
->e2fs
.e2fs_rev
> E2FS_REV0
) {
291 memset(fs
->e2fs
.e2fs_fsmnt
, 0, sizeof(fs
->e2fs
.e2fs_fsmnt
));
292 (void) copystr(mp
->mnt_stat
.f_mntonname
, fs
->e2fs
.e2fs_fsmnt
,
293 sizeof(fs
->e2fs
.e2fs_fsmnt
) - 1, 0);
295 (void)ext2fs_statvfs(mp
, &mp
->mnt_stat
);
296 vfs_unbusy(mp
, false, NULL
);
297 setrootfstime((time_t)fs
->e2fs
.e2fs_wtime
);
307 ext2fs_mount(struct mount
*mp
, const char *path
, void *data
, size_t *data_len
)
309 struct lwp
*l
= curlwp
;
311 struct ufs_args
*args
= data
;
312 struct ufsmount
*ump
= NULL
;
315 int error
= 0, flags
, update
;
318 if (*data_len
< sizeof *args
)
321 if (mp
->mnt_flag
& MNT_GETARGS
) {
325 memset(args
, 0, sizeof *args
);
327 *data_len
= sizeof *args
;
331 update
= mp
->mnt_flag
& MNT_UPDATE
;
333 /* Check arguments */
334 if (args
->fspec
!= NULL
) {
336 * Look up the name and verify that it's sane.
338 error
= namei_simple_user(args
->fspec
,
339 NSM_FOLLOW_NOEMULROOT
, &devvp
);
345 * Be sure this is a valid block device
347 if (devvp
->v_type
!= VBLK
)
349 else if (bdevsw_lookup(devvp
->v_rdev
) == NULL
)
353 * Be sure we're still naming the same device
354 * used for our initial mount
357 if (devvp
!= ump
->um_devvp
) {
358 if (devvp
->v_rdev
!= ump
->um_devvp
->v_rdev
)
362 devvp
= ump
->um_devvp
;
369 /* New mounts must have a filename for the device */
373 devvp
= ump
->um_devvp
;
379 * If mount by non-root, then verify that user has necessary
380 * permissions on the device.
382 * Permission to update a mount is checked higher, so here we presume
383 * updating the mount is okay (for example, as far as securelevel goes)
384 * which leaves us with the normal check.
389 (mp
->mnt_iflag
& IMNT_WANTRDWR
) != 0 :
390 (mp
->mnt_flag
& MNT_RDONLY
) == 0)
391 accessmode
|= VWRITE
;
392 vn_lock(devvp
, LK_EXCLUSIVE
| LK_RETRY
);
393 error
= genfs_can_mount(devvp
, accessmode
, l
->l_cred
);
394 VOP_UNLOCK(devvp
, 0);
405 if (mp
->mnt_flag
& MNT_RDONLY
)
408 xflags
= FREAD
|FWRITE
;
409 error
= VOP_OPEN(devvp
, xflags
, FSCRED
);
412 error
= ext2fs_mountfs(devvp
, mp
);
414 vn_lock(devvp
, LK_EXCLUSIVE
| LK_RETRY
);
415 (void)VOP_CLOSE(devvp
, xflags
, NOCRED
);
416 VOP_UNLOCK(devvp
, 0);
428 * The initial mount got a reference on this
429 * device, so drop the one obtained via
436 if (fs
->e2fs_ronly
== 0 && (mp
->mnt_flag
& MNT_RDONLY
)) {
438 * Changing from r/w to r/o
441 if (mp
->mnt_flag
& MNT_FORCE
)
443 error
= ext2fs_flushfiles(mp
, flags
);
445 ext2fs_cgupdate(ump
, MNT_WAIT
) == 0 &&
446 (fs
->e2fs
.e2fs_state
& E2FS_ERRORS
) == 0) {
447 fs
->e2fs
.e2fs_state
= E2FS_ISCLEAN
;
448 (void) ext2fs_sbupdate(ump
, MNT_WAIT
);
455 if (mp
->mnt_flag
& MNT_RELOAD
) {
456 error
= ext2fs_reload(mp
, l
->l_cred
, l
);
461 if (fs
->e2fs_ronly
&& (mp
->mnt_iflag
& IMNT_WANTRDWR
)) {
463 * Changing from read-only to read/write
466 if (fs
->e2fs
.e2fs_state
== E2FS_ISCLEAN
)
467 fs
->e2fs
.e2fs_state
= 0;
469 fs
->e2fs
.e2fs_state
= E2FS_ERRORS
;
472 if (args
->fspec
== NULL
)
476 error
= set_statvfs_info(path
, UIO_USERSPACE
, args
->fspec
,
477 UIO_USERSPACE
, mp
->mnt_op
->vfs_name
, mp
, l
);
478 (void) copystr(mp
->mnt_stat
.f_mntonname
, fs
->e2fs_fsmnt
,
479 sizeof(fs
->e2fs_fsmnt
) - 1, &size
);
480 memset(fs
->e2fs_fsmnt
+ size
, 0, sizeof(fs
->e2fs_fsmnt
) - size
);
481 if (fs
->e2fs
.e2fs_rev
> E2FS_REV0
) {
482 (void) copystr(mp
->mnt_stat
.f_mntonname
, fs
->e2fs
.e2fs_fsmnt
,
483 sizeof(fs
->e2fs
.e2fs_fsmnt
) - 1, &size
);
484 memset(fs
->e2fs
.e2fs_fsmnt
, 0,
485 sizeof(fs
->e2fs
.e2fs_fsmnt
) - size
);
487 if (fs
->e2fs_fmod
!= 0) { /* XXX */
489 if (fs
->e2fs
.e2fs_state
== 0)
490 fs
->e2fs
.e2fs_wtime
= time_second
;
492 printf("%s: file system not clean; please fsck(8)\n",
493 mp
->mnt_stat
.f_mntfromname
);
494 (void) ext2fs_cgupdate(ump
, MNT_WAIT
);
504 * Reload all incore data for a filesystem (used after running fsck on
505 * the root filesystem and finding things to fix). The filesystem must
506 * be mounted read-only.
508 * Things to do to update the mount:
509 * 1) invalidate all cached meta-data.
510 * 2) re-read superblock from disk.
511 * 3) re-read summary information from disk.
512 * 4) invalidate all inactive vnodes.
513 * 5) invalidate all cached file data.
514 * 6) re-read inode data for all active vnodes.
517 ext2fs_reload(struct mount
*mp
, kauth_cred_t cred
, struct lwp
*l
)
519 struct vnode
*vp
, *mvp
, *devvp
;
523 struct ext2fs
*newfs
;
524 struct partinfo dpart
;
527 struct ufsmount
*ump
;
529 if ((mp
->mnt_flag
& MNT_RDONLY
) == 0)
534 * Step 1: invalidate all cached meta-data.
536 devvp
= ump
->um_devvp
;
537 vn_lock(devvp
, LK_EXCLUSIVE
| LK_RETRY
);
538 error
= vinvalbuf(devvp
, 0, cred
, l
, 0, 0);
539 VOP_UNLOCK(devvp
, 0);
541 panic("ext2fs_reload: dirty1");
543 * Step 2: re-read superblock from disk.
545 if (VOP_IOCTL(devvp
, DIOCGPART
, &dpart
, FREAD
, NOCRED
) != 0)
548 size
= dpart
.disklab
->d_secsize
;
549 error
= bread(devvp
, (daddr_t
)(SBOFF
/ size
), SBSIZE
, NOCRED
, 0, &bp
);
554 newfs
= (struct ext2fs
*)bp
->b_data
;
555 error
= ext2fs_checksb(newfs
, (mp
->mnt_flag
& MNT_RDONLY
) != 0);
563 * copy in new superblock, and compute in-memory values
565 e2fs_sbload(newfs
, &fs
->e2fs
);
567 howmany(fs
->e2fs
.e2fs_bcount
- fs
->e2fs
.e2fs_first_dblock
,
569 /* XXX assume hw bsize = 512 */
570 fs
->e2fs_fsbtodb
= fs
->e2fs
.e2fs_log_bsize
+ 1;
571 fs
->e2fs_bsize
= MINBSIZE
<< fs
->e2fs
.e2fs_log_bsize
;
572 fs
->e2fs_bshift
= LOG_MINBSIZE
+ fs
->e2fs
.e2fs_log_bsize
;
573 fs
->e2fs_qbmask
= fs
->e2fs_bsize
- 1;
574 fs
->e2fs_bmask
= ~fs
->e2fs_qbmask
;
576 howmany(fs
->e2fs_ncg
, fs
->e2fs_bsize
/ sizeof(struct ext2_gd
));
577 fs
->e2fs_ipb
= fs
->e2fs_bsize
/ EXT2_DINODE_SIZE(fs
);
578 fs
->e2fs_itpg
= fs
->e2fs
.e2fs_ipg
/ fs
->e2fs_ipb
;
582 * Step 3: re-read summary information from disk.
585 for (i
= 0; i
< fs
->e2fs_ngdb
; i
++) {
586 error
= bread(devvp
,
587 fsbtodb(fs
, fs
->e2fs
.e2fs_first_dblock
+
588 1 /* superblock */ + i
),
589 fs
->e2fs_bsize
, NOCRED
, 0, &bp
);
594 e2fs_cgload((struct ext2_gd
*)bp
->b_data
,
595 &fs
->e2fs_gd
[i
* fs
->e2fs_bsize
/ sizeof(struct ext2_gd
)],
600 /* Allocate a marker vnode. */
601 if ((mvp
= vnalloc(mp
)) == NULL
)
604 * NOTE: not using the TAILQ_FOREACH here since in this loop vgone()
605 * and vclean() can be called indirectly
607 mutex_enter(&mntvnode_lock
);
609 for (vp
= TAILQ_FIRST(&mp
->mnt_vnodelist
); vp
; vp
= vunmark(mvp
)) {
611 if (vp
->v_mount
!= mp
|| vismarker(vp
))
614 * Step 4: invalidate all inactive vnodes.
616 if (vrecycle(vp
, &mntvnode_lock
, l
)) {
617 mutex_enter(&mntvnode_lock
);
622 * Step 5: invalidate all cached file data.
624 mutex_enter(&vp
->v_interlock
);
625 mutex_exit(&mntvnode_lock
);
626 if (vget(vp
, LK_EXCLUSIVE
| LK_INTERLOCK
)) {
627 mutex_enter(&mntvnode_lock
);
631 if (vinvalbuf(vp
, 0, cred
, l
, 0, 0))
632 panic("ext2fs_reload: dirty2");
634 * Step 6: re-read inode data for all active vnodes.
637 error
= bread(devvp
, fsbtodb(fs
, ino_to_fsba(fs
, ip
->i_number
)),
638 (int)fs
->e2fs_bsize
, NOCRED
, 0, &bp
);
641 mutex_enter(&mntvnode_lock
);
645 cp
= (char *)bp
->b_data
+
646 (ino_to_fsbo(fs
, ip
->i_number
) * EXT2_DINODE_SIZE(fs
));
647 e2fs_iload((struct ext2fs_dinode
*)cp
, ip
->i_din
.e2fs_din
);
648 ext2fs_set_inode_guid(ip
);
651 mutex_enter(&mntvnode_lock
);
653 mutex_exit(&mntvnode_lock
);
659 * Common code for mount and mountroot
662 ext2fs_mountfs(struct vnode
*devvp
, struct mount
*mp
)
664 struct lwp
*l
= curlwp
;
665 struct ufsmount
*ump
;
668 struct m_ext2fs
*m_fs
;
670 struct partinfo dpart
;
671 int error
, i
, size
, ronly
;
676 p
= l
? l
->l_proc
: NULL
;
677 cred
= l
? l
->l_cred
: NOCRED
;
679 /* Flush out any old buffers remaining from a previous use. */
680 vn_lock(devvp
, LK_EXCLUSIVE
| LK_RETRY
);
681 error
= vinvalbuf(devvp
, V_SAVE
, cred
, l
, 0, 0);
682 VOP_UNLOCK(devvp
, 0);
686 ronly
= (mp
->mnt_flag
& MNT_RDONLY
) != 0;
687 if (VOP_IOCTL(devvp
, DIOCGPART
, &dpart
, FREAD
, cred
) != 0)
690 size
= dpart
.disklab
->d_secsize
;
696 printf("ext2 sb size: %d\n", sizeof(struct ext2fs
));
698 error
= bread(devvp
, (SBOFF
/ size
), SBSIZE
, cred
, 0, &bp
);
701 fs
= (struct ext2fs
*)bp
->b_data
;
702 error
= ext2fs_checksb(fs
, ronly
);
705 ump
= malloc(sizeof(*ump
), M_UFSMNT
, M_WAITOK
);
706 memset(ump
, 0, sizeof(*ump
));
707 ump
->um_fstype
= UFS1
;
708 ump
->um_ops
= &ext2fs_ufsops
;
709 ump
->um_e2fs
= malloc(sizeof(struct m_ext2fs
), M_UFSMNT
, M_WAITOK
);
710 memset(ump
->um_e2fs
, 0, sizeof(struct m_ext2fs
));
711 e2fs_sbload((struct ext2fs
*)bp
->b_data
, &ump
->um_e2fs
->e2fs
);
715 m_fs
->e2fs_ronly
= ronly
;
718 printf("ext2 ino size %d\n", EXT2_DINODE_SIZE(m_fs
));
721 if (m_fs
->e2fs
.e2fs_state
== E2FS_ISCLEAN
)
722 m_fs
->e2fs
.e2fs_state
= 0;
724 m_fs
->e2fs
.e2fs_state
= E2FS_ERRORS
;
728 /* compute dynamic sb infos */
730 howmany(m_fs
->e2fs
.e2fs_bcount
- m_fs
->e2fs
.e2fs_first_dblock
,
731 m_fs
->e2fs
.e2fs_bpg
);
732 /* XXX assume hw bsize = 512 */
733 m_fs
->e2fs_fsbtodb
= m_fs
->e2fs
.e2fs_log_bsize
+ 1;
734 m_fs
->e2fs_bsize
= MINBSIZE
<< m_fs
->e2fs
.e2fs_log_bsize
;
735 m_fs
->e2fs_bshift
= LOG_MINBSIZE
+ m_fs
->e2fs
.e2fs_log_bsize
;
736 m_fs
->e2fs_qbmask
= m_fs
->e2fs_bsize
- 1;
737 m_fs
->e2fs_bmask
= ~m_fs
->e2fs_qbmask
;
739 howmany(m_fs
->e2fs_ncg
, m_fs
->e2fs_bsize
/ sizeof(struct ext2_gd
));
740 m_fs
->e2fs_ipb
= m_fs
->e2fs_bsize
/ EXT2_DINODE_SIZE(m_fs
);
741 m_fs
->e2fs_itpg
= m_fs
->e2fs
.e2fs_ipg
/ m_fs
->e2fs_ipb
;
743 m_fs
->e2fs_gd
= malloc(m_fs
->e2fs_ngdb
* m_fs
->e2fs_bsize
,
745 for (i
= 0; i
< m_fs
->e2fs_ngdb
; i
++) {
746 error
= bread(devvp
,
747 fsbtodb(m_fs
, m_fs
->e2fs
.e2fs_first_dblock
+
748 1 /* superblock */ + i
),
749 m_fs
->e2fs_bsize
, NOCRED
, 0, &bp
);
751 free(m_fs
->e2fs_gd
, M_UFSMNT
);
754 e2fs_cgload((struct ext2_gd
*)bp
->b_data
,
756 i
* m_fs
->e2fs_bsize
/ sizeof(struct ext2_gd
)],
763 mp
->mnt_stat
.f_fsidx
.__fsid_val
[0] = (long)dev
;
764 mp
->mnt_stat
.f_fsidx
.__fsid_val
[1] = makefstype(MOUNT_EXT2FS
);
765 mp
->mnt_stat
.f_fsid
= mp
->mnt_stat
.f_fsidx
.__fsid_val
[0];
766 mp
->mnt_stat
.f_namemax
= EXT2FS_MAXNAMLEN
;
767 mp
->mnt_flag
|= MNT_LOCAL
;
768 mp
->mnt_dev_bshift
= DEV_BSHIFT
; /* XXX */
769 mp
->mnt_fs_bshift
= m_fs
->e2fs_bshift
;
770 mp
->mnt_iflag
|= IMNT_DTYPE
;
774 ump
->um_devvp
= devvp
;
775 ump
->um_nindir
= NINDIR(m_fs
);
776 ump
->um_lognindir
= ffs(NINDIR(m_fs
)) - 1;
777 ump
->um_bptrtodb
= m_fs
->e2fs_fsbtodb
;
778 ump
->um_seqinc
= 1; /* no frags */
779 ump
->um_maxsymlinklen
= EXT2_MAXSYMLINKLEN
;
780 ump
->um_dirblksiz
= m_fs
->e2fs_bsize
;
781 ump
->um_maxfilesize
= ((uint64_t)0x80000000 * m_fs
->e2fs_bsize
- 1);
782 devvp
->v_specmountpoint
= mp
;
789 free(ump
->um_e2fs
, M_UFSMNT
);
797 * unmount system call
800 ext2fs_unmount(struct mount
*mp
, int mntflags
)
802 struct ufsmount
*ump
;
807 if (mntflags
& MNT_FORCE
)
809 if ((error
= ext2fs_flushfiles(mp
, flags
)) != 0)
813 if (fs
->e2fs_ronly
== 0 &&
814 ext2fs_cgupdate(ump
, MNT_WAIT
) == 0 &&
815 (fs
->e2fs
.e2fs_state
& E2FS_ERRORS
) == 0) {
816 fs
->e2fs
.e2fs_state
= E2FS_ISCLEAN
;
817 (void) ext2fs_sbupdate(ump
, MNT_WAIT
);
819 if (ump
->um_devvp
->v_type
!= VBAD
)
820 ump
->um_devvp
->v_specmountpoint
= NULL
;
821 vn_lock(ump
->um_devvp
, LK_EXCLUSIVE
| LK_RETRY
);
822 error
= VOP_CLOSE(ump
->um_devvp
, fs
->e2fs_ronly
? FREAD
: FREAD
|FWRITE
,
825 free(fs
->e2fs_gd
, M_UFSMNT
);
829 mp
->mnt_flag
&= ~MNT_LOCAL
;
834 * Flush out all the files in a filesystem.
837 ext2fs_flushfiles(struct mount
*mp
, int flags
)
843 flags
&= ~FORCECLOSE
;
844 error
= vflush(mp
, NULLVP
, flags
);
849 * Get file system statistics.
852 ext2fs_statvfs(struct mount
*mp
, struct statvfs
*sbp
)
854 struct ufsmount
*ump
;
856 uint32_t overhead
, overhead_per_group
, ngdb
;
861 if (fs
->e2fs
.e2fs_magic
!= E2FS_MAGIC
)
862 panic("ext2fs_statvfs");
865 * Compute the overhead (FS structures)
868 1 /* block bitmap */ +
869 1 /* inode bitmap */ +
871 overhead
= fs
->e2fs
.e2fs_first_dblock
+
872 fs
->e2fs_ncg
* overhead_per_group
;
873 if (fs
->e2fs
.e2fs_rev
> E2FS_REV0
&&
874 fs
->e2fs
.e2fs_features_rocompat
& EXT2F_ROCOMPAT_SPARSESUPER
) {
875 for (i
= 0, ngroups
= 0; i
< fs
->e2fs_ncg
; i
++) {
880 ngroups
= fs
->e2fs_ncg
;
882 ngdb
= fs
->e2fs_ngdb
;
883 if (fs
->e2fs
.e2fs_rev
> E2FS_REV0
&&
884 fs
->e2fs
.e2fs_features_compat
& EXT2F_COMPAT_RESIZE
)
885 ngdb
+= fs
->e2fs
.e2fs_reserved_ngdb
;
886 overhead
+= ngroups
* (1 /* superblock */ + ngdb
);
888 sbp
->f_bsize
= fs
->e2fs_bsize
;
889 sbp
->f_frsize
= MINBSIZE
<< fs
->e2fs
.e2fs_fsize
;
890 sbp
->f_iosize
= fs
->e2fs_bsize
;
891 sbp
->f_blocks
= fs
->e2fs
.e2fs_bcount
- overhead
;
892 sbp
->f_bfree
= fs
->e2fs
.e2fs_fbcount
;
893 sbp
->f_bresvd
= fs
->e2fs
.e2fs_rbcount
;
894 if (sbp
->f_bfree
> sbp
->f_bresvd
)
895 sbp
->f_bavail
= sbp
->f_bfree
- sbp
->f_bresvd
;
898 sbp
->f_files
= fs
->e2fs
.e2fs_icount
;
899 sbp
->f_ffree
= fs
->e2fs
.e2fs_ficount
;
900 sbp
->f_favail
= fs
->e2fs
.e2fs_ficount
;
902 copy_statvfs_info(sbp
, mp
);
907 * Go through the disk queues to initiate sandbagged IO;
908 * go through the inodes to write those that have been modified;
909 * initiate the writing of the super block if it has been modified.
911 * Note: we are always called with the filesystem marked `MPBUSY'.
914 ext2fs_sync(struct mount
*mp
, int waitfor
, kauth_cred_t cred
)
916 struct vnode
*vp
, *mvp
;
918 struct ufsmount
*ump
= VFSTOUFS(mp
);
920 int error
, allerror
= 0;
923 if (fs
->e2fs_fmod
!= 0 && fs
->e2fs_ronly
!= 0) { /* XXX */
924 printf("fs = %s\n", fs
->e2fs_fsmnt
);
925 panic("update: rofs mod");
928 /* Allocate a marker vnode. */
929 if ((mvp
= vnalloc(mp
)) == NULL
)
933 * Write back each (modified) inode.
935 mutex_enter(&mntvnode_lock
);
938 * NOTE: not using the TAILQ_FOREACH here since in this loop vgone()
939 * and vclean() can be called indirectly
941 for (vp
= TAILQ_FIRST(&mp
->mnt_vnodelist
); vp
; vp
= vunmark(mvp
)) {
943 if (vp
->v_mount
!= mp
|| vismarker(vp
))
945 mutex_enter(&vp
->v_interlock
);
947 if (ip
== NULL
|| (vp
->v_iflag
& (VI_XLOCK
|VI_CLEAN
)) != 0 ||
948 vp
->v_type
== VNON
||
950 (IN_CHANGE
| IN_UPDATE
| IN_MODIFIED
)) == 0 &&
951 LIST_EMPTY(&vp
->v_dirtyblkhd
) &&
952 UVM_OBJ_IS_CLEAN(&vp
->v_uobj
)))
954 mutex_exit(&vp
->v_interlock
);
957 mutex_exit(&mntvnode_lock
);
958 error
= vget(vp
, LK_EXCLUSIVE
| LK_NOWAIT
| LK_INTERLOCK
);
960 mutex_enter(&mntvnode_lock
);
961 if (error
== ENOENT
) {
962 mutex_enter(&mntvnode_lock
);
968 if (vp
->v_type
== VREG
&& waitfor
== MNT_LAZY
)
969 error
= ext2fs_update(vp
, NULL
, NULL
, 0);
971 error
= VOP_FSYNC(vp
, cred
,
972 waitfor
== MNT_WAIT
? FSYNC_WAIT
: 0, 0, 0);
976 mutex_enter(&mntvnode_lock
);
978 mutex_exit(&mntvnode_lock
);
981 * Force stale file system control information to be flushed.
983 if (waitfor
!= MNT_LAZY
) {
984 vn_lock(ump
->um_devvp
, LK_EXCLUSIVE
| LK_RETRY
);
985 if ((error
= VOP_FSYNC(ump
->um_devvp
, cred
,
986 waitfor
== MNT_WAIT
? FSYNC_WAIT
: 0, 0, 0)) != 0)
988 VOP_UNLOCK(ump
->um_devvp
, 0);
991 * Write back modified superblock.
993 if (fs
->e2fs_fmod
!= 0) {
995 fs
->e2fs
.e2fs_wtime
= time_second
;
996 if ((error
= ext2fs_cgupdate(ump
, waitfor
)))
1003 * Look up a EXT2FS dinode number to find its incore vnode, otherwise read it
1004 * in from disk. If it is in core, wait for the lock bit to clear, then
1005 * return the inode locked. Detection and handling of mount points must be
1006 * done by the calling routine.
1009 ext2fs_vget(struct mount
*mp
, ino_t ino
, struct vnode
**vpp
)
1011 struct m_ext2fs
*fs
;
1013 struct ufsmount
*ump
;
1023 if ((*vpp
= ufs_ihashget(dev
, ino
, LK_EXCLUSIVE
)) != NULL
)
1026 /* Allocate a new vnode/inode. */
1027 if ((error
= getnewvnode(VT_EXT2FS
, mp
, ext2fs_vnodeop_p
, &vp
)) != 0) {
1031 ip
= pool_get(&ext2fs_inode_pool
, PR_WAITOK
);
1033 mutex_enter(&ufs_hashlock
);
1034 if ((*vpp
= ufs_ihashget(dev
, ino
, 0)) != NULL
) {
1035 mutex_exit(&ufs_hashlock
);
1037 pool_put(&ext2fs_inode_pool
, ip
);
1041 vp
->v_vflag
|= VV_LOCKSWORK
;
1043 memset(ip
, 0, sizeof(struct inode
));
1047 ip
->i_e2fs
= fs
= ump
->um_e2fs
;
1050 ip
->i_e2fs_last_lblk
= 0;
1051 ip
->i_e2fs_last_blk
= 0;
1052 genfs_node_init(vp
, &ext2fs_genfsops
);
1055 * Put it onto its hash chain and lock it so that other requests for
1056 * this inode will block if they arrive while we are sleeping waiting
1057 * for old data structures to be purged or for the contents of the
1058 * disk portion of this inode to be read.
1062 mutex_exit(&ufs_hashlock
);
1064 /* Read in the disk contents for the inode, copy into the inode. */
1065 error
= bread(ump
->um_devvp
, fsbtodb(fs
, ino_to_fsba(fs
, ino
)),
1066 (int)fs
->e2fs_bsize
, NOCRED
, 0, &bp
);
1070 * The inode does not contain anything useful, so it would
1071 * be misleading to leave it on its hash chain. With mode
1072 * still zero, it will be unlinked and returned to the free
1081 cp
= (char *)bp
->b_data
+ (ino_to_fsbo(fs
, ino
) * EXT2_DINODE_SIZE(fs
));
1082 ip
->i_din
.e2fs_din
= pool_get(&ext2fs_dinode_pool
, PR_WAITOK
);
1083 e2fs_iload((struct ext2fs_dinode
*)cp
, ip
->i_din
.e2fs_din
);
1084 ext2fs_set_inode_guid(ip
);
1087 /* If the inode was deleted, reset all fields */
1088 if (ip
->i_e2fs_dtime
!= 0) {
1089 ip
->i_e2fs_mode
= ip
->i_e2fs_nblock
= 0;
1090 (void)ext2fs_setsize(ip
, 0);
1091 memset(ip
->i_e2fs_blocks
, 0, sizeof(ip
->i_e2fs_blocks
));
1095 * Initialize the vnode from the inode, check for aliases.
1098 error
= ext2fs_vinit(mp
, ext2fs_specop_p
, ext2fs_fifoop_p
, &vp
);
1105 * Finish inode initialization now that aliasing has been resolved.
1108 ip
->i_devvp
= ump
->um_devvp
;
1112 * Set up a generation number for this inode if it does not
1113 * already have one. This should only happen on old filesystems.
1116 if (ip
->i_e2fs_gen
== 0) {
1117 if (++ext2gennumber
< (u_long
)time_second
)
1118 ext2gennumber
= time_second
;
1119 ip
->i_e2fs_gen
= ext2gennumber
;
1120 if ((vp
->v_mount
->mnt_flag
& MNT_RDONLY
) == 0)
1121 ip
->i_flag
|= IN_MODIFIED
;
1123 uvm_vnp_setsize(vp
, ext2fs_size(ip
));
1129 * File handle to vnode
1131 * Have to be really careful about stale file handles:
1132 * - check that the inode number is valid
1133 * - call ext2fs_vget() to get the locked inode
1134 * - check for an unallocated inode (i_mode == 0)
1137 ext2fs_fhtovp(struct mount
*mp
, struct fid
*fhp
, struct vnode
**vpp
)
1143 struct m_ext2fs
*fs
;
1145 if (fhp
->fid_len
!= sizeof(struct ufid
))
1148 memcpy(&ufh
, fhp
, sizeof(struct ufid
));
1149 fs
= VFSTOUFS(mp
)->um_e2fs
;
1150 if ((ufh
.ufid_ino
< EXT2_FIRSTINO
&& ufh
.ufid_ino
!= EXT2_ROOTINO
) ||
1151 ufh
.ufid_ino
>= fs
->e2fs_ncg
* fs
->e2fs
.e2fs_ipg
)
1154 if ((error
= VFS_VGET(mp
, ufh
.ufid_ino
, &nvp
)) != 0) {
1159 if (ip
->i_e2fs_mode
== 0 || ip
->i_e2fs_dtime
!= 0 ||
1160 ip
->i_e2fs_gen
!= ufh
.ufid_gen
) {
1170 * Vnode pointer to File handle
1174 ext2fs_vptofh(struct vnode
*vp
, struct fid
*fhp
, size_t *fh_size
)
1179 if (*fh_size
< sizeof(struct ufid
)) {
1180 *fh_size
= sizeof(struct ufid
);
1183 *fh_size
= sizeof(struct ufid
);
1186 memset(&ufh
, 0, sizeof(ufh
));
1187 ufh
.ufid_len
= sizeof(struct ufid
);
1188 ufh
.ufid_ino
= ip
->i_number
;
1189 ufh
.ufid_gen
= ip
->i_e2fs_gen
;
1190 memcpy(fhp
, &ufh
, sizeof(ufh
));
1195 * Write a superblock and associated information back to disk.
1198 ext2fs_sbupdate(struct ufsmount
*mp
, int waitfor
)
1200 struct m_ext2fs
*fs
= mp
->um_e2fs
;
1204 bp
= getblk(mp
->um_devvp
, SBLOCK
, SBSIZE
, 0, 0);
1205 e2fs_sbsave(&fs
->e2fs
, (struct ext2fs
*)bp
->b_data
);
1206 if (waitfor
== MNT_WAIT
)
1214 ext2fs_cgupdate(struct ufsmount
*mp
, int waitfor
)
1216 struct m_ext2fs
*fs
= mp
->um_e2fs
;
1218 int i
, error
= 0, allerror
= 0;
1220 allerror
= ext2fs_sbupdate(mp
, waitfor
);
1221 for (i
= 0; i
< fs
->e2fs_ngdb
; i
++) {
1222 bp
= getblk(mp
->um_devvp
, fsbtodb(fs
,
1223 fs
->e2fs
.e2fs_first_dblock
+
1224 1 /* superblock */ + i
), fs
->e2fs_bsize
, 0, 0);
1225 e2fs_cgsave(&fs
->e2fs_gd
[
1226 i
* fs
->e2fs_bsize
/ sizeof(struct ext2_gd
)],
1227 (struct ext2_gd
*)bp
->b_data
, fs
->e2fs_bsize
);
1228 if (waitfor
== MNT_WAIT
)
1234 if (!allerror
&& error
)
1240 ext2fs_checksb(struct ext2fs
*fs
, int ronly
)
1243 if (fs2h16(fs
->e2fs_magic
) != E2FS_MAGIC
) {
1244 return (EINVAL
); /* XXX needs translation */
1246 if (fs2h32(fs
->e2fs_rev
) > E2FS_REV1
) {
1248 printf("Ext2 fs: unsupported revision number: %x\n",
1249 fs2h32(fs
->e2fs_rev
));
1251 return (EINVAL
); /* XXX needs translation */
1253 if (fs2h32(fs
->e2fs_log_bsize
) > 2) { /* block size = 1024|2048|4096 */
1255 printf("Ext2 fs: bad block size: %d "
1256 "(expected <= 2 for ext2 fs)\n",
1257 fs2h32(fs
->e2fs_log_bsize
));
1259 return (EINVAL
); /* XXX needs translation */
1261 if (fs2h32(fs
->e2fs_rev
) > E2FS_REV0
) {
1262 if (fs2h32(fs
->e2fs_first_ino
) != EXT2_FIRSTINO
) {
1263 printf("Ext2 fs: unsupported first inode position\n");
1264 return (EINVAL
); /* XXX needs translation */
1266 if (fs2h32(fs
->e2fs_features_incompat
) &
1267 ~EXT2F_INCOMPAT_SUPP
) {
1268 printf("Ext2 fs: unsupported optional feature\n");
1269 return (EINVAL
); /* XXX needs translation */
1271 if (!ronly
&& fs2h32(fs
->e2fs_features_rocompat
) &
1272 ~EXT2F_ROCOMPAT_SUPP
) {
1273 return (EROFS
); /* XXX needs translation */