2 * Copyright (C) International Business Machines Corp., 2000-2004
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
12 * the GNU General Public License for more details.
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 #include <linux/buffer_head.h>
21 #include <linux/quotaops.h>
22 #include "jfs_incore.h"
23 #include "jfs_filsys.h"
24 #include "jfs_metapage.h"
25 #include "jfs_dinode.h"
28 #include "jfs_superblock.h"
29 #include "jfs_txnmgr.h"
30 #include "jfs_debug.h"
32 #define BITSPERPAGE (PSIZE << 3)
34 #define MEGABYTE (1 << L2MEGABYTE)
35 #define MEGABYTE32 (MEGABYTE << 5)
37 /* convert block number to bmap file page number */
38 #define BLKTODMAPN(b)\
39 (((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1)
44 * function: extend file system;
46 * |-------------------------------|----------|----------|
47 * file system space fsck inline log
51 * new LVSize: in LV blocks (required)
52 * new LogSize: in LV blocks (optional)
53 * new FSSize: in LV blocks (optional)
56 * 1. set new LogSize as specified or default from new LVSize;
57 * 2. compute new FSCKSize from new LVSize;
58 * 3. set new FSSize as MIN(FSSize, LVSize-(LogSize+FSCKSize)) where
59 * assert(new FSSize >= old FSSize),
60 * i.e., file system must not be shrinked;
62 int jfs_extendfs(struct super_block
*sb
, s64 newLVSize
, int newLogSize
)
65 struct jfs_sb_info
*sbi
= JFS_SBI(sb
);
66 struct inode
*ipbmap
= sbi
->ipbmap
;
67 struct inode
*ipbmap2
;
68 struct inode
*ipimap
= sbi
->ipimap
;
69 struct jfs_log
*log
= sbi
->log
;
70 struct bmap
*bmp
= sbi
->bmap
;
71 s64 newLogAddress
, newFSCKAddress
;
73 s64 newMapSize
= 0, mapSize
;
74 s64 XAddress
, XSize
, nblocks
, xoff
, xaddr
, t64
;
78 int newNpages
= 0, nPages
, newPage
, xlen
, t32
;
80 int log_formatted
= 0;
81 struct inode
*iplist
[1];
82 struct jfs_superblock
*j_sb
, *j_sb2
;
84 struct buffer_head
*bh
, *bh2
;
86 /* If the volume hasn't grown, get out now */
88 if (sbi
->mntflag
& JFS_INLINELOG
)
89 oldLVSize
= addressPXD(&sbi
->logpxd
) + lengthPXD(&sbi
->logpxd
);
91 oldLVSize
= addressPXD(&sbi
->fsckpxd
) +
92 lengthPXD(&sbi
->fsckpxd
);
94 if (oldLVSize
>= newLVSize
) {
96 "jfs_extendfs: volume hasn't grown, returning\n");
100 VolumeSize
= sb
->s_bdev
->bd_inode
->i_size
>> sb
->s_blocksize_bits
;
103 if (newLVSize
> VolumeSize
) {
104 printk(KERN_WARNING
"jfs_extendfs: invalid size\n");
109 /* check the device */
110 bh
= sb_bread(sb
, newLVSize
- 1);
112 printk(KERN_WARNING
"jfs_extendfs: invalid size\n");
119 /* Can't extend write-protected drive */
121 if (isReadOnly(ipbmap
)) {
122 printk(KERN_WARNING
"jfs_extendfs: read-only file system\n");
128 * reconfigure LV spaces
129 * ---------------------
131 * validate new size, or, if not specified, determine new size
135 * reconfigure inline log space:
137 if ((sbi
->mntflag
& JFS_INLINELOG
)) {
138 if (newLogSize
== 0) {
140 * no size specified: default to 1/256 of aggregate
141 * size; rounded up to a megabyte boundary;
143 newLogSize
= newLVSize
>> 8;
144 t32
= (1 << (20 - sbi
->l2bsize
)) - 1;
145 newLogSize
= (newLogSize
+ t32
) & ~t32
;
147 min(newLogSize
, MEGABYTE32
>> sbi
->l2bsize
);
150 * convert the newLogSize to fs blocks.
152 * Since this is given in megabytes, it will always be
153 * an even number of pages.
155 newLogSize
= (newLogSize
* MEGABYTE
) >> sbi
->l2bsize
;
161 newLogAddress
= newLVSize
- newLogSize
;
164 * reconfigure fsck work space:
166 * configure it to the end of the logical volume regardless of
167 * whether file system extends to the end of the aggregate;
168 * Need enough 4k pages to cover:
169 * - 1 bit per block in aggregate rounded up to BPERDMAP boundary
170 * - 1 extra page to handle control page and intermediate level pages
171 * - 50 extra pages for the chkdsk service log
173 t64
= ((newLVSize
- newLogSize
+ BPERDMAP
- 1) >> L2BPERDMAP
)
175 t32
= ((t64
+ (BITSPERPAGE
- 1)) / BITSPERPAGE
) + 1 + 50;
176 newFSCKSize
= t32
<< sbi
->l2nbperpage
;
177 newFSCKAddress
= newLogAddress
- newFSCKSize
;
180 * compute new file system space;
182 newFSSize
= newLVSize
- newLogSize
- newFSCKSize
;
184 /* file system cannot be shrinked */
185 if (newFSSize
< bmp
->db_mapsize
) {
191 * If we're expanding enough that the inline log does not overlap
192 * the old one, we can format the new log before we quiesce the
195 if ((sbi
->mntflag
& JFS_INLINELOG
) && (newLogAddress
> oldLVSize
)) {
196 if ((rc
= lmLogFormat(log
, newLogAddress
, newLogSize
)))
201 * quiesce file system
203 * (prepare to move the inline log and to prevent map update)
205 * block any new transactions and wait for completion of
206 * all wip transactions and flush modified pages s.t.
207 * on-disk file system is in consistent state and
208 * log is not required for recovery.
212 if (sbi
->mntflag
& JFS_INLINELOG
) {
214 * deactivate old inline log
219 * mark on-disk super block for fs in transition;
221 * update on-disk superblock for the new space configuration
222 * of inline log space and fsck work space descriptors:
223 * N.B. FS descriptor is NOT updated;
226 * logredo(): if FM_EXTENDFS, return to fsck() for cleanup;
227 * fsck(): if FM_EXTENDFS, reformat inline log and fsck
228 * workspace from superblock inline log descriptor and fsck
229 * workspace descriptor;
232 /* read in superblock */
233 if ((rc
= readSuper(sb
, &bh
)))
235 j_sb
= (struct jfs_superblock
*)bh
->b_data
;
237 /* mark extendfs() in progress */
238 j_sb
->s_state
|= cpu_to_le32(FM_EXTENDFS
);
239 j_sb
->s_xsize
= cpu_to_le64(newFSSize
);
240 PXDaddress(&j_sb
->s_xfsckpxd
, newFSCKAddress
);
241 PXDlength(&j_sb
->s_xfsckpxd
, newFSCKSize
);
242 PXDaddress(&j_sb
->s_xlogpxd
, newLogAddress
);
243 PXDlength(&j_sb
->s_xlogpxd
, newLogSize
);
245 /* synchronously update superblock */
246 mark_buffer_dirty(bh
);
247 sync_dirty_buffer(bh
);
251 * format new inline log synchronously;
253 * crash recovery: if log move in progress,
254 * reformat log and exit success;
257 if ((rc
= lmLogFormat(log
, newLogAddress
, newLogSize
)))
263 log
->base
= newLogAddress
;
264 log
->size
= newLogSize
>> (L2LOGPSIZE
- sb
->s_blocksize_bits
);
265 if ((rc
= lmLogInit(log
)))
270 * extend block allocation map
271 * ---------------------------
273 * extendfs() for new extension, retry after crash recovery;
275 * note: both logredo() and fsck() rebuild map from
276 * the bitmap and configuration parameter from superblock
277 * (disregarding all other control information in the map);
280 * s_size: aggregate size in physical blocks;
283 * compute the new block allocation map configuration
286 * di_size: map file size in byte;
287 * di_nblocks: number of blocks allocated for map file;
288 * di_mapsize: number of blocks in aggregate (covered by map);
290 * db_mapsize: number of blocks in aggregate (covered by map);
292 newMapSize
= newFSSize
;
293 /* number of data pages of new bmap file:
294 * roundup new size to full dmap page boundary and
295 * add 1 extra dmap page for next extendfs()
297 t64
= (newMapSize
- 1) + BPERDMAP
;
298 newNpages
= BLKTODMAPN(t64
) + 1;
301 * extend map from current map (WITHOUT growing mapfile)
303 * map new extension with unmapped part of the last partial
304 * dmap page, if applicable, and extra page(s) allocated
305 * at end of bmap by mkfs() or previous extendfs();
308 /* compute number of blocks requested to extend */
309 mapSize
= bmp
->db_mapsize
;
310 XAddress
= mapSize
; /* eXtension Address */
311 XSize
= newMapSize
- mapSize
; /* eXtension Size */
312 old_agsize
= bmp
->db_agsize
; /* We need to know if this changes */
314 /* compute number of blocks that can be extended by current mapfile */
315 t64
= dbMapFileSizeToMapSize(ipbmap
);
317 printk(KERN_ERR
"jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx)\n",
318 (long long) mapSize
, (long long) t64
);
322 nblocks
= min(t64
- mapSize
, XSize
);
325 * update map pages for new extension:
327 * update/init dmap and bubble up the control hierarchy
328 * incrementally fold up dmaps into upper levels;
329 * update bmap control page;
331 if ((rc
= dbExtendFS(ipbmap
, XAddress
, nblocks
)))
334 * the map now has extended to cover additional nblocks:
335 * dn_mapsize = oldMapsize + nblocks;
337 /* ipbmap->i_mapsize += nblocks; */
341 * grow map file to cover remaining extension
342 * and/or one extra dmap page for next extendfs();
344 * allocate new map pages and its backing blocks, and
345 * update map file xtree
347 /* compute number of data pages of current bmap file */
348 nPages
= ipbmap
->i_size
>> L2PSIZE
;
350 /* need to grow map file ? */
351 if (nPages
== newNpages
)
355 * grow bmap file for the new map pages required:
357 * allocate growth at the start of newly extended region;
358 * bmap file only grows sequentially, i.e., both data pages
359 * and possibly xtree index pages may grow in append mode,
360 * s.t. logredo() can reconstruct pre-extension state
361 * by washing away bmap file of pages outside s_size boundary;
364 * journal map file growth as if a regular file growth:
365 * (note: bmap is created with di_mode = IFJOURNAL|IFREG);
367 * journaling of bmap file growth is not required since
368 * logredo() do/can not use log records of bmap file growth
369 * but it provides careful write semantics, pmap update, etc.;
371 /* synchronous write of data pages: bmap data pages are
372 * cached in meta-data cache, and not written out
375 filemap_fdatawait(ipbmap
->i_mapping
);
376 filemap_fdatawrite(ipbmap
->i_mapping
);
377 filemap_fdatawait(ipbmap
->i_mapping
);
378 diWriteSpecial(ipbmap
, 0);
380 newPage
= nPages
; /* first new page number */
381 xoff
= newPage
<< sbi
->l2nbperpage
;
382 xlen
= (newNpages
- nPages
) << sbi
->l2nbperpage
;
383 xlen
= min(xlen
, (int) nblocks
) & ~(sbi
->nbperpage
- 1);
386 tid
= txBegin(sb
, COMMIT_FORCE
);
388 if ((rc
= xtAppend(tid
, ipbmap
, 0, xoff
, nblocks
, &xlen
, &xaddr
, 0))) {
392 /* update bmap file size */
393 ipbmap
->i_size
+= xlen
<< sbi
->l2bsize
;
394 inode_add_bytes(ipbmap
, xlen
<< sbi
->l2bsize
);
397 rc
= txCommit(tid
, 1, &iplist
[0], COMMIT_FORCE
);
405 * map file has been grown now to cover extension to further out;
406 * di_size = new map file size;
408 * if huge extension, the previous extension based on previous
409 * map file size may not have been sufficient to cover whole extension
410 * (it could have been used up for new map pages),
411 * but the newly grown map file now covers lot bigger new free space
412 * available for further extension of map;
414 /* any more blocks to extend ? */
420 dbFinalizeBmap(ipbmap
);
423 * update inode allocation map
424 * ---------------------------
426 * move iag lists from old to new iag;
427 * agstart field is not updated for logredo() to reconstruct
428 * iag lists if system crash occurs.
429 * (computation of ag number from agstart based on agsize
430 * will correctly identify the new ag);
432 /* if new AG size the same as old AG size, done! */
433 if (bmp
->db_agsize
!= old_agsize
) {
434 if ((rc
= diExtendFS(ipimap
, ipbmap
)))
438 if ((rc
= diSync(ipimap
)))
446 * extension is committed when on-disk super block is
447 * updated with new descriptors: logredo will recover
448 * crash before it to pre-extension state;
451 /* sync log to skip log replay of bmap file growth transaction; */
452 /* lmLogSync(log, 1); */
455 * synchronous write bmap global control page;
456 * for crash before completion of write
457 * logredo() will recover to pre-extendfs state;
458 * for crash after completion of write,
459 * logredo() will recover post-extendfs state;
461 if ((rc
= dbSync(ipbmap
)))
465 * copy primary bmap inode to secondary bmap inode
468 ipbmap2
= diReadSpecial(sb
, BMAP_I
, 1);
469 if (ipbmap2
== NULL
) {
470 printk(KERN_ERR
"jfs_extendfs: diReadSpecial(bmap) failed\n");
473 memcpy(&JFS_IP(ipbmap2
)->i_xtroot
, &JFS_IP(ipbmap
)->i_xtroot
, 288);
474 ipbmap2
->i_size
= ipbmap
->i_size
;
475 ipbmap2
->i_blocks
= ipbmap
->i_blocks
;
477 diWriteSpecial(ipbmap2
, 1);
478 diFreeSpecial(ipbmap2
);
483 if ((rc
= readSuper(sb
, &bh
)))
485 j_sb
= (struct jfs_superblock
*)bh
->b_data
;
487 /* mark extendfs() completion */
488 j_sb
->s_state
&= cpu_to_le32(~FM_EXTENDFS
);
489 j_sb
->s_size
= cpu_to_le64(bmp
->db_mapsize
<<
490 le16_to_cpu(j_sb
->s_l2bfactor
));
491 j_sb
->s_agsize
= cpu_to_le32(bmp
->db_agsize
);
493 /* update inline log space descriptor */
494 if (sbi
->mntflag
& JFS_INLINELOG
) {
495 PXDaddress(&(j_sb
->s_logpxd
), newLogAddress
);
496 PXDlength(&(j_sb
->s_logpxd
), newLogSize
);
499 /* record log's mount serial number */
500 j_sb
->s_logserial
= cpu_to_le32(log
->serial
);
502 /* update fsck work space descriptor */
503 PXDaddress(&(j_sb
->s_fsckpxd
), newFSCKAddress
);
504 PXDlength(&(j_sb
->s_fsckpxd
), newFSCKSize
);
506 /* sb->s_fsckloglen remains the same */
508 /* Update secondary superblock */
509 bh2
= sb_bread(sb
, SUPER2_OFF
>> sb
->s_blocksize_bits
);
511 j_sb2
= (struct jfs_superblock
*)bh2
->b_data
;
512 memcpy(j_sb2
, j_sb
, sizeof (struct jfs_superblock
));
514 mark_buffer_dirty(bh
);
515 sync_dirty_buffer(bh2
);
519 /* write primary superblock */
520 mark_buffer_dirty(bh
);
521 sync_dirty_buffer(bh
);
527 jfs_error(sb
, "jfs_extendfs");
531 * resume file system transactions