Root/fs/jfs/resize.c

1/*
2 * Copyright (C) International Business Machines Corp., 2000-2004
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
12 * the GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, write to the Free Software
16 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17*/
18
19#include <linux/fs.h>
20#include <linux/buffer_head.h>
21#include <linux/quotaops.h>
22#include "jfs_incore.h"
23#include "jfs_filsys.h"
24#include "jfs_metapage.h"
25#include "jfs_dinode.h"
26#include "jfs_imap.h"
27#include "jfs_dmap.h"
28#include "jfs_superblock.h"
29#include "jfs_txnmgr.h"
30#include "jfs_debug.h"
31
32#define BITSPERPAGE (PSIZE << 3)
33#define L2MEGABYTE 20
34#define MEGABYTE (1 << L2MEGABYTE)
35#define MEGABYTE32 (MEGABYTE << 5)
36
37/* convert block number to bmap file page number */
38#define BLKTODMAPN(b)\
39    (((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1)
40
41/*
42 * jfs_extendfs()
43 *
44 * function: extend file system;
45 *
46 * |-------------------------------|----------|----------|
47 * file system space fsck inline log
48 * workspace space
49 *
50 * input:
51 * new LVSize: in LV blocks (required)
52 * new LogSize: in LV blocks (optional)
53 * new FSSize: in LV blocks (optional)
54 *
55 * new configuration:
56 * 1. set new LogSize as specified or default from new LVSize;
57 * 2. compute new FSCKSize from new LVSize;
58 * 3. set new FSSize as MIN(FSSize, LVSize-(LogSize+FSCKSize)) where
59 * assert(new FSSize >= old FSSize),
60 * i.e., file system must not be shrunk;
61 */
62int jfs_extendfs(struct super_block *sb, s64 newLVSize, int newLogSize)
63{
64    int rc = 0;
65    struct jfs_sb_info *sbi = JFS_SBI(sb);
66    struct inode *ipbmap = sbi->ipbmap;
67    struct inode *ipbmap2;
68    struct inode *ipimap = sbi->ipimap;
69    struct jfs_log *log = sbi->log;
70    struct bmap *bmp = sbi->bmap;
71    s64 newLogAddress, newFSCKAddress;
72    int newFSCKSize;
73    s64 newMapSize = 0, mapSize;
74    s64 XAddress, XSize, nblocks, xoff, xaddr, t64;
75    s64 oldLVSize;
76    s64 newFSSize;
77    s64 VolumeSize;
78    int newNpages = 0, nPages, newPage, xlen, t32;
79    int tid;
80    int log_formatted = 0;
81    struct inode *iplist[1];
82    struct jfs_superblock *j_sb, *j_sb2;
83    s64 old_agsize;
84    int agsizechanged = 0;
85    struct buffer_head *bh, *bh2;
86
87    /* If the volume hasn't grown, get out now */
88
89    if (sbi->mntflag & JFS_INLINELOG)
90        oldLVSize = addressPXD(&sbi->logpxd) + lengthPXD(&sbi->logpxd);
91    else
92        oldLVSize = addressPXD(&sbi->fsckpxd) +
93            lengthPXD(&sbi->fsckpxd);
94
95    if (oldLVSize >= newLVSize) {
96        printk(KERN_WARNING
97               "jfs_extendfs: volume hasn't grown, returning\n");
98        goto out;
99    }
100
101    VolumeSize = sb->s_bdev->bd_inode->i_size >> sb->s_blocksize_bits;
102
103    if (VolumeSize) {
104        if (newLVSize > VolumeSize) {
105            printk(KERN_WARNING "jfs_extendfs: invalid size\n");
106            rc = -EINVAL;
107            goto out;
108        }
109    } else {
110        /* check the device */
111        bh = sb_bread(sb, newLVSize - 1);
112        if (!bh) {
113            printk(KERN_WARNING "jfs_extendfs: invalid size\n");
114            rc = -EINVAL;
115            goto out;
116        }
117        bforget(bh);
118    }
119
120    /* Can't extend write-protected drive */
121
122    if (isReadOnly(ipbmap)) {
123        printk(KERN_WARNING "jfs_extendfs: read-only file system\n");
124        rc = -EROFS;
125        goto out;
126    }
127
128    /*
129     * reconfigure LV spaces
130     * ---------------------
131     *
132     * validate new size, or, if not specified, determine new size
133     */
134
135    /*
136     * reconfigure inline log space:
137     */
138    if ((sbi->mntflag & JFS_INLINELOG)) {
139        if (newLogSize == 0) {
140            /*
141             * no size specified: default to 1/256 of aggregate
142             * size; rounded up to a megabyte boundary;
143             */
144            newLogSize = newLVSize >> 8;
145            t32 = (1 << (20 - sbi->l2bsize)) - 1;
146            newLogSize = (newLogSize + t32) & ~t32;
147            newLogSize =
148                min(newLogSize, MEGABYTE32 >> sbi->l2bsize);
149        } else {
150            /*
151             * convert the newLogSize to fs blocks.
152             *
153             * Since this is given in megabytes, it will always be
154             * an even number of pages.
155             */
156            newLogSize = (newLogSize * MEGABYTE) >> sbi->l2bsize;
157        }
158
159    } else
160        newLogSize = 0;
161
162    newLogAddress = newLVSize - newLogSize;
163
164    /*
165     * reconfigure fsck work space:
166     *
167     * configure it to the end of the logical volume regardless of
168     * whether file system extends to the end of the aggregate;
169     * Need enough 4k pages to cover:
170     * - 1 bit per block in aggregate rounded up to BPERDMAP boundary
171     * - 1 extra page to handle control page and intermediate level pages
172     * - 50 extra pages for the chkdsk service log
173     */
174    t64 = ((newLVSize - newLogSize + BPERDMAP - 1) >> L2BPERDMAP)
175        << L2BPERDMAP;
176    t32 = DIV_ROUND_UP(t64, BITSPERPAGE) + 1 + 50;
177    newFSCKSize = t32 << sbi->l2nbperpage;
178    newFSCKAddress = newLogAddress - newFSCKSize;
179
180    /*
181     * compute new file system space;
182     */
183    newFSSize = newLVSize - newLogSize - newFSCKSize;
184
185    /* file system cannot be shrunk */
186    if (newFSSize < bmp->db_mapsize) {
187        rc = -EINVAL;
188        goto out;
189    }
190
191    /*
192     * If we're expanding enough that the inline log does not overlap
193     * the old one, we can format the new log before we quiesce the
194     * filesystem.
195     */
196    if ((sbi->mntflag & JFS_INLINELOG) && (newLogAddress > oldLVSize)) {
197        if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
198            goto out;
199        log_formatted = 1;
200    }
201    /*
202     * quiesce file system
203     *
204     * (prepare to move the inline log and to prevent map update)
205     *
206     * block any new transactions and wait for completion of
207     * all wip transactions and flush modified pages s.t.
208     * on-disk file system is in consistent state and
209     * log is not required for recovery.
210     */
211    txQuiesce(sb);
212
213    /* Reset size of direct inode */
214    sbi->direct_inode->i_size = sb->s_bdev->bd_inode->i_size;
215
216    if (sbi->mntflag & JFS_INLINELOG) {
217        /*
218         * deactivate old inline log
219         */
220        lmLogShutdown(log);
221
222        /*
223         * mark on-disk super block for fs in transition;
224         *
225         * update on-disk superblock for the new space configuration
226         * of inline log space and fsck work space descriptors:
227         * N.B. FS descriptor is NOT updated;
228         *
229         * crash recovery:
230         * logredo(): if FM_EXTENDFS, return to fsck() for cleanup;
231         * fsck(): if FM_EXTENDFS, reformat inline log and fsck
232         * workspace from superblock inline log descriptor and fsck
233         * workspace descriptor;
234         */
235
236        /* read in superblock */
237        if ((rc = readSuper(sb, &bh)))
238            goto error_out;
239        j_sb = (struct jfs_superblock *)bh->b_data;
240
241        /* mark extendfs() in progress */
242        j_sb->s_state |= cpu_to_le32(FM_EXTENDFS);
243        j_sb->s_xsize = cpu_to_le64(newFSSize);
244        PXDaddress(&j_sb->s_xfsckpxd, newFSCKAddress);
245        PXDlength(&j_sb->s_xfsckpxd, newFSCKSize);
246        PXDaddress(&j_sb->s_xlogpxd, newLogAddress);
247        PXDlength(&j_sb->s_xlogpxd, newLogSize);
248
249        /* synchronously update superblock */
250        mark_buffer_dirty(bh);
251        sync_dirty_buffer(bh);
252        brelse(bh);
253
254        /*
255         * format new inline log synchronously;
256         *
257         * crash recovery: if log move in progress,
258         * reformat log and exit success;
259         */
260        if (!log_formatted)
261            if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
262                goto error_out;
263
264        /*
265         * activate new log
266         */
267        log->base = newLogAddress;
268        log->size = newLogSize >> (L2LOGPSIZE - sb->s_blocksize_bits);
269        if ((rc = lmLogInit(log)))
270            goto error_out;
271    }
272
273    /*
274     * extend block allocation map
275     * ---------------------------
276     *
277     * extendfs() for new extension, retry after crash recovery;
278     *
279     * note: both logredo() and fsck() rebuild map from
280     * the bitmap and configuration parameter from superblock
281     * (disregarding all other control information in the map);
282     *
283     * superblock:
284     * s_size: aggregate size in physical blocks;
285     */
286    /*
287     * compute the new block allocation map configuration
288     *
289     * map dinode:
290     * di_size: map file size in byte;
291     * di_nblocks: number of blocks allocated for map file;
292     * di_mapsize: number of blocks in aggregate (covered by map);
293     * map control page:
294     * db_mapsize: number of blocks in aggregate (covered by map);
295     */
296    newMapSize = newFSSize;
297    /* number of data pages of new bmap file:
298     * roundup new size to full dmap page boundary and
299     * add 1 extra dmap page for next extendfs()
300     */
301    t64 = (newMapSize - 1) + BPERDMAP;
302    newNpages = BLKTODMAPN(t64) + 1;
303
304    /*
305     * extend map from current map (WITHOUT growing mapfile)
306     *
307     * map new extension with unmapped part of the last partial
308     * dmap page, if applicable, and extra page(s) allocated
309     * at end of bmap by mkfs() or previous extendfs();
310     */
311      extendBmap:
312    /* compute number of blocks requested to extend */
313    mapSize = bmp->db_mapsize;
314    XAddress = mapSize; /* eXtension Address */
315    XSize = newMapSize - mapSize; /* eXtension Size */
316    old_agsize = bmp->db_agsize; /* We need to know if this changes */
317
318    /* compute number of blocks that can be extended by current mapfile */
319    t64 = dbMapFileSizeToMapSize(ipbmap);
320    if (mapSize > t64) {
321        printk(KERN_ERR "jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx)\n",
322               (long long) mapSize, (long long) t64);
323        rc = -EIO;
324        goto error_out;
325    }
326    nblocks = min(t64 - mapSize, XSize);
327
328    /*
329     * update map pages for new extension:
330     *
331     * update/init dmap and bubble up the control hierarchy
332     * incrementally fold up dmaps into upper levels;
333     * update bmap control page;
334     */
335    if ((rc = dbExtendFS(ipbmap, XAddress, nblocks)))
336        goto error_out;
337
338    agsizechanged |= (bmp->db_agsize != old_agsize);
339
340    /*
341     * the map now has extended to cover additional nblocks:
342     * dn_mapsize = oldMapsize + nblocks;
343     */
344    /* ipbmap->i_mapsize += nblocks; */
345    XSize -= nblocks;
346
347    /*
348     * grow map file to cover remaining extension
349     * and/or one extra dmap page for next extendfs();
350     *
351     * allocate new map pages and its backing blocks, and
352     * update map file xtree
353     */
354    /* compute number of data pages of current bmap file */
355    nPages = ipbmap->i_size >> L2PSIZE;
356
357    /* need to grow map file ? */
358    if (nPages == newNpages)
359        goto finalizeBmap;
360
361    /*
362     * grow bmap file for the new map pages required:
363     *
364     * allocate growth at the start of newly extended region;
365     * bmap file only grows sequentially, i.e., both data pages
366     * and possibly xtree index pages may grow in append mode,
367     * s.t. logredo() can reconstruct pre-extension state
368     * by washing away bmap file of pages outside s_size boundary;
369     */
370    /*
371     * journal map file growth as if a regular file growth:
372     * (note: bmap is created with di_mode = IFJOURNAL|IFREG);
373     *
374     * journaling of bmap file growth is not required since
375     * logredo() do/can not use log records of bmap file growth
376     * but it provides careful write semantics, pmap update, etc.;
377     */
378    /* synchronous write of data pages: bmap data pages are
379     * cached in meta-data cache, and not written out
380     * by txCommit();
381     */
382    filemap_fdatawait(ipbmap->i_mapping);
383    filemap_write_and_wait(ipbmap->i_mapping);
384    diWriteSpecial(ipbmap, 0);
385
386    newPage = nPages; /* first new page number */
387    xoff = newPage << sbi->l2nbperpage;
388    xlen = (newNpages - nPages) << sbi->l2nbperpage;
389    xlen = min(xlen, (int) nblocks) & ~(sbi->nbperpage - 1);
390    xaddr = XAddress;
391
392    tid = txBegin(sb, COMMIT_FORCE);
393
394    if ((rc = xtAppend(tid, ipbmap, 0, xoff, nblocks, &xlen, &xaddr, 0))) {
395        txEnd(tid);
396        goto error_out;
397    }
398    /* update bmap file size */
399    ipbmap->i_size += xlen << sbi->l2bsize;
400    inode_add_bytes(ipbmap, xlen << sbi->l2bsize);
401
402    iplist[0] = ipbmap;
403    rc = txCommit(tid, 1, &iplist[0], COMMIT_FORCE);
404
405    txEnd(tid);
406
407    if (rc)
408        goto error_out;
409
410    /*
411     * map file has been grown now to cover extension to further out;
412     * di_size = new map file size;
413     *
414     * if huge extension, the previous extension based on previous
415     * map file size may not have been sufficient to cover whole extension
416     * (it could have been used up for new map pages),
417     * but the newly grown map file now covers lot bigger new free space
418     * available for further extension of map;
419     */
420    /* any more blocks to extend ? */
421    if (XSize)
422        goto extendBmap;
423
424      finalizeBmap:
425    /* finalize bmap */
426    dbFinalizeBmap(ipbmap);
427
428    /*
429     * update inode allocation map
430     * ---------------------------
431     *
432     * move iag lists from old to new iag;
433     * agstart field is not updated for logredo() to reconstruct
434     * iag lists if system crash occurs.
435     * (computation of ag number from agstart based on agsize
436     * will correctly identify the new ag);
437     */
438    /* if new AG size the same as old AG size, done! */
439    if (agsizechanged) {
440        if ((rc = diExtendFS(ipimap, ipbmap)))
441            goto error_out;
442
443        /* finalize imap */
444        if ((rc = diSync(ipimap)))
445            goto error_out;
446    }
447
448    /*
449     * finalize
450     * --------
451     *
452     * extension is committed when on-disk super block is
453     * updated with new descriptors: logredo will recover
454     * crash before it to pre-extension state;
455     */
456
457    /* sync log to skip log replay of bmap file growth transaction; */
458    /* lmLogSync(log, 1); */
459
460    /*
461     * synchronous write bmap global control page;
462     * for crash before completion of write
463     * logredo() will recover to pre-extendfs state;
464     * for crash after completion of write,
465     * logredo() will recover post-extendfs state;
466     */
467    if ((rc = dbSync(ipbmap)))
468        goto error_out;
469
470    /*
471     * copy primary bmap inode to secondary bmap inode
472     */
473
474    ipbmap2 = diReadSpecial(sb, BMAP_I, 1);
475    if (ipbmap2 == NULL) {
476        printk(KERN_ERR "jfs_extendfs: diReadSpecial(bmap) failed\n");
477        goto error_out;
478    }
479    memcpy(&JFS_IP(ipbmap2)->i_xtroot, &JFS_IP(ipbmap)->i_xtroot, 288);
480    ipbmap2->i_size = ipbmap->i_size;
481    ipbmap2->i_blocks = ipbmap->i_blocks;
482
483    diWriteSpecial(ipbmap2, 1);
484    diFreeSpecial(ipbmap2);
485
486    /*
487     * update superblock
488     */
489    if ((rc = readSuper(sb, &bh)))
490        goto error_out;
491    j_sb = (struct jfs_superblock *)bh->b_data;
492
493    /* mark extendfs() completion */
494    j_sb->s_state &= cpu_to_le32(~FM_EXTENDFS);
495    j_sb->s_size = cpu_to_le64(bmp->db_mapsize <<
496                   le16_to_cpu(j_sb->s_l2bfactor));
497    j_sb->s_agsize = cpu_to_le32(bmp->db_agsize);
498
499    /* update inline log space descriptor */
500    if (sbi->mntflag & JFS_INLINELOG) {
501        PXDaddress(&(j_sb->s_logpxd), newLogAddress);
502        PXDlength(&(j_sb->s_logpxd), newLogSize);
503    }
504
505    /* record log's mount serial number */
506    j_sb->s_logserial = cpu_to_le32(log->serial);
507
508    /* update fsck work space descriptor */
509    PXDaddress(&(j_sb->s_fsckpxd), newFSCKAddress);
510    PXDlength(&(j_sb->s_fsckpxd), newFSCKSize);
511    j_sb->s_fscklog = 1;
512    /* sb->s_fsckloglen remains the same */
513
514    /* Update secondary superblock */
515    bh2 = sb_bread(sb, SUPER2_OFF >> sb->s_blocksize_bits);
516    if (bh2) {
517        j_sb2 = (struct jfs_superblock *)bh2->b_data;
518        memcpy(j_sb2, j_sb, sizeof (struct jfs_superblock));
519
520        mark_buffer_dirty(bh);
521        sync_dirty_buffer(bh2);
522        brelse(bh2);
523    }
524
525    /* write primary superblock */
526    mark_buffer_dirty(bh);
527    sync_dirty_buffer(bh);
528    brelse(bh);
529
530    goto resume;
531
532      error_out:
533    jfs_error(sb, "jfs_extendfs");
534
535      resume:
536    /*
537     * resume file system transactions
538     */
539    txResume(sb);
540
541      out:
542    return rc;
543}
544

Archive Download this file



interactive