blob: 7ddcb445a3d9f65c61a4c423e2e969bf14649394 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Copyright (C) International Business Machines Corp., 2000-2004
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
Dave Kleikamp63f83c92006-10-02 09:55:27 -05006 * the Free Software Foundation; either version 2 of the License, or
Linus Torvalds1da177e2005-04-16 15:20:36 -07007 * (at your option) any later version.
Dave Kleikamp63f83c92006-10-02 09:55:27 -05008 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
12 * the GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
Dave Kleikamp63f83c92006-10-02 09:55:27 -050015 * along with this program; if not, write to the Free Software
Linus Torvalds1da177e2005-04-16 15:20:36 -070016 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17*/
18
19#include <linux/fs.h>
20#include <linux/buffer_head.h>
21#include <linux/quotaops.h>
22#include "jfs_incore.h"
23#include "jfs_filsys.h"
24#include "jfs_metapage.h"
25#include "jfs_dinode.h"
26#include "jfs_imap.h"
27#include "jfs_dmap.h"
28#include "jfs_superblock.h"
29#include "jfs_txnmgr.h"
30#include "jfs_debug.h"
31
Dave Kleikampf720e3b2007-06-06 15:28:35 -050032#define BITSPERPAGE (PSIZE << 3)
33#define L2MEGABYTE 20
34#define MEGABYTE (1 << L2MEGABYTE)
35#define MEGABYTE32 (MEGABYTE << 5)
Linus Torvalds1da177e2005-04-16 15:20:36 -070036
37/* convert block number to bmap file page number */
38#define BLKTODMAPN(b)\
Dave Kleikampf720e3b2007-06-06 15:28:35 -050039 (((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -070040
41/*
Dave Kleikampf720e3b2007-06-06 15:28:35 -050042 * jfs_extendfs()
Linus Torvalds1da177e2005-04-16 15:20:36 -070043 *
44 * function: extend file system;
45 *
46 * |-------------------------------|----------|----------|
47 * file system space fsck inline log
48 * workspace space
49 *
50 * input:
Dave Kleikampf720e3b2007-06-06 15:28:35 -050051 * new LVSize: in LV blocks (required)
52 * new LogSize: in LV blocks (optional)
53 * new FSSize: in LV blocks (optional)
Linus Torvalds1da177e2005-04-16 15:20:36 -070054 *
55 * new configuration:
56 * 1. set new LogSize as specified or default from new LVSize;
57 * 2. compute new FSCKSize from new LVSize;
58 * 3. set new FSSize as MIN(FSSize, LVSize-(LogSize+FSCKSize)) where
59 * assert(new FSSize >= old FSSize),
Lucas De Marchi25985ed2011-03-30 22:57:33 -030060 * i.e., file system must not be shrunk;
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 */
62int jfs_extendfs(struct super_block *sb, s64 newLVSize, int newLogSize)
63{
64 int rc = 0;
65 struct jfs_sb_info *sbi = JFS_SBI(sb);
66 struct inode *ipbmap = sbi->ipbmap;
67 struct inode *ipbmap2;
68 struct inode *ipimap = sbi->ipimap;
69 struct jfs_log *log = sbi->log;
70 struct bmap *bmp = sbi->bmap;
71 s64 newLogAddress, newFSCKAddress;
72 int newFSCKSize;
73 s64 newMapSize = 0, mapSize;
74 s64 XAddress, XSize, nblocks, xoff, xaddr, t64;
75 s64 oldLVSize;
76 s64 newFSSize;
77 s64 VolumeSize;
78 int newNpages = 0, nPages, newPage, xlen, t32;
79 int tid;
80 int log_formatted = 0;
81 struct inode *iplist[1];
82 struct jfs_superblock *j_sb, *j_sb2;
Dave Kleikamp206b6312011-06-20 10:30:04 -050083 s64 old_agsize;
Bill Pemberton2b0b3952010-04-16 08:01:20 -050084 int agsizechanged = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070085 struct buffer_head *bh, *bh2;
86
87 /* If the volume hasn't grown, get out now */
88
89 if (sbi->mntflag & JFS_INLINELOG)
90 oldLVSize = addressPXD(&sbi->logpxd) + lengthPXD(&sbi->logpxd);
91 else
92 oldLVSize = addressPXD(&sbi->fsckpxd) +
93 lengthPXD(&sbi->fsckpxd);
94
95 if (oldLVSize >= newLVSize) {
96 printk(KERN_WARNING
97 "jfs_extendfs: volume hasn't grown, returning\n");
98 goto out;
99 }
100
Fabian Frederick684666e2017-01-23 18:50:23 +0100101 VolumeSize = i_size_read(sb->s_bdev->bd_inode) >> sb->s_blocksize_bits;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102
103 if (VolumeSize) {
104 if (newLVSize > VolumeSize) {
105 printk(KERN_WARNING "jfs_extendfs: invalid size\n");
106 rc = -EINVAL;
107 goto out;
108 }
109 } else {
110 /* check the device */
111 bh = sb_bread(sb, newLVSize - 1);
112 if (!bh) {
113 printk(KERN_WARNING "jfs_extendfs: invalid size\n");
114 rc = -EINVAL;
115 goto out;
116 }
117 bforget(bh);
118 }
119
120 /* Can't extend write-protected drive */
121
122 if (isReadOnly(ipbmap)) {
123 printk(KERN_WARNING "jfs_extendfs: read-only file system\n");
124 rc = -EROFS;
125 goto out;
126 }
127
128 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500129 * reconfigure LV spaces
130 * ---------------------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700131 *
132 * validate new size, or, if not specified, determine new size
133 */
134
135 /*
136 * reconfigure inline log space:
137 */
138 if ((sbi->mntflag & JFS_INLINELOG)) {
139 if (newLogSize == 0) {
140 /*
141 * no size specified: default to 1/256 of aggregate
142 * size; rounded up to a megabyte boundary;
143 */
144 newLogSize = newLVSize >> 8;
145 t32 = (1 << (20 - sbi->l2bsize)) - 1;
146 newLogSize = (newLogSize + t32) & ~t32;
147 newLogSize =
148 min(newLogSize, MEGABYTE32 >> sbi->l2bsize);
149 } else {
150 /*
151 * convert the newLogSize to fs blocks.
152 *
153 * Since this is given in megabytes, it will always be
154 * an even number of pages.
155 */
156 newLogSize = (newLogSize * MEGABYTE) >> sbi->l2bsize;
157 }
158
159 } else
160 newLogSize = 0;
161
162 newLogAddress = newLVSize - newLogSize;
163
164 /*
165 * reconfigure fsck work space:
166 *
167 * configure it to the end of the logical volume regardless of
168 * whether file system extends to the end of the aggregate;
169 * Need enough 4k pages to cover:
170 * - 1 bit per block in aggregate rounded up to BPERDMAP boundary
171 * - 1 extra page to handle control page and intermediate level pages
172 * - 50 extra pages for the chkdsk service log
173 */
174 t64 = ((newLVSize - newLogSize + BPERDMAP - 1) >> L2BPERDMAP)
175 << L2BPERDMAP;
Shaun Zincka7fe0ba2007-08-31 12:57:28 -0500176 t32 = DIV_ROUND_UP(t64, BITSPERPAGE) + 1 + 50;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700177 newFSCKSize = t32 << sbi->l2nbperpage;
178 newFSCKAddress = newLogAddress - newFSCKSize;
179
180 /*
181 * compute new file system space;
182 */
183 newFSSize = newLVSize - newLogSize - newFSCKSize;
184
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300185 /* file system cannot be shrunk */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700186 if (newFSSize < bmp->db_mapsize) {
187 rc = -EINVAL;
188 goto out;
189 }
190
191 /*
192 * If we're expanding enough that the inline log does not overlap
193 * the old one, we can format the new log before we quiesce the
194 * filesystem.
195 */
196 if ((sbi->mntflag & JFS_INLINELOG) && (newLogAddress > oldLVSize)) {
197 if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
198 goto out;
199 log_formatted = 1;
200 }
201 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500202 * quiesce file system
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 *
204 * (prepare to move the inline log and to prevent map update)
205 *
206 * block any new transactions and wait for completion of
207 * all wip transactions and flush modified pages s.t.
208 * on-disk file system is in consistent state and
209 * log is not required for recovery.
210 */
211 txQuiesce(sb);
212
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600213 /* Reset size of direct inode */
Fabian Frederick684666e2017-01-23 18:50:23 +0100214 sbi->direct_inode->i_size = i_size_read(sb->s_bdev->bd_inode);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600215
Linus Torvalds1da177e2005-04-16 15:20:36 -0700216 if (sbi->mntflag & JFS_INLINELOG) {
217 /*
218 * deactivate old inline log
219 */
220 lmLogShutdown(log);
221
222 /*
223 * mark on-disk super block for fs in transition;
224 *
225 * update on-disk superblock for the new space configuration
226 * of inline log space and fsck work space descriptors:
227 * N.B. FS descriptor is NOT updated;
228 *
229 * crash recovery:
230 * logredo(): if FM_EXTENDFS, return to fsck() for cleanup;
231 * fsck(): if FM_EXTENDFS, reformat inline log and fsck
232 * workspace from superblock inline log descriptor and fsck
233 * workspace descriptor;
234 */
235
236 /* read in superblock */
237 if ((rc = readSuper(sb, &bh)))
238 goto error_out;
239 j_sb = (struct jfs_superblock *)bh->b_data;
240
241 /* mark extendfs() in progress */
242 j_sb->s_state |= cpu_to_le32(FM_EXTENDFS);
243 j_sb->s_xsize = cpu_to_le64(newFSSize);
244 PXDaddress(&j_sb->s_xfsckpxd, newFSCKAddress);
245 PXDlength(&j_sb->s_xfsckpxd, newFSCKSize);
246 PXDaddress(&j_sb->s_xlogpxd, newLogAddress);
247 PXDlength(&j_sb->s_xlogpxd, newLogSize);
248
249 /* synchronously update superblock */
250 mark_buffer_dirty(bh);
251 sync_dirty_buffer(bh);
252 brelse(bh);
253
254 /*
255 * format new inline log synchronously;
256 *
257 * crash recovery: if log move in progress,
258 * reformat log and exit success;
259 */
260 if (!log_formatted)
261 if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
262 goto error_out;
263
264 /*
265 * activate new log
266 */
267 log->base = newLogAddress;
268 log->size = newLogSize >> (L2LOGPSIZE - sb->s_blocksize_bits);
269 if ((rc = lmLogInit(log)))
270 goto error_out;
271 }
272
273 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500274 * extend block allocation map
275 * ---------------------------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700276 *
277 * extendfs() for new extension, retry after crash recovery;
278 *
279 * note: both logredo() and fsck() rebuild map from
280 * the bitmap and configuration parameter from superblock
281 * (disregarding all other control information in the map);
282 *
283 * superblock:
284 * s_size: aggregate size in physical blocks;
285 */
286 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500287 * compute the new block allocation map configuration
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 *
289 * map dinode:
290 * di_size: map file size in byte;
291 * di_nblocks: number of blocks allocated for map file;
292 * di_mapsize: number of blocks in aggregate (covered by map);
293 * map control page:
294 * db_mapsize: number of blocks in aggregate (covered by map);
295 */
296 newMapSize = newFSSize;
297 /* number of data pages of new bmap file:
298 * roundup new size to full dmap page boundary and
299 * add 1 extra dmap page for next extendfs()
300 */
301 t64 = (newMapSize - 1) + BPERDMAP;
302 newNpages = BLKTODMAPN(t64) + 1;
303
304 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500305 * extend map from current map (WITHOUT growing mapfile)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700306 *
307 * map new extension with unmapped part of the last partial
308 * dmap page, if applicable, and extra page(s) allocated
309 * at end of bmap by mkfs() or previous extendfs();
310 */
311 extendBmap:
312 /* compute number of blocks requested to extend */
313 mapSize = bmp->db_mapsize;
314 XAddress = mapSize; /* eXtension Address */
315 XSize = newMapSize - mapSize; /* eXtension Size */
316 old_agsize = bmp->db_agsize; /* We need to know if this changes */
317
318 /* compute number of blocks that can be extended by current mapfile */
319 t64 = dbMapFileSizeToMapSize(ipbmap);
320 if (mapSize > t64) {
321 printk(KERN_ERR "jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx)\n",
322 (long long) mapSize, (long long) t64);
323 rc = -EIO;
324 goto error_out;
325 }
326 nblocks = min(t64 - mapSize, XSize);
327
328 /*
329 * update map pages for new extension:
330 *
331 * update/init dmap and bubble up the control hierarchy
332 * incrementally fold up dmaps into upper levels;
333 * update bmap control page;
334 */
335 if ((rc = dbExtendFS(ipbmap, XAddress, nblocks)))
336 goto error_out;
Bill Pemberton2b0b3952010-04-16 08:01:20 -0500337
338 agsizechanged |= (bmp->db_agsize != old_agsize);
339
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 /*
341 * the map now has extended to cover additional nblocks:
342 * dn_mapsize = oldMapsize + nblocks;
343 */
344 /* ipbmap->i_mapsize += nblocks; */
345 XSize -= nblocks;
346
347 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500348 * grow map file to cover remaining extension
349 * and/or one extra dmap page for next extendfs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350 *
351 * allocate new map pages and its backing blocks, and
352 * update map file xtree
353 */
354 /* compute number of data pages of current bmap file */
355 nPages = ipbmap->i_size >> L2PSIZE;
356
357 /* need to grow map file ? */
358 if (nPages == newNpages)
359 goto finalizeBmap;
360
361 /*
362 * grow bmap file for the new map pages required:
363 *
364 * allocate growth at the start of newly extended region;
365 * bmap file only grows sequentially, i.e., both data pages
366 * and possibly xtree index pages may grow in append mode,
367 * s.t. logredo() can reconstruct pre-extension state
368 * by washing away bmap file of pages outside s_size boundary;
369 */
370 /*
371 * journal map file growth as if a regular file growth:
372 * (note: bmap is created with di_mode = IFJOURNAL|IFREG);
373 *
374 * journaling of bmap file growth is not required since
375 * logredo() do/can not use log records of bmap file growth
376 * but it provides careful write semantics, pmap update, etc.;
377 */
378 /* synchronous write of data pages: bmap data pages are
379 * cached in meta-data cache, and not written out
380 * by txCommit();
381 */
Quorum Laval7cfcd8b2016-08-26 15:40:40 +0100382 rc = filemap_fdatawait(ipbmap->i_mapping);
383 if (rc)
384 goto error_out;
385
386 rc = filemap_write_and_wait(ipbmap->i_mapping);
387 if (rc)
388 goto error_out;
389
Linus Torvalds1da177e2005-04-16 15:20:36 -0700390 diWriteSpecial(ipbmap, 0);
391
392 newPage = nPages; /* first new page number */
393 xoff = newPage << sbi->l2nbperpage;
394 xlen = (newNpages - nPages) << sbi->l2nbperpage;
395 xlen = min(xlen, (int) nblocks) & ~(sbi->nbperpage - 1);
396 xaddr = XAddress;
397
398 tid = txBegin(sb, COMMIT_FORCE);
399
400 if ((rc = xtAppend(tid, ipbmap, 0, xoff, nblocks, &xlen, &xaddr, 0))) {
401 txEnd(tid);
402 goto error_out;
403 }
404 /* update bmap file size */
405 ipbmap->i_size += xlen << sbi->l2bsize;
406 inode_add_bytes(ipbmap, xlen << sbi->l2bsize);
407
408 iplist[0] = ipbmap;
409 rc = txCommit(tid, 1, &iplist[0], COMMIT_FORCE);
410
411 txEnd(tid);
412
413 if (rc)
414 goto error_out;
415
416 /*
417 * map file has been grown now to cover extension to further out;
418 * di_size = new map file size;
419 *
420 * if huge extension, the previous extension based on previous
421 * map file size may not have been sufficient to cover whole extension
422 * (it could have been used up for new map pages),
423 * but the newly grown map file now covers lot bigger new free space
424 * available for further extension of map;
425 */
426 /* any more blocks to extend ? */
427 if (XSize)
428 goto extendBmap;
429
430 finalizeBmap:
431 /* finalize bmap */
432 dbFinalizeBmap(ipbmap);
433
434 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500435 * update inode allocation map
436 * ---------------------------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700437 *
438 * move iag lists from old to new iag;
439 * agstart field is not updated for logredo() to reconstruct
440 * iag lists if system crash occurs.
441 * (computation of ag number from agstart based on agsize
442 * will correctly identify the new ag);
443 */
444 /* if new AG size the same as old AG size, done! */
Bill Pemberton2b0b3952010-04-16 08:01:20 -0500445 if (agsizechanged) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700446 if ((rc = diExtendFS(ipimap, ipbmap)))
447 goto error_out;
448
449 /* finalize imap */
450 if ((rc = diSync(ipimap)))
451 goto error_out;
452 }
453
454 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500455 * finalize
456 * --------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700457 *
458 * extension is committed when on-disk super block is
459 * updated with new descriptors: logredo will recover
460 * crash before it to pre-extension state;
461 */
462
463 /* sync log to skip log replay of bmap file growth transaction; */
464 /* lmLogSync(log, 1); */
465
466 /*
467 * synchronous write bmap global control page;
468 * for crash before completion of write
469 * logredo() will recover to pre-extendfs state;
470 * for crash after completion of write,
471 * logredo() will recover post-extendfs state;
472 */
473 if ((rc = dbSync(ipbmap)))
474 goto error_out;
475
476 /*
477 * copy primary bmap inode to secondary bmap inode
478 */
479
480 ipbmap2 = diReadSpecial(sb, BMAP_I, 1);
481 if (ipbmap2 == NULL) {
482 printk(KERN_ERR "jfs_extendfs: diReadSpecial(bmap) failed\n");
483 goto error_out;
484 }
485 memcpy(&JFS_IP(ipbmap2)->i_xtroot, &JFS_IP(ipbmap)->i_xtroot, 288);
486 ipbmap2->i_size = ipbmap->i_size;
487 ipbmap2->i_blocks = ipbmap->i_blocks;
488
489 diWriteSpecial(ipbmap2, 1);
490 diFreeSpecial(ipbmap2);
491
492 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500493 * update superblock
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494 */
495 if ((rc = readSuper(sb, &bh)))
496 goto error_out;
497 j_sb = (struct jfs_superblock *)bh->b_data;
498
499 /* mark extendfs() completion */
500 j_sb->s_state &= cpu_to_le32(~FM_EXTENDFS);
501 j_sb->s_size = cpu_to_le64(bmp->db_mapsize <<
502 le16_to_cpu(j_sb->s_l2bfactor));
503 j_sb->s_agsize = cpu_to_le32(bmp->db_agsize);
504
505 /* update inline log space descriptor */
506 if (sbi->mntflag & JFS_INLINELOG) {
507 PXDaddress(&(j_sb->s_logpxd), newLogAddress);
508 PXDlength(&(j_sb->s_logpxd), newLogSize);
509 }
510
511 /* record log's mount serial number */
512 j_sb->s_logserial = cpu_to_le32(log->serial);
513
514 /* update fsck work space descriptor */
515 PXDaddress(&(j_sb->s_fsckpxd), newFSCKAddress);
516 PXDlength(&(j_sb->s_fsckpxd), newFSCKSize);
517 j_sb->s_fscklog = 1;
518 /* sb->s_fsckloglen remains the same */
519
520 /* Update secondary superblock */
521 bh2 = sb_bread(sb, SUPER2_OFF >> sb->s_blocksize_bits);
522 if (bh2) {
523 j_sb2 = (struct jfs_superblock *)bh2->b_data;
524 memcpy(j_sb2, j_sb, sizeof (struct jfs_superblock));
525
526 mark_buffer_dirty(bh);
527 sync_dirty_buffer(bh2);
528 brelse(bh2);
529 }
530
531 /* write primary superblock */
532 mark_buffer_dirty(bh);
533 sync_dirty_buffer(bh);
534 brelse(bh);
535
536 goto resume;
537
538 error_out:
Joe Percheseb8630d2013-06-04 16:39:15 -0700539 jfs_error(sb, "\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700540
541 resume:
542 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500543 * resume file system transactions
Linus Torvalds1da177e2005-04-16 15:20:36 -0700544 */
545 txResume(sb);
546
547 out:
548 return rc;
549}