blob: 8b9a72ae5efa7aa9c63ffffb7b7345a25c3f2c76 [file] [log] [blame]
Thomas Gleixner1a59d1b82019-05-27 08:55:05 +02001// SPDX-License-Identifier: GPL-2.0-or-later
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * Copyright (C) International Business Machines Corp., 2000-2004
Linus Torvalds1da177e2005-04-16 15:20:36 -07004*/
5
6#include <linux/fs.h>
7#include <linux/buffer_head.h>
8#include <linux/quotaops.h>
Christoph Hellwig621c1f42020-06-20 09:16:44 +02009#include <linux/blkdev.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070010#include "jfs_incore.h"
11#include "jfs_filsys.h"
12#include "jfs_metapage.h"
13#include "jfs_dinode.h"
14#include "jfs_imap.h"
15#include "jfs_dmap.h"
16#include "jfs_superblock.h"
17#include "jfs_txnmgr.h"
18#include "jfs_debug.h"
19
Dave Kleikampf720e3b2007-06-06 15:28:35 -050020#define BITSPERPAGE (PSIZE << 3)
21#define L2MEGABYTE 20
22#define MEGABYTE (1 << L2MEGABYTE)
23#define MEGABYTE32 (MEGABYTE << 5)
Linus Torvalds1da177e2005-04-16 15:20:36 -070024
25/* convert block number to bmap file page number */
26#define BLKTODMAPN(b)\
Dave Kleikampf720e3b2007-06-06 15:28:35 -050027 (((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1)
Linus Torvalds1da177e2005-04-16 15:20:36 -070028
29/*
Dave Kleikampf720e3b2007-06-06 15:28:35 -050030 * jfs_extendfs()
Linus Torvalds1da177e2005-04-16 15:20:36 -070031 *
32 * function: extend file system;
33 *
34 * |-------------------------------|----------|----------|
35 * file system space fsck inline log
36 * workspace space
37 *
38 * input:
Dave Kleikampf720e3b2007-06-06 15:28:35 -050039 * new LVSize: in LV blocks (required)
40 * new LogSize: in LV blocks (optional)
41 * new FSSize: in LV blocks (optional)
Linus Torvalds1da177e2005-04-16 15:20:36 -070042 *
43 * new configuration:
44 * 1. set new LogSize as specified or default from new LVSize;
45 * 2. compute new FSCKSize from new LVSize;
46 * 3. set new FSSize as MIN(FSSize, LVSize-(LogSize+FSCKSize)) where
47 * assert(new FSSize >= old FSSize),
Lucas De Marchi25985ed2011-03-30 22:57:33 -030048 * i.e., file system must not be shrunk;
Linus Torvalds1da177e2005-04-16 15:20:36 -070049 */
50int jfs_extendfs(struct super_block *sb, s64 newLVSize, int newLogSize)
51{
52 int rc = 0;
53 struct jfs_sb_info *sbi = JFS_SBI(sb);
54 struct inode *ipbmap = sbi->ipbmap;
55 struct inode *ipbmap2;
56 struct inode *ipimap = sbi->ipimap;
57 struct jfs_log *log = sbi->log;
58 struct bmap *bmp = sbi->bmap;
59 s64 newLogAddress, newFSCKAddress;
60 int newFSCKSize;
61 s64 newMapSize = 0, mapSize;
62 s64 XAddress, XSize, nblocks, xoff, xaddr, t64;
63 s64 oldLVSize;
64 s64 newFSSize;
65 s64 VolumeSize;
66 int newNpages = 0, nPages, newPage, xlen, t32;
67 int tid;
68 int log_formatted = 0;
69 struct inode *iplist[1];
70 struct jfs_superblock *j_sb, *j_sb2;
Dave Kleikamp206b6312011-06-20 10:30:04 -050071 s64 old_agsize;
Bill Pemberton2b0b3952010-04-16 08:01:20 -050072 int agsizechanged = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -070073 struct buffer_head *bh, *bh2;
74
75 /* If the volume hasn't grown, get out now */
76
77 if (sbi->mntflag & JFS_INLINELOG)
78 oldLVSize = addressPXD(&sbi->logpxd) + lengthPXD(&sbi->logpxd);
79 else
80 oldLVSize = addressPXD(&sbi->fsckpxd) +
81 lengthPXD(&sbi->fsckpxd);
82
83 if (oldLVSize >= newLVSize) {
84 printk(KERN_WARNING
85 "jfs_extendfs: volume hasn't grown, returning\n");
86 goto out;
87 }
88
Christoph Hellwigdd0c0bd2021-10-18 12:11:27 +020089 VolumeSize = sb_bdev_nr_blocks(sb);
Linus Torvalds1da177e2005-04-16 15:20:36 -070090 if (VolumeSize) {
91 if (newLVSize > VolumeSize) {
92 printk(KERN_WARNING "jfs_extendfs: invalid size\n");
93 rc = -EINVAL;
94 goto out;
95 }
96 } else {
97 /* check the device */
98 bh = sb_bread(sb, newLVSize - 1);
99 if (!bh) {
100 printk(KERN_WARNING "jfs_extendfs: invalid size\n");
101 rc = -EINVAL;
102 goto out;
103 }
104 bforget(bh);
105 }
106
107 /* Can't extend write-protected drive */
108
109 if (isReadOnly(ipbmap)) {
110 printk(KERN_WARNING "jfs_extendfs: read-only file system\n");
111 rc = -EROFS;
112 goto out;
113 }
114
115 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500116 * reconfigure LV spaces
117 * ---------------------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700118 *
119 * validate new size, or, if not specified, determine new size
120 */
121
122 /*
123 * reconfigure inline log space:
124 */
125 if ((sbi->mntflag & JFS_INLINELOG)) {
126 if (newLogSize == 0) {
127 /*
128 * no size specified: default to 1/256 of aggregate
129 * size; rounded up to a megabyte boundary;
130 */
131 newLogSize = newLVSize >> 8;
132 t32 = (1 << (20 - sbi->l2bsize)) - 1;
133 newLogSize = (newLogSize + t32) & ~t32;
134 newLogSize =
135 min(newLogSize, MEGABYTE32 >> sbi->l2bsize);
136 } else {
137 /*
138 * convert the newLogSize to fs blocks.
139 *
140 * Since this is given in megabytes, it will always be
141 * an even number of pages.
142 */
143 newLogSize = (newLogSize * MEGABYTE) >> sbi->l2bsize;
144 }
145
146 } else
147 newLogSize = 0;
148
149 newLogAddress = newLVSize - newLogSize;
150
151 /*
152 * reconfigure fsck work space:
153 *
154 * configure it to the end of the logical volume regardless of
155 * whether file system extends to the end of the aggregate;
156 * Need enough 4k pages to cover:
157 * - 1 bit per block in aggregate rounded up to BPERDMAP boundary
158 * - 1 extra page to handle control page and intermediate level pages
159 * - 50 extra pages for the chkdsk service log
160 */
161 t64 = ((newLVSize - newLogSize + BPERDMAP - 1) >> L2BPERDMAP)
162 << L2BPERDMAP;
Shaun Zincka7fe0ba2007-08-31 12:57:28 -0500163 t32 = DIV_ROUND_UP(t64, BITSPERPAGE) + 1 + 50;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700164 newFSCKSize = t32 << sbi->l2nbperpage;
165 newFSCKAddress = newLogAddress - newFSCKSize;
166
167 /*
168 * compute new file system space;
169 */
170 newFSSize = newLVSize - newLogSize - newFSCKSize;
171
Lucas De Marchi25985ed2011-03-30 22:57:33 -0300172 /* file system cannot be shrunk */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700173 if (newFSSize < bmp->db_mapsize) {
174 rc = -EINVAL;
175 goto out;
176 }
177
178 /*
179 * If we're expanding enough that the inline log does not overlap
180 * the old one, we can format the new log before we quiesce the
181 * filesystem.
182 */
183 if ((sbi->mntflag & JFS_INLINELOG) && (newLogAddress > oldLVSize)) {
184 if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
185 goto out;
186 log_formatted = 1;
187 }
188 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500189 * quiesce file system
Linus Torvalds1da177e2005-04-16 15:20:36 -0700190 *
191 * (prepare to move the inline log and to prevent map update)
192 *
193 * block any new transactions and wait for completion of
194 * all wip transactions and flush modified pages s.t.
195 * on-disk file system is in consistent state and
196 * log is not required for recovery.
197 */
198 txQuiesce(sb);
199
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600200 /* Reset size of direct inode */
Christoph Hellwig74e157e2021-10-18 12:11:17 +0200201 sbi->direct_inode->i_size = bdev_nr_bytes(sb->s_bdev);
Dave Kleikamp7fab4792005-05-02 12:25:02 -0600202
Linus Torvalds1da177e2005-04-16 15:20:36 -0700203 if (sbi->mntflag & JFS_INLINELOG) {
204 /*
205 * deactivate old inline log
206 */
207 lmLogShutdown(log);
208
209 /*
210 * mark on-disk super block for fs in transition;
211 *
212 * update on-disk superblock for the new space configuration
213 * of inline log space and fsck work space descriptors:
214 * N.B. FS descriptor is NOT updated;
215 *
216 * crash recovery:
217 * logredo(): if FM_EXTENDFS, return to fsck() for cleanup;
218 * fsck(): if FM_EXTENDFS, reformat inline log and fsck
219 * workspace from superblock inline log descriptor and fsck
220 * workspace descriptor;
221 */
222
223 /* read in superblock */
224 if ((rc = readSuper(sb, &bh)))
225 goto error_out;
226 j_sb = (struct jfs_superblock *)bh->b_data;
227
228 /* mark extendfs() in progress */
229 j_sb->s_state |= cpu_to_le32(FM_EXTENDFS);
230 j_sb->s_xsize = cpu_to_le64(newFSSize);
231 PXDaddress(&j_sb->s_xfsckpxd, newFSCKAddress);
232 PXDlength(&j_sb->s_xfsckpxd, newFSCKSize);
233 PXDaddress(&j_sb->s_xlogpxd, newLogAddress);
234 PXDlength(&j_sb->s_xlogpxd, newLogSize);
235
236 /* synchronously update superblock */
237 mark_buffer_dirty(bh);
238 sync_dirty_buffer(bh);
239 brelse(bh);
240
241 /*
242 * format new inline log synchronously;
243 *
244 * crash recovery: if log move in progress,
245 * reformat log and exit success;
246 */
247 if (!log_formatted)
248 if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
249 goto error_out;
250
251 /*
252 * activate new log
253 */
254 log->base = newLogAddress;
255 log->size = newLogSize >> (L2LOGPSIZE - sb->s_blocksize_bits);
256 if ((rc = lmLogInit(log)))
257 goto error_out;
258 }
259
260 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500261 * extend block allocation map
262 * ---------------------------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700263 *
264 * extendfs() for new extension, retry after crash recovery;
265 *
266 * note: both logredo() and fsck() rebuild map from
267 * the bitmap and configuration parameter from superblock
268 * (disregarding all other control information in the map);
269 *
270 * superblock:
271 * s_size: aggregate size in physical blocks;
272 */
273 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500274 * compute the new block allocation map configuration
Linus Torvalds1da177e2005-04-16 15:20:36 -0700275 *
276 * map dinode:
277 * di_size: map file size in byte;
278 * di_nblocks: number of blocks allocated for map file;
279 * di_mapsize: number of blocks in aggregate (covered by map);
280 * map control page:
281 * db_mapsize: number of blocks in aggregate (covered by map);
282 */
283 newMapSize = newFSSize;
284 /* number of data pages of new bmap file:
285 * roundup new size to full dmap page boundary and
286 * add 1 extra dmap page for next extendfs()
287 */
288 t64 = (newMapSize - 1) + BPERDMAP;
289 newNpages = BLKTODMAPN(t64) + 1;
290
291 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500292 * extend map from current map (WITHOUT growing mapfile)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700293 *
294 * map new extension with unmapped part of the last partial
295 * dmap page, if applicable, and extra page(s) allocated
296 * at end of bmap by mkfs() or previous extendfs();
297 */
298 extendBmap:
299 /* compute number of blocks requested to extend */
300 mapSize = bmp->db_mapsize;
301 XAddress = mapSize; /* eXtension Address */
302 XSize = newMapSize - mapSize; /* eXtension Size */
303 old_agsize = bmp->db_agsize; /* We need to know if this changes */
304
305 /* compute number of blocks that can be extended by current mapfile */
306 t64 = dbMapFileSizeToMapSize(ipbmap);
307 if (mapSize > t64) {
308 printk(KERN_ERR "jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx)\n",
309 (long long) mapSize, (long long) t64);
310 rc = -EIO;
311 goto error_out;
312 }
313 nblocks = min(t64 - mapSize, XSize);
314
315 /*
316 * update map pages for new extension:
317 *
318 * update/init dmap and bubble up the control hierarchy
319 * incrementally fold up dmaps into upper levels;
320 * update bmap control page;
321 */
322 if ((rc = dbExtendFS(ipbmap, XAddress, nblocks)))
323 goto error_out;
Bill Pemberton2b0b3952010-04-16 08:01:20 -0500324
325 agsizechanged |= (bmp->db_agsize != old_agsize);
326
Linus Torvalds1da177e2005-04-16 15:20:36 -0700327 /*
328 * the map now has extended to cover additional nblocks:
329 * dn_mapsize = oldMapsize + nblocks;
330 */
331 /* ipbmap->i_mapsize += nblocks; */
332 XSize -= nblocks;
333
334 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500335 * grow map file to cover remaining extension
336 * and/or one extra dmap page for next extendfs();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700337 *
338 * allocate new map pages and its backing blocks, and
339 * update map file xtree
340 */
341 /* compute number of data pages of current bmap file */
342 nPages = ipbmap->i_size >> L2PSIZE;
343
344 /* need to grow map file ? */
345 if (nPages == newNpages)
346 goto finalizeBmap;
347
348 /*
349 * grow bmap file for the new map pages required:
350 *
351 * allocate growth at the start of newly extended region;
352 * bmap file only grows sequentially, i.e., both data pages
353 * and possibly xtree index pages may grow in append mode,
354 * s.t. logredo() can reconstruct pre-extension state
355 * by washing away bmap file of pages outside s_size boundary;
356 */
357 /*
358 * journal map file growth as if a regular file growth:
359 * (note: bmap is created with di_mode = IFJOURNAL|IFREG);
360 *
361 * journaling of bmap file growth is not required since
362 * logredo() do/can not use log records of bmap file growth
363 * but it provides careful write semantics, pmap update, etc.;
364 */
365 /* synchronous write of data pages: bmap data pages are
366 * cached in meta-data cache, and not written out
367 * by txCommit();
368 */
Quorum Laval7cfcd8b2016-08-26 15:40:40 +0100369 rc = filemap_fdatawait(ipbmap->i_mapping);
370 if (rc)
371 goto error_out;
372
373 rc = filemap_write_and_wait(ipbmap->i_mapping);
374 if (rc)
375 goto error_out;
376
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377 diWriteSpecial(ipbmap, 0);
378
379 newPage = nPages; /* first new page number */
380 xoff = newPage << sbi->l2nbperpage;
381 xlen = (newNpages - nPages) << sbi->l2nbperpage;
382 xlen = min(xlen, (int) nblocks) & ~(sbi->nbperpage - 1);
383 xaddr = XAddress;
384
385 tid = txBegin(sb, COMMIT_FORCE);
386
387 if ((rc = xtAppend(tid, ipbmap, 0, xoff, nblocks, &xlen, &xaddr, 0))) {
388 txEnd(tid);
389 goto error_out;
390 }
391 /* update bmap file size */
392 ipbmap->i_size += xlen << sbi->l2bsize;
393 inode_add_bytes(ipbmap, xlen << sbi->l2bsize);
394
395 iplist[0] = ipbmap;
396 rc = txCommit(tid, 1, &iplist[0], COMMIT_FORCE);
397
398 txEnd(tid);
399
400 if (rc)
401 goto error_out;
402
403 /*
404 * map file has been grown now to cover extension to further out;
405 * di_size = new map file size;
406 *
407 * if huge extension, the previous extension based on previous
408 * map file size may not have been sufficient to cover whole extension
409 * (it could have been used up for new map pages),
410 * but the newly grown map file now covers lot bigger new free space
411 * available for further extension of map;
412 */
413 /* any more blocks to extend ? */
414 if (XSize)
415 goto extendBmap;
416
417 finalizeBmap:
418 /* finalize bmap */
419 dbFinalizeBmap(ipbmap);
420
421 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500422 * update inode allocation map
423 * ---------------------------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424 *
425 * move iag lists from old to new iag;
426 * agstart field is not updated for logredo() to reconstruct
427 * iag lists if system crash occurs.
428 * (computation of ag number from agstart based on agsize
429 * will correctly identify the new ag);
430 */
431 /* if new AG size the same as old AG size, done! */
Bill Pemberton2b0b3952010-04-16 08:01:20 -0500432 if (agsizechanged) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700433 if ((rc = diExtendFS(ipimap, ipbmap)))
434 goto error_out;
435
436 /* finalize imap */
437 if ((rc = diSync(ipimap)))
438 goto error_out;
439 }
440
441 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500442 * finalize
443 * --------
Linus Torvalds1da177e2005-04-16 15:20:36 -0700444 *
445 * extension is committed when on-disk super block is
446 * updated with new descriptors: logredo will recover
447 * crash before it to pre-extension state;
448 */
449
450 /* sync log to skip log replay of bmap file growth transaction; */
451 /* lmLogSync(log, 1); */
452
453 /*
454 * synchronous write bmap global control page;
455 * for crash before completion of write
456 * logredo() will recover to pre-extendfs state;
457 * for crash after completion of write,
458 * logredo() will recover post-extendfs state;
459 */
460 if ((rc = dbSync(ipbmap)))
461 goto error_out;
462
463 /*
464 * copy primary bmap inode to secondary bmap inode
465 */
466
467 ipbmap2 = diReadSpecial(sb, BMAP_I, 1);
468 if (ipbmap2 == NULL) {
469 printk(KERN_ERR "jfs_extendfs: diReadSpecial(bmap) failed\n");
470 goto error_out;
471 }
472 memcpy(&JFS_IP(ipbmap2)->i_xtroot, &JFS_IP(ipbmap)->i_xtroot, 288);
473 ipbmap2->i_size = ipbmap->i_size;
474 ipbmap2->i_blocks = ipbmap->i_blocks;
475
476 diWriteSpecial(ipbmap2, 1);
477 diFreeSpecial(ipbmap2);
478
479 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500480 * update superblock
Linus Torvalds1da177e2005-04-16 15:20:36 -0700481 */
482 if ((rc = readSuper(sb, &bh)))
483 goto error_out;
484 j_sb = (struct jfs_superblock *)bh->b_data;
485
486 /* mark extendfs() completion */
487 j_sb->s_state &= cpu_to_le32(~FM_EXTENDFS);
488 j_sb->s_size = cpu_to_le64(bmp->db_mapsize <<
489 le16_to_cpu(j_sb->s_l2bfactor));
490 j_sb->s_agsize = cpu_to_le32(bmp->db_agsize);
491
492 /* update inline log space descriptor */
493 if (sbi->mntflag & JFS_INLINELOG) {
494 PXDaddress(&(j_sb->s_logpxd), newLogAddress);
495 PXDlength(&(j_sb->s_logpxd), newLogSize);
496 }
497
498 /* record log's mount serial number */
499 j_sb->s_logserial = cpu_to_le32(log->serial);
500
501 /* update fsck work space descriptor */
502 PXDaddress(&(j_sb->s_fsckpxd), newFSCKAddress);
503 PXDlength(&(j_sb->s_fsckpxd), newFSCKSize);
504 j_sb->s_fscklog = 1;
505 /* sb->s_fsckloglen remains the same */
506
507 /* Update secondary superblock */
508 bh2 = sb_bread(sb, SUPER2_OFF >> sb->s_blocksize_bits);
509 if (bh2) {
510 j_sb2 = (struct jfs_superblock *)bh2->b_data;
511 memcpy(j_sb2, j_sb, sizeof (struct jfs_superblock));
512
513 mark_buffer_dirty(bh);
514 sync_dirty_buffer(bh2);
515 brelse(bh2);
516 }
517
518 /* write primary superblock */
519 mark_buffer_dirty(bh);
520 sync_dirty_buffer(bh);
521 brelse(bh);
522
523 goto resume;
524
525 error_out:
Joe Percheseb8630d2013-06-04 16:39:15 -0700526 jfs_error(sb, "\n");
Linus Torvalds1da177e2005-04-16 15:20:36 -0700527
528 resume:
529 /*
Dave Kleikampf720e3b2007-06-06 15:28:35 -0500530 * resume file system transactions
Linus Torvalds1da177e2005-04-16 15:20:36 -0700531 */
532 txResume(sb);
533
534 out:
535 return rc;
536}