Linux Kernel  3.7.1
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Groups Pages
resize.c
Go to the documentation of this file.
1 /*
2  * Copyright (C) International Business Machines Corp., 2000-2004
3  *
4  * This program is free software; you can redistribute it and/or modify
5  * it under the terms of the GNU General Public License as published by
6  * the Free Software Foundation; either version 2 of the License, or
7  * (at your option) any later version.
8  *
9  * This program is distributed in the hope that it will be useful,
10  * but WITHOUT ANY WARRANTY; without even the implied warranty of
11  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
12  * the GNU General Public License for more details.
13  *
14  * You should have received a copy of the GNU General Public License
15  * along with this program; if not, write to the Free Software
16  * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17 */
18 
19 #include <linux/fs.h>
20 #include <linux/buffer_head.h>
21 #include <linux/quotaops.h>
22 #include "jfs_incore.h"
23 #include "jfs_filsys.h"
24 #include "jfs_metapage.h"
25 #include "jfs_dinode.h"
26 #include "jfs_imap.h"
27 #include "jfs_dmap.h"
28 #include "jfs_superblock.h"
29 #include "jfs_txnmgr.h"
30 #include "jfs_debug.h"
31 
32 #define BITSPERPAGE (PSIZE << 3)
33 #define L2MEGABYTE 20
34 #define MEGABYTE (1 << L2MEGABYTE)
35 #define MEGABYTE32 (MEGABYTE << 5)
36 
37 /* convert block number to bmap file page number */
38 #define BLKTODMAPN(b)\
39  (((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1)
40 
41 /*
42  * jfs_extendfs()
43  *
44  * function: extend file system;
45  *
46  * |-------------------------------|----------|----------|
47  * file system space fsck inline log
48  * workspace space
49  *
50  * input:
51  * new LVSize: in LV blocks (required)
52  * new LogSize: in LV blocks (optional)
53  * new FSSize: in LV blocks (optional)
54  *
55  * new configuration:
56  * 1. set new LogSize as specified or default from new LVSize;
57  * 2. compute new FSCKSize from new LVSize;
58  * 3. set new FSSize as MIN(FSSize, LVSize-(LogSize+FSCKSize)) where
59  * assert(new FSSize >= old FSSize),
60  * i.e., file system must not be shrunk;
61  */
62 int jfs_extendfs(struct super_block *sb, s64 newLVSize, int newLogSize)
63 {
64  int rc = 0;
65  struct jfs_sb_info *sbi = JFS_SBI(sb);
66  struct inode *ipbmap = sbi->ipbmap;
67  struct inode *ipbmap2;
68  struct inode *ipimap = sbi->ipimap;
69  struct jfs_log *log = sbi->log;
70  struct bmap *bmp = sbi->bmap;
71  s64 newLogAddress, newFSCKAddress;
72  int newFSCKSize;
73  s64 newMapSize = 0, mapSize;
74  s64 XAddress, XSize, nblocks, xoff, xaddr, t64;
75  s64 oldLVSize;
76  s64 newFSSize;
77  s64 VolumeSize;
78  int newNpages = 0, nPages, newPage, xlen, t32;
79  int tid;
80  int log_formatted = 0;
81  struct inode *iplist[1];
82  struct jfs_superblock *j_sb, *j_sb2;
83  s64 old_agsize;
84  int agsizechanged = 0;
85  struct buffer_head *bh, *bh2;
86 
87  /* If the volume hasn't grown, get out now */
88 
89  if (sbi->mntflag & JFS_INLINELOG)
90  oldLVSize = addressPXD(&sbi->logpxd) + lengthPXD(&sbi->logpxd);
91  else
92  oldLVSize = addressPXD(&sbi->fsckpxd) +
93  lengthPXD(&sbi->fsckpxd);
94 
95  if (oldLVSize >= newLVSize) {
97  "jfs_extendfs: volume hasn't grown, returning\n");
98  goto out;
99  }
100 
101  VolumeSize = sb->s_bdev->bd_inode->i_size >> sb->s_blocksize_bits;
102 
103  if (VolumeSize) {
104  if (newLVSize > VolumeSize) {
105  printk(KERN_WARNING "jfs_extendfs: invalid size\n");
106  rc = -EINVAL;
107  goto out;
108  }
109  } else {
110  /* check the device */
111  bh = sb_bread(sb, newLVSize - 1);
112  if (!bh) {
113  printk(KERN_WARNING "jfs_extendfs: invalid size\n");
114  rc = -EINVAL;
115  goto out;
116  }
117  bforget(bh);
118  }
119 
120  /* Can't extend write-protected drive */
121 
122  if (isReadOnly(ipbmap)) {
123  printk(KERN_WARNING "jfs_extendfs: read-only file system\n");
124  rc = -EROFS;
125  goto out;
126  }
127 
128  /*
129  * reconfigure LV spaces
130  * ---------------------
131  *
132  * validate new size, or, if not specified, determine new size
133  */
134 
135  /*
136  * reconfigure inline log space:
137  */
138  if ((sbi->mntflag & JFS_INLINELOG)) {
139  if (newLogSize == 0) {
140  /*
141  * no size specified: default to 1/256 of aggregate
142  * size; rounded up to a megabyte boundary;
143  */
144  newLogSize = newLVSize >> 8;
145  t32 = (1 << (20 - sbi->l2bsize)) - 1;
146  newLogSize = (newLogSize + t32) & ~t32;
147  newLogSize =
148  min(newLogSize, MEGABYTE32 >> sbi->l2bsize);
149  } else {
150  /*
151  * convert the newLogSize to fs blocks.
152  *
153  * Since this is given in megabytes, it will always be
154  * an even number of pages.
155  */
156  newLogSize = (newLogSize * MEGABYTE) >> sbi->l2bsize;
157  }
158 
159  } else
160  newLogSize = 0;
161 
162  newLogAddress = newLVSize - newLogSize;
163 
164  /*
165  * reconfigure fsck work space:
166  *
167  * configure it to the end of the logical volume regardless of
168  * whether file system extends to the end of the aggregate;
169  * Need enough 4k pages to cover:
170  * - 1 bit per block in aggregate rounded up to BPERDMAP boundary
171  * - 1 extra page to handle control page and intermediate level pages
172  * - 50 extra pages for the chkdsk service log
173  */
174  t64 = ((newLVSize - newLogSize + BPERDMAP - 1) >> L2BPERDMAP)
175  << L2BPERDMAP;
176  t32 = DIV_ROUND_UP(t64, BITSPERPAGE) + 1 + 50;
177  newFSCKSize = t32 << sbi->l2nbperpage;
178  newFSCKAddress = newLogAddress - newFSCKSize;
179 
180  /*
181  * compute new file system space;
182  */
183  newFSSize = newLVSize - newLogSize - newFSCKSize;
184 
185  /* file system cannot be shrunk */
186  if (newFSSize < bmp->db_mapsize) {
187  rc = -EINVAL;
188  goto out;
189  }
190 
191  /*
192  * If we're expanding enough that the inline log does not overlap
193  * the old one, we can format the new log before we quiesce the
194  * filesystem.
195  */
196  if ((sbi->mntflag & JFS_INLINELOG) && (newLogAddress > oldLVSize)) {
197  if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
198  goto out;
199  log_formatted = 1;
200  }
201  /*
202  * quiesce file system
203  *
204  * (prepare to move the inline log and to prevent map update)
205  *
206  * block any new transactions and wait for completion of
207  * all wip transactions and flush modified pages s.t.
208  * on-disk file system is in consistent state and
209  * log is not required for recovery.
210  */
211  txQuiesce(sb);
212 
213  /* Reset size of direct inode */
214  sbi->direct_inode->i_size = sb->s_bdev->bd_inode->i_size;
215 
216  if (sbi->mntflag & JFS_INLINELOG) {
217  /*
218  * deactivate old inline log
219  */
220  lmLogShutdown(log);
221 
222  /*
223  * mark on-disk super block for fs in transition;
224  *
225  * update on-disk superblock for the new space configuration
226  * of inline log space and fsck work space descriptors:
227  * N.B. FS descriptor is NOT updated;
228  *
229  * crash recovery:
230  * logredo(): if FM_EXTENDFS, return to fsck() for cleanup;
231  * fsck(): if FM_EXTENDFS, reformat inline log and fsck
232  * workspace from superblock inline log descriptor and fsck
233  * workspace descriptor;
234  */
235 
236  /* read in superblock */
237  if ((rc = readSuper(sb, &bh)))
238  goto error_out;
239  j_sb = (struct jfs_superblock *)bh->b_data;
240 
241  /* mark extendfs() in progress */
242  j_sb->s_state |= cpu_to_le32(FM_EXTENDFS);
243  j_sb->s_xsize = cpu_to_le64(newFSSize);
244  PXDaddress(&j_sb->s_xfsckpxd, newFSCKAddress);
245  PXDlength(&j_sb->s_xfsckpxd, newFSCKSize);
246  PXDaddress(&j_sb->s_xlogpxd, newLogAddress);
247  PXDlength(&j_sb->s_xlogpxd, newLogSize);
248 
249  /* synchronously update superblock */
250  mark_buffer_dirty(bh);
251  sync_dirty_buffer(bh);
252  brelse(bh);
253 
254  /*
255  * format new inline log synchronously;
256  *
257  * crash recovery: if log move in progress,
258  * reformat log and exit success;
259  */
260  if (!log_formatted)
261  if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
262  goto error_out;
263 
264  /*
265  * activate new log
266  */
267  log->base = newLogAddress;
268  log->size = newLogSize >> (L2LOGPSIZE - sb->s_blocksize_bits);
269  if ((rc = lmLogInit(log)))
270  goto error_out;
271  }
272 
273  /*
274  * extend block allocation map
275  * ---------------------------
276  *
277  * extendfs() for new extension, retry after crash recovery;
278  *
279  * note: both logredo() and fsck() rebuild map from
280  * the bitmap and configuration parameter from superblock
281  * (disregarding all other control information in the map);
282  *
283  * superblock:
284  * s_size: aggregate size in physical blocks;
285  */
286  /*
287  * compute the new block allocation map configuration
288  *
289  * map dinode:
290  * di_size: map file size in byte;
291  * di_nblocks: number of blocks allocated for map file;
292  * di_mapsize: number of blocks in aggregate (covered by map);
293  * map control page:
294  * db_mapsize: number of blocks in aggregate (covered by map);
295  */
296  newMapSize = newFSSize;
297  /* number of data pages of new bmap file:
298  * roundup new size to full dmap page boundary and
299  * add 1 extra dmap page for next extendfs()
300  */
301  t64 = (newMapSize - 1) + BPERDMAP;
302  newNpages = BLKTODMAPN(t64) + 1;
303 
304  /*
305  * extend map from current map (WITHOUT growing mapfile)
306  *
307  * map new extension with unmapped part of the last partial
308  * dmap page, if applicable, and extra page(s) allocated
309  * at end of bmap by mkfs() or previous extendfs();
310  */
311  extendBmap:
312  /* compute number of blocks requested to extend */
313  mapSize = bmp->db_mapsize;
314  XAddress = mapSize; /* eXtension Address */
315  XSize = newMapSize - mapSize; /* eXtension Size */
316  old_agsize = bmp->db_agsize; /* We need to know if this changes */
317 
318  /* compute number of blocks that can be extended by current mapfile */
319  t64 = dbMapFileSizeToMapSize(ipbmap);
320  if (mapSize > t64) {
321  printk(KERN_ERR "jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx)\n",
322  (long long) mapSize, (long long) t64);
323  rc = -EIO;
324  goto error_out;
325  }
326  nblocks = min(t64 - mapSize, XSize);
327 
328  /*
329  * update map pages for new extension:
330  *
331  * update/init dmap and bubble up the control hierarchy
332  * incrementally fold up dmaps into upper levels;
333  * update bmap control page;
334  */
335  if ((rc = dbExtendFS(ipbmap, XAddress, nblocks)))
336  goto error_out;
337 
338  agsizechanged |= (bmp->db_agsize != old_agsize);
339 
340  /*
341  * the map now has extended to cover additional nblocks:
342  * dn_mapsize = oldMapsize + nblocks;
343  */
344  /* ipbmap->i_mapsize += nblocks; */
345  XSize -= nblocks;
346 
347  /*
348  * grow map file to cover remaining extension
349  * and/or one extra dmap page for next extendfs();
350  *
351  * allocate new map pages and its backing blocks, and
352  * update map file xtree
353  */
354  /* compute number of data pages of current bmap file */
355  nPages = ipbmap->i_size >> L2PSIZE;
356 
357  /* need to grow map file ? */
358  if (nPages == newNpages)
359  goto finalizeBmap;
360 
361  /*
362  * grow bmap file for the new map pages required:
363  *
364  * allocate growth at the start of newly extended region;
365  * bmap file only grows sequentially, i.e., both data pages
366  * and possibly xtree index pages may grow in append mode,
367  * s.t. logredo() can reconstruct pre-extension state
368  * by washing away bmap file of pages outside s_size boundary;
369  */
370  /*
371  * journal map file growth as if a regular file growth:
372  * (note: bmap is created with di_mode = IFJOURNAL|IFREG);
373  *
374  * journaling of bmap file growth is not required since
375  * logredo() do/can not use log records of bmap file growth
376  * but it provides careful write semantics, pmap update, etc.;
377  */
378  /* synchronous write of data pages: bmap data pages are
379  * cached in meta-data cache, and not written out
380  * by txCommit();
381  */
382  filemap_fdatawait(ipbmap->i_mapping);
384  diWriteSpecial(ipbmap, 0);
385 
386  newPage = nPages; /* first new page number */
387  xoff = newPage << sbi->l2nbperpage;
388  xlen = (newNpages - nPages) << sbi->l2nbperpage;
389  xlen = min(xlen, (int) nblocks) & ~(sbi->nbperpage - 1);
390  xaddr = XAddress;
391 
392  tid = txBegin(sb, COMMIT_FORCE);
393 
394  if ((rc = xtAppend(tid, ipbmap, 0, xoff, nblocks, &xlen, &xaddr, 0))) {
395  txEnd(tid);
396  goto error_out;
397  }
398  /* update bmap file size */
399  ipbmap->i_size += xlen << sbi->l2bsize;
400  inode_add_bytes(ipbmap, xlen << sbi->l2bsize);
401 
402  iplist[0] = ipbmap;
403  rc = txCommit(tid, 1, &iplist[0], COMMIT_FORCE);
404 
405  txEnd(tid);
406 
407  if (rc)
408  goto error_out;
409 
410  /*
411  * map file has been grown now to cover extension to further out;
412  * di_size = new map file size;
413  *
414  * if huge extension, the previous extension based on previous
415  * map file size may not have been sufficient to cover whole extension
416  * (it could have been used up for new map pages),
417  * but the newly grown map file now covers lot bigger new free space
418  * available for further extension of map;
419  */
420  /* any more blocks to extend ? */
421  if (XSize)
422  goto extendBmap;
423 
424  finalizeBmap:
425  /* finalize bmap */
426  dbFinalizeBmap(ipbmap);
427 
428  /*
429  * update inode allocation map
430  * ---------------------------
431  *
432  * move iag lists from old to new iag;
433  * agstart field is not updated for logredo() to reconstruct
434  * iag lists if system crash occurs.
435  * (computation of ag number from agstart based on agsize
436  * will correctly identify the new ag);
437  */
438  /* if new AG size the same as old AG size, done! */
439  if (agsizechanged) {
440  if ((rc = diExtendFS(ipimap, ipbmap)))
441  goto error_out;
442 
443  /* finalize imap */
444  if ((rc = diSync(ipimap)))
445  goto error_out;
446  }
447 
448  /*
449  * finalize
450  * --------
451  *
452  * extension is committed when on-disk super block is
453  * updated with new descriptors: logredo will recover
454  * crash before it to pre-extension state;
455  */
456 
457  /* sync log to skip log replay of bmap file growth transaction; */
458  /* lmLogSync(log, 1); */
459 
460  /*
461  * synchronous write bmap global control page;
462  * for crash before completion of write
463  * logredo() will recover to pre-extendfs state;
464  * for crash after completion of write,
465  * logredo() will recover post-extendfs state;
466  */
467  if ((rc = dbSync(ipbmap)))
468  goto error_out;
469 
470  /*
471  * copy primary bmap inode to secondary bmap inode
472  */
473 
474  ipbmap2 = diReadSpecial(sb, BMAP_I, 1);
475  if (ipbmap2 == NULL) {
476  printk(KERN_ERR "jfs_extendfs: diReadSpecial(bmap) failed\n");
477  goto error_out;
478  }
479  memcpy(&JFS_IP(ipbmap2)->i_xtroot, &JFS_IP(ipbmap)->i_xtroot, 288);
480  ipbmap2->i_size = ipbmap->i_size;
481  ipbmap2->i_blocks = ipbmap->i_blocks;
482 
483  diWriteSpecial(ipbmap2, 1);
484  diFreeSpecial(ipbmap2);
485 
486  /*
487  * update superblock
488  */
489  if ((rc = readSuper(sb, &bh)))
490  goto error_out;
491  j_sb = (struct jfs_superblock *)bh->b_data;
492 
493  /* mark extendfs() completion */
494  j_sb->s_state &= cpu_to_le32(~FM_EXTENDFS);
495  j_sb->s_size = cpu_to_le64(bmp->db_mapsize <<
496  le16_to_cpu(j_sb->s_l2bfactor));
497  j_sb->s_agsize = cpu_to_le32(bmp->db_agsize);
498 
499  /* update inline log space descriptor */
500  if (sbi->mntflag & JFS_INLINELOG) {
501  PXDaddress(&(j_sb->s_logpxd), newLogAddress);
502  PXDlength(&(j_sb->s_logpxd), newLogSize);
503  }
504 
505  /* record log's mount serial number */
506  j_sb->s_logserial = cpu_to_le32(log->serial);
507 
508  /* update fsck work space descriptor */
509  PXDaddress(&(j_sb->s_fsckpxd), newFSCKAddress);
510  PXDlength(&(j_sb->s_fsckpxd), newFSCKSize);
511  j_sb->s_fscklog = 1;
512  /* sb->s_fsckloglen remains the same */
513 
514  /* Update secondary superblock */
515  bh2 = sb_bread(sb, SUPER2_OFF >> sb->s_blocksize_bits);
516  if (bh2) {
517  j_sb2 = (struct jfs_superblock *)bh2->b_data;
518  memcpy(j_sb2, j_sb, sizeof (struct jfs_superblock));
519 
520  mark_buffer_dirty(bh);
521  sync_dirty_buffer(bh2);
522  brelse(bh2);
523  }
524 
525  /* write primary superblock */
526  mark_buffer_dirty(bh);
527  sync_dirty_buffer(bh);
528  brelse(bh);
529 
530  goto resume;
531 
532  error_out:
533  jfs_error(sb, "jfs_extendfs");
534 
535  resume:
536  /*
537  * resume file system transactions
538  */
539  txResume(sb);
540 
541  out:
542  return rc;
543 }