Blame - fs/jfs/resize.c - kernel/msm-4.9

blob: c6dc254d325325ba247142e39d75abfb072b7a58 [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	/*
				2	* Copyright (C) International Business Machines Corp., 2000-2004
				3	*
				4	* This program is free software; you can redistribute it and/or modify
				5	* it under the terms of the GNU General Public License as published by
				6	* the Free Software Foundation; either version 2 of the License, or
				7	* (at your option) any later version.
				8	*
				9	* This program is distributed in the hope that it will be useful,
				10	* but WITHOUT ANY WARRANTY; without even the implied warranty of
				11	* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
				12	* the GNU General Public License for more details.
				13	*
				14	* You should have received a copy of the GNU General Public License
				15	* along with this program; if not, write to the Free Software
				16	* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
				17	*/
				18
				19	#include <linux/fs.h>
				20	#include <linux/buffer_head.h>
				21	#include <linux/quotaops.h>
				22	#include "jfs_incore.h"
				23	#include "jfs_filsys.h"
				24	#include "jfs_metapage.h"
				25	#include "jfs_dinode.h"
				26	#include "jfs_imap.h"
				27	#include "jfs_dmap.h"
				28	#include "jfs_superblock.h"
				29	#include "jfs_txnmgr.h"
				30	#include "jfs_debug.h"
				31
				32	#define BITSPERPAGE (PSIZE << 3)
				33	#define L2MEGABYTE 20
				34	#define MEGABYTE (1 << L2MEGABYTE)
				35	#define MEGABYTE32 (MEGABYTE << 5)
				36
				37	/* convert block number to bmap file page number */
				38	#define BLKTODMAPN(b)\
				39	(((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1)
				40
				41	/*
				42	* jfs_extendfs()
				43	*
				44	* function: extend file system;
				45	*
				46	* \|-------------------------------\|----------\|----------\|
				47	* file system space fsck inline log
				48	* workspace space
				49	*
				50	* input:
				51	* new LVSize: in LV blocks (required)
				52	* new LogSize: in LV blocks (optional)
				53	* new FSSize: in LV blocks (optional)
				54	*
				55	* new configuration:
				56	* 1. set new LogSize as specified or default from new LVSize;
				57	* 2. compute new FSCKSize from new LVSize;
				58	* 3. set new FSSize as MIN(FSSize, LVSize-(LogSize+FSCKSize)) where
				59	* assert(new FSSize >= old FSSize),
				60	* i.e., file system must not be shrinked;
				61	*/
				62	int jfs_extendfs(struct super_block *sb, s64 newLVSize, int newLogSize)
				63	{
				64	int rc = 0;
				65	struct jfs_sb_info *sbi = JFS_SBI(sb);
				66	struct inode *ipbmap = sbi->ipbmap;
				67	struct inode *ipbmap2;
				68	struct inode *ipimap = sbi->ipimap;
				69	struct jfs_log *log = sbi->log;
				70	struct bmap *bmp = sbi->bmap;
				71	s64 newLogAddress, newFSCKAddress;
				72	int newFSCKSize;
				73	s64 newMapSize = 0, mapSize;
				74	s64 XAddress, XSize, nblocks, xoff, xaddr, t64;
				75	s64 oldLVSize;
				76	s64 newFSSize;
				77	s64 VolumeSize;
				78	int newNpages = 0, nPages, newPage, xlen, t32;
				79	int tid;
				80	int log_formatted = 0;
				81	struct inode *iplist[1];
				82	struct jfs_superblock j_sb, j_sb2;
				83	uint old_agsize;
				84	struct buffer_head bh, bh2;
				85
				86	/* If the volume hasn't grown, get out now */
				87
				88	if (sbi->mntflag & JFS_INLINELOG)
				89	oldLVSize = addressPXD(&sbi->logpxd) + lengthPXD(&sbi->logpxd);
				90	else
				91	oldLVSize = addressPXD(&sbi->fsckpxd) +
				92	lengthPXD(&sbi->fsckpxd);
				93
				94	if (oldLVSize >= newLVSize) {
				95	printk(KERN_WARNING
				96	"jfs_extendfs: volume hasn't grown, returning\n");
				97	goto out;
				98	}
				99
				100	VolumeSize = sb->s_bdev->bd_inode->i_size >> sb->s_blocksize_bits;
				101
				102	if (VolumeSize) {
				103	if (newLVSize > VolumeSize) {
				104	printk(KERN_WARNING "jfs_extendfs: invalid size\n");
				105	rc = -EINVAL;
				106	goto out;
				107	}
				108	} else {
				109	/* check the device */
				110	bh = sb_bread(sb, newLVSize - 1);
				111	if (!bh) {
				112	printk(KERN_WARNING "jfs_extendfs: invalid size\n");
				113	rc = -EINVAL;
				114	goto out;
				115	}
				116	bforget(bh);
				117	}
				118
				119	/* Can't extend write-protected drive */
				120
				121	if (isReadOnly(ipbmap)) {
				122	printk(KERN_WARNING "jfs_extendfs: read-only file system\n");
				123	rc = -EROFS;
				124	goto out;
				125	}
				126
				127	/*
				128	* reconfigure LV spaces
				129	* ---------------------
				130	*
				131	* validate new size, or, if not specified, determine new size
				132	*/
				133
				134	/*
				135	* reconfigure inline log space:
				136	*/
				137	if ((sbi->mntflag & JFS_INLINELOG)) {
				138	if (newLogSize == 0) {
				139	/*
				140	* no size specified: default to 1/256 of aggregate
				141	* size; rounded up to a megabyte boundary;
				142	*/
				143	newLogSize = newLVSize >> 8;
				144	t32 = (1 << (20 - sbi->l2bsize)) - 1;
				145	newLogSize = (newLogSize + t32) & ~t32;
				146	newLogSize =
				147	min(newLogSize, MEGABYTE32 >> sbi->l2bsize);
				148	} else {
				149	/*
				150	* convert the newLogSize to fs blocks.
				151	*
				152	* Since this is given in megabytes, it will always be
				153	* an even number of pages.
				154	*/
				155	newLogSize = (newLogSize * MEGABYTE) >> sbi->l2bsize;
				156	}
				157
				158	} else
				159	newLogSize = 0;
				160
				161	newLogAddress = newLVSize - newLogSize;
				162
				163	/*
				164	* reconfigure fsck work space:
				165	*
				166	* configure it to the end of the logical volume regardless of
				167	* whether file system extends to the end of the aggregate;
				168	* Need enough 4k pages to cover:
				169	* - 1 bit per block in aggregate rounded up to BPERDMAP boundary
				170	* - 1 extra page to handle control page and intermediate level pages
				171	* - 50 extra pages for the chkdsk service log
				172	*/
				173	t64 = ((newLVSize - newLogSize + BPERDMAP - 1) >> L2BPERDMAP)
				174	<< L2BPERDMAP;
				175	t32 = ((t64 + (BITSPERPAGE - 1)) / BITSPERPAGE) + 1 + 50;
				176	newFSCKSize = t32 << sbi->l2nbperpage;
				177	newFSCKAddress = newLogAddress - newFSCKSize;
				178
				179	/*
				180	* compute new file system space;
				181	*/
				182	newFSSize = newLVSize - newLogSize - newFSCKSize;
				183
				184	/* file system cannot be shrinked */
				185	if (newFSSize < bmp->db_mapsize) {
				186	rc = -EINVAL;
				187	goto out;
				188	}
				189
				190	/*
				191	* If we're expanding enough that the inline log does not overlap
				192	* the old one, we can format the new log before we quiesce the
				193	* filesystem.
				194	*/
				195	if ((sbi->mntflag & JFS_INLINELOG) && (newLogAddress > oldLVSize)) {
				196	if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
				197	goto out;
				198	log_formatted = 1;
				199	}
				200	/*
				201	* quiesce file system
				202	*
				203	* (prepare to move the inline log and to prevent map update)
				204	*
				205	* block any new transactions and wait for completion of
				206	* all wip transactions and flush modified pages s.t.
				207	* on-disk file system is in consistent state and
				208	* log is not required for recovery.
				209	*/
				210	txQuiesce(sb);
				211
Dave Kleikamp	7fab479	2005-05-02 12:25:02 -0600	[diff] [blame]	212	/* Reset size of direct inode */
				213	sbi->direct_inode->i_size = sb->s_bdev->bd_inode->i_size;
				214
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	215	if (sbi->mntflag & JFS_INLINELOG) {
				216	/*
				217	* deactivate old inline log
				218	*/
				219	lmLogShutdown(log);
				220
				221	/*
				222	* mark on-disk super block for fs in transition;
				223	*
				224	* update on-disk superblock for the new space configuration
				225	* of inline log space and fsck work space descriptors:
				226	* N.B. FS descriptor is NOT updated;
				227	*
				228	* crash recovery:
				229	* logredo(): if FM_EXTENDFS, return to fsck() for cleanup;
				230	* fsck(): if FM_EXTENDFS, reformat inline log and fsck
				231	* workspace from superblock inline log descriptor and fsck
				232	* workspace descriptor;
				233	*/
				234
				235	/* read in superblock */
				236	if ((rc = readSuper(sb, &bh)))
				237	goto error_out;
				238	j_sb = (struct jfs_superblock *)bh->b_data;
				239
				240	/* mark extendfs() in progress */
				241	j_sb->s_state \|= cpu_to_le32(FM_EXTENDFS);
				242	j_sb->s_xsize = cpu_to_le64(newFSSize);
				243	PXDaddress(&j_sb->s_xfsckpxd, newFSCKAddress);
				244	PXDlength(&j_sb->s_xfsckpxd, newFSCKSize);
				245	PXDaddress(&j_sb->s_xlogpxd, newLogAddress);
				246	PXDlength(&j_sb->s_xlogpxd, newLogSize);
				247
				248	/* synchronously update superblock */
				249	mark_buffer_dirty(bh);
				250	sync_dirty_buffer(bh);
				251	brelse(bh);
				252
				253	/*
				254	* format new inline log synchronously;
				255	*
				256	* crash recovery: if log move in progress,
				257	* reformat log and exit success;
				258	*/
				259	if (!log_formatted)
				260	if ((rc = lmLogFormat(log, newLogAddress, newLogSize)))
				261	goto error_out;
				262
				263	/*
				264	* activate new log
				265	*/
				266	log->base = newLogAddress;
				267	log->size = newLogSize >> (L2LOGPSIZE - sb->s_blocksize_bits);
				268	if ((rc = lmLogInit(log)))
				269	goto error_out;
				270	}
				271
				272	/*
				273	* extend block allocation map
				274	* ---------------------------
				275	*
				276	* extendfs() for new extension, retry after crash recovery;
				277	*
				278	* note: both logredo() and fsck() rebuild map from
				279	* the bitmap and configuration parameter from superblock
				280	* (disregarding all other control information in the map);
				281	*
				282	* superblock:
				283	* s_size: aggregate size in physical blocks;
				284	*/
				285	/*
				286	* compute the new block allocation map configuration
				287	*
				288	* map dinode:
				289	* di_size: map file size in byte;
				290	* di_nblocks: number of blocks allocated for map file;
				291	* di_mapsize: number of blocks in aggregate (covered by map);
				292	* map control page:
				293	* db_mapsize: number of blocks in aggregate (covered by map);
				294	*/
				295	newMapSize = newFSSize;
				296	/* number of data pages of new bmap file:
				297	* roundup new size to full dmap page boundary and
				298	* add 1 extra dmap page for next extendfs()
				299	*/
				300	t64 = (newMapSize - 1) + BPERDMAP;
				301	newNpages = BLKTODMAPN(t64) + 1;
				302
				303	/*
				304	* extend map from current map (WITHOUT growing mapfile)
				305	*
				306	* map new extension with unmapped part of the last partial
				307	* dmap page, if applicable, and extra page(s) allocated
				308	* at end of bmap by mkfs() or previous extendfs();
				309	*/
				310	extendBmap:
				311	/* compute number of blocks requested to extend */
				312	mapSize = bmp->db_mapsize;
				313	XAddress = mapSize; /* eXtension Address */
				314	XSize = newMapSize - mapSize; /* eXtension Size */
				315	old_agsize = bmp->db_agsize; /* We need to know if this changes */
				316
				317	/* compute number of blocks that can be extended by current mapfile */
				318	t64 = dbMapFileSizeToMapSize(ipbmap);
				319	if (mapSize > t64) {
				320	printk(KERN_ERR "jfs_extendfs: mapSize (0x%Lx) > t64 (0x%Lx)\n",
				321	(long long) mapSize, (long long) t64);
				322	rc = -EIO;
				323	goto error_out;
				324	}
				325	nblocks = min(t64 - mapSize, XSize);
				326
				327	/*
				328	* update map pages for new extension:
				329	*
				330	* update/init dmap and bubble up the control hierarchy
				331	* incrementally fold up dmaps into upper levels;
				332	* update bmap control page;
				333	*/
				334	if ((rc = dbExtendFS(ipbmap, XAddress, nblocks)))
				335	goto error_out;
				336	/*
				337	* the map now has extended to cover additional nblocks:
				338	* dn_mapsize = oldMapsize + nblocks;
				339	*/
				340	/* ipbmap->i_mapsize += nblocks; */
				341	XSize -= nblocks;
				342
				343	/*
				344	* grow map file to cover remaining extension
				345	* and/or one extra dmap page for next extendfs();
				346	*
				347	* allocate new map pages and its backing blocks, and
				348	* update map file xtree
				349	*/
				350	/* compute number of data pages of current bmap file */
				351	nPages = ipbmap->i_size >> L2PSIZE;
				352
				353	/* need to grow map file ? */
				354	if (nPages == newNpages)
				355	goto finalizeBmap;
				356
				357	/*
				358	* grow bmap file for the new map pages required:
				359	*
				360	* allocate growth at the start of newly extended region;
				361	* bmap file only grows sequentially, i.e., both data pages
				362	* and possibly xtree index pages may grow in append mode,
				363	* s.t. logredo() can reconstruct pre-extension state
				364	* by washing away bmap file of pages outside s_size boundary;
				365	*/
				366	/*
				367	* journal map file growth as if a regular file growth:
				368	* (note: bmap is created with di_mode = IFJOURNAL\|IFREG);
				369	*
				370	* journaling of bmap file growth is not required since
				371	* logredo() do/can not use log records of bmap file growth
				372	* but it provides careful write semantics, pmap update, etc.;
				373	*/
				374	/* synchronous write of data pages: bmap data pages are
				375	* cached in meta-data cache, and not written out
				376	* by txCommit();
				377	*/
				378	filemap_fdatawait(ipbmap->i_mapping);
				379	filemap_fdatawrite(ipbmap->i_mapping);
				380	filemap_fdatawait(ipbmap->i_mapping);
				381	diWriteSpecial(ipbmap, 0);
				382
				383	newPage = nPages; /* first new page number */
				384	xoff = newPage << sbi->l2nbperpage;
				385	xlen = (newNpages - nPages) << sbi->l2nbperpage;
				386	xlen = min(xlen, (int) nblocks) & ~(sbi->nbperpage - 1);
				387	xaddr = XAddress;
				388
				389	tid = txBegin(sb, COMMIT_FORCE);
				390
				391	if ((rc = xtAppend(tid, ipbmap, 0, xoff, nblocks, &xlen, &xaddr, 0))) {
				392	txEnd(tid);
				393	goto error_out;
				394	}
				395	/* update bmap file size */
				396	ipbmap->i_size += xlen << sbi->l2bsize;
				397	inode_add_bytes(ipbmap, xlen << sbi->l2bsize);
				398
				399	iplist[0] = ipbmap;
				400	rc = txCommit(tid, 1, &iplist[0], COMMIT_FORCE);
				401
				402	txEnd(tid);
				403
				404	if (rc)
				405	goto error_out;
				406
				407	/*
				408	* map file has been grown now to cover extension to further out;
				409	* di_size = new map file size;
				410	*
				411	* if huge extension, the previous extension based on previous
				412	* map file size may not have been sufficient to cover whole extension
				413	* (it could have been used up for new map pages),
				414	* but the newly grown map file now covers lot bigger new free space
				415	* available for further extension of map;
				416	*/
				417	/* any more blocks to extend ? */
				418	if (XSize)
				419	goto extendBmap;
				420
				421	finalizeBmap:
				422	/* finalize bmap */
				423	dbFinalizeBmap(ipbmap);
				424
				425	/*
				426	* update inode allocation map
				427	* ---------------------------
				428	*
				429	* move iag lists from old to new iag;
				430	* agstart field is not updated for logredo() to reconstruct
				431	* iag lists if system crash occurs.
				432	* (computation of ag number from agstart based on agsize
				433	* will correctly identify the new ag);
				434	*/
				435	/* if new AG size the same as old AG size, done! */
				436	if (bmp->db_agsize != old_agsize) {
				437	if ((rc = diExtendFS(ipimap, ipbmap)))
				438	goto error_out;
				439
				440	/* finalize imap */
				441	if ((rc = diSync(ipimap)))
				442	goto error_out;
				443	}
				444
				445	/*
				446	* finalize
				447	* --------
				448	*
				449	* extension is committed when on-disk super block is
				450	* updated with new descriptors: logredo will recover
				451	* crash before it to pre-extension state;
				452	*/
				453
				454	/* sync log to skip log replay of bmap file growth transaction; */
				455	/* lmLogSync(log, 1); */
				456
				457	/*
				458	* synchronous write bmap global control page;
				459	* for crash before completion of write
				460	* logredo() will recover to pre-extendfs state;
				461	* for crash after completion of write,
				462	* logredo() will recover post-extendfs state;
				463	*/
				464	if ((rc = dbSync(ipbmap)))
				465	goto error_out;
				466
				467	/*
				468	* copy primary bmap inode to secondary bmap inode
				469	*/
				470
				471	ipbmap2 = diReadSpecial(sb, BMAP_I, 1);
				472	if (ipbmap2 == NULL) {
				473	printk(KERN_ERR "jfs_extendfs: diReadSpecial(bmap) failed\n");
				474	goto error_out;
				475	}
				476	memcpy(&JFS_IP(ipbmap2)->i_xtroot, &JFS_IP(ipbmap)->i_xtroot, 288);
				477	ipbmap2->i_size = ipbmap->i_size;
				478	ipbmap2->i_blocks = ipbmap->i_blocks;
				479
				480	diWriteSpecial(ipbmap2, 1);
				481	diFreeSpecial(ipbmap2);
				482
				483	/*
				484	* update superblock
				485	*/
				486	if ((rc = readSuper(sb, &bh)))
				487	goto error_out;
				488	j_sb = (struct jfs_superblock *)bh->b_data;
				489
				490	/* mark extendfs() completion */
				491	j_sb->s_state &= cpu_to_le32(~FM_EXTENDFS);
				492	j_sb->s_size = cpu_to_le64(bmp->db_mapsize <<
				493	le16_to_cpu(j_sb->s_l2bfactor));
				494	j_sb->s_agsize = cpu_to_le32(bmp->db_agsize);
				495
				496	/* update inline log space descriptor */
				497	if (sbi->mntflag & JFS_INLINELOG) {
				498	PXDaddress(&(j_sb->s_logpxd), newLogAddress);
				499	PXDlength(&(j_sb->s_logpxd), newLogSize);
				500	}
				501
				502	/* record log's mount serial number */
				503	j_sb->s_logserial = cpu_to_le32(log->serial);
				504
				505	/* update fsck work space descriptor */
				506	PXDaddress(&(j_sb->s_fsckpxd), newFSCKAddress);
				507	PXDlength(&(j_sb->s_fsckpxd), newFSCKSize);
				508	j_sb->s_fscklog = 1;
				509	/* sb->s_fsckloglen remains the same */
				510
				511	/* Update secondary superblock */
				512	bh2 = sb_bread(sb, SUPER2_OFF >> sb->s_blocksize_bits);
				513	if (bh2) {
				514	j_sb2 = (struct jfs_superblock *)bh2->b_data;
				515	memcpy(j_sb2, j_sb, sizeof (struct jfs_superblock));
				516
				517	mark_buffer_dirty(bh);
				518	sync_dirty_buffer(bh2);
				519	brelse(bh2);
				520	}
				521
				522	/* write primary superblock */
				523	mark_buffer_dirty(bh);
				524	sync_dirty_buffer(bh);
				525	brelse(bh);
				526
				527	goto resume;
				528
				529	error_out:
				530	jfs_error(sb, "jfs_extendfs");
				531
				532	resume:
				533	/*
				534	* resume file system transactions
				535	*/
				536	txResume(sb);
				537
				538	out:
				539	return rc;
				540	}