xref: /linux/fs/ext4/super.c (revision 06705bff9114531a997a7d0c2520bea0f2927410)
1ac27a0ecSDave Kleikamp /*
2617ba13bSMingming Cao  *  linux/fs/ext4/super.c
3ac27a0ecSDave Kleikamp  *
4ac27a0ecSDave Kleikamp  * Copyright (C) 1992, 1993, 1994, 1995
5ac27a0ecSDave Kleikamp  * Remy Card (card@masi.ibp.fr)
6ac27a0ecSDave Kleikamp  * Laboratoire MASI - Institut Blaise Pascal
7ac27a0ecSDave Kleikamp  * Universite Pierre et Marie Curie (Paris VI)
8ac27a0ecSDave Kleikamp  *
9ac27a0ecSDave Kleikamp  *  from
10ac27a0ecSDave Kleikamp  *
11ac27a0ecSDave Kleikamp  *  linux/fs/minix/inode.c
12ac27a0ecSDave Kleikamp  *
13ac27a0ecSDave Kleikamp  *  Copyright (C) 1991, 1992  Linus Torvalds
14ac27a0ecSDave Kleikamp  *
15ac27a0ecSDave Kleikamp  *  Big-endian to little-endian byte-swapping/bitmaps by
16ac27a0ecSDave Kleikamp  *        David S. Miller (davem@caip.rutgers.edu), 1995
17ac27a0ecSDave Kleikamp  */
18ac27a0ecSDave Kleikamp 
19ac27a0ecSDave Kleikamp #include <linux/module.h>
20ac27a0ecSDave Kleikamp #include <linux/string.h>
21ac27a0ecSDave Kleikamp #include <linux/fs.h>
22ac27a0ecSDave Kleikamp #include <linux/time.h>
23dab291afSMingming Cao #include <linux/jbd2.h>
24ac27a0ecSDave Kleikamp #include <linux/slab.h>
25ac27a0ecSDave Kleikamp #include <linux/init.h>
26ac27a0ecSDave Kleikamp #include <linux/blkdev.h>
27ac27a0ecSDave Kleikamp #include <linux/parser.h>
28ac27a0ecSDave Kleikamp #include <linux/smp_lock.h>
29ac27a0ecSDave Kleikamp #include <linux/buffer_head.h>
30a5694255SChristoph Hellwig #include <linux/exportfs.h>
31ac27a0ecSDave Kleikamp #include <linux/vfs.h>
32ac27a0ecSDave Kleikamp #include <linux/random.h>
33ac27a0ecSDave Kleikamp #include <linux/mount.h>
34ac27a0ecSDave Kleikamp #include <linux/namei.h>
35ac27a0ecSDave Kleikamp #include <linux/quotaops.h>
36ac27a0ecSDave Kleikamp #include <linux/seq_file.h>
379f6200bbSTheodore Ts'o #include <linux/proc_fs.h>
383197ebdbSTheodore Ts'o #include <linux/ctype.h>
39ede86cc4STheodore Ts'o #include <linux/marker.h>
401330593eSVignesh Babu #include <linux/log2.h>
41717d50e4SAndreas Dilger #include <linux/crc16.h>
42ac27a0ecSDave Kleikamp #include <asm/uaccess.h>
43ac27a0ecSDave Kleikamp 
443dcf5451SChristoph Hellwig #include "ext4.h"
453dcf5451SChristoph Hellwig #include "ext4_jbd2.h"
46ac27a0ecSDave Kleikamp #include "xattr.h"
47ac27a0ecSDave Kleikamp #include "acl.h"
48ac27a0ecSDave Kleikamp #include "namei.h"
49717d50e4SAndreas Dilger #include "group.h"
50ac27a0ecSDave Kleikamp 
519f6200bbSTheodore Ts'o struct proc_dir_entry *ext4_proc_root;
523197ebdbSTheodore Ts'o static struct kset *ext4_kset;
539f6200bbSTheodore Ts'o 
54617ba13bSMingming Cao static int ext4_load_journal(struct super_block *, struct ext4_super_block *,
55ac27a0ecSDave Kleikamp 			     unsigned long journal_devnum);
56c4be0c1dSTakashi Sato static int ext4_commit_super(struct super_block *sb,
572b2d6d01STheodore Ts'o 			      struct ext4_super_block *es, int sync);
58617ba13bSMingming Cao static void ext4_mark_recovery_complete(struct super_block *sb,
59617ba13bSMingming Cao 					struct ext4_super_block *es);
60617ba13bSMingming Cao static void ext4_clear_journal_err(struct super_block *sb,
61617ba13bSMingming Cao 				   struct ext4_super_block *es);
62617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait);
63617ba13bSMingming Cao static const char *ext4_decode_error(struct super_block *sb, int errno,
64ac27a0ecSDave Kleikamp 				     char nbuf[16]);
65617ba13bSMingming Cao static int ext4_remount(struct super_block *sb, int *flags, char *data);
66617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf);
67c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb);
68617ba13bSMingming Cao static void ext4_write_super(struct super_block *sb);
69c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb);
70ac27a0ecSDave Kleikamp 
71bd81d8eeSLaurent Vivier 
728fadc143SAlexandre Ratchov ext4_fsblk_t ext4_block_bitmap(struct super_block *sb,
738fadc143SAlexandre Ratchov 			       struct ext4_group_desc *bg)
74bd81d8eeSLaurent Vivier {
753a14589cSAneesh Kumar K.V 	return le32_to_cpu(bg->bg_block_bitmap_lo) |
768fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
778fadc143SAlexandre Ratchov 		(ext4_fsblk_t)le32_to_cpu(bg->bg_block_bitmap_hi) << 32 : 0);
78bd81d8eeSLaurent Vivier }
79bd81d8eeSLaurent Vivier 
808fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_bitmap(struct super_block *sb,
818fadc143SAlexandre Ratchov 			       struct ext4_group_desc *bg)
82bd81d8eeSLaurent Vivier {
835272f837SAneesh Kumar K.V 	return le32_to_cpu(bg->bg_inode_bitmap_lo) |
848fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
858fadc143SAlexandre Ratchov 		(ext4_fsblk_t)le32_to_cpu(bg->bg_inode_bitmap_hi) << 32 : 0);
86bd81d8eeSLaurent Vivier }
87bd81d8eeSLaurent Vivier 
888fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_table(struct super_block *sb,
898fadc143SAlexandre Ratchov 			      struct ext4_group_desc *bg)
90bd81d8eeSLaurent Vivier {
915272f837SAneesh Kumar K.V 	return le32_to_cpu(bg->bg_inode_table_lo) |
928fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
938fadc143SAlexandre Ratchov 		(ext4_fsblk_t)le32_to_cpu(bg->bg_inode_table_hi) << 32 : 0);
94bd81d8eeSLaurent Vivier }
95bd81d8eeSLaurent Vivier 
96560671a0SAneesh Kumar K.V __u32 ext4_free_blks_count(struct super_block *sb,
97560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
98560671a0SAneesh Kumar K.V {
99560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_free_blocks_count_lo) |
100560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
101560671a0SAneesh Kumar K.V 		(__u32)le16_to_cpu(bg->bg_free_blocks_count_hi) << 16 : 0);
102560671a0SAneesh Kumar K.V }
103560671a0SAneesh Kumar K.V 
104560671a0SAneesh Kumar K.V __u32 ext4_free_inodes_count(struct super_block *sb,
105560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
106560671a0SAneesh Kumar K.V {
107560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_free_inodes_count_lo) |
108560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
109560671a0SAneesh Kumar K.V 		(__u32)le16_to_cpu(bg->bg_free_inodes_count_hi) << 16 : 0);
110560671a0SAneesh Kumar K.V }
111560671a0SAneesh Kumar K.V 
112560671a0SAneesh Kumar K.V __u32 ext4_used_dirs_count(struct super_block *sb,
113560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
114560671a0SAneesh Kumar K.V {
115560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_used_dirs_count_lo) |
116560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
117560671a0SAneesh Kumar K.V 		(__u32)le16_to_cpu(bg->bg_used_dirs_count_hi) << 16 : 0);
118560671a0SAneesh Kumar K.V }
119560671a0SAneesh Kumar K.V 
120560671a0SAneesh Kumar K.V __u32 ext4_itable_unused_count(struct super_block *sb,
121560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
122560671a0SAneesh Kumar K.V {
123560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_itable_unused_lo) |
124560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
125560671a0SAneesh Kumar K.V 		(__u32)le16_to_cpu(bg->bg_itable_unused_hi) << 16 : 0);
126560671a0SAneesh Kumar K.V }
127560671a0SAneesh Kumar K.V 
1288fadc143SAlexandre Ratchov void ext4_block_bitmap_set(struct super_block *sb,
1298fadc143SAlexandre Ratchov 			   struct ext4_group_desc *bg, ext4_fsblk_t blk)
130bd81d8eeSLaurent Vivier {
1313a14589cSAneesh Kumar K.V 	bg->bg_block_bitmap_lo = cpu_to_le32((u32)blk);
1328fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
1338fadc143SAlexandre Ratchov 		bg->bg_block_bitmap_hi = cpu_to_le32(blk >> 32);
134bd81d8eeSLaurent Vivier }
135bd81d8eeSLaurent Vivier 
1368fadc143SAlexandre Ratchov void ext4_inode_bitmap_set(struct super_block *sb,
1378fadc143SAlexandre Ratchov 			   struct ext4_group_desc *bg, ext4_fsblk_t blk)
138bd81d8eeSLaurent Vivier {
1395272f837SAneesh Kumar K.V 	bg->bg_inode_bitmap_lo  = cpu_to_le32((u32)blk);
1408fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
1418fadc143SAlexandre Ratchov 		bg->bg_inode_bitmap_hi = cpu_to_le32(blk >> 32);
142bd81d8eeSLaurent Vivier }
143bd81d8eeSLaurent Vivier 
1448fadc143SAlexandre Ratchov void ext4_inode_table_set(struct super_block *sb,
1458fadc143SAlexandre Ratchov 			  struct ext4_group_desc *bg, ext4_fsblk_t blk)
146bd81d8eeSLaurent Vivier {
1475272f837SAneesh Kumar K.V 	bg->bg_inode_table_lo = cpu_to_le32((u32)blk);
1488fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
1498fadc143SAlexandre Ratchov 		bg->bg_inode_table_hi = cpu_to_le32(blk >> 32);
150bd81d8eeSLaurent Vivier }
151bd81d8eeSLaurent Vivier 
152560671a0SAneesh Kumar K.V void ext4_free_blks_set(struct super_block *sb,
153560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
154560671a0SAneesh Kumar K.V {
155560671a0SAneesh Kumar K.V 	bg->bg_free_blocks_count_lo = cpu_to_le16((__u16)count);
156560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
157560671a0SAneesh Kumar K.V 		bg->bg_free_blocks_count_hi = cpu_to_le16(count >> 16);
158560671a0SAneesh Kumar K.V }
159560671a0SAneesh Kumar K.V 
160560671a0SAneesh Kumar K.V void ext4_free_inodes_set(struct super_block *sb,
161560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
162560671a0SAneesh Kumar K.V {
163560671a0SAneesh Kumar K.V 	bg->bg_free_inodes_count_lo = cpu_to_le16((__u16)count);
164560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
165560671a0SAneesh Kumar K.V 		bg->bg_free_inodes_count_hi = cpu_to_le16(count >> 16);
166560671a0SAneesh Kumar K.V }
167560671a0SAneesh Kumar K.V 
168560671a0SAneesh Kumar K.V void ext4_used_dirs_set(struct super_block *sb,
169560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
170560671a0SAneesh Kumar K.V {
171560671a0SAneesh Kumar K.V 	bg->bg_used_dirs_count_lo = cpu_to_le16((__u16)count);
172560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
173560671a0SAneesh Kumar K.V 		bg->bg_used_dirs_count_hi = cpu_to_le16(count >> 16);
174560671a0SAneesh Kumar K.V }
175560671a0SAneesh Kumar K.V 
176560671a0SAneesh Kumar K.V void ext4_itable_unused_set(struct super_block *sb,
177560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
178560671a0SAneesh Kumar K.V {
179560671a0SAneesh Kumar K.V 	bg->bg_itable_unused_lo = cpu_to_le16((__u16)count);
180560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
181560671a0SAneesh Kumar K.V 		bg->bg_itable_unused_hi = cpu_to_le16(count >> 16);
182560671a0SAneesh Kumar K.V }
183560671a0SAneesh Kumar K.V 
184ac27a0ecSDave Kleikamp /*
185dab291afSMingming Cao  * Wrappers for jbd2_journal_start/end.
186ac27a0ecSDave Kleikamp  *
187ac27a0ecSDave Kleikamp  * The only special thing we need to do here is to make sure that all
188ac27a0ecSDave Kleikamp  * journal_end calls result in the superblock being marked dirty, so
189ac27a0ecSDave Kleikamp  * that sync() will call the filesystem's write_super callback if
190ac27a0ecSDave Kleikamp  * appropriate.
191ac27a0ecSDave Kleikamp  */
192617ba13bSMingming Cao handle_t *ext4_journal_start_sb(struct super_block *sb, int nblocks)
193ac27a0ecSDave Kleikamp {
194ac27a0ecSDave Kleikamp 	journal_t *journal;
195ac27a0ecSDave Kleikamp 
196ac27a0ecSDave Kleikamp 	if (sb->s_flags & MS_RDONLY)
197ac27a0ecSDave Kleikamp 		return ERR_PTR(-EROFS);
198ac27a0ecSDave Kleikamp 
199ac27a0ecSDave Kleikamp 	/* Special case here: if the journal has aborted behind our
200ac27a0ecSDave Kleikamp 	 * backs (eg. EIO in the commit thread), then we still need to
201ac27a0ecSDave Kleikamp 	 * take the FS itself readonly cleanly. */
202617ba13bSMingming Cao 	journal = EXT4_SB(sb)->s_journal;
2030390131bSFrank Mayhar 	if (journal) {
204ac27a0ecSDave Kleikamp 		if (is_journal_aborted(journal)) {
20546e665e9SHarvey Harrison 			ext4_abort(sb, __func__,
206ac27a0ecSDave Kleikamp 				   "Detected aborted journal");
207ac27a0ecSDave Kleikamp 			return ERR_PTR(-EROFS);
208ac27a0ecSDave Kleikamp 		}
209dab291afSMingming Cao 		return jbd2_journal_start(journal, nblocks);
210ac27a0ecSDave Kleikamp 	}
2110390131bSFrank Mayhar 	/*
2120390131bSFrank Mayhar 	 * We're not journaling, return the appropriate indication.
2130390131bSFrank Mayhar 	 */
2140390131bSFrank Mayhar 	current->journal_info = EXT4_NOJOURNAL_HANDLE;
2150390131bSFrank Mayhar 	return current->journal_info;
2160390131bSFrank Mayhar }
217ac27a0ecSDave Kleikamp 
218ac27a0ecSDave Kleikamp /*
219ac27a0ecSDave Kleikamp  * The only special thing we need to do here is to make sure that all
220dab291afSMingming Cao  * jbd2_journal_stop calls result in the superblock being marked dirty, so
221ac27a0ecSDave Kleikamp  * that sync() will call the filesystem's write_super callback if
222ac27a0ecSDave Kleikamp  * appropriate.
223ac27a0ecSDave Kleikamp  */
224617ba13bSMingming Cao int __ext4_journal_stop(const char *where, handle_t *handle)
225ac27a0ecSDave Kleikamp {
226ac27a0ecSDave Kleikamp 	struct super_block *sb;
227ac27a0ecSDave Kleikamp 	int err;
228ac27a0ecSDave Kleikamp 	int rc;
229ac27a0ecSDave Kleikamp 
2300390131bSFrank Mayhar 	if (!ext4_handle_valid(handle)) {
2310390131bSFrank Mayhar 		/*
2320390131bSFrank Mayhar 		 * Do this here since we don't call jbd2_journal_stop() in
2330390131bSFrank Mayhar 		 * no-journal mode.
2340390131bSFrank Mayhar 		 */
2350390131bSFrank Mayhar 		current->journal_info = NULL;
2360390131bSFrank Mayhar 		return 0;
2370390131bSFrank Mayhar 	}
238ac27a0ecSDave Kleikamp 	sb = handle->h_transaction->t_journal->j_private;
239ac27a0ecSDave Kleikamp 	err = handle->h_err;
240dab291afSMingming Cao 	rc = jbd2_journal_stop(handle);
241ac27a0ecSDave Kleikamp 
242ac27a0ecSDave Kleikamp 	if (!err)
243ac27a0ecSDave Kleikamp 		err = rc;
244ac27a0ecSDave Kleikamp 	if (err)
245617ba13bSMingming Cao 		__ext4_std_error(sb, where, err);
246ac27a0ecSDave Kleikamp 	return err;
247ac27a0ecSDave Kleikamp }
248ac27a0ecSDave Kleikamp 
249617ba13bSMingming Cao void ext4_journal_abort_handle(const char *caller, const char *err_fn,
250ac27a0ecSDave Kleikamp 		struct buffer_head *bh, handle_t *handle, int err)
251ac27a0ecSDave Kleikamp {
252ac27a0ecSDave Kleikamp 	char nbuf[16];
253617ba13bSMingming Cao 	const char *errstr = ext4_decode_error(NULL, err, nbuf);
254ac27a0ecSDave Kleikamp 
2550390131bSFrank Mayhar 	BUG_ON(!ext4_handle_valid(handle));
2560390131bSFrank Mayhar 
257ac27a0ecSDave Kleikamp 	if (bh)
258ac27a0ecSDave Kleikamp 		BUFFER_TRACE(bh, "abort");
259ac27a0ecSDave Kleikamp 
260ac27a0ecSDave Kleikamp 	if (!handle->h_err)
261ac27a0ecSDave Kleikamp 		handle->h_err = err;
262ac27a0ecSDave Kleikamp 
263ac27a0ecSDave Kleikamp 	if (is_handle_aborted(handle))
264ac27a0ecSDave Kleikamp 		return;
265ac27a0ecSDave Kleikamp 
266ac27a0ecSDave Kleikamp 	printk(KERN_ERR "%s: aborting transaction: %s in %s\n",
267ac27a0ecSDave Kleikamp 	       caller, errstr, err_fn);
268ac27a0ecSDave Kleikamp 
269dab291afSMingming Cao 	jbd2_journal_abort_handle(handle);
270ac27a0ecSDave Kleikamp }
271ac27a0ecSDave Kleikamp 
272ac27a0ecSDave Kleikamp /* Deal with the reporting of failure conditions on a filesystem such as
273ac27a0ecSDave Kleikamp  * inconsistencies detected or read IO failures.
274ac27a0ecSDave Kleikamp  *
275ac27a0ecSDave Kleikamp  * On ext2, we can store the error state of the filesystem in the
276617ba13bSMingming Cao  * superblock.  That is not possible on ext4, because we may have other
277ac27a0ecSDave Kleikamp  * write ordering constraints on the superblock which prevent us from
278ac27a0ecSDave Kleikamp  * writing it out straight away; and given that the journal is about to
279ac27a0ecSDave Kleikamp  * be aborted, we can't rely on the current, or future, transactions to
280ac27a0ecSDave Kleikamp  * write out the superblock safely.
281ac27a0ecSDave Kleikamp  *
282dab291afSMingming Cao  * We'll just use the jbd2_journal_abort() error code to record an error in
283ac27a0ecSDave Kleikamp  * the journal instead.  On recovery, the journal will compain about
284ac27a0ecSDave Kleikamp  * that error until we've noted it down and cleared it.
285ac27a0ecSDave Kleikamp  */
286ac27a0ecSDave Kleikamp 
287617ba13bSMingming Cao static void ext4_handle_error(struct super_block *sb)
288ac27a0ecSDave Kleikamp {
289617ba13bSMingming Cao 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
290ac27a0ecSDave Kleikamp 
291617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
292617ba13bSMingming Cao 	es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
293ac27a0ecSDave Kleikamp 
294ac27a0ecSDave Kleikamp 	if (sb->s_flags & MS_RDONLY)
295ac27a0ecSDave Kleikamp 		return;
296ac27a0ecSDave Kleikamp 
297ac27a0ecSDave Kleikamp 	if (!test_opt(sb, ERRORS_CONT)) {
298617ba13bSMingming Cao 		journal_t *journal = EXT4_SB(sb)->s_journal;
299ac27a0ecSDave Kleikamp 
300617ba13bSMingming Cao 		EXT4_SB(sb)->s_mount_opt |= EXT4_MOUNT_ABORT;
301ac27a0ecSDave Kleikamp 		if (journal)
302dab291afSMingming Cao 			jbd2_journal_abort(journal, -EIO);
303ac27a0ecSDave Kleikamp 	}
304ac27a0ecSDave Kleikamp 	if (test_opt(sb, ERRORS_RO)) {
305ac27a0ecSDave Kleikamp 		printk(KERN_CRIT "Remounting filesystem read-only\n");
306ac27a0ecSDave Kleikamp 		sb->s_flags |= MS_RDONLY;
307ac27a0ecSDave Kleikamp 	}
308617ba13bSMingming Cao 	ext4_commit_super(sb, es, 1);
309ac27a0ecSDave Kleikamp 	if (test_opt(sb, ERRORS_PANIC))
310617ba13bSMingming Cao 		panic("EXT4-fs (device %s): panic forced after error\n",
311ac27a0ecSDave Kleikamp 			sb->s_id);
312ac27a0ecSDave Kleikamp }
313ac27a0ecSDave Kleikamp 
314617ba13bSMingming Cao void ext4_error(struct super_block *sb, const char *function,
315ac27a0ecSDave Kleikamp 		const char *fmt, ...)
316ac27a0ecSDave Kleikamp {
317ac27a0ecSDave Kleikamp 	va_list args;
318ac27a0ecSDave Kleikamp 
319ac27a0ecSDave Kleikamp 	va_start(args, fmt);
320617ba13bSMingming Cao 	printk(KERN_CRIT "EXT4-fs error (device %s): %s: ", sb->s_id, function);
321ac27a0ecSDave Kleikamp 	vprintk(fmt, args);
322ac27a0ecSDave Kleikamp 	printk("\n");
323ac27a0ecSDave Kleikamp 	va_end(args);
324ac27a0ecSDave Kleikamp 
325617ba13bSMingming Cao 	ext4_handle_error(sb);
326ac27a0ecSDave Kleikamp }
327ac27a0ecSDave Kleikamp 
328617ba13bSMingming Cao static const char *ext4_decode_error(struct super_block *sb, int errno,
329ac27a0ecSDave Kleikamp 				     char nbuf[16])
330ac27a0ecSDave Kleikamp {
331ac27a0ecSDave Kleikamp 	char *errstr = NULL;
332ac27a0ecSDave Kleikamp 
333ac27a0ecSDave Kleikamp 	switch (errno) {
334ac27a0ecSDave Kleikamp 	case -EIO:
335ac27a0ecSDave Kleikamp 		errstr = "IO failure";
336ac27a0ecSDave Kleikamp 		break;
337ac27a0ecSDave Kleikamp 	case -ENOMEM:
338ac27a0ecSDave Kleikamp 		errstr = "Out of memory";
339ac27a0ecSDave Kleikamp 		break;
340ac27a0ecSDave Kleikamp 	case -EROFS:
341dab291afSMingming Cao 		if (!sb || EXT4_SB(sb)->s_journal->j_flags & JBD2_ABORT)
342ac27a0ecSDave Kleikamp 			errstr = "Journal has aborted";
343ac27a0ecSDave Kleikamp 		else
344ac27a0ecSDave Kleikamp 			errstr = "Readonly filesystem";
345ac27a0ecSDave Kleikamp 		break;
346ac27a0ecSDave Kleikamp 	default:
347ac27a0ecSDave Kleikamp 		/* If the caller passed in an extra buffer for unknown
348ac27a0ecSDave Kleikamp 		 * errors, textualise them now.  Else we just return
349ac27a0ecSDave Kleikamp 		 * NULL. */
350ac27a0ecSDave Kleikamp 		if (nbuf) {
351ac27a0ecSDave Kleikamp 			/* Check for truncated error codes... */
352ac27a0ecSDave Kleikamp 			if (snprintf(nbuf, 16, "error %d", -errno) >= 0)
353ac27a0ecSDave Kleikamp 				errstr = nbuf;
354ac27a0ecSDave Kleikamp 		}
355ac27a0ecSDave Kleikamp 		break;
356ac27a0ecSDave Kleikamp 	}
357ac27a0ecSDave Kleikamp 
358ac27a0ecSDave Kleikamp 	return errstr;
359ac27a0ecSDave Kleikamp }
360ac27a0ecSDave Kleikamp 
361617ba13bSMingming Cao /* __ext4_std_error decodes expected errors from journaling functions
362ac27a0ecSDave Kleikamp  * automatically and invokes the appropriate error response.  */
363ac27a0ecSDave Kleikamp 
3642b2d6d01STheodore Ts'o void __ext4_std_error(struct super_block *sb, const char *function, int errno)
365ac27a0ecSDave Kleikamp {
366ac27a0ecSDave Kleikamp 	char nbuf[16];
367ac27a0ecSDave Kleikamp 	const char *errstr;
368ac27a0ecSDave Kleikamp 
369ac27a0ecSDave Kleikamp 	/* Special case: if the error is EROFS, and we're not already
370ac27a0ecSDave Kleikamp 	 * inside a transaction, then there's really no point in logging
371ac27a0ecSDave Kleikamp 	 * an error. */
372ac27a0ecSDave Kleikamp 	if (errno == -EROFS && journal_current_handle() == NULL &&
373ac27a0ecSDave Kleikamp 	    (sb->s_flags & MS_RDONLY))
374ac27a0ecSDave Kleikamp 		return;
375ac27a0ecSDave Kleikamp 
376617ba13bSMingming Cao 	errstr = ext4_decode_error(sb, errno, nbuf);
377617ba13bSMingming Cao 	printk(KERN_CRIT "EXT4-fs error (device %s) in %s: %s\n",
378ac27a0ecSDave Kleikamp 	       sb->s_id, function, errstr);
379ac27a0ecSDave Kleikamp 
380617ba13bSMingming Cao 	ext4_handle_error(sb);
381ac27a0ecSDave Kleikamp }
382ac27a0ecSDave Kleikamp 
383ac27a0ecSDave Kleikamp /*
384617ba13bSMingming Cao  * ext4_abort is a much stronger failure handler than ext4_error.  The
385ac27a0ecSDave Kleikamp  * abort function may be used to deal with unrecoverable failures such
386ac27a0ecSDave Kleikamp  * as journal IO errors or ENOMEM at a critical moment in log management.
387ac27a0ecSDave Kleikamp  *
388ac27a0ecSDave Kleikamp  * We unconditionally force the filesystem into an ABORT|READONLY state,
389ac27a0ecSDave Kleikamp  * unless the error response on the fs has been set to panic in which
390ac27a0ecSDave Kleikamp  * case we take the easy way out and panic immediately.
391ac27a0ecSDave Kleikamp  */
392ac27a0ecSDave Kleikamp 
393617ba13bSMingming Cao void ext4_abort(struct super_block *sb, const char *function,
394ac27a0ecSDave Kleikamp 		const char *fmt, ...)
395ac27a0ecSDave Kleikamp {
396ac27a0ecSDave Kleikamp 	va_list args;
397ac27a0ecSDave Kleikamp 
398617ba13bSMingming Cao 	printk(KERN_CRIT "ext4_abort called.\n");
399ac27a0ecSDave Kleikamp 
400ac27a0ecSDave Kleikamp 	va_start(args, fmt);
401617ba13bSMingming Cao 	printk(KERN_CRIT "EXT4-fs error (device %s): %s: ", sb->s_id, function);
402ac27a0ecSDave Kleikamp 	vprintk(fmt, args);
403ac27a0ecSDave Kleikamp 	printk("\n");
404ac27a0ecSDave Kleikamp 	va_end(args);
405ac27a0ecSDave Kleikamp 
406ac27a0ecSDave Kleikamp 	if (test_opt(sb, ERRORS_PANIC))
407617ba13bSMingming Cao 		panic("EXT4-fs panic from previous error\n");
408ac27a0ecSDave Kleikamp 
409ac27a0ecSDave Kleikamp 	if (sb->s_flags & MS_RDONLY)
410ac27a0ecSDave Kleikamp 		return;
411ac27a0ecSDave Kleikamp 
412ac27a0ecSDave Kleikamp 	printk(KERN_CRIT "Remounting filesystem read-only\n");
413617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
414ac27a0ecSDave Kleikamp 	sb->s_flags |= MS_RDONLY;
415617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_opt |= EXT4_MOUNT_ABORT;
416ef2cabf7SHidehiro Kawai 	if (EXT4_SB(sb)->s_journal)
417dab291afSMingming Cao 		jbd2_journal_abort(EXT4_SB(sb)->s_journal, -EIO);
418ac27a0ecSDave Kleikamp }
419ac27a0ecSDave Kleikamp 
420617ba13bSMingming Cao void ext4_warning(struct super_block *sb, const char *function,
421ac27a0ecSDave Kleikamp 		  const char *fmt, ...)
422ac27a0ecSDave Kleikamp {
423ac27a0ecSDave Kleikamp 	va_list args;
424ac27a0ecSDave Kleikamp 
425ac27a0ecSDave Kleikamp 	va_start(args, fmt);
426617ba13bSMingming Cao 	printk(KERN_WARNING "EXT4-fs warning (device %s): %s: ",
427ac27a0ecSDave Kleikamp 	       sb->s_id, function);
428ac27a0ecSDave Kleikamp 	vprintk(fmt, args);
429ac27a0ecSDave Kleikamp 	printk("\n");
430ac27a0ecSDave Kleikamp 	va_end(args);
431ac27a0ecSDave Kleikamp }
432ac27a0ecSDave Kleikamp 
4335d1b1b3fSAneesh Kumar K.V void ext4_grp_locked_error(struct super_block *sb, ext4_group_t grp,
4345d1b1b3fSAneesh Kumar K.V 				const char *function, const char *fmt, ...)
4355d1b1b3fSAneesh Kumar K.V __releases(bitlock)
4365d1b1b3fSAneesh Kumar K.V __acquires(bitlock)
4375d1b1b3fSAneesh Kumar K.V {
4385d1b1b3fSAneesh Kumar K.V 	va_list args;
4395d1b1b3fSAneesh Kumar K.V 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
4405d1b1b3fSAneesh Kumar K.V 
4415d1b1b3fSAneesh Kumar K.V 	va_start(args, fmt);
4425d1b1b3fSAneesh Kumar K.V 	printk(KERN_CRIT "EXT4-fs error (device %s): %s: ", sb->s_id, function);
4435d1b1b3fSAneesh Kumar K.V 	vprintk(fmt, args);
4445d1b1b3fSAneesh Kumar K.V 	printk("\n");
4455d1b1b3fSAneesh Kumar K.V 	va_end(args);
4465d1b1b3fSAneesh Kumar K.V 
4475d1b1b3fSAneesh Kumar K.V 	if (test_opt(sb, ERRORS_CONT)) {
4485d1b1b3fSAneesh Kumar K.V 		EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
4495d1b1b3fSAneesh Kumar K.V 		es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
4505d1b1b3fSAneesh Kumar K.V 		ext4_commit_super(sb, es, 0);
4515d1b1b3fSAneesh Kumar K.V 		return;
4525d1b1b3fSAneesh Kumar K.V 	}
4535d1b1b3fSAneesh Kumar K.V 	ext4_unlock_group(sb, grp);
4545d1b1b3fSAneesh Kumar K.V 	ext4_handle_error(sb);
4555d1b1b3fSAneesh Kumar K.V 	/*
4565d1b1b3fSAneesh Kumar K.V 	 * We only get here in the ERRORS_RO case; relocking the group
4575d1b1b3fSAneesh Kumar K.V 	 * may be dangerous, but nothing bad will happen since the
4585d1b1b3fSAneesh Kumar K.V 	 * filesystem will have already been marked read/only and the
4595d1b1b3fSAneesh Kumar K.V 	 * journal has been aborted.  We return 1 as a hint to callers
4605d1b1b3fSAneesh Kumar K.V 	 * who might what to use the return value from
4615d1b1b3fSAneesh Kumar K.V 	 * ext4_grp_locked_error() to distinguish beween the
4625d1b1b3fSAneesh Kumar K.V 	 * ERRORS_CONT and ERRORS_RO case, and perhaps return more
4635d1b1b3fSAneesh Kumar K.V 	 * aggressively from the ext4 function in question, with a
4645d1b1b3fSAneesh Kumar K.V 	 * more appropriate error code.
4655d1b1b3fSAneesh Kumar K.V 	 */
4665d1b1b3fSAneesh Kumar K.V 	ext4_lock_group(sb, grp);
4675d1b1b3fSAneesh Kumar K.V 	return;
4685d1b1b3fSAneesh Kumar K.V }
4695d1b1b3fSAneesh Kumar K.V 
4705d1b1b3fSAneesh Kumar K.V 
471617ba13bSMingming Cao void ext4_update_dynamic_rev(struct super_block *sb)
472ac27a0ecSDave Kleikamp {
473617ba13bSMingming Cao 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
474ac27a0ecSDave Kleikamp 
475617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) > EXT4_GOOD_OLD_REV)
476ac27a0ecSDave Kleikamp 		return;
477ac27a0ecSDave Kleikamp 
47846e665e9SHarvey Harrison 	ext4_warning(sb, __func__,
479ac27a0ecSDave Kleikamp 		     "updating to rev %d because of new feature flag, "
480ac27a0ecSDave Kleikamp 		     "running e2fsck is recommended",
481617ba13bSMingming Cao 		     EXT4_DYNAMIC_REV);
482ac27a0ecSDave Kleikamp 
483617ba13bSMingming Cao 	es->s_first_ino = cpu_to_le32(EXT4_GOOD_OLD_FIRST_INO);
484617ba13bSMingming Cao 	es->s_inode_size = cpu_to_le16(EXT4_GOOD_OLD_INODE_SIZE);
485617ba13bSMingming Cao 	es->s_rev_level = cpu_to_le32(EXT4_DYNAMIC_REV);
486ac27a0ecSDave Kleikamp 	/* leave es->s_feature_*compat flags alone */
487ac27a0ecSDave Kleikamp 	/* es->s_uuid will be set by e2fsck if empty */
488ac27a0ecSDave Kleikamp 
489ac27a0ecSDave Kleikamp 	/*
490ac27a0ecSDave Kleikamp 	 * The rest of the superblock fields should be zero, and if not it
491ac27a0ecSDave Kleikamp 	 * means they are likely already in use, so leave them alone.  We
492ac27a0ecSDave Kleikamp 	 * can leave it up to e2fsck to clean up any inconsistencies there.
493ac27a0ecSDave Kleikamp 	 */
494ac27a0ecSDave Kleikamp }
495ac27a0ecSDave Kleikamp 
496ac27a0ecSDave Kleikamp /*
497ac27a0ecSDave Kleikamp  * Open the external journal device
498ac27a0ecSDave Kleikamp  */
499617ba13bSMingming Cao static struct block_device *ext4_blkdev_get(dev_t dev)
500ac27a0ecSDave Kleikamp {
501ac27a0ecSDave Kleikamp 	struct block_device *bdev;
502ac27a0ecSDave Kleikamp 	char b[BDEVNAME_SIZE];
503ac27a0ecSDave Kleikamp 
504ac27a0ecSDave Kleikamp 	bdev = open_by_devnum(dev, FMODE_READ|FMODE_WRITE);
505ac27a0ecSDave Kleikamp 	if (IS_ERR(bdev))
506ac27a0ecSDave Kleikamp 		goto fail;
507ac27a0ecSDave Kleikamp 	return bdev;
508ac27a0ecSDave Kleikamp 
509ac27a0ecSDave Kleikamp fail:
510abda1418STheodore Ts'o 	printk(KERN_ERR "EXT4-fs: failed to open journal device %s: %ld\n",
511ac27a0ecSDave Kleikamp 			__bdevname(dev, b), PTR_ERR(bdev));
512ac27a0ecSDave Kleikamp 	return NULL;
513ac27a0ecSDave Kleikamp }
514ac27a0ecSDave Kleikamp 
515ac27a0ecSDave Kleikamp /*
516ac27a0ecSDave Kleikamp  * Release the journal device
517ac27a0ecSDave Kleikamp  */
518617ba13bSMingming Cao static int ext4_blkdev_put(struct block_device *bdev)
519ac27a0ecSDave Kleikamp {
520ac27a0ecSDave Kleikamp 	bd_release(bdev);
5219a1c3542SAl Viro 	return blkdev_put(bdev, FMODE_READ|FMODE_WRITE);
522ac27a0ecSDave Kleikamp }
523ac27a0ecSDave Kleikamp 
524617ba13bSMingming Cao static int ext4_blkdev_remove(struct ext4_sb_info *sbi)
525ac27a0ecSDave Kleikamp {
526ac27a0ecSDave Kleikamp 	struct block_device *bdev;
527ac27a0ecSDave Kleikamp 	int ret = -ENODEV;
528ac27a0ecSDave Kleikamp 
529ac27a0ecSDave Kleikamp 	bdev = sbi->journal_bdev;
530ac27a0ecSDave Kleikamp 	if (bdev) {
531617ba13bSMingming Cao 		ret = ext4_blkdev_put(bdev);
532ac27a0ecSDave Kleikamp 		sbi->journal_bdev = NULL;
533ac27a0ecSDave Kleikamp 	}
534ac27a0ecSDave Kleikamp 	return ret;
535ac27a0ecSDave Kleikamp }
536ac27a0ecSDave Kleikamp 
537ac27a0ecSDave Kleikamp static inline struct inode *orphan_list_entry(struct list_head *l)
538ac27a0ecSDave Kleikamp {
539617ba13bSMingming Cao 	return &list_entry(l, struct ext4_inode_info, i_orphan)->vfs_inode;
540ac27a0ecSDave Kleikamp }
541ac27a0ecSDave Kleikamp 
542617ba13bSMingming Cao static void dump_orphan_list(struct super_block *sb, struct ext4_sb_info *sbi)
543ac27a0ecSDave Kleikamp {
544ac27a0ecSDave Kleikamp 	struct list_head *l;
545ac27a0ecSDave Kleikamp 
546ac27a0ecSDave Kleikamp 	printk(KERN_ERR "sb orphan head is %d\n",
547ac27a0ecSDave Kleikamp 	       le32_to_cpu(sbi->s_es->s_last_orphan));
548ac27a0ecSDave Kleikamp 
549ac27a0ecSDave Kleikamp 	printk(KERN_ERR "sb_info orphan list:\n");
550ac27a0ecSDave Kleikamp 	list_for_each(l, &sbi->s_orphan) {
551ac27a0ecSDave Kleikamp 		struct inode *inode = orphan_list_entry(l);
552ac27a0ecSDave Kleikamp 		printk(KERN_ERR "  "
553ac27a0ecSDave Kleikamp 		       "inode %s:%lu at %p: mode %o, nlink %d, next %d\n",
554ac27a0ecSDave Kleikamp 		       inode->i_sb->s_id, inode->i_ino, inode,
555ac27a0ecSDave Kleikamp 		       inode->i_mode, inode->i_nlink,
556ac27a0ecSDave Kleikamp 		       NEXT_ORPHAN(inode));
557ac27a0ecSDave Kleikamp 	}
558ac27a0ecSDave Kleikamp }
559ac27a0ecSDave Kleikamp 
560617ba13bSMingming Cao static void ext4_put_super(struct super_block *sb)
561ac27a0ecSDave Kleikamp {
562617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
563617ba13bSMingming Cao 	struct ext4_super_block *es = sbi->s_es;
564ef2cabf7SHidehiro Kawai 	int i, err;
565ac27a0ecSDave Kleikamp 
566c9de560dSAlex Tomas 	ext4_mb_release(sb);
567a86c6181SAlex Tomas 	ext4_ext_release(sb);
568617ba13bSMingming Cao 	ext4_xattr_put_super(sb);
5690390131bSFrank Mayhar 	if (sbi->s_journal) {
570ef2cabf7SHidehiro Kawai 		err = jbd2_journal_destroy(sbi->s_journal);
57147b4a50bSJan Kara 		sbi->s_journal = NULL;
572ef2cabf7SHidehiro Kawai 		if (err < 0)
5730390131bSFrank Mayhar 			ext4_abort(sb, __func__,
5740390131bSFrank Mayhar 				   "Couldn't clean up the journal");
5750390131bSFrank Mayhar 	}
576ac27a0ecSDave Kleikamp 	if (!(sb->s_flags & MS_RDONLY)) {
577617ba13bSMingming Cao 		EXT4_CLEAR_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER);
578ac27a0ecSDave Kleikamp 		es->s_state = cpu_to_le16(sbi->s_mount_state);
579617ba13bSMingming Cao 		ext4_commit_super(sb, es, 1);
580ac27a0ecSDave Kleikamp 	}
581240799cdSTheodore Ts'o 	if (sbi->s_proc) {
5829f6200bbSTheodore Ts'o 		remove_proc_entry(sb->s_id, ext4_proc_root);
583240799cdSTheodore Ts'o 	}
5843197ebdbSTheodore Ts'o 	kobject_del(&sbi->s_kobj);
585ac27a0ecSDave Kleikamp 
586ac27a0ecSDave Kleikamp 	for (i = 0; i < sbi->s_gdb_count; i++)
587ac27a0ecSDave Kleikamp 		brelse(sbi->s_group_desc[i]);
588ac27a0ecSDave Kleikamp 	kfree(sbi->s_group_desc);
589772cb7c8SJose R. Santos 	kfree(sbi->s_flex_groups);
590ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_freeblocks_counter);
591ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_freeinodes_counter);
592ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_dirs_counter);
5936bc6e63fSAneesh Kumar K.V 	percpu_counter_destroy(&sbi->s_dirtyblocks_counter);
594ac27a0ecSDave Kleikamp 	brelse(sbi->s_sbh);
595ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
596ac27a0ecSDave Kleikamp 	for (i = 0; i < MAXQUOTAS; i++)
597ac27a0ecSDave Kleikamp 		kfree(sbi->s_qf_names[i]);
598ac27a0ecSDave Kleikamp #endif
599ac27a0ecSDave Kleikamp 
600ac27a0ecSDave Kleikamp 	/* Debugging code just in case the in-memory inode orphan list
601ac27a0ecSDave Kleikamp 	 * isn't empty.  The on-disk one can be non-empty if we've
602ac27a0ecSDave Kleikamp 	 * detected an error and taken the fs readonly, but the
603ac27a0ecSDave Kleikamp 	 * in-memory list had better be clean by this point. */
604ac27a0ecSDave Kleikamp 	if (!list_empty(&sbi->s_orphan))
605ac27a0ecSDave Kleikamp 		dump_orphan_list(sb, sbi);
606ac27a0ecSDave Kleikamp 	J_ASSERT(list_empty(&sbi->s_orphan));
607ac27a0ecSDave Kleikamp 
608f98393a6SPeter Zijlstra 	invalidate_bdev(sb->s_bdev);
609ac27a0ecSDave Kleikamp 	if (sbi->journal_bdev && sbi->journal_bdev != sb->s_bdev) {
610ac27a0ecSDave Kleikamp 		/*
611ac27a0ecSDave Kleikamp 		 * Invalidate the journal device's buffers.  We don't want them
612ac27a0ecSDave Kleikamp 		 * floating about in memory - the physical journal device may
613ac27a0ecSDave Kleikamp 		 * hotswapped, and it breaks the `ro-after' testing code.
614ac27a0ecSDave Kleikamp 		 */
615ac27a0ecSDave Kleikamp 		sync_blockdev(sbi->journal_bdev);
616f98393a6SPeter Zijlstra 		invalidate_bdev(sbi->journal_bdev);
617617ba13bSMingming Cao 		ext4_blkdev_remove(sbi);
618ac27a0ecSDave Kleikamp 	}
619ac27a0ecSDave Kleikamp 	sb->s_fs_info = NULL;
6203197ebdbSTheodore Ts'o 	/*
6213197ebdbSTheodore Ts'o 	 * Now that we are completely done shutting down the
6223197ebdbSTheodore Ts'o 	 * superblock, we need to actually destroy the kobject.
6233197ebdbSTheodore Ts'o 	 */
6243197ebdbSTheodore Ts'o 	unlock_kernel();
6253197ebdbSTheodore Ts'o 	unlock_super(sb);
6263197ebdbSTheodore Ts'o 	kobject_put(&sbi->s_kobj);
6273197ebdbSTheodore Ts'o 	wait_for_completion(&sbi->s_kobj_unregister);
6283197ebdbSTheodore Ts'o 	lock_super(sb);
6293197ebdbSTheodore Ts'o 	lock_kernel();
630705895b6SPekka Enberg 	kfree(sbi->s_blockgroup_lock);
631ac27a0ecSDave Kleikamp 	kfree(sbi);
632ac27a0ecSDave Kleikamp 	return;
633ac27a0ecSDave Kleikamp }
634ac27a0ecSDave Kleikamp 
635e18b890bSChristoph Lameter static struct kmem_cache *ext4_inode_cachep;
636ac27a0ecSDave Kleikamp 
637ac27a0ecSDave Kleikamp /*
638ac27a0ecSDave Kleikamp  * Called inside transaction, so use GFP_NOFS
639ac27a0ecSDave Kleikamp  */
640617ba13bSMingming Cao static struct inode *ext4_alloc_inode(struct super_block *sb)
641ac27a0ecSDave Kleikamp {
642617ba13bSMingming Cao 	struct ext4_inode_info *ei;
643ac27a0ecSDave Kleikamp 
644e6b4f8daSChristoph Lameter 	ei = kmem_cache_alloc(ext4_inode_cachep, GFP_NOFS);
645ac27a0ecSDave Kleikamp 	if (!ei)
646ac27a0ecSDave Kleikamp 		return NULL;
64703010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
648617ba13bSMingming Cao 	ei->i_acl = EXT4_ACL_NOT_CACHED;
649617ba13bSMingming Cao 	ei->i_default_acl = EXT4_ACL_NOT_CACHED;
650ac27a0ecSDave Kleikamp #endif
651ac27a0ecSDave Kleikamp 	ei->vfs_inode.i_version = 1;
65291246c00SAneesh Kumar K.V 	ei->vfs_inode.i_data.writeback_index = 0;
653a86c6181SAlex Tomas 	memset(&ei->i_cached_extent, 0, sizeof(struct ext4_ext_cache));
654c9de560dSAlex Tomas 	INIT_LIST_HEAD(&ei->i_prealloc_list);
655c9de560dSAlex Tomas 	spin_lock_init(&ei->i_prealloc_lock);
6560390131bSFrank Mayhar 	/*
6570390131bSFrank Mayhar 	 * Note:  We can be called before EXT4_SB(sb)->s_journal is set,
6580390131bSFrank Mayhar 	 * therefore it can be null here.  Don't check it, just initialize
6590390131bSFrank Mayhar 	 * jinode.
6600390131bSFrank Mayhar 	 */
661678aaf48SJan Kara 	jbd2_journal_init_jbd_inode(&ei->jinode, &ei->vfs_inode);
662d2a17637SMingming Cao 	ei->i_reserved_data_blocks = 0;
663d2a17637SMingming Cao 	ei->i_reserved_meta_blocks = 0;
664d2a17637SMingming Cao 	ei->i_allocated_meta_blocks = 0;
665d2a17637SMingming Cao 	ei->i_delalloc_reserved_flag = 0;
666d2a17637SMingming Cao 	spin_lock_init(&(ei->i_block_reservation_lock));
667ac27a0ecSDave Kleikamp 	return &ei->vfs_inode;
668ac27a0ecSDave Kleikamp }
669ac27a0ecSDave Kleikamp 
670617ba13bSMingming Cao static void ext4_destroy_inode(struct inode *inode)
671ac27a0ecSDave Kleikamp {
6729f7dd93dSVasily Averin 	if (!list_empty(&(EXT4_I(inode)->i_orphan))) {
6739f7dd93dSVasily Averin 		printk("EXT4 Inode %p: orphan list check failed!\n",
6749f7dd93dSVasily Averin 			EXT4_I(inode));
6759f7dd93dSVasily Averin 		print_hex_dump(KERN_INFO, "", DUMP_PREFIX_ADDRESS, 16, 4,
6769f7dd93dSVasily Averin 				EXT4_I(inode), sizeof(struct ext4_inode_info),
6779f7dd93dSVasily Averin 				true);
6789f7dd93dSVasily Averin 		dump_stack();
6799f7dd93dSVasily Averin 	}
680617ba13bSMingming Cao 	kmem_cache_free(ext4_inode_cachep, EXT4_I(inode));
681ac27a0ecSDave Kleikamp }
682ac27a0ecSDave Kleikamp 
68351cc5068SAlexey Dobriyan static void init_once(void *foo)
684ac27a0ecSDave Kleikamp {
685617ba13bSMingming Cao 	struct ext4_inode_info *ei = (struct ext4_inode_info *) foo;
686ac27a0ecSDave Kleikamp 
687ac27a0ecSDave Kleikamp 	INIT_LIST_HEAD(&ei->i_orphan);
68803010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_XATTR
689ac27a0ecSDave Kleikamp 	init_rwsem(&ei->xattr_sem);
690ac27a0ecSDave Kleikamp #endif
6910e855ac8SAneesh Kumar K.V 	init_rwsem(&ei->i_data_sem);
692ac27a0ecSDave Kleikamp 	inode_init_once(&ei->vfs_inode);
693ac27a0ecSDave Kleikamp }
694ac27a0ecSDave Kleikamp 
695ac27a0ecSDave Kleikamp static int init_inodecache(void)
696ac27a0ecSDave Kleikamp {
697617ba13bSMingming Cao 	ext4_inode_cachep = kmem_cache_create("ext4_inode_cache",
698617ba13bSMingming Cao 					     sizeof(struct ext4_inode_info),
699ac27a0ecSDave Kleikamp 					     0, (SLAB_RECLAIM_ACCOUNT|
700ac27a0ecSDave Kleikamp 						SLAB_MEM_SPREAD),
70120c2df83SPaul Mundt 					     init_once);
702617ba13bSMingming Cao 	if (ext4_inode_cachep == NULL)
703ac27a0ecSDave Kleikamp 		return -ENOMEM;
704ac27a0ecSDave Kleikamp 	return 0;
705ac27a0ecSDave Kleikamp }
706ac27a0ecSDave Kleikamp 
707ac27a0ecSDave Kleikamp static void destroy_inodecache(void)
708ac27a0ecSDave Kleikamp {
709617ba13bSMingming Cao 	kmem_cache_destroy(ext4_inode_cachep);
710ac27a0ecSDave Kleikamp }
711ac27a0ecSDave Kleikamp 
712617ba13bSMingming Cao static void ext4_clear_inode(struct inode *inode)
713ac27a0ecSDave Kleikamp {
71403010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
715617ba13bSMingming Cao 	if (EXT4_I(inode)->i_acl &&
716617ba13bSMingming Cao 			EXT4_I(inode)->i_acl != EXT4_ACL_NOT_CACHED) {
717617ba13bSMingming Cao 		posix_acl_release(EXT4_I(inode)->i_acl);
718617ba13bSMingming Cao 		EXT4_I(inode)->i_acl = EXT4_ACL_NOT_CACHED;
719ac27a0ecSDave Kleikamp 	}
720617ba13bSMingming Cao 	if (EXT4_I(inode)->i_default_acl &&
721617ba13bSMingming Cao 			EXT4_I(inode)->i_default_acl != EXT4_ACL_NOT_CACHED) {
722617ba13bSMingming Cao 		posix_acl_release(EXT4_I(inode)->i_default_acl);
723617ba13bSMingming Cao 		EXT4_I(inode)->i_default_acl = EXT4_ACL_NOT_CACHED;
724ac27a0ecSDave Kleikamp 	}
725ac27a0ecSDave Kleikamp #endif
726c2ea3fdeSTheodore Ts'o 	ext4_discard_preallocations(inode);
7270390131bSFrank Mayhar 	if (EXT4_JOURNAL(inode))
728678aaf48SJan Kara 		jbd2_journal_release_jbd_inode(EXT4_SB(inode->i_sb)->s_journal,
729678aaf48SJan Kara 				       &EXT4_I(inode)->jinode);
730ac27a0ecSDave Kleikamp }
731ac27a0ecSDave Kleikamp 
7322b2d6d01STheodore Ts'o static inline void ext4_show_quota_options(struct seq_file *seq,
7332b2d6d01STheodore Ts'o 					   struct super_block *sb)
734ac27a0ecSDave Kleikamp {
735ac27a0ecSDave Kleikamp #if defined(CONFIG_QUOTA)
736617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
737ac27a0ecSDave Kleikamp 
738ac27a0ecSDave Kleikamp 	if (sbi->s_jquota_fmt)
739ac27a0ecSDave Kleikamp 		seq_printf(seq, ",jqfmt=%s",
740ac27a0ecSDave Kleikamp 		(sbi->s_jquota_fmt == QFMT_VFS_OLD) ? "vfsold" : "vfsv0");
741ac27a0ecSDave Kleikamp 
742ac27a0ecSDave Kleikamp 	if (sbi->s_qf_names[USRQUOTA])
743ac27a0ecSDave Kleikamp 		seq_printf(seq, ",usrjquota=%s", sbi->s_qf_names[USRQUOTA]);
744ac27a0ecSDave Kleikamp 
745ac27a0ecSDave Kleikamp 	if (sbi->s_qf_names[GRPQUOTA])
746ac27a0ecSDave Kleikamp 		seq_printf(seq, ",grpjquota=%s", sbi->s_qf_names[GRPQUOTA]);
747ac27a0ecSDave Kleikamp 
748617ba13bSMingming Cao 	if (sbi->s_mount_opt & EXT4_MOUNT_USRQUOTA)
749ac27a0ecSDave Kleikamp 		seq_puts(seq, ",usrquota");
750ac27a0ecSDave Kleikamp 
751617ba13bSMingming Cao 	if (sbi->s_mount_opt & EXT4_MOUNT_GRPQUOTA)
752ac27a0ecSDave Kleikamp 		seq_puts(seq, ",grpquota");
753ac27a0ecSDave Kleikamp #endif
754ac27a0ecSDave Kleikamp }
755ac27a0ecSDave Kleikamp 
756d9c9bef1SMiklos Szeredi /*
757d9c9bef1SMiklos Szeredi  * Show an option if
758d9c9bef1SMiklos Szeredi  *  - it's set to a non-default value OR
759d9c9bef1SMiklos Szeredi  *  - if the per-sb default is different from the global default
760d9c9bef1SMiklos Szeredi  */
761617ba13bSMingming Cao static int ext4_show_options(struct seq_file *seq, struct vfsmount *vfs)
762ac27a0ecSDave Kleikamp {
763aa22df2cSAneesh Kumar K.V 	int def_errors;
764aa22df2cSAneesh Kumar K.V 	unsigned long def_mount_opts;
765ac27a0ecSDave Kleikamp 	struct super_block *sb = vfs->mnt_sb;
766d9c9bef1SMiklos Szeredi 	struct ext4_sb_info *sbi = EXT4_SB(sb);
767d9c9bef1SMiklos Szeredi 	struct ext4_super_block *es = sbi->s_es;
768d9c9bef1SMiklos Szeredi 
769d9c9bef1SMiklos Szeredi 	def_mount_opts = le32_to_cpu(es->s_default_mount_opts);
770aa22df2cSAneesh Kumar K.V 	def_errors     = le16_to_cpu(es->s_errors);
771d9c9bef1SMiklos Szeredi 
772d9c9bef1SMiklos Szeredi 	if (sbi->s_sb_block != 1)
773d9c9bef1SMiklos Szeredi 		seq_printf(seq, ",sb=%llu", sbi->s_sb_block);
774d9c9bef1SMiklos Szeredi 	if (test_opt(sb, MINIX_DF))
775d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",minixdf");
776aa22df2cSAneesh Kumar K.V 	if (test_opt(sb, GRPID) && !(def_mount_opts & EXT4_DEFM_BSDGROUPS))
777d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",grpid");
778d9c9bef1SMiklos Szeredi 	if (!test_opt(sb, GRPID) && (def_mount_opts & EXT4_DEFM_BSDGROUPS))
779d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",nogrpid");
780d9c9bef1SMiklos Szeredi 	if (sbi->s_resuid != EXT4_DEF_RESUID ||
781d9c9bef1SMiklos Szeredi 	    le16_to_cpu(es->s_def_resuid) != EXT4_DEF_RESUID) {
782d9c9bef1SMiklos Szeredi 		seq_printf(seq, ",resuid=%u", sbi->s_resuid);
783d9c9bef1SMiklos Szeredi 	}
784d9c9bef1SMiklos Szeredi 	if (sbi->s_resgid != EXT4_DEF_RESGID ||
785d9c9bef1SMiklos Szeredi 	    le16_to_cpu(es->s_def_resgid) != EXT4_DEF_RESGID) {
786d9c9bef1SMiklos Szeredi 		seq_printf(seq, ",resgid=%u", sbi->s_resgid);
787d9c9bef1SMiklos Szeredi 	}
788bb4f397aSAneesh Kumar K.V 	if (test_opt(sb, ERRORS_RO)) {
789d9c9bef1SMiklos Szeredi 		if (def_errors == EXT4_ERRORS_PANIC ||
790bb4f397aSAneesh Kumar K.V 		    def_errors == EXT4_ERRORS_CONTINUE) {
791d9c9bef1SMiklos Szeredi 			seq_puts(seq, ",errors=remount-ro");
792bb4f397aSAneesh Kumar K.V 		}
793bb4f397aSAneesh Kumar K.V 	}
794aa22df2cSAneesh Kumar K.V 	if (test_opt(sb, ERRORS_CONT) && def_errors != EXT4_ERRORS_CONTINUE)
795bb4f397aSAneesh Kumar K.V 		seq_puts(seq, ",errors=continue");
796aa22df2cSAneesh Kumar K.V 	if (test_opt(sb, ERRORS_PANIC) && def_errors != EXT4_ERRORS_PANIC)
797d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",errors=panic");
798aa22df2cSAneesh Kumar K.V 	if (test_opt(sb, NO_UID32) && !(def_mount_opts & EXT4_DEFM_UID16))
799d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",nouid32");
800aa22df2cSAneesh Kumar K.V 	if (test_opt(sb, DEBUG) && !(def_mount_opts & EXT4_DEFM_DEBUG))
801d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",debug");
802d9c9bef1SMiklos Szeredi 	if (test_opt(sb, OLDALLOC))
803d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",oldalloc");
80403010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_XATTR
805aa22df2cSAneesh Kumar K.V 	if (test_opt(sb, XATTR_USER) &&
806aa22df2cSAneesh Kumar K.V 		!(def_mount_opts & EXT4_DEFM_XATTR_USER))
807d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",user_xattr");
808d9c9bef1SMiklos Szeredi 	if (!test_opt(sb, XATTR_USER) &&
809d9c9bef1SMiklos Szeredi 	    (def_mount_opts & EXT4_DEFM_XATTR_USER)) {
810d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",nouser_xattr");
811d9c9bef1SMiklos Szeredi 	}
812d9c9bef1SMiklos Szeredi #endif
81303010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
814aa22df2cSAneesh Kumar K.V 	if (test_opt(sb, POSIX_ACL) && !(def_mount_opts & EXT4_DEFM_ACL))
815d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",acl");
816d9c9bef1SMiklos Szeredi 	if (!test_opt(sb, POSIX_ACL) && (def_mount_opts & EXT4_DEFM_ACL))
817d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",noacl");
818d9c9bef1SMiklos Szeredi #endif
81930773840STheodore Ts'o 	if (sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ) {
820d9c9bef1SMiklos Szeredi 		seq_printf(seq, ",commit=%u",
821d9c9bef1SMiklos Szeredi 			   (unsigned) (sbi->s_commit_interval / HZ));
822d9c9bef1SMiklos Szeredi 	}
82330773840STheodore Ts'o 	if (sbi->s_min_batch_time != EXT4_DEF_MIN_BATCH_TIME) {
82430773840STheodore Ts'o 		seq_printf(seq, ",min_batch_time=%u",
82530773840STheodore Ts'o 			   (unsigned) sbi->s_min_batch_time);
82630773840STheodore Ts'o 	}
82730773840STheodore Ts'o 	if (sbi->s_max_batch_time != EXT4_DEF_MAX_BATCH_TIME) {
82830773840STheodore Ts'o 		seq_printf(seq, ",max_batch_time=%u",
82930773840STheodore Ts'o 			   (unsigned) sbi->s_min_batch_time);
83030773840STheodore Ts'o 	}
83130773840STheodore Ts'o 
832571640caSEric Sandeen 	/*
833571640caSEric Sandeen 	 * We're changing the default of barrier mount option, so
834571640caSEric Sandeen 	 * let's always display its mount state so it's clear what its
835571640caSEric Sandeen 	 * status is.
836571640caSEric Sandeen 	 */
837571640caSEric Sandeen 	seq_puts(seq, ",barrier=");
838571640caSEric Sandeen 	seq_puts(seq, test_opt(sb, BARRIER) ? "1" : "0");
839cd0b6a39STheodore Ts'o 	if (test_opt(sb, JOURNAL_ASYNC_COMMIT))
840cd0b6a39STheodore Ts'o 		seq_puts(seq, ",journal_async_commit");
841d9c9bef1SMiklos Szeredi 	if (test_opt(sb, NOBH))
842d9c9bef1SMiklos Szeredi 		seq_puts(seq, ",nobh");
84325ec56b5SJean Noel Cordenner 	if (test_opt(sb, I_VERSION))
84425ec56b5SJean Noel Cordenner 		seq_puts(seq, ",i_version");
845dd919b98SAneesh Kumar K.V 	if (!test_opt(sb, DELALLOC))
846dd919b98SAneesh Kumar K.V 		seq_puts(seq, ",nodelalloc");
847dd919b98SAneesh Kumar K.V 
848ac27a0ecSDave Kleikamp 
849cb45bbe4SMiklos Szeredi 	if (sbi->s_stripe)
850cb45bbe4SMiklos Szeredi 		seq_printf(seq, ",stripe=%lu", sbi->s_stripe);
851aa22df2cSAneesh Kumar K.V 	/*
852aa22df2cSAneesh Kumar K.V 	 * journal mode get enabled in different ways
853aa22df2cSAneesh Kumar K.V 	 * So just print the value even if we didn't specify it
854aa22df2cSAneesh Kumar K.V 	 */
855617ba13bSMingming Cao 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
856ac27a0ecSDave Kleikamp 		seq_puts(seq, ",data=journal");
857617ba13bSMingming Cao 	else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
858ac27a0ecSDave Kleikamp 		seq_puts(seq, ",data=ordered");
859617ba13bSMingming Cao 	else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_WRITEBACK_DATA)
860ac27a0ecSDave Kleikamp 		seq_puts(seq, ",data=writeback");
861ac27a0ecSDave Kleikamp 
862240799cdSTheodore Ts'o 	if (sbi->s_inode_readahead_blks != EXT4_DEF_INODE_READAHEAD_BLKS)
863240799cdSTheodore Ts'o 		seq_printf(seq, ",inode_readahead_blks=%u",
864240799cdSTheodore Ts'o 			   sbi->s_inode_readahead_blks);
865240799cdSTheodore Ts'o 
8665bf5683aSHidehiro Kawai 	if (test_opt(sb, DATA_ERR_ABORT))
8675bf5683aSHidehiro Kawai 		seq_puts(seq, ",data_err=abort");
8685bf5683aSHidehiro Kawai 
869afd4672dSTheodore Ts'o 	if (test_opt(sb, NO_AUTO_DA_ALLOC))
870*06705bffSTheodore Ts'o 		seq_puts(seq, ",noauto_da_alloc");
871afd4672dSTheodore Ts'o 
872617ba13bSMingming Cao 	ext4_show_quota_options(seq, sb);
873ac27a0ecSDave Kleikamp 	return 0;
874ac27a0ecSDave Kleikamp }
875ac27a0ecSDave Kleikamp 
876ac27a0ecSDave Kleikamp 
8771b961ac0SChristoph Hellwig static struct inode *ext4_nfs_get_inode(struct super_block *sb,
8781b961ac0SChristoph Hellwig 		u64 ino, u32 generation)
879ac27a0ecSDave Kleikamp {
880ac27a0ecSDave Kleikamp 	struct inode *inode;
881ac27a0ecSDave Kleikamp 
882617ba13bSMingming Cao 	if (ino < EXT4_FIRST_INO(sb) && ino != EXT4_ROOT_INO)
883ac27a0ecSDave Kleikamp 		return ERR_PTR(-ESTALE);
884617ba13bSMingming Cao 	if (ino > le32_to_cpu(EXT4_SB(sb)->s_es->s_inodes_count))
885ac27a0ecSDave Kleikamp 		return ERR_PTR(-ESTALE);
886ac27a0ecSDave Kleikamp 
887ac27a0ecSDave Kleikamp 	/* iget isn't really right if the inode is currently unallocated!!
888ac27a0ecSDave Kleikamp 	 *
889617ba13bSMingming Cao 	 * ext4_read_inode will return a bad_inode if the inode had been
890ac27a0ecSDave Kleikamp 	 * deleted, so we should be safe.
891ac27a0ecSDave Kleikamp 	 *
892ac27a0ecSDave Kleikamp 	 * Currently we don't know the generation for parent directory, so
893ac27a0ecSDave Kleikamp 	 * a generation of 0 means "accept any"
894ac27a0ecSDave Kleikamp 	 */
8951d1fe1eeSDavid Howells 	inode = ext4_iget(sb, ino);
8961d1fe1eeSDavid Howells 	if (IS_ERR(inode))
8971d1fe1eeSDavid Howells 		return ERR_CAST(inode);
8981d1fe1eeSDavid Howells 	if (generation && inode->i_generation != generation) {
899ac27a0ecSDave Kleikamp 		iput(inode);
900ac27a0ecSDave Kleikamp 		return ERR_PTR(-ESTALE);
901ac27a0ecSDave Kleikamp 	}
9021b961ac0SChristoph Hellwig 
9031b961ac0SChristoph Hellwig 	return inode;
904ac27a0ecSDave Kleikamp }
9051b961ac0SChristoph Hellwig 
9061b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_dentry(struct super_block *sb, struct fid *fid,
9071b961ac0SChristoph Hellwig 		int fh_len, int fh_type)
9081b961ac0SChristoph Hellwig {
9091b961ac0SChristoph Hellwig 	return generic_fh_to_dentry(sb, fid, fh_len, fh_type,
9101b961ac0SChristoph Hellwig 				    ext4_nfs_get_inode);
9111b961ac0SChristoph Hellwig }
9121b961ac0SChristoph Hellwig 
9131b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_parent(struct super_block *sb, struct fid *fid,
9141b961ac0SChristoph Hellwig 		int fh_len, int fh_type)
9151b961ac0SChristoph Hellwig {
9161b961ac0SChristoph Hellwig 	return generic_fh_to_parent(sb, fid, fh_len, fh_type,
9171b961ac0SChristoph Hellwig 				    ext4_nfs_get_inode);
918ac27a0ecSDave Kleikamp }
919ac27a0ecSDave Kleikamp 
920c39a7f84SToshiyuki Okajima /*
921c39a7f84SToshiyuki Okajima  * Try to release metadata pages (indirect blocks, directories) which are
922c39a7f84SToshiyuki Okajima  * mapped via the block device.  Since these pages could have journal heads
923c39a7f84SToshiyuki Okajima  * which would prevent try_to_free_buffers() from freeing them, we must use
924c39a7f84SToshiyuki Okajima  * jbd2 layer's try_to_free_buffers() function to release them.
925c39a7f84SToshiyuki Okajima  */
926c39a7f84SToshiyuki Okajima static int bdev_try_to_free_page(struct super_block *sb, struct page *page, gfp_t wait)
927c39a7f84SToshiyuki Okajima {
928c39a7f84SToshiyuki Okajima 	journal_t *journal = EXT4_SB(sb)->s_journal;
929c39a7f84SToshiyuki Okajima 
930c39a7f84SToshiyuki Okajima 	WARN_ON(PageChecked(page));
931c39a7f84SToshiyuki Okajima 	if (!page_has_buffers(page))
932c39a7f84SToshiyuki Okajima 		return 0;
933c39a7f84SToshiyuki Okajima 	if (journal)
934c39a7f84SToshiyuki Okajima 		return jbd2_journal_try_to_free_buffers(journal, page,
935c39a7f84SToshiyuki Okajima 							wait & ~__GFP_WAIT);
936c39a7f84SToshiyuki Okajima 	return try_to_free_buffers(page);
937c39a7f84SToshiyuki Okajima }
938c39a7f84SToshiyuki Okajima 
939ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
940ac27a0ecSDave Kleikamp #define QTYPE2NAME(t) ((t) == USRQUOTA ? "user" : "group")
941ac27a0ecSDave Kleikamp #define QTYPE2MOPT(on, t) ((t) == USRQUOTA?((on)##USRJQUOTA):((on)##GRPJQUOTA))
942ac27a0ecSDave Kleikamp 
943617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot);
944617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot);
945617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot);
946617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot);
947617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type);
9486f28e087SJan Kara static int ext4_quota_on(struct super_block *sb, int type, int format_id,
9496f28e087SJan Kara 				char *path, int remount);
950617ba13bSMingming Cao static int ext4_quota_on_mount(struct super_block *sb, int type);
951617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
952ac27a0ecSDave Kleikamp 			       size_t len, loff_t off);
953617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
954ac27a0ecSDave Kleikamp 				const char *data, size_t len, loff_t off);
955ac27a0ecSDave Kleikamp 
956617ba13bSMingming Cao static struct dquot_operations ext4_quota_operations = {
957edf72453SJan Kara 	.initialize	= dquot_initialize,
958edf72453SJan Kara 	.drop		= dquot_drop,
959ac27a0ecSDave Kleikamp 	.alloc_space	= dquot_alloc_space,
96060e58e0fSMingming Cao 	.reserve_space	= dquot_reserve_space,
96160e58e0fSMingming Cao 	.claim_space	= dquot_claim_space,
96260e58e0fSMingming Cao 	.release_rsv	= dquot_release_reserved_space,
96360e58e0fSMingming Cao 	.get_reserved_space = ext4_get_reserved_space,
964ac27a0ecSDave Kleikamp 	.alloc_inode	= dquot_alloc_inode,
965ac27a0ecSDave Kleikamp 	.free_space	= dquot_free_space,
966ac27a0ecSDave Kleikamp 	.free_inode	= dquot_free_inode,
967ac27a0ecSDave Kleikamp 	.transfer	= dquot_transfer,
968617ba13bSMingming Cao 	.write_dquot	= ext4_write_dquot,
969617ba13bSMingming Cao 	.acquire_dquot	= ext4_acquire_dquot,
970617ba13bSMingming Cao 	.release_dquot	= ext4_release_dquot,
971617ba13bSMingming Cao 	.mark_dirty	= ext4_mark_dquot_dirty,
972a5b5ee32SJan Kara 	.write_info	= ext4_write_info,
973a5b5ee32SJan Kara 	.alloc_dquot	= dquot_alloc,
974a5b5ee32SJan Kara 	.destroy_dquot	= dquot_destroy,
975ac27a0ecSDave Kleikamp };
976ac27a0ecSDave Kleikamp 
977617ba13bSMingming Cao static struct quotactl_ops ext4_qctl_operations = {
978617ba13bSMingming Cao 	.quota_on	= ext4_quota_on,
979ac27a0ecSDave Kleikamp 	.quota_off	= vfs_quota_off,
980ac27a0ecSDave Kleikamp 	.quota_sync	= vfs_quota_sync,
981ac27a0ecSDave Kleikamp 	.get_info	= vfs_get_dqinfo,
982ac27a0ecSDave Kleikamp 	.set_info	= vfs_set_dqinfo,
983ac27a0ecSDave Kleikamp 	.get_dqblk	= vfs_get_dqblk,
984ac27a0ecSDave Kleikamp 	.set_dqblk	= vfs_set_dqblk
985ac27a0ecSDave Kleikamp };
986ac27a0ecSDave Kleikamp #endif
987ac27a0ecSDave Kleikamp 
988ee9b6d61SJosef 'Jeff' Sipek static const struct super_operations ext4_sops = {
989617ba13bSMingming Cao 	.alloc_inode	= ext4_alloc_inode,
990617ba13bSMingming Cao 	.destroy_inode	= ext4_destroy_inode,
991617ba13bSMingming Cao 	.write_inode	= ext4_write_inode,
992617ba13bSMingming Cao 	.dirty_inode	= ext4_dirty_inode,
993617ba13bSMingming Cao 	.delete_inode	= ext4_delete_inode,
994617ba13bSMingming Cao 	.put_super	= ext4_put_super,
995617ba13bSMingming Cao 	.write_super	= ext4_write_super,
996617ba13bSMingming Cao 	.sync_fs	= ext4_sync_fs,
997c4be0c1dSTakashi Sato 	.freeze_fs	= ext4_freeze,
998c4be0c1dSTakashi Sato 	.unfreeze_fs	= ext4_unfreeze,
999617ba13bSMingming Cao 	.statfs		= ext4_statfs,
1000617ba13bSMingming Cao 	.remount_fs	= ext4_remount,
1001617ba13bSMingming Cao 	.clear_inode	= ext4_clear_inode,
1002617ba13bSMingming Cao 	.show_options	= ext4_show_options,
1003ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1004617ba13bSMingming Cao 	.quota_read	= ext4_quota_read,
1005617ba13bSMingming Cao 	.quota_write	= ext4_quota_write,
1006ac27a0ecSDave Kleikamp #endif
1007c39a7f84SToshiyuki Okajima 	.bdev_try_to_free_page = bdev_try_to_free_page,
1008ac27a0ecSDave Kleikamp };
1009ac27a0ecSDave Kleikamp 
101039655164SChristoph Hellwig static const struct export_operations ext4_export_ops = {
10111b961ac0SChristoph Hellwig 	.fh_to_dentry = ext4_fh_to_dentry,
10121b961ac0SChristoph Hellwig 	.fh_to_parent = ext4_fh_to_parent,
1013617ba13bSMingming Cao 	.get_parent = ext4_get_parent,
1014ac27a0ecSDave Kleikamp };
1015ac27a0ecSDave Kleikamp 
1016ac27a0ecSDave Kleikamp enum {
1017ac27a0ecSDave Kleikamp 	Opt_bsd_df, Opt_minix_df, Opt_grpid, Opt_nogrpid,
1018ac27a0ecSDave Kleikamp 	Opt_resgid, Opt_resuid, Opt_sb, Opt_err_cont, Opt_err_panic, Opt_err_ro,
101901436ef2STheodore Ts'o 	Opt_nouid32, Opt_debug, Opt_oldalloc, Opt_orlov,
1020ac27a0ecSDave Kleikamp 	Opt_user_xattr, Opt_nouser_xattr, Opt_acl, Opt_noacl,
1021*06705bffSTheodore Ts'o 	Opt_auto_da_alloc, Opt_noauto_da_alloc, Opt_noload, Opt_nobh, Opt_bh,
102230773840STheodore Ts'o 	Opt_commit, Opt_min_batch_time, Opt_max_batch_time,
1023c3191067STheodore Ts'o 	Opt_journal_update, Opt_journal_dev,
1024818d276cSGirish Shilamkar 	Opt_journal_checksum, Opt_journal_async_commit,
1025ac27a0ecSDave Kleikamp 	Opt_abort, Opt_data_journal, Opt_data_ordered, Opt_data_writeback,
10265bf5683aSHidehiro Kawai 	Opt_data_err_abort, Opt_data_err_ignore,
1027ac27a0ecSDave Kleikamp 	Opt_usrjquota, Opt_grpjquota, Opt_offusrjquota, Opt_offgrpjquota,
1028ac27a0ecSDave Kleikamp 	Opt_jqfmt_vfsold, Opt_jqfmt_vfsv0, Opt_quota, Opt_noquota,
1029*06705bffSTheodore Ts'o 	Opt_ignore, Opt_barrier, Opt_nobarrier, Opt_err, Opt_resize,
1030*06705bffSTheodore Ts'o 	Opt_usrquota, Opt_grpquota, Opt_i_version,
103101436ef2STheodore Ts'o 	Opt_stripe, Opt_delalloc, Opt_nodelalloc,
1032b3881f74STheodore Ts'o 	Opt_inode_readahead_blks, Opt_journal_ioprio
1033ac27a0ecSDave Kleikamp };
1034ac27a0ecSDave Kleikamp 
1035a447c093SSteven Whitehouse static const match_table_t tokens = {
1036ac27a0ecSDave Kleikamp 	{Opt_bsd_df, "bsddf"},
1037ac27a0ecSDave Kleikamp 	{Opt_minix_df, "minixdf"},
1038ac27a0ecSDave Kleikamp 	{Opt_grpid, "grpid"},
1039ac27a0ecSDave Kleikamp 	{Opt_grpid, "bsdgroups"},
1040ac27a0ecSDave Kleikamp 	{Opt_nogrpid, "nogrpid"},
1041ac27a0ecSDave Kleikamp 	{Opt_nogrpid, "sysvgroups"},
1042ac27a0ecSDave Kleikamp 	{Opt_resgid, "resgid=%u"},
1043ac27a0ecSDave Kleikamp 	{Opt_resuid, "resuid=%u"},
1044ac27a0ecSDave Kleikamp 	{Opt_sb, "sb=%u"},
1045ac27a0ecSDave Kleikamp 	{Opt_err_cont, "errors=continue"},
1046ac27a0ecSDave Kleikamp 	{Opt_err_panic, "errors=panic"},
1047ac27a0ecSDave Kleikamp 	{Opt_err_ro, "errors=remount-ro"},
1048ac27a0ecSDave Kleikamp 	{Opt_nouid32, "nouid32"},
1049ac27a0ecSDave Kleikamp 	{Opt_debug, "debug"},
1050ac27a0ecSDave Kleikamp 	{Opt_oldalloc, "oldalloc"},
1051ac27a0ecSDave Kleikamp 	{Opt_orlov, "orlov"},
1052ac27a0ecSDave Kleikamp 	{Opt_user_xattr, "user_xattr"},
1053ac27a0ecSDave Kleikamp 	{Opt_nouser_xattr, "nouser_xattr"},
1054ac27a0ecSDave Kleikamp 	{Opt_acl, "acl"},
1055ac27a0ecSDave Kleikamp 	{Opt_noacl, "noacl"},
1056ac27a0ecSDave Kleikamp 	{Opt_noload, "noload"},
1057ac27a0ecSDave Kleikamp 	{Opt_nobh, "nobh"},
1058ac27a0ecSDave Kleikamp 	{Opt_bh, "bh"},
1059ac27a0ecSDave Kleikamp 	{Opt_commit, "commit=%u"},
106030773840STheodore Ts'o 	{Opt_min_batch_time, "min_batch_time=%u"},
106130773840STheodore Ts'o 	{Opt_max_batch_time, "max_batch_time=%u"},
1062ac27a0ecSDave Kleikamp 	{Opt_journal_update, "journal=update"},
1063ac27a0ecSDave Kleikamp 	{Opt_journal_dev, "journal_dev=%u"},
1064818d276cSGirish Shilamkar 	{Opt_journal_checksum, "journal_checksum"},
1065818d276cSGirish Shilamkar 	{Opt_journal_async_commit, "journal_async_commit"},
1066ac27a0ecSDave Kleikamp 	{Opt_abort, "abort"},
1067ac27a0ecSDave Kleikamp 	{Opt_data_journal, "data=journal"},
1068ac27a0ecSDave Kleikamp 	{Opt_data_ordered, "data=ordered"},
1069ac27a0ecSDave Kleikamp 	{Opt_data_writeback, "data=writeback"},
10705bf5683aSHidehiro Kawai 	{Opt_data_err_abort, "data_err=abort"},
10715bf5683aSHidehiro Kawai 	{Opt_data_err_ignore, "data_err=ignore"},
1072ac27a0ecSDave Kleikamp 	{Opt_offusrjquota, "usrjquota="},
1073ac27a0ecSDave Kleikamp 	{Opt_usrjquota, "usrjquota=%s"},
1074ac27a0ecSDave Kleikamp 	{Opt_offgrpjquota, "grpjquota="},
1075ac27a0ecSDave Kleikamp 	{Opt_grpjquota, "grpjquota=%s"},
1076ac27a0ecSDave Kleikamp 	{Opt_jqfmt_vfsold, "jqfmt=vfsold"},
1077ac27a0ecSDave Kleikamp 	{Opt_jqfmt_vfsv0, "jqfmt=vfsv0"},
1078ac27a0ecSDave Kleikamp 	{Opt_grpquota, "grpquota"},
1079ac27a0ecSDave Kleikamp 	{Opt_noquota, "noquota"},
1080ac27a0ecSDave Kleikamp 	{Opt_quota, "quota"},
1081ac27a0ecSDave Kleikamp 	{Opt_usrquota, "usrquota"},
1082ac27a0ecSDave Kleikamp 	{Opt_barrier, "barrier=%u"},
1083*06705bffSTheodore Ts'o 	{Opt_barrier, "barrier"},
1084*06705bffSTheodore Ts'o 	{Opt_nobarrier, "nobarrier"},
108525ec56b5SJean Noel Cordenner 	{Opt_i_version, "i_version"},
1086c9de560dSAlex Tomas 	{Opt_stripe, "stripe=%u"},
1087ac27a0ecSDave Kleikamp 	{Opt_resize, "resize"},
108864769240SAlex Tomas 	{Opt_delalloc, "delalloc"},
1089dd919b98SAneesh Kumar K.V 	{Opt_nodelalloc, "nodelalloc"},
1090240799cdSTheodore Ts'o 	{Opt_inode_readahead_blks, "inode_readahead_blks=%u"},
1091b3881f74STheodore Ts'o 	{Opt_journal_ioprio, "journal_ioprio=%u"},
1092afd4672dSTheodore Ts'o 	{Opt_auto_da_alloc, "auto_da_alloc=%u"},
1093*06705bffSTheodore Ts'o 	{Opt_auto_da_alloc, "auto_da_alloc"},
1094*06705bffSTheodore Ts'o 	{Opt_noauto_da_alloc, "noauto_da_alloc"},
1095f3f12faaSJosef Bacik 	{Opt_err, NULL},
1096ac27a0ecSDave Kleikamp };
1097ac27a0ecSDave Kleikamp 
1098617ba13bSMingming Cao static ext4_fsblk_t get_sb_block(void **data)
1099ac27a0ecSDave Kleikamp {
1100617ba13bSMingming Cao 	ext4_fsblk_t	sb_block;
1101ac27a0ecSDave Kleikamp 	char		*options = (char *) *data;
1102ac27a0ecSDave Kleikamp 
1103ac27a0ecSDave Kleikamp 	if (!options || strncmp(options, "sb=", 3) != 0)
1104ac27a0ecSDave Kleikamp 		return 1;	/* Default location */
1105ac27a0ecSDave Kleikamp 	options += 3;
1106617ba13bSMingming Cao 	/*todo: use simple_strtoll with >32bit ext4 */
1107ac27a0ecSDave Kleikamp 	sb_block = simple_strtoul(options, &options, 0);
1108ac27a0ecSDave Kleikamp 	if (*options && *options != ',') {
11094776004fSTheodore Ts'o 		printk(KERN_ERR "EXT4-fs: Invalid sb specification: %s\n",
1110ac27a0ecSDave Kleikamp 		       (char *) *data);
1111ac27a0ecSDave Kleikamp 		return 1;
1112ac27a0ecSDave Kleikamp 	}
1113ac27a0ecSDave Kleikamp 	if (*options == ',')
1114ac27a0ecSDave Kleikamp 		options++;
1115ac27a0ecSDave Kleikamp 	*data = (void *) options;
1116ac27a0ecSDave Kleikamp 	return sb_block;
1117ac27a0ecSDave Kleikamp }
1118ac27a0ecSDave Kleikamp 
1119b3881f74STheodore Ts'o #define DEFAULT_JOURNAL_IOPRIO (IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, 3))
1120b3881f74STheodore Ts'o 
1121ac27a0ecSDave Kleikamp static int parse_options(char *options, struct super_block *sb,
1122c3191067STheodore Ts'o 			 unsigned long *journal_devnum,
1123b3881f74STheodore Ts'o 			 unsigned int *journal_ioprio,
1124617ba13bSMingming Cao 			 ext4_fsblk_t *n_blocks_count, int is_remount)
1125ac27a0ecSDave Kleikamp {
1126617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1127ac27a0ecSDave Kleikamp 	char *p;
1128ac27a0ecSDave Kleikamp 	substring_t args[MAX_OPT_ARGS];
1129ac27a0ecSDave Kleikamp 	int data_opt = 0;
1130ac27a0ecSDave Kleikamp 	int option;
1131ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1132dfc5d03fSJan Kara 	int qtype, qfmt;
1133ac27a0ecSDave Kleikamp 	char *qname;
1134ac27a0ecSDave Kleikamp #endif
1135ac27a0ecSDave Kleikamp 
1136ac27a0ecSDave Kleikamp 	if (!options)
1137ac27a0ecSDave Kleikamp 		return 1;
1138ac27a0ecSDave Kleikamp 
1139ac27a0ecSDave Kleikamp 	while ((p = strsep(&options, ",")) != NULL) {
1140ac27a0ecSDave Kleikamp 		int token;
1141ac27a0ecSDave Kleikamp 		if (!*p)
1142ac27a0ecSDave Kleikamp 			continue;
1143ac27a0ecSDave Kleikamp 
1144ac27a0ecSDave Kleikamp 		token = match_token(p, tokens, args);
1145ac27a0ecSDave Kleikamp 		switch (token) {
1146ac27a0ecSDave Kleikamp 		case Opt_bsd_df:
1147ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, MINIX_DF);
1148ac27a0ecSDave Kleikamp 			break;
1149ac27a0ecSDave Kleikamp 		case Opt_minix_df:
1150ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, MINIX_DF);
1151ac27a0ecSDave Kleikamp 			break;
1152ac27a0ecSDave Kleikamp 		case Opt_grpid:
1153ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, GRPID);
1154ac27a0ecSDave Kleikamp 			break;
1155ac27a0ecSDave Kleikamp 		case Opt_nogrpid:
1156ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, GRPID);
1157ac27a0ecSDave Kleikamp 			break;
1158ac27a0ecSDave Kleikamp 		case Opt_resuid:
1159ac27a0ecSDave Kleikamp 			if (match_int(&args[0], &option))
1160ac27a0ecSDave Kleikamp 				return 0;
1161ac27a0ecSDave Kleikamp 			sbi->s_resuid = option;
1162ac27a0ecSDave Kleikamp 			break;
1163ac27a0ecSDave Kleikamp 		case Opt_resgid:
1164ac27a0ecSDave Kleikamp 			if (match_int(&args[0], &option))
1165ac27a0ecSDave Kleikamp 				return 0;
1166ac27a0ecSDave Kleikamp 			sbi->s_resgid = option;
1167ac27a0ecSDave Kleikamp 			break;
1168ac27a0ecSDave Kleikamp 		case Opt_sb:
1169ac27a0ecSDave Kleikamp 			/* handled by get_sb_block() instead of here */
1170ac27a0ecSDave Kleikamp 			/* *sb_block = match_int(&args[0]); */
1171ac27a0ecSDave Kleikamp 			break;
1172ac27a0ecSDave Kleikamp 		case Opt_err_panic:
1173ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, ERRORS_CONT);
1174ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, ERRORS_RO);
1175ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, ERRORS_PANIC);
1176ac27a0ecSDave Kleikamp 			break;
1177ac27a0ecSDave Kleikamp 		case Opt_err_ro:
1178ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, ERRORS_CONT);
1179ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, ERRORS_PANIC);
1180ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, ERRORS_RO);
1181ac27a0ecSDave Kleikamp 			break;
1182ac27a0ecSDave Kleikamp 		case Opt_err_cont:
1183ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, ERRORS_RO);
1184ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, ERRORS_PANIC);
1185ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, ERRORS_CONT);
1186ac27a0ecSDave Kleikamp 			break;
1187ac27a0ecSDave Kleikamp 		case Opt_nouid32:
1188ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, NO_UID32);
1189ac27a0ecSDave Kleikamp 			break;
1190ac27a0ecSDave Kleikamp 		case Opt_debug:
1191ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, DEBUG);
1192ac27a0ecSDave Kleikamp 			break;
1193ac27a0ecSDave Kleikamp 		case Opt_oldalloc:
1194ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, OLDALLOC);
1195ac27a0ecSDave Kleikamp 			break;
1196ac27a0ecSDave Kleikamp 		case Opt_orlov:
1197ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, OLDALLOC);
1198ac27a0ecSDave Kleikamp 			break;
119903010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_XATTR
1200ac27a0ecSDave Kleikamp 		case Opt_user_xattr:
1201ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, XATTR_USER);
1202ac27a0ecSDave Kleikamp 			break;
1203ac27a0ecSDave Kleikamp 		case Opt_nouser_xattr:
1204ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, XATTR_USER);
1205ac27a0ecSDave Kleikamp 			break;
1206ac27a0ecSDave Kleikamp #else
1207ac27a0ecSDave Kleikamp 		case Opt_user_xattr:
1208ac27a0ecSDave Kleikamp 		case Opt_nouser_xattr:
12094776004fSTheodore Ts'o 			printk(KERN_ERR "EXT4 (no)user_xattr options "
12104776004fSTheodore Ts'o 			       "not supported\n");
1211ac27a0ecSDave Kleikamp 			break;
1212ac27a0ecSDave Kleikamp #endif
121303010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
1214ac27a0ecSDave Kleikamp 		case Opt_acl:
1215ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, POSIX_ACL);
1216ac27a0ecSDave Kleikamp 			break;
1217ac27a0ecSDave Kleikamp 		case Opt_noacl:
1218ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, POSIX_ACL);
1219ac27a0ecSDave Kleikamp 			break;
1220ac27a0ecSDave Kleikamp #else
1221ac27a0ecSDave Kleikamp 		case Opt_acl:
1222ac27a0ecSDave Kleikamp 		case Opt_noacl:
12234776004fSTheodore Ts'o 			printk(KERN_ERR "EXT4 (no)acl options "
12244776004fSTheodore Ts'o 			       "not supported\n");
1225ac27a0ecSDave Kleikamp 			break;
1226ac27a0ecSDave Kleikamp #endif
1227ac27a0ecSDave Kleikamp 		case Opt_journal_update:
1228ac27a0ecSDave Kleikamp 			/* @@@ FIXME */
1229ac27a0ecSDave Kleikamp 			/* Eventually we will want to be able to create
1230ac27a0ecSDave Kleikamp 			   a journal file here.  For now, only allow the
1231ac27a0ecSDave Kleikamp 			   user to specify an existing inode to be the
1232ac27a0ecSDave Kleikamp 			   journal file. */
1233ac27a0ecSDave Kleikamp 			if (is_remount) {
1234617ba13bSMingming Cao 				printk(KERN_ERR "EXT4-fs: cannot specify "
1235ac27a0ecSDave Kleikamp 				       "journal on remount\n");
1236ac27a0ecSDave Kleikamp 				return 0;
1237ac27a0ecSDave Kleikamp 			}
1238ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, UPDATE_JOURNAL);
1239ac27a0ecSDave Kleikamp 			break;
1240ac27a0ecSDave Kleikamp 		case Opt_journal_dev:
1241ac27a0ecSDave Kleikamp 			if (is_remount) {
1242617ba13bSMingming Cao 				printk(KERN_ERR "EXT4-fs: cannot specify "
1243ac27a0ecSDave Kleikamp 				       "journal on remount\n");
1244ac27a0ecSDave Kleikamp 				return 0;
1245ac27a0ecSDave Kleikamp 			}
1246ac27a0ecSDave Kleikamp 			if (match_int(&args[0], &option))
1247ac27a0ecSDave Kleikamp 				return 0;
1248ac27a0ecSDave Kleikamp 			*journal_devnum = option;
1249ac27a0ecSDave Kleikamp 			break;
1250818d276cSGirish Shilamkar 		case Opt_journal_checksum:
1251818d276cSGirish Shilamkar 			set_opt(sbi->s_mount_opt, JOURNAL_CHECKSUM);
1252818d276cSGirish Shilamkar 			break;
1253818d276cSGirish Shilamkar 		case Opt_journal_async_commit:
1254818d276cSGirish Shilamkar 			set_opt(sbi->s_mount_opt, JOURNAL_ASYNC_COMMIT);
1255818d276cSGirish Shilamkar 			set_opt(sbi->s_mount_opt, JOURNAL_CHECKSUM);
1256818d276cSGirish Shilamkar 			break;
1257ac27a0ecSDave Kleikamp 		case Opt_noload:
1258ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, NOLOAD);
1259ac27a0ecSDave Kleikamp 			break;
1260ac27a0ecSDave Kleikamp 		case Opt_commit:
1261ac27a0ecSDave Kleikamp 			if (match_int(&args[0], &option))
1262ac27a0ecSDave Kleikamp 				return 0;
1263ac27a0ecSDave Kleikamp 			if (option < 0)
1264ac27a0ecSDave Kleikamp 				return 0;
1265ac27a0ecSDave Kleikamp 			if (option == 0)
1266cd02ff0bSMingming Cao 				option = JBD2_DEFAULT_MAX_COMMIT_AGE;
1267ac27a0ecSDave Kleikamp 			sbi->s_commit_interval = HZ * option;
1268ac27a0ecSDave Kleikamp 			break;
126930773840STheodore Ts'o 		case Opt_max_batch_time:
127030773840STheodore Ts'o 			if (match_int(&args[0], &option))
127130773840STheodore Ts'o 				return 0;
127230773840STheodore Ts'o 			if (option < 0)
127330773840STheodore Ts'o 				return 0;
127430773840STheodore Ts'o 			if (option == 0)
127530773840STheodore Ts'o 				option = EXT4_DEF_MAX_BATCH_TIME;
127630773840STheodore Ts'o 			sbi->s_max_batch_time = option;
127730773840STheodore Ts'o 			break;
127830773840STheodore Ts'o 		case Opt_min_batch_time:
127930773840STheodore Ts'o 			if (match_int(&args[0], &option))
128030773840STheodore Ts'o 				return 0;
128130773840STheodore Ts'o 			if (option < 0)
128230773840STheodore Ts'o 				return 0;
128330773840STheodore Ts'o 			sbi->s_min_batch_time = option;
128430773840STheodore Ts'o 			break;
1285ac27a0ecSDave Kleikamp 		case Opt_data_journal:
1286617ba13bSMingming Cao 			data_opt = EXT4_MOUNT_JOURNAL_DATA;
1287ac27a0ecSDave Kleikamp 			goto datacheck;
1288ac27a0ecSDave Kleikamp 		case Opt_data_ordered:
1289617ba13bSMingming Cao 			data_opt = EXT4_MOUNT_ORDERED_DATA;
1290ac27a0ecSDave Kleikamp 			goto datacheck;
1291ac27a0ecSDave Kleikamp 		case Opt_data_writeback:
1292617ba13bSMingming Cao 			data_opt = EXT4_MOUNT_WRITEBACK_DATA;
1293ac27a0ecSDave Kleikamp 		datacheck:
1294ac27a0ecSDave Kleikamp 			if (is_remount) {
1295617ba13bSMingming Cao 				if ((sbi->s_mount_opt & EXT4_MOUNT_DATA_FLAGS)
1296ac27a0ecSDave Kleikamp 						!= data_opt) {
1297ac27a0ecSDave Kleikamp 					printk(KERN_ERR
1298617ba13bSMingming Cao 						"EXT4-fs: cannot change data "
1299ac27a0ecSDave Kleikamp 						"mode on remount\n");
1300ac27a0ecSDave Kleikamp 					return 0;
1301ac27a0ecSDave Kleikamp 				}
1302ac27a0ecSDave Kleikamp 			} else {
1303617ba13bSMingming Cao 				sbi->s_mount_opt &= ~EXT4_MOUNT_DATA_FLAGS;
1304ac27a0ecSDave Kleikamp 				sbi->s_mount_opt |= data_opt;
1305ac27a0ecSDave Kleikamp 			}
1306ac27a0ecSDave Kleikamp 			break;
13075bf5683aSHidehiro Kawai 		case Opt_data_err_abort:
13085bf5683aSHidehiro Kawai 			set_opt(sbi->s_mount_opt, DATA_ERR_ABORT);
13095bf5683aSHidehiro Kawai 			break;
13105bf5683aSHidehiro Kawai 		case Opt_data_err_ignore:
13115bf5683aSHidehiro Kawai 			clear_opt(sbi->s_mount_opt, DATA_ERR_ABORT);
13125bf5683aSHidehiro Kawai 			break;
1313ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1314ac27a0ecSDave Kleikamp 		case Opt_usrjquota:
1315ac27a0ecSDave Kleikamp 			qtype = USRQUOTA;
1316ac27a0ecSDave Kleikamp 			goto set_qf_name;
1317ac27a0ecSDave Kleikamp 		case Opt_grpjquota:
1318ac27a0ecSDave Kleikamp 			qtype = GRPQUOTA;
1319ac27a0ecSDave Kleikamp set_qf_name:
132017bd13b3SJan Kara 			if (sb_any_quota_loaded(sb) &&
1321dfc5d03fSJan Kara 			    !sbi->s_qf_names[qtype]) {
1322ac27a0ecSDave Kleikamp 				printk(KERN_ERR
13232c8be6b2SJan Kara 				       "EXT4-fs: Cannot change journaled "
1324ac27a0ecSDave Kleikamp 				       "quota options when quota turned on.\n");
1325ac27a0ecSDave Kleikamp 				return 0;
1326ac27a0ecSDave Kleikamp 			}
1327ac27a0ecSDave Kleikamp 			qname = match_strdup(&args[0]);
1328ac27a0ecSDave Kleikamp 			if (!qname) {
1329ac27a0ecSDave Kleikamp 				printk(KERN_ERR
1330617ba13bSMingming Cao 					"EXT4-fs: not enough memory for "
1331ac27a0ecSDave Kleikamp 					"storing quotafile name.\n");
1332ac27a0ecSDave Kleikamp 				return 0;
1333ac27a0ecSDave Kleikamp 			}
1334ac27a0ecSDave Kleikamp 			if (sbi->s_qf_names[qtype] &&
1335ac27a0ecSDave Kleikamp 			    strcmp(sbi->s_qf_names[qtype], qname)) {
1336ac27a0ecSDave Kleikamp 				printk(KERN_ERR
1337617ba13bSMingming Cao 					"EXT4-fs: %s quota file already "
1338ac27a0ecSDave Kleikamp 					"specified.\n", QTYPE2NAME(qtype));
1339ac27a0ecSDave Kleikamp 				kfree(qname);
1340ac27a0ecSDave Kleikamp 				return 0;
1341ac27a0ecSDave Kleikamp 			}
1342ac27a0ecSDave Kleikamp 			sbi->s_qf_names[qtype] = qname;
1343ac27a0ecSDave Kleikamp 			if (strchr(sbi->s_qf_names[qtype], '/')) {
1344ac27a0ecSDave Kleikamp 				printk(KERN_ERR
1345617ba13bSMingming Cao 					"EXT4-fs: quotafile must be on "
1346ac27a0ecSDave Kleikamp 					"filesystem root.\n");
1347ac27a0ecSDave Kleikamp 				kfree(sbi->s_qf_names[qtype]);
1348ac27a0ecSDave Kleikamp 				sbi->s_qf_names[qtype] = NULL;
1349ac27a0ecSDave Kleikamp 				return 0;
1350ac27a0ecSDave Kleikamp 			}
1351ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, QUOTA);
1352ac27a0ecSDave Kleikamp 			break;
1353ac27a0ecSDave Kleikamp 		case Opt_offusrjquota:
1354ac27a0ecSDave Kleikamp 			qtype = USRQUOTA;
1355ac27a0ecSDave Kleikamp 			goto clear_qf_name;
1356ac27a0ecSDave Kleikamp 		case Opt_offgrpjquota:
1357ac27a0ecSDave Kleikamp 			qtype = GRPQUOTA;
1358ac27a0ecSDave Kleikamp clear_qf_name:
135917bd13b3SJan Kara 			if (sb_any_quota_loaded(sb) &&
1360dfc5d03fSJan Kara 			    sbi->s_qf_names[qtype]) {
1361617ba13bSMingming Cao 				printk(KERN_ERR "EXT4-fs: Cannot change "
13622c8be6b2SJan Kara 					"journaled quota options when "
1363ac27a0ecSDave Kleikamp 					"quota turned on.\n");
1364ac27a0ecSDave Kleikamp 				return 0;
1365ac27a0ecSDave Kleikamp 			}
1366ac27a0ecSDave Kleikamp 			/*
1367ac27a0ecSDave Kleikamp 			 * The space will be released later when all options
1368ac27a0ecSDave Kleikamp 			 * are confirmed to be correct
1369ac27a0ecSDave Kleikamp 			 */
1370ac27a0ecSDave Kleikamp 			sbi->s_qf_names[qtype] = NULL;
1371ac27a0ecSDave Kleikamp 			break;
1372ac27a0ecSDave Kleikamp 		case Opt_jqfmt_vfsold:
1373dfc5d03fSJan Kara 			qfmt = QFMT_VFS_OLD;
1374dfc5d03fSJan Kara 			goto set_qf_format;
1375ac27a0ecSDave Kleikamp 		case Opt_jqfmt_vfsv0:
1376dfc5d03fSJan Kara 			qfmt = QFMT_VFS_V0;
1377dfc5d03fSJan Kara set_qf_format:
137817bd13b3SJan Kara 			if (sb_any_quota_loaded(sb) &&
1379dfc5d03fSJan Kara 			    sbi->s_jquota_fmt != qfmt) {
1380dfc5d03fSJan Kara 				printk(KERN_ERR "EXT4-fs: Cannot change "
1381dfc5d03fSJan Kara 					"journaled quota options when "
1382dfc5d03fSJan Kara 					"quota turned on.\n");
1383dfc5d03fSJan Kara 				return 0;
1384dfc5d03fSJan Kara 			}
1385dfc5d03fSJan Kara 			sbi->s_jquota_fmt = qfmt;
1386ac27a0ecSDave Kleikamp 			break;
1387ac27a0ecSDave Kleikamp 		case Opt_quota:
1388ac27a0ecSDave Kleikamp 		case Opt_usrquota:
1389ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, QUOTA);
1390ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, USRQUOTA);
1391ac27a0ecSDave Kleikamp 			break;
1392ac27a0ecSDave Kleikamp 		case Opt_grpquota:
1393ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, QUOTA);
1394ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, GRPQUOTA);
1395ac27a0ecSDave Kleikamp 			break;
1396ac27a0ecSDave Kleikamp 		case Opt_noquota:
139717bd13b3SJan Kara 			if (sb_any_quota_loaded(sb)) {
1398617ba13bSMingming Cao 				printk(KERN_ERR "EXT4-fs: Cannot change quota "
1399ac27a0ecSDave Kleikamp 					"options when quota turned on.\n");
1400ac27a0ecSDave Kleikamp 				return 0;
1401ac27a0ecSDave Kleikamp 			}
1402ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, QUOTA);
1403ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, USRQUOTA);
1404ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, GRPQUOTA);
1405ac27a0ecSDave Kleikamp 			break;
1406ac27a0ecSDave Kleikamp #else
1407ac27a0ecSDave Kleikamp 		case Opt_quota:
1408ac27a0ecSDave Kleikamp 		case Opt_usrquota:
1409ac27a0ecSDave Kleikamp 		case Opt_grpquota:
1410cd59e7b9SJan Kara 			printk(KERN_ERR
1411cd59e7b9SJan Kara 				"EXT4-fs: quota options not supported.\n");
1412cd59e7b9SJan Kara 			break;
1413ac27a0ecSDave Kleikamp 		case Opt_usrjquota:
1414ac27a0ecSDave Kleikamp 		case Opt_grpjquota:
1415ac27a0ecSDave Kleikamp 		case Opt_offusrjquota:
1416ac27a0ecSDave Kleikamp 		case Opt_offgrpjquota:
1417ac27a0ecSDave Kleikamp 		case Opt_jqfmt_vfsold:
1418ac27a0ecSDave Kleikamp 		case Opt_jqfmt_vfsv0:
1419ac27a0ecSDave Kleikamp 			printk(KERN_ERR
1420cd59e7b9SJan Kara 				"EXT4-fs: journaled quota options not "
1421ac27a0ecSDave Kleikamp 				"supported.\n");
1422ac27a0ecSDave Kleikamp 			break;
1423ac27a0ecSDave Kleikamp 		case Opt_noquota:
1424ac27a0ecSDave Kleikamp 			break;
1425ac27a0ecSDave Kleikamp #endif
1426ac27a0ecSDave Kleikamp 		case Opt_abort:
1427ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, ABORT);
1428ac27a0ecSDave Kleikamp 			break;
1429*06705bffSTheodore Ts'o 		case Opt_nobarrier:
1430*06705bffSTheodore Ts'o 			clear_opt(sbi->s_mount_opt, BARRIER);
1431*06705bffSTheodore Ts'o 			break;
1432ac27a0ecSDave Kleikamp 		case Opt_barrier:
1433*06705bffSTheodore Ts'o 			if (match_int(&args[0], &option)) {
1434*06705bffSTheodore Ts'o 				set_opt(sbi->s_mount_opt, BARRIER);
1435*06705bffSTheodore Ts'o 				break;
1436*06705bffSTheodore Ts'o 			}
1437ac27a0ecSDave Kleikamp 			if (option)
1438ac27a0ecSDave Kleikamp 				set_opt(sbi->s_mount_opt, BARRIER);
1439ac27a0ecSDave Kleikamp 			else
1440ac27a0ecSDave Kleikamp 				clear_opt(sbi->s_mount_opt, BARRIER);
1441ac27a0ecSDave Kleikamp 			break;
1442ac27a0ecSDave Kleikamp 		case Opt_ignore:
1443ac27a0ecSDave Kleikamp 			break;
1444ac27a0ecSDave Kleikamp 		case Opt_resize:
1445ac27a0ecSDave Kleikamp 			if (!is_remount) {
1446617ba13bSMingming Cao 				printk("EXT4-fs: resize option only available "
1447ac27a0ecSDave Kleikamp 					"for remount\n");
1448ac27a0ecSDave Kleikamp 				return 0;
1449ac27a0ecSDave Kleikamp 			}
1450ac27a0ecSDave Kleikamp 			if (match_int(&args[0], &option) != 0)
1451ac27a0ecSDave Kleikamp 				return 0;
1452ac27a0ecSDave Kleikamp 			*n_blocks_count = option;
1453ac27a0ecSDave Kleikamp 			break;
1454ac27a0ecSDave Kleikamp 		case Opt_nobh:
1455ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, NOBH);
1456ac27a0ecSDave Kleikamp 			break;
1457ac27a0ecSDave Kleikamp 		case Opt_bh:
1458ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, NOBH);
1459ac27a0ecSDave Kleikamp 			break;
146025ec56b5SJean Noel Cordenner 		case Opt_i_version:
146125ec56b5SJean Noel Cordenner 			set_opt(sbi->s_mount_opt, I_VERSION);
146225ec56b5SJean Noel Cordenner 			sb->s_flags |= MS_I_VERSION;
146325ec56b5SJean Noel Cordenner 			break;
1464dd919b98SAneesh Kumar K.V 		case Opt_nodelalloc:
1465dd919b98SAneesh Kumar K.V 			clear_opt(sbi->s_mount_opt, DELALLOC);
1466dd919b98SAneesh Kumar K.V 			break;
1467c9de560dSAlex Tomas 		case Opt_stripe:
1468c9de560dSAlex Tomas 			if (match_int(&args[0], &option))
1469c9de560dSAlex Tomas 				return 0;
1470c9de560dSAlex Tomas 			if (option < 0)
1471c9de560dSAlex Tomas 				return 0;
1472c9de560dSAlex Tomas 			sbi->s_stripe = option;
1473c9de560dSAlex Tomas 			break;
147464769240SAlex Tomas 		case Opt_delalloc:
147564769240SAlex Tomas 			set_opt(sbi->s_mount_opt, DELALLOC);
147664769240SAlex Tomas 			break;
1477240799cdSTheodore Ts'o 		case Opt_inode_readahead_blks:
1478240799cdSTheodore Ts'o 			if (match_int(&args[0], &option))
1479240799cdSTheodore Ts'o 				return 0;
1480240799cdSTheodore Ts'o 			if (option < 0 || option > (1 << 30))
1481240799cdSTheodore Ts'o 				return 0;
14823197ebdbSTheodore Ts'o 			if (option & (option - 1)) {
14833197ebdbSTheodore Ts'o 				printk(KERN_ERR "EXT4-fs: inode_readahead_blks"
14843197ebdbSTheodore Ts'o 				       " must be a power of 2\n");
14853197ebdbSTheodore Ts'o 				return 0;
14863197ebdbSTheodore Ts'o 			}
1487240799cdSTheodore Ts'o 			sbi->s_inode_readahead_blks = option;
1488240799cdSTheodore Ts'o 			break;
1489b3881f74STheodore Ts'o 		case Opt_journal_ioprio:
1490b3881f74STheodore Ts'o 			if (match_int(&args[0], &option))
1491b3881f74STheodore Ts'o 				return 0;
1492b3881f74STheodore Ts'o 			if (option < 0 || option > 7)
1493b3881f74STheodore Ts'o 				break;
1494b3881f74STheodore Ts'o 			*journal_ioprio = IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE,
1495b3881f74STheodore Ts'o 							    option);
1496b3881f74STheodore Ts'o 			break;
1497*06705bffSTheodore Ts'o 		case Opt_noauto_da_alloc:
1498*06705bffSTheodore Ts'o 			set_opt(sbi->s_mount_opt,NO_AUTO_DA_ALLOC);
1499*06705bffSTheodore Ts'o 			break;
1500afd4672dSTheodore Ts'o 		case Opt_auto_da_alloc:
1501*06705bffSTheodore Ts'o 			if (match_int(&args[0], &option)) {
1502*06705bffSTheodore Ts'o 				clear_opt(sbi->s_mount_opt, NO_AUTO_DA_ALLOC);
1503*06705bffSTheodore Ts'o 				break;
1504*06705bffSTheodore Ts'o 			}
1505afd4672dSTheodore Ts'o 			if (option)
1506afd4672dSTheodore Ts'o 				clear_opt(sbi->s_mount_opt, NO_AUTO_DA_ALLOC);
1507afd4672dSTheodore Ts'o 			else
1508afd4672dSTheodore Ts'o 				set_opt(sbi->s_mount_opt,NO_AUTO_DA_ALLOC);
1509afd4672dSTheodore Ts'o 			break;
1510ac27a0ecSDave Kleikamp 		default:
1511ac27a0ecSDave Kleikamp 			printk(KERN_ERR
1512617ba13bSMingming Cao 			       "EXT4-fs: Unrecognized mount option \"%s\" "
1513ac27a0ecSDave Kleikamp 			       "or missing value\n", p);
1514ac27a0ecSDave Kleikamp 			return 0;
1515ac27a0ecSDave Kleikamp 		}
1516ac27a0ecSDave Kleikamp 	}
1517ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1518ac27a0ecSDave Kleikamp 	if (sbi->s_qf_names[USRQUOTA] || sbi->s_qf_names[GRPQUOTA]) {
1519617ba13bSMingming Cao 		if ((sbi->s_mount_opt & EXT4_MOUNT_USRQUOTA) &&
1520ac27a0ecSDave Kleikamp 		     sbi->s_qf_names[USRQUOTA])
1521ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, USRQUOTA);
1522ac27a0ecSDave Kleikamp 
1523617ba13bSMingming Cao 		if ((sbi->s_mount_opt & EXT4_MOUNT_GRPQUOTA) &&
1524ac27a0ecSDave Kleikamp 		     sbi->s_qf_names[GRPQUOTA])
1525ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, GRPQUOTA);
1526ac27a0ecSDave Kleikamp 
1527ac27a0ecSDave Kleikamp 		if ((sbi->s_qf_names[USRQUOTA] &&
1528617ba13bSMingming Cao 				(sbi->s_mount_opt & EXT4_MOUNT_GRPQUOTA)) ||
1529ac27a0ecSDave Kleikamp 		    (sbi->s_qf_names[GRPQUOTA] &&
1530617ba13bSMingming Cao 				(sbi->s_mount_opt & EXT4_MOUNT_USRQUOTA))) {
1531617ba13bSMingming Cao 			printk(KERN_ERR "EXT4-fs: old and new quota "
1532ac27a0ecSDave Kleikamp 					"format mixing.\n");
1533ac27a0ecSDave Kleikamp 			return 0;
1534ac27a0ecSDave Kleikamp 		}
1535ac27a0ecSDave Kleikamp 
1536ac27a0ecSDave Kleikamp 		if (!sbi->s_jquota_fmt) {
15372c8be6b2SJan Kara 			printk(KERN_ERR "EXT4-fs: journaled quota format "
1538ac27a0ecSDave Kleikamp 					"not specified.\n");
1539ac27a0ecSDave Kleikamp 			return 0;
1540ac27a0ecSDave Kleikamp 		}
1541ac27a0ecSDave Kleikamp 	} else {
1542ac27a0ecSDave Kleikamp 		if (sbi->s_jquota_fmt) {
15432c8be6b2SJan Kara 			printk(KERN_ERR "EXT4-fs: journaled quota format "
15442c8be6b2SJan Kara 					"specified with no journaling "
1545ac27a0ecSDave Kleikamp 					"enabled.\n");
1546ac27a0ecSDave Kleikamp 			return 0;
1547ac27a0ecSDave Kleikamp 		}
1548ac27a0ecSDave Kleikamp 	}
1549ac27a0ecSDave Kleikamp #endif
1550ac27a0ecSDave Kleikamp 	return 1;
1551ac27a0ecSDave Kleikamp }
1552ac27a0ecSDave Kleikamp 
1553617ba13bSMingming Cao static int ext4_setup_super(struct super_block *sb, struct ext4_super_block *es,
1554ac27a0ecSDave Kleikamp 			    int read_only)
1555ac27a0ecSDave Kleikamp {
1556617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1557ac27a0ecSDave Kleikamp 	int res = 0;
1558ac27a0ecSDave Kleikamp 
1559617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) > EXT4_MAX_SUPP_REV) {
1560617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs warning: revision level too high, "
1561ac27a0ecSDave Kleikamp 		       "forcing read-only mode\n");
1562ac27a0ecSDave Kleikamp 		res = MS_RDONLY;
1563ac27a0ecSDave Kleikamp 	}
1564ac27a0ecSDave Kleikamp 	if (read_only)
1565ac27a0ecSDave Kleikamp 		return res;
1566617ba13bSMingming Cao 	if (!(sbi->s_mount_state & EXT4_VALID_FS))
1567617ba13bSMingming Cao 		printk(KERN_WARNING "EXT4-fs warning: mounting unchecked fs, "
1568ac27a0ecSDave Kleikamp 		       "running e2fsck is recommended\n");
1569617ba13bSMingming Cao 	else if ((sbi->s_mount_state & EXT4_ERROR_FS))
1570ac27a0ecSDave Kleikamp 		printk(KERN_WARNING
1571617ba13bSMingming Cao 		       "EXT4-fs warning: mounting fs with errors, "
1572ac27a0ecSDave Kleikamp 		       "running e2fsck is recommended\n");
1573ac27a0ecSDave Kleikamp 	else if ((__s16) le16_to_cpu(es->s_max_mnt_count) >= 0 &&
1574ac27a0ecSDave Kleikamp 		 le16_to_cpu(es->s_mnt_count) >=
1575ac27a0ecSDave Kleikamp 		 (unsigned short) (__s16) le16_to_cpu(es->s_max_mnt_count))
1576ac27a0ecSDave Kleikamp 		printk(KERN_WARNING
1577617ba13bSMingming Cao 		       "EXT4-fs warning: maximal mount count reached, "
1578ac27a0ecSDave Kleikamp 		       "running e2fsck is recommended\n");
1579ac27a0ecSDave Kleikamp 	else if (le32_to_cpu(es->s_checkinterval) &&
1580ac27a0ecSDave Kleikamp 		(le32_to_cpu(es->s_lastcheck) +
1581ac27a0ecSDave Kleikamp 			le32_to_cpu(es->s_checkinterval) <= get_seconds()))
1582ac27a0ecSDave Kleikamp 		printk(KERN_WARNING
1583617ba13bSMingming Cao 		       "EXT4-fs warning: checktime reached, "
1584ac27a0ecSDave Kleikamp 		       "running e2fsck is recommended\n");
15850390131bSFrank Mayhar 	if (!sbi->s_journal)
1586216c34b2SMarcin Slusarz 		es->s_state &= cpu_to_le16(~EXT4_VALID_FS);
1587ac27a0ecSDave Kleikamp 	if (!(__s16) le16_to_cpu(es->s_max_mnt_count))
1588617ba13bSMingming Cao 		es->s_max_mnt_count = cpu_to_le16(EXT4_DFL_MAX_MNT_COUNT);
1589e8546d06SMarcin Slusarz 	le16_add_cpu(&es->s_mnt_count, 1);
1590ac27a0ecSDave Kleikamp 	es->s_mtime = cpu_to_le32(get_seconds());
1591617ba13bSMingming Cao 	ext4_update_dynamic_rev(sb);
15920390131bSFrank Mayhar 	if (sbi->s_journal)
1593617ba13bSMingming Cao 		EXT4_SET_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER);
1594ac27a0ecSDave Kleikamp 
1595617ba13bSMingming Cao 	ext4_commit_super(sb, es, 1);
1596ac27a0ecSDave Kleikamp 	if (test_opt(sb, DEBUG))
1597a9df9a49STheodore Ts'o 		printk(KERN_INFO "[EXT4 FS bs=%lu, gc=%u, "
1598ac27a0ecSDave Kleikamp 				"bpg=%lu, ipg=%lu, mo=%04lx]\n",
1599ac27a0ecSDave Kleikamp 			sb->s_blocksize,
1600ac27a0ecSDave Kleikamp 			sbi->s_groups_count,
1601617ba13bSMingming Cao 			EXT4_BLOCKS_PER_GROUP(sb),
1602617ba13bSMingming Cao 			EXT4_INODES_PER_GROUP(sb),
1603ac27a0ecSDave Kleikamp 			sbi->s_mount_opt);
1604ac27a0ecSDave Kleikamp 
16050390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal) {
160605496769STheodore Ts'o 		printk(KERN_INFO "EXT4 FS on %s, %s journal on %s\n",
160705496769STheodore Ts'o 		       sb->s_id, EXT4_SB(sb)->s_journal->j_inode ? "internal" :
160805496769STheodore Ts'o 		       "external", EXT4_SB(sb)->s_journal->j_devname);
16090390131bSFrank Mayhar 	} else {
16100390131bSFrank Mayhar 		printk(KERN_INFO "EXT4 FS on %s, no journal\n", sb->s_id);
16110390131bSFrank Mayhar 	}
1612ac27a0ecSDave Kleikamp 	return res;
1613ac27a0ecSDave Kleikamp }
1614ac27a0ecSDave Kleikamp 
1615772cb7c8SJose R. Santos static int ext4_fill_flex_info(struct super_block *sb)
1616772cb7c8SJose R. Santos {
1617772cb7c8SJose R. Santos 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1618772cb7c8SJose R. Santos 	struct ext4_group_desc *gdp = NULL;
1619772cb7c8SJose R. Santos 	struct buffer_head *bh;
1620772cb7c8SJose R. Santos 	ext4_group_t flex_group_count;
1621772cb7c8SJose R. Santos 	ext4_group_t flex_group;
1622772cb7c8SJose R. Santos 	int groups_per_flex = 0;
1623772cb7c8SJose R. Santos 	int i;
1624772cb7c8SJose R. Santos 
1625772cb7c8SJose R. Santos 	if (!sbi->s_es->s_log_groups_per_flex) {
1626772cb7c8SJose R. Santos 		sbi->s_log_groups_per_flex = 0;
1627772cb7c8SJose R. Santos 		return 1;
1628772cb7c8SJose R. Santos 	}
1629772cb7c8SJose R. Santos 
1630772cb7c8SJose R. Santos 	sbi->s_log_groups_per_flex = sbi->s_es->s_log_groups_per_flex;
1631772cb7c8SJose R. Santos 	groups_per_flex = 1 << sbi->s_log_groups_per_flex;
1632772cb7c8SJose R. Santos 
1633c62a11fdSFrederic Bohe 	/* We allocate both existing and potentially added groups */
1634c62a11fdSFrederic Bohe 	flex_group_count = ((sbi->s_groups_count + groups_per_flex - 1) +
1635d94e99a6SAneesh Kumar K.V 			((le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) + 1) <<
1636d94e99a6SAneesh Kumar K.V 			      EXT4_DESC_PER_BLOCK_BITS(sb))) / groups_per_flex;
1637ec05e868SLi Zefan 	sbi->s_flex_groups = kzalloc(flex_group_count *
1638772cb7c8SJose R. Santos 				     sizeof(struct flex_groups), GFP_KERNEL);
1639772cb7c8SJose R. Santos 	if (sbi->s_flex_groups == NULL) {
1640ec05e868SLi Zefan 		printk(KERN_ERR "EXT4-fs: not enough memory for "
1641a9df9a49STheodore Ts'o 				"%u flex groups\n", flex_group_count);
1642772cb7c8SJose R. Santos 		goto failed;
1643772cb7c8SJose R. Santos 	}
1644772cb7c8SJose R. Santos 
1645772cb7c8SJose R. Santos 	for (i = 0; i < sbi->s_groups_count; i++) {
1646772cb7c8SJose R. Santos 		gdp = ext4_get_group_desc(sb, i, &bh);
1647772cb7c8SJose R. Santos 
1648772cb7c8SJose R. Santos 		flex_group = ext4_flex_group(sbi, i);
16499f24e420STheodore Ts'o 		atomic_set(&sbi->s_flex_groups[flex_group].free_inodes,
16509f24e420STheodore Ts'o 			   ext4_free_inodes_count(sb, gdp));
16519f24e420STheodore Ts'o 		atomic_set(&sbi->s_flex_groups[flex_group].free_blocks,
16529f24e420STheodore Ts'o 			   ext4_free_blks_count(sb, gdp));
16537d39db14STheodore Ts'o 		atomic_set(&sbi->s_flex_groups[flex_group].used_dirs,
16547d39db14STheodore Ts'o 			   ext4_used_dirs_count(sb, gdp));
1655772cb7c8SJose R. Santos 	}
1656772cb7c8SJose R. Santos 
1657772cb7c8SJose R. Santos 	return 1;
1658772cb7c8SJose R. Santos failed:
1659772cb7c8SJose R. Santos 	return 0;
1660772cb7c8SJose R. Santos }
1661772cb7c8SJose R. Santos 
1662717d50e4SAndreas Dilger __le16 ext4_group_desc_csum(struct ext4_sb_info *sbi, __u32 block_group,
1663717d50e4SAndreas Dilger 			    struct ext4_group_desc *gdp)
1664717d50e4SAndreas Dilger {
1665717d50e4SAndreas Dilger 	__u16 crc = 0;
1666717d50e4SAndreas Dilger 
1667717d50e4SAndreas Dilger 	if (sbi->s_es->s_feature_ro_compat &
1668717d50e4SAndreas Dilger 	    cpu_to_le32(EXT4_FEATURE_RO_COMPAT_GDT_CSUM)) {
1669717d50e4SAndreas Dilger 		int offset = offsetof(struct ext4_group_desc, bg_checksum);
1670717d50e4SAndreas Dilger 		__le32 le_group = cpu_to_le32(block_group);
1671717d50e4SAndreas Dilger 
1672717d50e4SAndreas Dilger 		crc = crc16(~0, sbi->s_es->s_uuid, sizeof(sbi->s_es->s_uuid));
1673717d50e4SAndreas Dilger 		crc = crc16(crc, (__u8 *)&le_group, sizeof(le_group));
1674717d50e4SAndreas Dilger 		crc = crc16(crc, (__u8 *)gdp, offset);
1675717d50e4SAndreas Dilger 		offset += sizeof(gdp->bg_checksum); /* skip checksum */
1676717d50e4SAndreas Dilger 		/* for checksum of struct ext4_group_desc do the rest...*/
1677717d50e4SAndreas Dilger 		if ((sbi->s_es->s_feature_incompat &
1678717d50e4SAndreas Dilger 		     cpu_to_le32(EXT4_FEATURE_INCOMPAT_64BIT)) &&
1679717d50e4SAndreas Dilger 		    offset < le16_to_cpu(sbi->s_es->s_desc_size))
1680717d50e4SAndreas Dilger 			crc = crc16(crc, (__u8 *)gdp + offset,
1681717d50e4SAndreas Dilger 				    le16_to_cpu(sbi->s_es->s_desc_size) -
1682717d50e4SAndreas Dilger 					offset);
1683717d50e4SAndreas Dilger 	}
1684717d50e4SAndreas Dilger 
1685717d50e4SAndreas Dilger 	return cpu_to_le16(crc);
1686717d50e4SAndreas Dilger }
1687717d50e4SAndreas Dilger 
1688717d50e4SAndreas Dilger int ext4_group_desc_csum_verify(struct ext4_sb_info *sbi, __u32 block_group,
1689717d50e4SAndreas Dilger 				struct ext4_group_desc *gdp)
1690717d50e4SAndreas Dilger {
1691717d50e4SAndreas Dilger 	if ((sbi->s_es->s_feature_ro_compat &
1692717d50e4SAndreas Dilger 	     cpu_to_le32(EXT4_FEATURE_RO_COMPAT_GDT_CSUM)) &&
1693717d50e4SAndreas Dilger 	    (gdp->bg_checksum != ext4_group_desc_csum(sbi, block_group, gdp)))
1694717d50e4SAndreas Dilger 		return 0;
1695717d50e4SAndreas Dilger 
1696717d50e4SAndreas Dilger 	return 1;
1697717d50e4SAndreas Dilger }
1698717d50e4SAndreas Dilger 
1699ac27a0ecSDave Kleikamp /* Called at mount-time, super-block is locked */
1700617ba13bSMingming Cao static int ext4_check_descriptors(struct super_block *sb)
1701ac27a0ecSDave Kleikamp {
1702617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1703617ba13bSMingming Cao 	ext4_fsblk_t first_block = le32_to_cpu(sbi->s_es->s_first_data_block);
1704617ba13bSMingming Cao 	ext4_fsblk_t last_block;
1705bd81d8eeSLaurent Vivier 	ext4_fsblk_t block_bitmap;
1706bd81d8eeSLaurent Vivier 	ext4_fsblk_t inode_bitmap;
1707bd81d8eeSLaurent Vivier 	ext4_fsblk_t inode_table;
1708ce421581SJose R. Santos 	int flexbg_flag = 0;
1709fd2d4291SAvantika Mathur 	ext4_group_t i;
1710ac27a0ecSDave Kleikamp 
1711ce421581SJose R. Santos 	if (EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_FLEX_BG))
1712ce421581SJose R. Santos 		flexbg_flag = 1;
1713ce421581SJose R. Santos 
1714617ba13bSMingming Cao 	ext4_debug("Checking group descriptors");
1715ac27a0ecSDave Kleikamp 
1716197cd65aSAkinobu Mita 	for (i = 0; i < sbi->s_groups_count; i++) {
1717197cd65aSAkinobu Mita 		struct ext4_group_desc *gdp = ext4_get_group_desc(sb, i, NULL);
1718197cd65aSAkinobu Mita 
1719ce421581SJose R. Santos 		if (i == sbi->s_groups_count - 1 || flexbg_flag)
1720bd81d8eeSLaurent Vivier 			last_block = ext4_blocks_count(sbi->s_es) - 1;
1721ac27a0ecSDave Kleikamp 		else
1722ac27a0ecSDave Kleikamp 			last_block = first_block +
1723617ba13bSMingming Cao 				(EXT4_BLOCKS_PER_GROUP(sb) - 1);
1724ac27a0ecSDave Kleikamp 
17258fadc143SAlexandre Ratchov 		block_bitmap = ext4_block_bitmap(sb, gdp);
17262b2d6d01STheodore Ts'o 		if (block_bitmap < first_block || block_bitmap > last_block) {
1727c19204b0SJosef Bacik 			printk(KERN_ERR "EXT4-fs: ext4_check_descriptors: "
1728a9df9a49STheodore Ts'o 			       "Block bitmap for group %u not in group "
17295128273aSEric Sesterhenn 			       "(block %llu)!\n", i, block_bitmap);
1730ac27a0ecSDave Kleikamp 			return 0;
1731ac27a0ecSDave Kleikamp 		}
17328fadc143SAlexandre Ratchov 		inode_bitmap = ext4_inode_bitmap(sb, gdp);
17332b2d6d01STheodore Ts'o 		if (inode_bitmap < first_block || inode_bitmap > last_block) {
1734c19204b0SJosef Bacik 			printk(KERN_ERR "EXT4-fs: ext4_check_descriptors: "
1735a9df9a49STheodore Ts'o 			       "Inode bitmap for group %u not in group "
17365128273aSEric Sesterhenn 			       "(block %llu)!\n", i, inode_bitmap);
1737ac27a0ecSDave Kleikamp 			return 0;
1738ac27a0ecSDave Kleikamp 		}
17398fadc143SAlexandre Ratchov 		inode_table = ext4_inode_table(sb, gdp);
1740bd81d8eeSLaurent Vivier 		if (inode_table < first_block ||
17412b2d6d01STheodore Ts'o 		    inode_table + sbi->s_itb_per_group - 1 > last_block) {
1742c19204b0SJosef Bacik 			printk(KERN_ERR "EXT4-fs: ext4_check_descriptors: "
1743a9df9a49STheodore Ts'o 			       "Inode table for group %u not in group "
17445128273aSEric Sesterhenn 			       "(block %llu)!\n", i, inode_table);
1745ac27a0ecSDave Kleikamp 			return 0;
1746ac27a0ecSDave Kleikamp 		}
1747b5f10eedSEric Sandeen 		spin_lock(sb_bgl_lock(sbi, i));
1748717d50e4SAndreas Dilger 		if (!ext4_group_desc_csum_verify(sbi, i, gdp)) {
1749c19204b0SJosef Bacik 			printk(KERN_ERR "EXT4-fs: ext4_check_descriptors: "
1750a9df9a49STheodore Ts'o 			       "Checksum for group %u failed (%u!=%u)\n",
1751fd2d4291SAvantika Mathur 			       i, le16_to_cpu(ext4_group_desc_csum(sbi, i,
1752fd2d4291SAvantika Mathur 			       gdp)), le16_to_cpu(gdp->bg_checksum));
17537ee1ec4cSLi Zefan 			if (!(sb->s_flags & MS_RDONLY)) {
17547ee1ec4cSLi Zefan 				spin_unlock(sb_bgl_lock(sbi, i));
1755717d50e4SAndreas Dilger 				return 0;
1756717d50e4SAndreas Dilger 			}
17577ee1ec4cSLi Zefan 		}
1758b5f10eedSEric Sandeen 		spin_unlock(sb_bgl_lock(sbi, i));
1759ce421581SJose R. Santos 		if (!flexbg_flag)
1760617ba13bSMingming Cao 			first_block += EXT4_BLOCKS_PER_GROUP(sb);
1761ac27a0ecSDave Kleikamp 	}
1762ac27a0ecSDave Kleikamp 
1763bd81d8eeSLaurent Vivier 	ext4_free_blocks_count_set(sbi->s_es, ext4_count_free_blocks(sb));
1764617ba13bSMingming Cao 	sbi->s_es->s_free_inodes_count = cpu_to_le32(ext4_count_free_inodes(sb));
1765ac27a0ecSDave Kleikamp 	return 1;
1766ac27a0ecSDave Kleikamp }
1767ac27a0ecSDave Kleikamp 
1768617ba13bSMingming Cao /* ext4_orphan_cleanup() walks a singly-linked list of inodes (starting at
1769ac27a0ecSDave Kleikamp  * the superblock) which were deleted from all directories, but held open by
1770ac27a0ecSDave Kleikamp  * a process at the time of a crash.  We walk the list and try to delete these
1771ac27a0ecSDave Kleikamp  * inodes at recovery time (only with a read-write filesystem).
1772ac27a0ecSDave Kleikamp  *
1773ac27a0ecSDave Kleikamp  * In order to keep the orphan inode chain consistent during traversal (in
1774ac27a0ecSDave Kleikamp  * case of crash during recovery), we link each inode into the superblock
1775ac27a0ecSDave Kleikamp  * orphan list_head and handle it the same way as an inode deletion during
1776ac27a0ecSDave Kleikamp  * normal operation (which journals the operations for us).
1777ac27a0ecSDave Kleikamp  *
1778ac27a0ecSDave Kleikamp  * We only do an iget() and an iput() on each inode, which is very safe if we
1779ac27a0ecSDave Kleikamp  * accidentally point at an in-use or already deleted inode.  The worst that
1780ac27a0ecSDave Kleikamp  * can happen in this case is that we get a "bit already cleared" message from
1781617ba13bSMingming Cao  * ext4_free_inode().  The only reason we would point at a wrong inode is if
1782ac27a0ecSDave Kleikamp  * e2fsck was run on this filesystem, and it must have already done the orphan
1783ac27a0ecSDave Kleikamp  * inode cleanup for us, so we can safely abort without any further action.
1784ac27a0ecSDave Kleikamp  */
1785617ba13bSMingming Cao static void ext4_orphan_cleanup(struct super_block *sb,
1786617ba13bSMingming Cao 				struct ext4_super_block *es)
1787ac27a0ecSDave Kleikamp {
1788ac27a0ecSDave Kleikamp 	unsigned int s_flags = sb->s_flags;
1789ac27a0ecSDave Kleikamp 	int nr_orphans = 0, nr_truncates = 0;
1790ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1791ac27a0ecSDave Kleikamp 	int i;
1792ac27a0ecSDave Kleikamp #endif
1793ac27a0ecSDave Kleikamp 	if (!es->s_last_orphan) {
1794ac27a0ecSDave Kleikamp 		jbd_debug(4, "no orphan inodes to clean up\n");
1795ac27a0ecSDave Kleikamp 		return;
1796ac27a0ecSDave Kleikamp 	}
1797ac27a0ecSDave Kleikamp 
1798a8f48a95SEric Sandeen 	if (bdev_read_only(sb->s_bdev)) {
1799a8f48a95SEric Sandeen 		printk(KERN_ERR "EXT4-fs: write access "
1800a8f48a95SEric Sandeen 			"unavailable, skipping orphan cleanup.\n");
1801a8f48a95SEric Sandeen 		return;
1802a8f48a95SEric Sandeen 	}
1803a8f48a95SEric Sandeen 
1804617ba13bSMingming Cao 	if (EXT4_SB(sb)->s_mount_state & EXT4_ERROR_FS) {
1805ac27a0ecSDave Kleikamp 		if (es->s_last_orphan)
1806ac27a0ecSDave Kleikamp 			jbd_debug(1, "Errors on filesystem, "
1807ac27a0ecSDave Kleikamp 				  "clearing orphan list.\n");
1808ac27a0ecSDave Kleikamp 		es->s_last_orphan = 0;
1809ac27a0ecSDave Kleikamp 		jbd_debug(1, "Skipping orphan recovery on fs with errors.\n");
1810ac27a0ecSDave Kleikamp 		return;
1811ac27a0ecSDave Kleikamp 	}
1812ac27a0ecSDave Kleikamp 
1813ac27a0ecSDave Kleikamp 	if (s_flags & MS_RDONLY) {
1814617ba13bSMingming Cao 		printk(KERN_INFO "EXT4-fs: %s: orphan cleanup on readonly fs\n",
1815ac27a0ecSDave Kleikamp 		       sb->s_id);
1816ac27a0ecSDave Kleikamp 		sb->s_flags &= ~MS_RDONLY;
1817ac27a0ecSDave Kleikamp 	}
1818ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1819ac27a0ecSDave Kleikamp 	/* Needed for iput() to work correctly and not trash data */
1820ac27a0ecSDave Kleikamp 	sb->s_flags |= MS_ACTIVE;
1821ac27a0ecSDave Kleikamp 	/* Turn on quotas so that they are updated correctly */
1822ac27a0ecSDave Kleikamp 	for (i = 0; i < MAXQUOTAS; i++) {
1823617ba13bSMingming Cao 		if (EXT4_SB(sb)->s_qf_names[i]) {
1824617ba13bSMingming Cao 			int ret = ext4_quota_on_mount(sb, i);
1825ac27a0ecSDave Kleikamp 			if (ret < 0)
1826ac27a0ecSDave Kleikamp 				printk(KERN_ERR
18272c8be6b2SJan Kara 					"EXT4-fs: Cannot turn on journaled "
1828ac27a0ecSDave Kleikamp 					"quota: error %d\n", ret);
1829ac27a0ecSDave Kleikamp 		}
1830ac27a0ecSDave Kleikamp 	}
1831ac27a0ecSDave Kleikamp #endif
1832ac27a0ecSDave Kleikamp 
1833ac27a0ecSDave Kleikamp 	while (es->s_last_orphan) {
1834ac27a0ecSDave Kleikamp 		struct inode *inode;
1835ac27a0ecSDave Kleikamp 
183697bd42b9SJosef Bacik 		inode = ext4_orphan_get(sb, le32_to_cpu(es->s_last_orphan));
183797bd42b9SJosef Bacik 		if (IS_ERR(inode)) {
1838ac27a0ecSDave Kleikamp 			es->s_last_orphan = 0;
1839ac27a0ecSDave Kleikamp 			break;
1840ac27a0ecSDave Kleikamp 		}
1841ac27a0ecSDave Kleikamp 
1842617ba13bSMingming Cao 		list_add(&EXT4_I(inode)->i_orphan, &EXT4_SB(sb)->s_orphan);
1843a269eb18SJan Kara 		vfs_dq_init(inode);
1844ac27a0ecSDave Kleikamp 		if (inode->i_nlink) {
1845ac27a0ecSDave Kleikamp 			printk(KERN_DEBUG
1846e5f8eab8STheodore Ts'o 				"%s: truncating inode %lu to %lld bytes\n",
184746e665e9SHarvey Harrison 				__func__, inode->i_ino, inode->i_size);
1848e5f8eab8STheodore Ts'o 			jbd_debug(2, "truncating inode %lu to %lld bytes\n",
1849ac27a0ecSDave Kleikamp 				  inode->i_ino, inode->i_size);
1850617ba13bSMingming Cao 			ext4_truncate(inode);
1851ac27a0ecSDave Kleikamp 			nr_truncates++;
1852ac27a0ecSDave Kleikamp 		} else {
1853ac27a0ecSDave Kleikamp 			printk(KERN_DEBUG
1854ac27a0ecSDave Kleikamp 				"%s: deleting unreferenced inode %lu\n",
185546e665e9SHarvey Harrison 				__func__, inode->i_ino);
1856ac27a0ecSDave Kleikamp 			jbd_debug(2, "deleting unreferenced inode %lu\n",
1857ac27a0ecSDave Kleikamp 				  inode->i_ino);
1858ac27a0ecSDave Kleikamp 			nr_orphans++;
1859ac27a0ecSDave Kleikamp 		}
1860ac27a0ecSDave Kleikamp 		iput(inode);  /* The delete magic happens here! */
1861ac27a0ecSDave Kleikamp 	}
1862ac27a0ecSDave Kleikamp 
1863ac27a0ecSDave Kleikamp #define PLURAL(x) (x), ((x) == 1) ? "" : "s"
1864ac27a0ecSDave Kleikamp 
1865ac27a0ecSDave Kleikamp 	if (nr_orphans)
1866617ba13bSMingming Cao 		printk(KERN_INFO "EXT4-fs: %s: %d orphan inode%s deleted\n",
1867ac27a0ecSDave Kleikamp 		       sb->s_id, PLURAL(nr_orphans));
1868ac27a0ecSDave Kleikamp 	if (nr_truncates)
1869617ba13bSMingming Cao 		printk(KERN_INFO "EXT4-fs: %s: %d truncate%s cleaned up\n",
1870ac27a0ecSDave Kleikamp 		       sb->s_id, PLURAL(nr_truncates));
1871ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1872ac27a0ecSDave Kleikamp 	/* Turn quotas off */
1873ac27a0ecSDave Kleikamp 	for (i = 0; i < MAXQUOTAS; i++) {
1874ac27a0ecSDave Kleikamp 		if (sb_dqopt(sb)->files[i])
18756f28e087SJan Kara 			vfs_quota_off(sb, i, 0);
1876ac27a0ecSDave Kleikamp 	}
1877ac27a0ecSDave Kleikamp #endif
1878ac27a0ecSDave Kleikamp 	sb->s_flags = s_flags; /* Restore MS_RDONLY status */
1879ac27a0ecSDave Kleikamp }
1880cd2291a4SEric Sandeen /*
1881cd2291a4SEric Sandeen  * Maximal extent format file size.
1882cd2291a4SEric Sandeen  * Resulting logical blkno at s_maxbytes must fit in our on-disk
1883cd2291a4SEric Sandeen  * extent format containers, within a sector_t, and within i_blocks
1884cd2291a4SEric Sandeen  * in the vfs.  ext4 inode has 48 bits of i_block in fsblock units,
1885cd2291a4SEric Sandeen  * so that won't be a limiting factor.
1886cd2291a4SEric Sandeen  *
1887cd2291a4SEric Sandeen  * Note, this does *not* consider any metadata overhead for vfs i_blocks.
1888cd2291a4SEric Sandeen  */
1889f287a1a5STheodore Ts'o static loff_t ext4_max_size(int blkbits, int has_huge_files)
1890cd2291a4SEric Sandeen {
1891cd2291a4SEric Sandeen 	loff_t res;
1892cd2291a4SEric Sandeen 	loff_t upper_limit = MAX_LFS_FILESIZE;
1893cd2291a4SEric Sandeen 
1894cd2291a4SEric Sandeen 	/* small i_blocks in vfs inode? */
1895f287a1a5STheodore Ts'o 	if (!has_huge_files || sizeof(blkcnt_t) < sizeof(u64)) {
1896cd2291a4SEric Sandeen 		/*
1897b3a6ffe1SJens Axboe 		 * CONFIG_LBD is not enabled implies the inode
1898cd2291a4SEric Sandeen 		 * i_block represent total blocks in 512 bytes
1899cd2291a4SEric Sandeen 		 * 32 == size of vfs inode i_blocks * 8
1900cd2291a4SEric Sandeen 		 */
1901cd2291a4SEric Sandeen 		upper_limit = (1LL << 32) - 1;
1902cd2291a4SEric Sandeen 
1903cd2291a4SEric Sandeen 		/* total blocks in file system block size */
1904cd2291a4SEric Sandeen 		upper_limit >>= (blkbits - 9);
1905cd2291a4SEric Sandeen 		upper_limit <<= blkbits;
1906cd2291a4SEric Sandeen 	}
1907cd2291a4SEric Sandeen 
1908cd2291a4SEric Sandeen 	/* 32-bit extent-start container, ee_block */
1909cd2291a4SEric Sandeen 	res = 1LL << 32;
1910cd2291a4SEric Sandeen 	res <<= blkbits;
1911cd2291a4SEric Sandeen 	res -= 1;
1912cd2291a4SEric Sandeen 
1913cd2291a4SEric Sandeen 	/* Sanity check against vm- & vfs- imposed limits */
1914cd2291a4SEric Sandeen 	if (res > upper_limit)
1915cd2291a4SEric Sandeen 		res = upper_limit;
1916cd2291a4SEric Sandeen 
1917cd2291a4SEric Sandeen 	return res;
1918cd2291a4SEric Sandeen }
1919ac27a0ecSDave Kleikamp 
1920ac27a0ecSDave Kleikamp /*
1921cd2291a4SEric Sandeen  * Maximal bitmap file size.  There is a direct, and {,double-,triple-}indirect
19220fc1b451SAneesh Kumar K.V  * block limit, and also a limit of (2^48 - 1) 512-byte sectors in i_blocks.
19230fc1b451SAneesh Kumar K.V  * We need to be 1 filesystem block less than the 2^48 sector limit.
1924ac27a0ecSDave Kleikamp  */
1925f287a1a5STheodore Ts'o static loff_t ext4_max_bitmap_size(int bits, int has_huge_files)
1926ac27a0ecSDave Kleikamp {
1927617ba13bSMingming Cao 	loff_t res = EXT4_NDIR_BLOCKS;
19280fc1b451SAneesh Kumar K.V 	int meta_blocks;
19290fc1b451SAneesh Kumar K.V 	loff_t upper_limit;
19300fc1b451SAneesh Kumar K.V 	/* This is calculated to be the largest file size for a
1931cd2291a4SEric Sandeen 	 * dense, bitmapped file such that the total number of
1932ac27a0ecSDave Kleikamp 	 * sectors in the file, including data and all indirect blocks,
19330fc1b451SAneesh Kumar K.V 	 * does not exceed 2^48 -1
19340fc1b451SAneesh Kumar K.V 	 * __u32 i_blocks_lo and _u16 i_blocks_high representing the
19350fc1b451SAneesh Kumar K.V 	 * total number of  512 bytes blocks of the file
19360fc1b451SAneesh Kumar K.V 	 */
19370fc1b451SAneesh Kumar K.V 
1938f287a1a5STheodore Ts'o 	if (!has_huge_files || sizeof(blkcnt_t) < sizeof(u64)) {
19390fc1b451SAneesh Kumar K.V 		/*
1940b3a6ffe1SJens Axboe 		 * !has_huge_files or CONFIG_LBD is not enabled
1941f287a1a5STheodore Ts'o 		 * implies the inode i_block represent total blocks in
1942f287a1a5STheodore Ts'o 		 * 512 bytes 32 == size of vfs inode i_blocks * 8
19430fc1b451SAneesh Kumar K.V 		 */
19440fc1b451SAneesh Kumar K.V 		upper_limit = (1LL << 32) - 1;
19450fc1b451SAneesh Kumar K.V 
19460fc1b451SAneesh Kumar K.V 		/* total blocks in file system block size */
19470fc1b451SAneesh Kumar K.V 		upper_limit >>= (bits - 9);
19480fc1b451SAneesh Kumar K.V 
19490fc1b451SAneesh Kumar K.V 	} else {
19508180a562SAneesh Kumar K.V 		/*
19518180a562SAneesh Kumar K.V 		 * We use 48 bit ext4_inode i_blocks
19528180a562SAneesh Kumar K.V 		 * With EXT4_HUGE_FILE_FL set the i_blocks
19538180a562SAneesh Kumar K.V 		 * represent total number of blocks in
19548180a562SAneesh Kumar K.V 		 * file system block size
19558180a562SAneesh Kumar K.V 		 */
19560fc1b451SAneesh Kumar K.V 		upper_limit = (1LL << 48) - 1;
19570fc1b451SAneesh Kumar K.V 
19580fc1b451SAneesh Kumar K.V 	}
19590fc1b451SAneesh Kumar K.V 
19600fc1b451SAneesh Kumar K.V 	/* indirect blocks */
19610fc1b451SAneesh Kumar K.V 	meta_blocks = 1;
19620fc1b451SAneesh Kumar K.V 	/* double indirect blocks */
19630fc1b451SAneesh Kumar K.V 	meta_blocks += 1 + (1LL << (bits-2));
19640fc1b451SAneesh Kumar K.V 	/* tripple indirect blocks */
19650fc1b451SAneesh Kumar K.V 	meta_blocks += 1 + (1LL << (bits-2)) + (1LL << (2*(bits-2)));
19660fc1b451SAneesh Kumar K.V 
19670fc1b451SAneesh Kumar K.V 	upper_limit -= meta_blocks;
19680fc1b451SAneesh Kumar K.V 	upper_limit <<= bits;
1969ac27a0ecSDave Kleikamp 
1970ac27a0ecSDave Kleikamp 	res += 1LL << (bits-2);
1971ac27a0ecSDave Kleikamp 	res += 1LL << (2*(bits-2));
1972ac27a0ecSDave Kleikamp 	res += 1LL << (3*(bits-2));
1973ac27a0ecSDave Kleikamp 	res <<= bits;
1974ac27a0ecSDave Kleikamp 	if (res > upper_limit)
1975ac27a0ecSDave Kleikamp 		res = upper_limit;
19760fc1b451SAneesh Kumar K.V 
19770fc1b451SAneesh Kumar K.V 	if (res > MAX_LFS_FILESIZE)
19780fc1b451SAneesh Kumar K.V 		res = MAX_LFS_FILESIZE;
19790fc1b451SAneesh Kumar K.V 
1980ac27a0ecSDave Kleikamp 	return res;
1981ac27a0ecSDave Kleikamp }
1982ac27a0ecSDave Kleikamp 
1983617ba13bSMingming Cao static ext4_fsblk_t descriptor_loc(struct super_block *sb,
198470bbb3e0SAndrew Morton 				ext4_fsblk_t logical_sb_block, int nr)
1985ac27a0ecSDave Kleikamp {
1986617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1987fd2d4291SAvantika Mathur 	ext4_group_t bg, first_meta_bg;
1988ac27a0ecSDave Kleikamp 	int has_super = 0;
1989ac27a0ecSDave Kleikamp 
1990ac27a0ecSDave Kleikamp 	first_meta_bg = le32_to_cpu(sbi->s_es->s_first_meta_bg);
1991ac27a0ecSDave Kleikamp 
1992617ba13bSMingming Cao 	if (!EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_META_BG) ||
1993ac27a0ecSDave Kleikamp 	    nr < first_meta_bg)
199470bbb3e0SAndrew Morton 		return logical_sb_block + nr + 1;
1995ac27a0ecSDave Kleikamp 	bg = sbi->s_desc_per_block * nr;
1996617ba13bSMingming Cao 	if (ext4_bg_has_super(sb, bg))
1997ac27a0ecSDave Kleikamp 		has_super = 1;
1998617ba13bSMingming Cao 	return (has_super + ext4_group_first_block_no(sb, bg));
1999ac27a0ecSDave Kleikamp }
2000ac27a0ecSDave Kleikamp 
2001c9de560dSAlex Tomas /**
2002c9de560dSAlex Tomas  * ext4_get_stripe_size: Get the stripe size.
2003c9de560dSAlex Tomas  * @sbi: In memory super block info
2004c9de560dSAlex Tomas  *
2005c9de560dSAlex Tomas  * If we have specified it via mount option, then
2006c9de560dSAlex Tomas  * use the mount option value. If the value specified at mount time is
2007c9de560dSAlex Tomas  * greater than the blocks per group use the super block value.
2008c9de560dSAlex Tomas  * If the super block value is greater than blocks per group return 0.
2009c9de560dSAlex Tomas  * Allocator needs it be less than blocks per group.
2010c9de560dSAlex Tomas  *
2011c9de560dSAlex Tomas  */
2012c9de560dSAlex Tomas static unsigned long ext4_get_stripe_size(struct ext4_sb_info *sbi)
2013c9de560dSAlex Tomas {
2014c9de560dSAlex Tomas 	unsigned long stride = le16_to_cpu(sbi->s_es->s_raid_stride);
2015c9de560dSAlex Tomas 	unsigned long stripe_width =
2016c9de560dSAlex Tomas 			le32_to_cpu(sbi->s_es->s_raid_stripe_width);
2017c9de560dSAlex Tomas 
2018c9de560dSAlex Tomas 	if (sbi->s_stripe && sbi->s_stripe <= sbi->s_blocks_per_group)
2019c9de560dSAlex Tomas 		return sbi->s_stripe;
2020c9de560dSAlex Tomas 
2021c9de560dSAlex Tomas 	if (stripe_width <= sbi->s_blocks_per_group)
2022c9de560dSAlex Tomas 		return stripe_width;
2023c9de560dSAlex Tomas 
2024c9de560dSAlex Tomas 	if (stride <= sbi->s_blocks_per_group)
2025c9de560dSAlex Tomas 		return stride;
2026c9de560dSAlex Tomas 
2027c9de560dSAlex Tomas 	return 0;
2028c9de560dSAlex Tomas }
2029ac27a0ecSDave Kleikamp 
20303197ebdbSTheodore Ts'o /* sysfs supprt */
20313197ebdbSTheodore Ts'o 
20323197ebdbSTheodore Ts'o struct ext4_attr {
20333197ebdbSTheodore Ts'o 	struct attribute attr;
20343197ebdbSTheodore Ts'o 	ssize_t (*show)(struct ext4_attr *, struct ext4_sb_info *, char *);
20353197ebdbSTheodore Ts'o 	ssize_t (*store)(struct ext4_attr *, struct ext4_sb_info *,
20363197ebdbSTheodore Ts'o 			 const char *, size_t);
20373197ebdbSTheodore Ts'o 	int offset;
20383197ebdbSTheodore Ts'o };
20393197ebdbSTheodore Ts'o 
20403197ebdbSTheodore Ts'o static int parse_strtoul(const char *buf,
20413197ebdbSTheodore Ts'o 		unsigned long max, unsigned long *value)
20423197ebdbSTheodore Ts'o {
20433197ebdbSTheodore Ts'o 	char *endp;
20443197ebdbSTheodore Ts'o 
20453197ebdbSTheodore Ts'o 	while (*buf && isspace(*buf))
20463197ebdbSTheodore Ts'o 		buf++;
20473197ebdbSTheodore Ts'o 	*value = simple_strtoul(buf, &endp, 0);
20483197ebdbSTheodore Ts'o 	while (*endp && isspace(*endp))
20493197ebdbSTheodore Ts'o 		endp++;
20503197ebdbSTheodore Ts'o 	if (*endp || *value > max)
20513197ebdbSTheodore Ts'o 		return -EINVAL;
20523197ebdbSTheodore Ts'o 
20533197ebdbSTheodore Ts'o 	return 0;
20543197ebdbSTheodore Ts'o }
20553197ebdbSTheodore Ts'o 
20563197ebdbSTheodore Ts'o static ssize_t delayed_allocation_blocks_show(struct ext4_attr *a,
20573197ebdbSTheodore Ts'o 					      struct ext4_sb_info *sbi,
20583197ebdbSTheodore Ts'o 					      char *buf)
20593197ebdbSTheodore Ts'o {
20603197ebdbSTheodore Ts'o 	return snprintf(buf, PAGE_SIZE, "%llu\n",
20613197ebdbSTheodore Ts'o 			(s64) percpu_counter_sum(&sbi->s_dirtyblocks_counter));
20623197ebdbSTheodore Ts'o }
20633197ebdbSTheodore Ts'o 
20643197ebdbSTheodore Ts'o static ssize_t session_write_kbytes_show(struct ext4_attr *a,
20653197ebdbSTheodore Ts'o 					 struct ext4_sb_info *sbi, char *buf)
20663197ebdbSTheodore Ts'o {
20673197ebdbSTheodore Ts'o 	struct super_block *sb = sbi->s_buddy_cache->i_sb;
20683197ebdbSTheodore Ts'o 
20693197ebdbSTheodore Ts'o 	return snprintf(buf, PAGE_SIZE, "%lu\n",
20703197ebdbSTheodore Ts'o 			(part_stat_read(sb->s_bdev->bd_part, sectors[1]) -
20713197ebdbSTheodore Ts'o 			 sbi->s_sectors_written_start) >> 1);
20723197ebdbSTheodore Ts'o }
20733197ebdbSTheodore Ts'o 
20743197ebdbSTheodore Ts'o static ssize_t lifetime_write_kbytes_show(struct ext4_attr *a,
20753197ebdbSTheodore Ts'o 					  struct ext4_sb_info *sbi, char *buf)
20763197ebdbSTheodore Ts'o {
20773197ebdbSTheodore Ts'o 	struct super_block *sb = sbi->s_buddy_cache->i_sb;
20783197ebdbSTheodore Ts'o 
20793197ebdbSTheodore Ts'o 	return snprintf(buf, PAGE_SIZE, "%llu\n",
20803197ebdbSTheodore Ts'o 			sbi->s_kbytes_written +
20813197ebdbSTheodore Ts'o 			((part_stat_read(sb->s_bdev->bd_part, sectors[1]) -
20823197ebdbSTheodore Ts'o 			  EXT4_SB(sb)->s_sectors_written_start) >> 1));
20833197ebdbSTheodore Ts'o }
20843197ebdbSTheodore Ts'o 
20853197ebdbSTheodore Ts'o static ssize_t inode_readahead_blks_store(struct ext4_attr *a,
20863197ebdbSTheodore Ts'o 					  struct ext4_sb_info *sbi,
20873197ebdbSTheodore Ts'o 					  const char *buf, size_t count)
20883197ebdbSTheodore Ts'o {
20893197ebdbSTheodore Ts'o 	unsigned long t;
20903197ebdbSTheodore Ts'o 
20913197ebdbSTheodore Ts'o 	if (parse_strtoul(buf, 0x40000000, &t))
20923197ebdbSTheodore Ts'o 		return -EINVAL;
20933197ebdbSTheodore Ts'o 
20943197ebdbSTheodore Ts'o 	/* inode_readahead_blks must be a power of 2 */
20953197ebdbSTheodore Ts'o 	if (t & (t-1))
20963197ebdbSTheodore Ts'o 		return -EINVAL;
20973197ebdbSTheodore Ts'o 
20983197ebdbSTheodore Ts'o 	sbi->s_inode_readahead_blks = t;
20993197ebdbSTheodore Ts'o 	return count;
21003197ebdbSTheodore Ts'o }
21013197ebdbSTheodore Ts'o 
21023197ebdbSTheodore Ts'o static ssize_t sbi_ui_show(struct ext4_attr *a,
21033197ebdbSTheodore Ts'o 				struct ext4_sb_info *sbi, char *buf)
21043197ebdbSTheodore Ts'o {
21053197ebdbSTheodore Ts'o 	unsigned int *ui = (unsigned int *) (((char *) sbi) + a->offset);
21063197ebdbSTheodore Ts'o 
21073197ebdbSTheodore Ts'o 	return snprintf(buf, PAGE_SIZE, "%u\n", *ui);
21083197ebdbSTheodore Ts'o }
21093197ebdbSTheodore Ts'o 
21103197ebdbSTheodore Ts'o static ssize_t sbi_ui_store(struct ext4_attr *a,
21113197ebdbSTheodore Ts'o 			    struct ext4_sb_info *sbi,
21123197ebdbSTheodore Ts'o 			    const char *buf, size_t count)
21133197ebdbSTheodore Ts'o {
21143197ebdbSTheodore Ts'o 	unsigned int *ui = (unsigned int *) (((char *) sbi) + a->offset);
21153197ebdbSTheodore Ts'o 	unsigned long t;
21163197ebdbSTheodore Ts'o 
21173197ebdbSTheodore Ts'o 	if (parse_strtoul(buf, 0xffffffff, &t))
21183197ebdbSTheodore Ts'o 		return -EINVAL;
21193197ebdbSTheodore Ts'o 	*ui = t;
21203197ebdbSTheodore Ts'o 	return count;
21213197ebdbSTheodore Ts'o }
21223197ebdbSTheodore Ts'o 
21233197ebdbSTheodore Ts'o #define EXT4_ATTR_OFFSET(_name,_mode,_show,_store,_elname) \
21243197ebdbSTheodore Ts'o static struct ext4_attr ext4_attr_##_name = {			\
21253197ebdbSTheodore Ts'o 	.attr = {.name = __stringify(_name), .mode = _mode },	\
21263197ebdbSTheodore Ts'o 	.show	= _show,					\
21273197ebdbSTheodore Ts'o 	.store	= _store,					\
21283197ebdbSTheodore Ts'o 	.offset = offsetof(struct ext4_sb_info, _elname),	\
21293197ebdbSTheodore Ts'o }
21303197ebdbSTheodore Ts'o #define EXT4_ATTR(name, mode, show, store) \
21313197ebdbSTheodore Ts'o static struct ext4_attr ext4_attr_##name = __ATTR(name, mode, show, store)
21323197ebdbSTheodore Ts'o 
21333197ebdbSTheodore Ts'o #define EXT4_RO_ATTR(name) EXT4_ATTR(name, 0444, name##_show, NULL)
21343197ebdbSTheodore Ts'o #define EXT4_RW_ATTR(name) EXT4_ATTR(name, 0644, name##_show, name##_store)
21353197ebdbSTheodore Ts'o #define EXT4_RW_ATTR_SBI_UI(name, elname)	\
21363197ebdbSTheodore Ts'o 	EXT4_ATTR_OFFSET(name, 0644, sbi_ui_show, sbi_ui_store, elname)
21373197ebdbSTheodore Ts'o #define ATTR_LIST(name) &ext4_attr_##name.attr
21383197ebdbSTheodore Ts'o 
21393197ebdbSTheodore Ts'o EXT4_RO_ATTR(delayed_allocation_blocks);
21403197ebdbSTheodore Ts'o EXT4_RO_ATTR(session_write_kbytes);
21413197ebdbSTheodore Ts'o EXT4_RO_ATTR(lifetime_write_kbytes);
21423197ebdbSTheodore Ts'o EXT4_ATTR_OFFSET(inode_readahead_blks, 0644, sbi_ui_show,
21433197ebdbSTheodore Ts'o 		 inode_readahead_blks_store, s_inode_readahead_blks);
21443197ebdbSTheodore Ts'o EXT4_RW_ATTR_SBI_UI(mb_stats, s_mb_stats);
21453197ebdbSTheodore Ts'o EXT4_RW_ATTR_SBI_UI(mb_max_to_scan, s_mb_max_to_scan);
21463197ebdbSTheodore Ts'o EXT4_RW_ATTR_SBI_UI(mb_min_to_scan, s_mb_min_to_scan);
21473197ebdbSTheodore Ts'o EXT4_RW_ATTR_SBI_UI(mb_order2_req, s_mb_order2_reqs);
21483197ebdbSTheodore Ts'o EXT4_RW_ATTR_SBI_UI(mb_stream_req, s_mb_stream_request);
21493197ebdbSTheodore Ts'o EXT4_RW_ATTR_SBI_UI(mb_group_prealloc, s_mb_group_prealloc);
21503197ebdbSTheodore Ts'o 
21513197ebdbSTheodore Ts'o static struct attribute *ext4_attrs[] = {
21523197ebdbSTheodore Ts'o 	ATTR_LIST(delayed_allocation_blocks),
21533197ebdbSTheodore Ts'o 	ATTR_LIST(session_write_kbytes),
21543197ebdbSTheodore Ts'o 	ATTR_LIST(lifetime_write_kbytes),
21553197ebdbSTheodore Ts'o 	ATTR_LIST(inode_readahead_blks),
21563197ebdbSTheodore Ts'o 	ATTR_LIST(mb_stats),
21573197ebdbSTheodore Ts'o 	ATTR_LIST(mb_max_to_scan),
21583197ebdbSTheodore Ts'o 	ATTR_LIST(mb_min_to_scan),
21593197ebdbSTheodore Ts'o 	ATTR_LIST(mb_order2_req),
21603197ebdbSTheodore Ts'o 	ATTR_LIST(mb_stream_req),
21613197ebdbSTheodore Ts'o 	ATTR_LIST(mb_group_prealloc),
21623197ebdbSTheodore Ts'o 	NULL,
21633197ebdbSTheodore Ts'o };
21643197ebdbSTheodore Ts'o 
21653197ebdbSTheodore Ts'o static ssize_t ext4_attr_show(struct kobject *kobj,
21663197ebdbSTheodore Ts'o 			      struct attribute *attr, char *buf)
21673197ebdbSTheodore Ts'o {
21683197ebdbSTheodore Ts'o 	struct ext4_sb_info *sbi = container_of(kobj, struct ext4_sb_info,
21693197ebdbSTheodore Ts'o 						s_kobj);
21703197ebdbSTheodore Ts'o 	struct ext4_attr *a = container_of(attr, struct ext4_attr, attr);
21713197ebdbSTheodore Ts'o 
21723197ebdbSTheodore Ts'o 	return a->show ? a->show(a, sbi, buf) : 0;
21733197ebdbSTheodore Ts'o }
21743197ebdbSTheodore Ts'o 
21753197ebdbSTheodore Ts'o static ssize_t ext4_attr_store(struct kobject *kobj,
21763197ebdbSTheodore Ts'o 			       struct attribute *attr,
21773197ebdbSTheodore Ts'o 			       const char *buf, size_t len)
21783197ebdbSTheodore Ts'o {
21793197ebdbSTheodore Ts'o 	struct ext4_sb_info *sbi = container_of(kobj, struct ext4_sb_info,
21803197ebdbSTheodore Ts'o 						s_kobj);
21813197ebdbSTheodore Ts'o 	struct ext4_attr *a = container_of(attr, struct ext4_attr, attr);
21823197ebdbSTheodore Ts'o 
21833197ebdbSTheodore Ts'o 	return a->store ? a->store(a, sbi, buf, len) : 0;
21843197ebdbSTheodore Ts'o }
21853197ebdbSTheodore Ts'o 
21863197ebdbSTheodore Ts'o static void ext4_sb_release(struct kobject *kobj)
21873197ebdbSTheodore Ts'o {
21883197ebdbSTheodore Ts'o 	struct ext4_sb_info *sbi = container_of(kobj, struct ext4_sb_info,
21893197ebdbSTheodore Ts'o 						s_kobj);
21903197ebdbSTheodore Ts'o 	complete(&sbi->s_kobj_unregister);
21913197ebdbSTheodore Ts'o }
21923197ebdbSTheodore Ts'o 
21933197ebdbSTheodore Ts'o 
21943197ebdbSTheodore Ts'o static struct sysfs_ops ext4_attr_ops = {
21953197ebdbSTheodore Ts'o 	.show	= ext4_attr_show,
21963197ebdbSTheodore Ts'o 	.store	= ext4_attr_store,
21973197ebdbSTheodore Ts'o };
21983197ebdbSTheodore Ts'o 
21993197ebdbSTheodore Ts'o static struct kobj_type ext4_ktype = {
22003197ebdbSTheodore Ts'o 	.default_attrs	= ext4_attrs,
22013197ebdbSTheodore Ts'o 	.sysfs_ops	= &ext4_attr_ops,
22023197ebdbSTheodore Ts'o 	.release	= ext4_sb_release,
22033197ebdbSTheodore Ts'o };
22043197ebdbSTheodore Ts'o 
2205617ba13bSMingming Cao static int ext4_fill_super(struct super_block *sb, void *data, int silent)
22067477827fSAneesh Kumar K.V 				__releases(kernel_lock)
22077477827fSAneesh Kumar K.V 				__acquires(kernel_lock)
22081d03ec98SAneesh Kumar K.V 
2209ac27a0ecSDave Kleikamp {
2210ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
2211617ba13bSMingming Cao 	struct ext4_super_block *es = NULL;
2212617ba13bSMingming Cao 	struct ext4_sb_info *sbi;
2213617ba13bSMingming Cao 	ext4_fsblk_t block;
2214617ba13bSMingming Cao 	ext4_fsblk_t sb_block = get_sb_block(&data);
221570bbb3e0SAndrew Morton 	ext4_fsblk_t logical_sb_block;
2216ac27a0ecSDave Kleikamp 	unsigned long offset = 0;
2217ac27a0ecSDave Kleikamp 	unsigned long journal_devnum = 0;
2218ac27a0ecSDave Kleikamp 	unsigned long def_mount_opts;
2219ac27a0ecSDave Kleikamp 	struct inode *root;
22209f6200bbSTheodore Ts'o 	char *cp;
22210390131bSFrank Mayhar 	const char *descr;
22221d1fe1eeSDavid Howells 	int ret = -EINVAL;
2223ac27a0ecSDave Kleikamp 	int blocksize;
22244ec11028STheodore Ts'o 	unsigned int db_count;
22254ec11028STheodore Ts'o 	unsigned int i;
2226f287a1a5STheodore Ts'o 	int needs_recovery, has_huge_files;
22273a06d778SAneesh Kumar K.V 	int features;
2228bd81d8eeSLaurent Vivier 	__u64 blocks_count;
2229833f4077SPeter Zijlstra 	int err;
2230b3881f74STheodore Ts'o 	unsigned int journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
2231ac27a0ecSDave Kleikamp 
2232ac27a0ecSDave Kleikamp 	sbi = kzalloc(sizeof(*sbi), GFP_KERNEL);
2233ac27a0ecSDave Kleikamp 	if (!sbi)
2234ac27a0ecSDave Kleikamp 		return -ENOMEM;
2235705895b6SPekka Enberg 
2236705895b6SPekka Enberg 	sbi->s_blockgroup_lock =
2237705895b6SPekka Enberg 		kzalloc(sizeof(struct blockgroup_lock), GFP_KERNEL);
2238705895b6SPekka Enberg 	if (!sbi->s_blockgroup_lock) {
2239705895b6SPekka Enberg 		kfree(sbi);
2240705895b6SPekka Enberg 		return -ENOMEM;
2241705895b6SPekka Enberg 	}
2242ac27a0ecSDave Kleikamp 	sb->s_fs_info = sbi;
2243ac27a0ecSDave Kleikamp 	sbi->s_mount_opt = 0;
2244617ba13bSMingming Cao 	sbi->s_resuid = EXT4_DEF_RESUID;
2245617ba13bSMingming Cao 	sbi->s_resgid = EXT4_DEF_RESGID;
2246240799cdSTheodore Ts'o 	sbi->s_inode_readahead_blks = EXT4_DEF_INODE_READAHEAD_BLKS;
2247d9c9bef1SMiklos Szeredi 	sbi->s_sb_block = sb_block;
2248afc32f7eSTheodore Ts'o 	sbi->s_sectors_written_start = part_stat_read(sb->s_bdev->bd_part,
2249afc32f7eSTheodore Ts'o 						      sectors[1]);
2250ac27a0ecSDave Kleikamp 
2251ac27a0ecSDave Kleikamp 	unlock_kernel();
2252ac27a0ecSDave Kleikamp 
22539f6200bbSTheodore Ts'o 	/* Cleanup superblock name */
22549f6200bbSTheodore Ts'o 	for (cp = sb->s_id; (cp = strchr(cp, '/'));)
22559f6200bbSTheodore Ts'o 		*cp = '!';
22569f6200bbSTheodore Ts'o 
2257617ba13bSMingming Cao 	blocksize = sb_min_blocksize(sb, EXT4_MIN_BLOCK_SIZE);
2258ac27a0ecSDave Kleikamp 	if (!blocksize) {
2259617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: unable to set blocksize\n");
2260ac27a0ecSDave Kleikamp 		goto out_fail;
2261ac27a0ecSDave Kleikamp 	}
2262ac27a0ecSDave Kleikamp 
2263ac27a0ecSDave Kleikamp 	/*
2264617ba13bSMingming Cao 	 * The ext4 superblock will not be buffer aligned for other than 1kB
2265ac27a0ecSDave Kleikamp 	 * block sizes.  We need to calculate the offset from buffer start.
2266ac27a0ecSDave Kleikamp 	 */
2267617ba13bSMingming Cao 	if (blocksize != EXT4_MIN_BLOCK_SIZE) {
226870bbb3e0SAndrew Morton 		logical_sb_block = sb_block * EXT4_MIN_BLOCK_SIZE;
226970bbb3e0SAndrew Morton 		offset = do_div(logical_sb_block, blocksize);
2270ac27a0ecSDave Kleikamp 	} else {
227170bbb3e0SAndrew Morton 		logical_sb_block = sb_block;
2272ac27a0ecSDave Kleikamp 	}
2273ac27a0ecSDave Kleikamp 
227470bbb3e0SAndrew Morton 	if (!(bh = sb_bread(sb, logical_sb_block))) {
2275617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: unable to read superblock\n");
2276ac27a0ecSDave Kleikamp 		goto out_fail;
2277ac27a0ecSDave Kleikamp 	}
2278ac27a0ecSDave Kleikamp 	/*
2279ac27a0ecSDave Kleikamp 	 * Note: s_es must be initialized as soon as possible because
2280617ba13bSMingming Cao 	 *       some ext4 macro-instructions depend on its value
2281ac27a0ecSDave Kleikamp 	 */
2282617ba13bSMingming Cao 	es = (struct ext4_super_block *) (((char *)bh->b_data) + offset);
2283ac27a0ecSDave Kleikamp 	sbi->s_es = es;
2284ac27a0ecSDave Kleikamp 	sb->s_magic = le16_to_cpu(es->s_magic);
2285617ba13bSMingming Cao 	if (sb->s_magic != EXT4_SUPER_MAGIC)
2286617ba13bSMingming Cao 		goto cantfind_ext4;
2287afc32f7eSTheodore Ts'o 	sbi->s_kbytes_written = le64_to_cpu(es->s_kbytes_written);
2288ac27a0ecSDave Kleikamp 
2289ac27a0ecSDave Kleikamp 	/* Set defaults before we parse the mount options */
2290ac27a0ecSDave Kleikamp 	def_mount_opts = le32_to_cpu(es->s_default_mount_opts);
2291617ba13bSMingming Cao 	if (def_mount_opts & EXT4_DEFM_DEBUG)
2292ac27a0ecSDave Kleikamp 		set_opt(sbi->s_mount_opt, DEBUG);
2293617ba13bSMingming Cao 	if (def_mount_opts & EXT4_DEFM_BSDGROUPS)
2294ac27a0ecSDave Kleikamp 		set_opt(sbi->s_mount_opt, GRPID);
2295617ba13bSMingming Cao 	if (def_mount_opts & EXT4_DEFM_UID16)
2296ac27a0ecSDave Kleikamp 		set_opt(sbi->s_mount_opt, NO_UID32);
229703010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_XATTR
2298617ba13bSMingming Cao 	if (def_mount_opts & EXT4_DEFM_XATTR_USER)
2299ac27a0ecSDave Kleikamp 		set_opt(sbi->s_mount_opt, XATTR_USER);
23002e7842b8SHugh Dickins #endif
230103010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
2302617ba13bSMingming Cao 	if (def_mount_opts & EXT4_DEFM_ACL)
2303ac27a0ecSDave Kleikamp 		set_opt(sbi->s_mount_opt, POSIX_ACL);
23042e7842b8SHugh Dickins #endif
2305617ba13bSMingming Cao 	if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_DATA)
2306617ba13bSMingming Cao 		sbi->s_mount_opt |= EXT4_MOUNT_JOURNAL_DATA;
2307617ba13bSMingming Cao 	else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_ORDERED)
2308617ba13bSMingming Cao 		sbi->s_mount_opt |= EXT4_MOUNT_ORDERED_DATA;
2309617ba13bSMingming Cao 	else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_WBACK)
2310617ba13bSMingming Cao 		sbi->s_mount_opt |= EXT4_MOUNT_WRITEBACK_DATA;
2311ac27a0ecSDave Kleikamp 
2312617ba13bSMingming Cao 	if (le16_to_cpu(sbi->s_es->s_errors) == EXT4_ERRORS_PANIC)
2313ac27a0ecSDave Kleikamp 		set_opt(sbi->s_mount_opt, ERRORS_PANIC);
2314bb4f397aSAneesh Kumar K.V 	else if (le16_to_cpu(sbi->s_es->s_errors) == EXT4_ERRORS_CONTINUE)
2315ceea16bfSDmitry Mishin 		set_opt(sbi->s_mount_opt, ERRORS_CONT);
2316bb4f397aSAneesh Kumar K.V 	else
2317bb4f397aSAneesh Kumar K.V 		set_opt(sbi->s_mount_opt, ERRORS_RO);
2318ac27a0ecSDave Kleikamp 
2319ac27a0ecSDave Kleikamp 	sbi->s_resuid = le16_to_cpu(es->s_def_resuid);
2320ac27a0ecSDave Kleikamp 	sbi->s_resgid = le16_to_cpu(es->s_def_resgid);
232130773840STheodore Ts'o 	sbi->s_commit_interval = JBD2_DEFAULT_MAX_COMMIT_AGE * HZ;
232230773840STheodore Ts'o 	sbi->s_min_batch_time = EXT4_DEF_MIN_BATCH_TIME;
232330773840STheodore Ts'o 	sbi->s_max_batch_time = EXT4_DEF_MAX_BATCH_TIME;
2324ac27a0ecSDave Kleikamp 
2325571640caSEric Sandeen 	set_opt(sbi->s_mount_opt, BARRIER);
2326ac27a0ecSDave Kleikamp 
23271e2462f9SMingming Cao 	/*
2328dd919b98SAneesh Kumar K.V 	 * enable delayed allocation by default
2329dd919b98SAneesh Kumar K.V 	 * Use -o nodelalloc to turn it off
2330dd919b98SAneesh Kumar K.V 	 */
2331dd919b98SAneesh Kumar K.V 	set_opt(sbi->s_mount_opt, DELALLOC);
2332dd919b98SAneesh Kumar K.V 
2333dd919b98SAneesh Kumar K.V 
2334b3881f74STheodore Ts'o 	if (!parse_options((char *) data, sb, &journal_devnum,
2335b3881f74STheodore Ts'o 			   &journal_ioprio, NULL, 0))
2336ac27a0ecSDave Kleikamp 		goto failed_mount;
2337ac27a0ecSDave Kleikamp 
2338ac27a0ecSDave Kleikamp 	sb->s_flags = (sb->s_flags & ~MS_POSIXACL) |
2339617ba13bSMingming Cao 		((sbi->s_mount_opt & EXT4_MOUNT_POSIX_ACL) ? MS_POSIXACL : 0);
2340ac27a0ecSDave Kleikamp 
2341617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV &&
2342617ba13bSMingming Cao 	    (EXT4_HAS_COMPAT_FEATURE(sb, ~0U) ||
2343617ba13bSMingming Cao 	     EXT4_HAS_RO_COMPAT_FEATURE(sb, ~0U) ||
2344617ba13bSMingming Cao 	     EXT4_HAS_INCOMPAT_FEATURE(sb, ~0U)))
2345ac27a0ecSDave Kleikamp 		printk(KERN_WARNING
2346617ba13bSMingming Cao 		       "EXT4-fs warning: feature flags set on rev 0 fs, "
2347ac27a0ecSDave Kleikamp 		       "running e2fsck is recommended\n");
2348469108ffSTheodore Tso 
2349469108ffSTheodore Tso 	/*
2350ac27a0ecSDave Kleikamp 	 * Check feature flags regardless of the revision level, since we
2351ac27a0ecSDave Kleikamp 	 * previously didn't change the revision level when setting the flags,
2352ac27a0ecSDave Kleikamp 	 * so there is a chance incompat flags are set on a rev 0 filesystem.
2353ac27a0ecSDave Kleikamp 	 */
2354617ba13bSMingming Cao 	features = EXT4_HAS_INCOMPAT_FEATURE(sb, ~EXT4_FEATURE_INCOMPAT_SUPP);
2355ac27a0ecSDave Kleikamp 	if (features) {
2356617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: %s: couldn't mount because of "
23573a06d778SAneesh Kumar K.V 		       "unsupported optional features (%x).\n", sb->s_id,
23583a06d778SAneesh Kumar K.V 			(le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_incompat) &
23593a06d778SAneesh Kumar K.V 			~EXT4_FEATURE_INCOMPAT_SUPP));
2360ac27a0ecSDave Kleikamp 		goto failed_mount;
2361ac27a0ecSDave Kleikamp 	}
2362617ba13bSMingming Cao 	features = EXT4_HAS_RO_COMPAT_FEATURE(sb, ~EXT4_FEATURE_RO_COMPAT_SUPP);
2363ac27a0ecSDave Kleikamp 	if (!(sb->s_flags & MS_RDONLY) && features) {
2364617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: %s: couldn't mount RDWR because of "
23653a06d778SAneesh Kumar K.V 		       "unsupported optional features (%x).\n", sb->s_id,
23663a06d778SAneesh Kumar K.V 			(le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_ro_compat) &
23673a06d778SAneesh Kumar K.V 			~EXT4_FEATURE_RO_COMPAT_SUPP));
2368ac27a0ecSDave Kleikamp 		goto failed_mount;
2369ac27a0ecSDave Kleikamp 	}
2370f287a1a5STheodore Ts'o 	has_huge_files = EXT4_HAS_RO_COMPAT_FEATURE(sb,
2371f287a1a5STheodore Ts'o 				    EXT4_FEATURE_RO_COMPAT_HUGE_FILE);
2372f287a1a5STheodore Ts'o 	if (has_huge_files) {
23730fc1b451SAneesh Kumar K.V 		/*
23740fc1b451SAneesh Kumar K.V 		 * Large file size enabled file system can only be
2375b3a6ffe1SJens Axboe 		 * mount if kernel is build with CONFIG_LBD
23760fc1b451SAneesh Kumar K.V 		 */
23770fc1b451SAneesh Kumar K.V 		if (sizeof(root->i_blocks) < sizeof(u64) &&
23780fc1b451SAneesh Kumar K.V 				!(sb->s_flags & MS_RDONLY)) {
23790fc1b451SAneesh Kumar K.V 			printk(KERN_ERR "EXT4-fs: %s: Filesystem with huge "
23800fc1b451SAneesh Kumar K.V 					"files cannot be mounted read-write "
2381b3a6ffe1SJens Axboe 					"without CONFIG_LBD.\n", sb->s_id);
23820fc1b451SAneesh Kumar K.V 			goto failed_mount;
23830fc1b451SAneesh Kumar K.V 		}
23840fc1b451SAneesh Kumar K.V 	}
2385ac27a0ecSDave Kleikamp 	blocksize = BLOCK_SIZE << le32_to_cpu(es->s_log_block_size);
2386ac27a0ecSDave Kleikamp 
2387617ba13bSMingming Cao 	if (blocksize < EXT4_MIN_BLOCK_SIZE ||
2388617ba13bSMingming Cao 	    blocksize > EXT4_MAX_BLOCK_SIZE) {
2389ac27a0ecSDave Kleikamp 		printk(KERN_ERR
2390617ba13bSMingming Cao 		       "EXT4-fs: Unsupported filesystem blocksize %d on %s.\n",
2391ac27a0ecSDave Kleikamp 		       blocksize, sb->s_id);
2392ac27a0ecSDave Kleikamp 		goto failed_mount;
2393ac27a0ecSDave Kleikamp 	}
2394ac27a0ecSDave Kleikamp 
2395ac27a0ecSDave Kleikamp 	if (sb->s_blocksize != blocksize) {
2396ce40733cSAneesh Kumar K.V 
2397ce40733cSAneesh Kumar K.V 		/* Validate the filesystem blocksize */
2398ce40733cSAneesh Kumar K.V 		if (!sb_set_blocksize(sb, blocksize)) {
2399ce40733cSAneesh Kumar K.V 			printk(KERN_ERR "EXT4-fs: bad block size %d.\n",
2400ce40733cSAneesh Kumar K.V 					blocksize);
2401ac27a0ecSDave Kleikamp 			goto failed_mount;
2402ac27a0ecSDave Kleikamp 		}
2403ac27a0ecSDave Kleikamp 
2404ac27a0ecSDave Kleikamp 		brelse(bh);
240570bbb3e0SAndrew Morton 		logical_sb_block = sb_block * EXT4_MIN_BLOCK_SIZE;
240670bbb3e0SAndrew Morton 		offset = do_div(logical_sb_block, blocksize);
240770bbb3e0SAndrew Morton 		bh = sb_bread(sb, logical_sb_block);
2408ac27a0ecSDave Kleikamp 		if (!bh) {
2409ac27a0ecSDave Kleikamp 			printk(KERN_ERR
2410617ba13bSMingming Cao 			       "EXT4-fs: Can't read superblock on 2nd try.\n");
2411ac27a0ecSDave Kleikamp 			goto failed_mount;
2412ac27a0ecSDave Kleikamp 		}
2413617ba13bSMingming Cao 		es = (struct ext4_super_block *)(((char *)bh->b_data) + offset);
2414ac27a0ecSDave Kleikamp 		sbi->s_es = es;
2415617ba13bSMingming Cao 		if (es->s_magic != cpu_to_le16(EXT4_SUPER_MAGIC)) {
2416ac27a0ecSDave Kleikamp 			printk(KERN_ERR
2417617ba13bSMingming Cao 			       "EXT4-fs: Magic mismatch, very weird !\n");
2418ac27a0ecSDave Kleikamp 			goto failed_mount;
2419ac27a0ecSDave Kleikamp 		}
2420ac27a0ecSDave Kleikamp 	}
2421ac27a0ecSDave Kleikamp 
2422f287a1a5STheodore Ts'o 	sbi->s_bitmap_maxbytes = ext4_max_bitmap_size(sb->s_blocksize_bits,
2423f287a1a5STheodore Ts'o 						      has_huge_files);
2424f287a1a5STheodore Ts'o 	sb->s_maxbytes = ext4_max_size(sb->s_blocksize_bits, has_huge_files);
2425ac27a0ecSDave Kleikamp 
2426617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV) {
2427617ba13bSMingming Cao 		sbi->s_inode_size = EXT4_GOOD_OLD_INODE_SIZE;
2428617ba13bSMingming Cao 		sbi->s_first_ino = EXT4_GOOD_OLD_FIRST_INO;
2429ac27a0ecSDave Kleikamp 	} else {
2430ac27a0ecSDave Kleikamp 		sbi->s_inode_size = le16_to_cpu(es->s_inode_size);
2431ac27a0ecSDave Kleikamp 		sbi->s_first_ino = le32_to_cpu(es->s_first_ino);
2432617ba13bSMingming Cao 		if ((sbi->s_inode_size < EXT4_GOOD_OLD_INODE_SIZE) ||
24331330593eSVignesh Babu 		    (!is_power_of_2(sbi->s_inode_size)) ||
2434ac27a0ecSDave Kleikamp 		    (sbi->s_inode_size > blocksize)) {
2435ac27a0ecSDave Kleikamp 			printk(KERN_ERR
2436617ba13bSMingming Cao 			       "EXT4-fs: unsupported inode size: %d\n",
2437ac27a0ecSDave Kleikamp 			       sbi->s_inode_size);
2438ac27a0ecSDave Kleikamp 			goto failed_mount;
2439ac27a0ecSDave Kleikamp 		}
2440ef7f3835SKalpak Shah 		if (sbi->s_inode_size > EXT4_GOOD_OLD_INODE_SIZE)
2441ef7f3835SKalpak Shah 			sb->s_time_gran = 1 << (EXT4_EPOCH_BITS - 2);
2442ac27a0ecSDave Kleikamp 	}
24430d1ee42fSAlexandre Ratchov 	sbi->s_desc_size = le16_to_cpu(es->s_desc_size);
24440d1ee42fSAlexandre Ratchov 	if (EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_64BIT)) {
24458fadc143SAlexandre Ratchov 		if (sbi->s_desc_size < EXT4_MIN_DESC_SIZE_64BIT ||
24460d1ee42fSAlexandre Ratchov 		    sbi->s_desc_size > EXT4_MAX_DESC_SIZE ||
2447d8ea6cf8Svignesh babu 		    !is_power_of_2(sbi->s_desc_size)) {
24480d1ee42fSAlexandre Ratchov 			printk(KERN_ERR
24498fadc143SAlexandre Ratchov 			       "EXT4-fs: unsupported descriptor size %lu\n",
24500d1ee42fSAlexandre Ratchov 			       sbi->s_desc_size);
24510d1ee42fSAlexandre Ratchov 			goto failed_mount;
24520d1ee42fSAlexandre Ratchov 		}
24530d1ee42fSAlexandre Ratchov 	} else
24540d1ee42fSAlexandre Ratchov 		sbi->s_desc_size = EXT4_MIN_DESC_SIZE;
2455ac27a0ecSDave Kleikamp 	sbi->s_blocks_per_group = le32_to_cpu(es->s_blocks_per_group);
2456ac27a0ecSDave Kleikamp 	sbi->s_inodes_per_group = le32_to_cpu(es->s_inodes_per_group);
2457b47b6f38SAndries E. Brouwer 	if (EXT4_INODE_SIZE(sb) == 0 || EXT4_INODES_PER_GROUP(sb) == 0)
2458617ba13bSMingming Cao 		goto cantfind_ext4;
2459617ba13bSMingming Cao 	sbi->s_inodes_per_block = blocksize / EXT4_INODE_SIZE(sb);
2460ac27a0ecSDave Kleikamp 	if (sbi->s_inodes_per_block == 0)
2461617ba13bSMingming Cao 		goto cantfind_ext4;
2462ac27a0ecSDave Kleikamp 	sbi->s_itb_per_group = sbi->s_inodes_per_group /
2463ac27a0ecSDave Kleikamp 					sbi->s_inodes_per_block;
24640d1ee42fSAlexandre Ratchov 	sbi->s_desc_per_block = blocksize / EXT4_DESC_SIZE(sb);
2465ac27a0ecSDave Kleikamp 	sbi->s_sbh = bh;
2466ac27a0ecSDave Kleikamp 	sbi->s_mount_state = le16_to_cpu(es->s_state);
2467e57aa839SFengguang Wu 	sbi->s_addr_per_block_bits = ilog2(EXT4_ADDR_PER_BLOCK(sb));
2468e57aa839SFengguang Wu 	sbi->s_desc_per_block_bits = ilog2(EXT4_DESC_PER_BLOCK(sb));
2469ac27a0ecSDave Kleikamp 	for (i = 0; i < 4; i++)
2470ac27a0ecSDave Kleikamp 		sbi->s_hash_seed[i] = le32_to_cpu(es->s_hash_seed[i]);
2471ac27a0ecSDave Kleikamp 	sbi->s_def_hash_version = es->s_def_hash_version;
2472f99b2589STheodore Ts'o 	i = le32_to_cpu(es->s_flags);
2473f99b2589STheodore Ts'o 	if (i & EXT2_FLAGS_UNSIGNED_HASH)
2474f99b2589STheodore Ts'o 		sbi->s_hash_unsigned = 3;
2475f99b2589STheodore Ts'o 	else if ((i & EXT2_FLAGS_SIGNED_HASH) == 0) {
2476f99b2589STheodore Ts'o #ifdef __CHAR_UNSIGNED__
2477f99b2589STheodore Ts'o 		es->s_flags |= cpu_to_le32(EXT2_FLAGS_UNSIGNED_HASH);
2478f99b2589STheodore Ts'o 		sbi->s_hash_unsigned = 3;
2479f99b2589STheodore Ts'o #else
2480f99b2589STheodore Ts'o 		es->s_flags |= cpu_to_le32(EXT2_FLAGS_SIGNED_HASH);
2481f99b2589STheodore Ts'o #endif
2482f99b2589STheodore Ts'o 		sb->s_dirt = 1;
2483f99b2589STheodore Ts'o 	}
2484ac27a0ecSDave Kleikamp 
2485ac27a0ecSDave Kleikamp 	if (sbi->s_blocks_per_group > blocksize * 8) {
2486ac27a0ecSDave Kleikamp 		printk(KERN_ERR
2487617ba13bSMingming Cao 		       "EXT4-fs: #blocks per group too big: %lu\n",
2488ac27a0ecSDave Kleikamp 		       sbi->s_blocks_per_group);
2489ac27a0ecSDave Kleikamp 		goto failed_mount;
2490ac27a0ecSDave Kleikamp 	}
2491ac27a0ecSDave Kleikamp 	if (sbi->s_inodes_per_group > blocksize * 8) {
2492ac27a0ecSDave Kleikamp 		printk(KERN_ERR
2493617ba13bSMingming Cao 		       "EXT4-fs: #inodes per group too big: %lu\n",
2494ac27a0ecSDave Kleikamp 		       sbi->s_inodes_per_group);
2495ac27a0ecSDave Kleikamp 		goto failed_mount;
2496ac27a0ecSDave Kleikamp 	}
2497ac27a0ecSDave Kleikamp 
2498bd81d8eeSLaurent Vivier 	if (ext4_blocks_count(es) >
2499ac27a0ecSDave Kleikamp 		    (sector_t)(~0ULL) >> (sb->s_blocksize_bits - 9)) {
2500617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: filesystem on %s:"
2501ac27a0ecSDave Kleikamp 			" too large to mount safely\n", sb->s_id);
2502ac27a0ecSDave Kleikamp 		if (sizeof(sector_t) < 8)
2503617ba13bSMingming Cao 			printk(KERN_WARNING "EXT4-fs: CONFIG_LBD not "
2504ac27a0ecSDave Kleikamp 					"enabled\n");
2505ac27a0ecSDave Kleikamp 		goto failed_mount;
2506ac27a0ecSDave Kleikamp 	}
2507ac27a0ecSDave Kleikamp 
2508617ba13bSMingming Cao 	if (EXT4_BLOCKS_PER_GROUP(sb) == 0)
2509617ba13bSMingming Cao 		goto cantfind_ext4;
2510e7c95593SEric Sandeen 
25114ec11028STheodore Ts'o         /*
25124ec11028STheodore Ts'o          * It makes no sense for the first data block to be beyond the end
25134ec11028STheodore Ts'o          * of the filesystem.
25144ec11028STheodore Ts'o          */
25154ec11028STheodore Ts'o         if (le32_to_cpu(es->s_first_data_block) >= ext4_blocks_count(es)) {
25164ec11028STheodore Ts'o                 printk(KERN_WARNING "EXT4-fs: bad geometry: first data"
25174ec11028STheodore Ts'o 		       "block %u is beyond end of filesystem (%llu)\n",
2518e7c95593SEric Sandeen 		       le32_to_cpu(es->s_first_data_block),
25194ec11028STheodore Ts'o 		       ext4_blocks_count(es));
2520e7c95593SEric Sandeen 		goto failed_mount;
2521e7c95593SEric Sandeen 	}
2522bd81d8eeSLaurent Vivier 	blocks_count = (ext4_blocks_count(es) -
2523bd81d8eeSLaurent Vivier 			le32_to_cpu(es->s_first_data_block) +
2524bd81d8eeSLaurent Vivier 			EXT4_BLOCKS_PER_GROUP(sb) - 1);
2525bd81d8eeSLaurent Vivier 	do_div(blocks_count, EXT4_BLOCKS_PER_GROUP(sb));
25264ec11028STheodore Ts'o 	if (blocks_count > ((uint64_t)1<<32) - EXT4_DESC_PER_BLOCK(sb)) {
25274ec11028STheodore Ts'o 		printk(KERN_WARNING "EXT4-fs: groups count too large: %u "
25284ec11028STheodore Ts'o 		       "(block count %llu, first data block %u, "
25294ec11028STheodore Ts'o 		       "blocks per group %lu)\n", sbi->s_groups_count,
25304ec11028STheodore Ts'o 		       ext4_blocks_count(es),
25314ec11028STheodore Ts'o 		       le32_to_cpu(es->s_first_data_block),
25324ec11028STheodore Ts'o 		       EXT4_BLOCKS_PER_GROUP(sb));
25334ec11028STheodore Ts'o 		goto failed_mount;
25344ec11028STheodore Ts'o 	}
2535bd81d8eeSLaurent Vivier 	sbi->s_groups_count = blocks_count;
2536617ba13bSMingming Cao 	db_count = (sbi->s_groups_count + EXT4_DESC_PER_BLOCK(sb) - 1) /
2537617ba13bSMingming Cao 		   EXT4_DESC_PER_BLOCK(sb);
2538ac27a0ecSDave Kleikamp 	sbi->s_group_desc = kmalloc(db_count * sizeof(struct buffer_head *),
2539ac27a0ecSDave Kleikamp 				    GFP_KERNEL);
2540ac27a0ecSDave Kleikamp 	if (sbi->s_group_desc == NULL) {
2541617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: not enough memory\n");
2542ac27a0ecSDave Kleikamp 		goto failed_mount;
2543ac27a0ecSDave Kleikamp 	}
2544ac27a0ecSDave Kleikamp 
25453244fcb1SAlexander Beregalov #ifdef CONFIG_PROC_FS
25469f6200bbSTheodore Ts'o 	if (ext4_proc_root)
25479f6200bbSTheodore Ts'o 		sbi->s_proc = proc_mkdir(sb->s_id, ext4_proc_root);
25483244fcb1SAlexander Beregalov #endif
2549240799cdSTheodore Ts'o 
2550705895b6SPekka Enberg 	bgl_lock_init(sbi->s_blockgroup_lock);
2551ac27a0ecSDave Kleikamp 
2552ac27a0ecSDave Kleikamp 	for (i = 0; i < db_count; i++) {
255370bbb3e0SAndrew Morton 		block = descriptor_loc(sb, logical_sb_block, i);
2554ac27a0ecSDave Kleikamp 		sbi->s_group_desc[i] = sb_bread(sb, block);
2555ac27a0ecSDave Kleikamp 		if (!sbi->s_group_desc[i]) {
2556617ba13bSMingming Cao 			printk(KERN_ERR "EXT4-fs: "
2557ac27a0ecSDave Kleikamp 			       "can't read group descriptor %d\n", i);
2558ac27a0ecSDave Kleikamp 			db_count = i;
2559ac27a0ecSDave Kleikamp 			goto failed_mount2;
2560ac27a0ecSDave Kleikamp 		}
2561ac27a0ecSDave Kleikamp 	}
2562617ba13bSMingming Cao 	if (!ext4_check_descriptors(sb)) {
2563617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: group descriptors corrupted!\n");
2564ac27a0ecSDave Kleikamp 		goto failed_mount2;
2565ac27a0ecSDave Kleikamp 	}
2566772cb7c8SJose R. Santos 	if (EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_FLEX_BG))
2567772cb7c8SJose R. Santos 		if (!ext4_fill_flex_info(sb)) {
2568772cb7c8SJose R. Santos 			printk(KERN_ERR
2569772cb7c8SJose R. Santos 			       "EXT4-fs: unable to initialize "
2570772cb7c8SJose R. Santos 			       "flex_bg meta info!\n");
2571772cb7c8SJose R. Santos 			goto failed_mount2;
2572772cb7c8SJose R. Santos 		}
2573772cb7c8SJose R. Santos 
2574ac27a0ecSDave Kleikamp 	sbi->s_gdb_count = db_count;
2575ac27a0ecSDave Kleikamp 	get_random_bytes(&sbi->s_next_generation, sizeof(u32));
2576ac27a0ecSDave Kleikamp 	spin_lock_init(&sbi->s_next_gen_lock);
2577ac27a0ecSDave Kleikamp 
2578833f4077SPeter Zijlstra 	err = percpu_counter_init(&sbi->s_freeblocks_counter,
2579617ba13bSMingming Cao 			ext4_count_free_blocks(sb));
2580833f4077SPeter Zijlstra 	if (!err) {
2581833f4077SPeter Zijlstra 		err = percpu_counter_init(&sbi->s_freeinodes_counter,
2582617ba13bSMingming Cao 				ext4_count_free_inodes(sb));
2583833f4077SPeter Zijlstra 	}
2584833f4077SPeter Zijlstra 	if (!err) {
2585833f4077SPeter Zijlstra 		err = percpu_counter_init(&sbi->s_dirs_counter,
2586617ba13bSMingming Cao 				ext4_count_dirs(sb));
2587833f4077SPeter Zijlstra 	}
25886bc6e63fSAneesh Kumar K.V 	if (!err) {
25896bc6e63fSAneesh Kumar K.V 		err = percpu_counter_init(&sbi->s_dirtyblocks_counter, 0);
25906bc6e63fSAneesh Kumar K.V 	}
2591833f4077SPeter Zijlstra 	if (err) {
2592833f4077SPeter Zijlstra 		printk(KERN_ERR "EXT4-fs: insufficient memory\n");
2593833f4077SPeter Zijlstra 		goto failed_mount3;
2594833f4077SPeter Zijlstra 	}
2595ac27a0ecSDave Kleikamp 
2596c9de560dSAlex Tomas 	sbi->s_stripe = ext4_get_stripe_size(sbi);
2597c9de560dSAlex Tomas 
2598ac27a0ecSDave Kleikamp 	/*
2599ac27a0ecSDave Kleikamp 	 * set up enough so that it can read an inode
2600ac27a0ecSDave Kleikamp 	 */
2601617ba13bSMingming Cao 	sb->s_op = &ext4_sops;
2602617ba13bSMingming Cao 	sb->s_export_op = &ext4_export_ops;
2603617ba13bSMingming Cao 	sb->s_xattr = ext4_xattr_handlers;
2604ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
2605617ba13bSMingming Cao 	sb->s_qcop = &ext4_qctl_operations;
2606617ba13bSMingming Cao 	sb->dq_op = &ext4_quota_operations;
2607ac27a0ecSDave Kleikamp #endif
2608ac27a0ecSDave Kleikamp 	INIT_LIST_HEAD(&sbi->s_orphan); /* unlinked but open files */
2609ac27a0ecSDave Kleikamp 
2610ac27a0ecSDave Kleikamp 	sb->s_root = NULL;
2611ac27a0ecSDave Kleikamp 
2612ac27a0ecSDave Kleikamp 	needs_recovery = (es->s_last_orphan != 0 ||
2613617ba13bSMingming Cao 			  EXT4_HAS_INCOMPAT_FEATURE(sb,
2614617ba13bSMingming Cao 				    EXT4_FEATURE_INCOMPAT_RECOVER));
2615ac27a0ecSDave Kleikamp 
2616ac27a0ecSDave Kleikamp 	/*
2617ac27a0ecSDave Kleikamp 	 * The first inode we look at is the journal inode.  Don't try
2618ac27a0ecSDave Kleikamp 	 * root first: it may be modified in the journal!
2619ac27a0ecSDave Kleikamp 	 */
2620ac27a0ecSDave Kleikamp 	if (!test_opt(sb, NOLOAD) &&
2621617ba13bSMingming Cao 	    EXT4_HAS_COMPAT_FEATURE(sb, EXT4_FEATURE_COMPAT_HAS_JOURNAL)) {
2622617ba13bSMingming Cao 		if (ext4_load_journal(sb, es, journal_devnum))
2623ac27a0ecSDave Kleikamp 			goto failed_mount3;
2624624080edSTheodore Ts'o 		if (!(sb->s_flags & MS_RDONLY) &&
2625624080edSTheodore Ts'o 		    EXT4_SB(sb)->s_journal->j_failed_commit) {
2626624080edSTheodore Ts'o 			printk(KERN_CRIT "EXT4-fs error (device %s): "
2627624080edSTheodore Ts'o 			       "ext4_fill_super: Journal transaction "
2628624080edSTheodore Ts'o 			       "%u is corrupt\n", sb->s_id,
2629624080edSTheodore Ts'o 			       EXT4_SB(sb)->s_journal->j_failed_commit);
2630624080edSTheodore Ts'o 			if (test_opt(sb, ERRORS_RO)) {
2631624080edSTheodore Ts'o 				printk(KERN_CRIT
2632624080edSTheodore Ts'o 				       "Mounting filesystem read-only\n");
2633624080edSTheodore Ts'o 				sb->s_flags |= MS_RDONLY;
2634624080edSTheodore Ts'o 				EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
2635624080edSTheodore Ts'o 				es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
2636624080edSTheodore Ts'o 			}
2637624080edSTheodore Ts'o 			if (test_opt(sb, ERRORS_PANIC)) {
2638624080edSTheodore Ts'o 				EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
2639624080edSTheodore Ts'o 				es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
2640624080edSTheodore Ts'o 				ext4_commit_super(sb, es, 1);
2641624080edSTheodore Ts'o 				goto failed_mount4;
2642624080edSTheodore Ts'o 			}
2643624080edSTheodore Ts'o 		}
26440390131bSFrank Mayhar 	} else if (test_opt(sb, NOLOAD) && !(sb->s_flags & MS_RDONLY) &&
26450390131bSFrank Mayhar 	      EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER)) {
26460390131bSFrank Mayhar 		printk(KERN_ERR "EXT4-fs: required journal recovery "
26470390131bSFrank Mayhar 		       "suppressed and not mounted read-only\n");
26480390131bSFrank Mayhar 		goto failed_mount4;
2649ac27a0ecSDave Kleikamp 	} else {
26500390131bSFrank Mayhar 		clear_opt(sbi->s_mount_opt, DATA_FLAGS);
26510390131bSFrank Mayhar 		set_opt(sbi->s_mount_opt, WRITEBACK_DATA);
26520390131bSFrank Mayhar 		sbi->s_journal = NULL;
26530390131bSFrank Mayhar 		needs_recovery = 0;
26540390131bSFrank Mayhar 		goto no_journal;
2655ac27a0ecSDave Kleikamp 	}
2656ac27a0ecSDave Kleikamp 
2657eb40a09cSJose R. Santos 	if (ext4_blocks_count(es) > 0xffffffffULL &&
2658eb40a09cSJose R. Santos 	    !jbd2_journal_set_features(EXT4_SB(sb)->s_journal, 0, 0,
2659eb40a09cSJose R. Santos 				       JBD2_FEATURE_INCOMPAT_64BIT)) {
2660abda1418STheodore Ts'o 		printk(KERN_ERR "EXT4-fs: Failed to set 64-bit journal feature\n");
2661eb40a09cSJose R. Santos 		goto failed_mount4;
2662eb40a09cSJose R. Santos 	}
2663eb40a09cSJose R. Santos 
2664818d276cSGirish Shilamkar 	if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
2665818d276cSGirish Shilamkar 		jbd2_journal_set_features(sbi->s_journal,
2666818d276cSGirish Shilamkar 				JBD2_FEATURE_COMPAT_CHECKSUM, 0,
2667818d276cSGirish Shilamkar 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
2668818d276cSGirish Shilamkar 	} else if (test_opt(sb, JOURNAL_CHECKSUM)) {
2669818d276cSGirish Shilamkar 		jbd2_journal_set_features(sbi->s_journal,
2670818d276cSGirish Shilamkar 				JBD2_FEATURE_COMPAT_CHECKSUM, 0, 0);
2671818d276cSGirish Shilamkar 		jbd2_journal_clear_features(sbi->s_journal, 0, 0,
2672818d276cSGirish Shilamkar 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
2673818d276cSGirish Shilamkar 	} else {
2674818d276cSGirish Shilamkar 		jbd2_journal_clear_features(sbi->s_journal,
2675818d276cSGirish Shilamkar 				JBD2_FEATURE_COMPAT_CHECKSUM, 0,
2676818d276cSGirish Shilamkar 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
2677818d276cSGirish Shilamkar 	}
2678818d276cSGirish Shilamkar 
2679ac27a0ecSDave Kleikamp 	/* We have now updated the journal if required, so we can
2680ac27a0ecSDave Kleikamp 	 * validate the data journaling mode. */
2681ac27a0ecSDave Kleikamp 	switch (test_opt(sb, DATA_FLAGS)) {
2682ac27a0ecSDave Kleikamp 	case 0:
2683ac27a0ecSDave Kleikamp 		/* No mode set, assume a default based on the journal
268463f57933SAndrew Morton 		 * capabilities: ORDERED_DATA if the journal can
268563f57933SAndrew Morton 		 * cope, else JOURNAL_DATA
268663f57933SAndrew Morton 		 */
2687dab291afSMingming Cao 		if (jbd2_journal_check_available_features
2688dab291afSMingming Cao 		    (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE))
2689ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, ORDERED_DATA);
2690ac27a0ecSDave Kleikamp 		else
2691ac27a0ecSDave Kleikamp 			set_opt(sbi->s_mount_opt, JOURNAL_DATA);
2692ac27a0ecSDave Kleikamp 		break;
2693ac27a0ecSDave Kleikamp 
2694617ba13bSMingming Cao 	case EXT4_MOUNT_ORDERED_DATA:
2695617ba13bSMingming Cao 	case EXT4_MOUNT_WRITEBACK_DATA:
2696dab291afSMingming Cao 		if (!jbd2_journal_check_available_features
2697dab291afSMingming Cao 		    (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) {
2698617ba13bSMingming Cao 			printk(KERN_ERR "EXT4-fs: Journal does not support "
2699ac27a0ecSDave Kleikamp 			       "requested data journaling mode\n");
2700ac27a0ecSDave Kleikamp 			goto failed_mount4;
2701ac27a0ecSDave Kleikamp 		}
2702ac27a0ecSDave Kleikamp 	default:
2703ac27a0ecSDave Kleikamp 		break;
2704ac27a0ecSDave Kleikamp 	}
2705b3881f74STheodore Ts'o 	set_task_ioprio(sbi->s_journal->j_task, journal_ioprio);
2706ac27a0ecSDave Kleikamp 
27070390131bSFrank Mayhar no_journal:
2708ac27a0ecSDave Kleikamp 
2709ac27a0ecSDave Kleikamp 	if (test_opt(sb, NOBH)) {
2710617ba13bSMingming Cao 		if (!(test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_WRITEBACK_DATA)) {
2711617ba13bSMingming Cao 			printk(KERN_WARNING "EXT4-fs: Ignoring nobh option - "
2712ac27a0ecSDave Kleikamp 				"its supported only with writeback mode\n");
2713ac27a0ecSDave Kleikamp 			clear_opt(sbi->s_mount_opt, NOBH);
2714ac27a0ecSDave Kleikamp 		}
2715ac27a0ecSDave Kleikamp 	}
2716ac27a0ecSDave Kleikamp 	/*
2717dab291afSMingming Cao 	 * The jbd2_journal_load will have done any necessary log recovery,
2718ac27a0ecSDave Kleikamp 	 * so we can safely mount the rest of the filesystem now.
2719ac27a0ecSDave Kleikamp 	 */
2720ac27a0ecSDave Kleikamp 
27211d1fe1eeSDavid Howells 	root = ext4_iget(sb, EXT4_ROOT_INO);
27221d1fe1eeSDavid Howells 	if (IS_ERR(root)) {
2723617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: get root inode failed\n");
27241d1fe1eeSDavid Howells 		ret = PTR_ERR(root);
2725ac27a0ecSDave Kleikamp 		goto failed_mount4;
2726ac27a0ecSDave Kleikamp 	}
2727ac27a0ecSDave Kleikamp 	if (!S_ISDIR(root->i_mode) || !root->i_blocks || !root->i_size) {
27281d1fe1eeSDavid Howells 		iput(root);
2729617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: corrupt root inode, run e2fsck\n");
2730ac27a0ecSDave Kleikamp 		goto failed_mount4;
2731ac27a0ecSDave Kleikamp 	}
27321d1fe1eeSDavid Howells 	sb->s_root = d_alloc_root(root);
27331d1fe1eeSDavid Howells 	if (!sb->s_root) {
27341d1fe1eeSDavid Howells 		printk(KERN_ERR "EXT4-fs: get root dentry failed\n");
27351d1fe1eeSDavid Howells 		iput(root);
27361d1fe1eeSDavid Howells 		ret = -ENOMEM;
27371d1fe1eeSDavid Howells 		goto failed_mount4;
27381d1fe1eeSDavid Howells 	}
2739ac27a0ecSDave Kleikamp 
2740617ba13bSMingming Cao 	ext4_setup_super(sb, es, sb->s_flags & MS_RDONLY);
2741ef7f3835SKalpak Shah 
2742ef7f3835SKalpak Shah 	/* determine the minimum size of new large inodes, if present */
2743ef7f3835SKalpak Shah 	if (sbi->s_inode_size > EXT4_GOOD_OLD_INODE_SIZE) {
2744ef7f3835SKalpak Shah 		sbi->s_want_extra_isize = sizeof(struct ext4_inode) -
2745ef7f3835SKalpak Shah 						     EXT4_GOOD_OLD_INODE_SIZE;
2746ef7f3835SKalpak Shah 		if (EXT4_HAS_RO_COMPAT_FEATURE(sb,
2747ef7f3835SKalpak Shah 				       EXT4_FEATURE_RO_COMPAT_EXTRA_ISIZE)) {
2748ef7f3835SKalpak Shah 			if (sbi->s_want_extra_isize <
2749ef7f3835SKalpak Shah 			    le16_to_cpu(es->s_want_extra_isize))
2750ef7f3835SKalpak Shah 				sbi->s_want_extra_isize =
2751ef7f3835SKalpak Shah 					le16_to_cpu(es->s_want_extra_isize);
2752ef7f3835SKalpak Shah 			if (sbi->s_want_extra_isize <
2753ef7f3835SKalpak Shah 			    le16_to_cpu(es->s_min_extra_isize))
2754ef7f3835SKalpak Shah 				sbi->s_want_extra_isize =
2755ef7f3835SKalpak Shah 					le16_to_cpu(es->s_min_extra_isize);
2756ef7f3835SKalpak Shah 		}
2757ef7f3835SKalpak Shah 	}
2758ef7f3835SKalpak Shah 	/* Check if enough inode space is available */
2759ef7f3835SKalpak Shah 	if (EXT4_GOOD_OLD_INODE_SIZE + sbi->s_want_extra_isize >
2760ef7f3835SKalpak Shah 							sbi->s_inode_size) {
2761ef7f3835SKalpak Shah 		sbi->s_want_extra_isize = sizeof(struct ext4_inode) -
2762ef7f3835SKalpak Shah 						       EXT4_GOOD_OLD_INODE_SIZE;
2763ef7f3835SKalpak Shah 		printk(KERN_INFO "EXT4-fs: required extra inode space not"
2764ef7f3835SKalpak Shah 			"available.\n");
2765ef7f3835SKalpak Shah 	}
2766ef7f3835SKalpak Shah 
2767c2774d84SAneesh Kumar K.V 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) {
2768c2774d84SAneesh Kumar K.V 		printk(KERN_WARNING "EXT4-fs: Ignoring delalloc option - "
2769c2774d84SAneesh Kumar K.V 				"requested data journaling mode\n");
2770c2774d84SAneesh Kumar K.V 		clear_opt(sbi->s_mount_opt, DELALLOC);
2771c2774d84SAneesh Kumar K.V 	} else if (test_opt(sb, DELALLOC))
2772c2774d84SAneesh Kumar K.V 		printk(KERN_INFO "EXT4-fs: delayed allocation enabled\n");
2773c2774d84SAneesh Kumar K.V 
2774c2774d84SAneesh Kumar K.V 	ext4_ext_init(sb);
2775c2774d84SAneesh Kumar K.V 	err = ext4_mb_init(sb, needs_recovery);
2776c2774d84SAneesh Kumar K.V 	if (err) {
2777c2774d84SAneesh Kumar K.V 		printk(KERN_ERR "EXT4-fs: failed to initalize mballoc (%d)\n",
2778c2774d84SAneesh Kumar K.V 		       err);
2779c2774d84SAneesh Kumar K.V 		goto failed_mount4;
2780c2774d84SAneesh Kumar K.V 	}
2781c2774d84SAneesh Kumar K.V 
27823197ebdbSTheodore Ts'o 	sbi->s_kobj.kset = ext4_kset;
27833197ebdbSTheodore Ts'o 	init_completion(&sbi->s_kobj_unregister);
27843197ebdbSTheodore Ts'o 	err = kobject_init_and_add(&sbi->s_kobj, &ext4_ktype, NULL,
27853197ebdbSTheodore Ts'o 				   "%s", sb->s_id);
27863197ebdbSTheodore Ts'o 	if (err) {
27873197ebdbSTheodore Ts'o 		ext4_mb_release(sb);
27883197ebdbSTheodore Ts'o 		ext4_ext_release(sb);
27893197ebdbSTheodore Ts'o 		goto failed_mount4;
27903197ebdbSTheodore Ts'o 	};
27913197ebdbSTheodore Ts'o 
2792ac27a0ecSDave Kleikamp 	/*
2793ac27a0ecSDave Kleikamp 	 * akpm: core read_super() calls in here with the superblock locked.
2794ac27a0ecSDave Kleikamp 	 * That deadlocks, because orphan cleanup needs to lock the superblock
2795ac27a0ecSDave Kleikamp 	 * in numerous places.  Here we just pop the lock - it's relatively
2796ac27a0ecSDave Kleikamp 	 * harmless, because we are now ready to accept write_super() requests,
2797ac27a0ecSDave Kleikamp 	 * and aviro says that's the only reason for hanging onto the
2798ac27a0ecSDave Kleikamp 	 * superblock lock.
2799ac27a0ecSDave Kleikamp 	 */
2800617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state |= EXT4_ORPHAN_FS;
2801617ba13bSMingming Cao 	ext4_orphan_cleanup(sb, es);
2802617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state &= ~EXT4_ORPHAN_FS;
28030390131bSFrank Mayhar 	if (needs_recovery) {
2804617ba13bSMingming Cao 		printk(KERN_INFO "EXT4-fs: recovery complete.\n");
2805617ba13bSMingming Cao 		ext4_mark_recovery_complete(sb, es);
28060390131bSFrank Mayhar 	}
28070390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal) {
28080390131bSFrank Mayhar 		if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
28090390131bSFrank Mayhar 			descr = " journalled data mode";
28100390131bSFrank Mayhar 		else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
28110390131bSFrank Mayhar 			descr = " ordered data mode";
28120390131bSFrank Mayhar 		else
28130390131bSFrank Mayhar 			descr = " writeback data mode";
28140390131bSFrank Mayhar 	} else
28150390131bSFrank Mayhar 		descr = "out journal";
28160390131bSFrank Mayhar 
28170390131bSFrank Mayhar 	printk(KERN_INFO "EXT4-fs: mounted filesystem %s with%s\n",
28180390131bSFrank Mayhar 	       sb->s_id, descr);
2819ac27a0ecSDave Kleikamp 
2820ac27a0ecSDave Kleikamp 	lock_kernel();
2821ac27a0ecSDave Kleikamp 	return 0;
2822ac27a0ecSDave Kleikamp 
2823617ba13bSMingming Cao cantfind_ext4:
2824ac27a0ecSDave Kleikamp 	if (!silent)
2825617ba13bSMingming Cao 		printk(KERN_ERR "VFS: Can't find ext4 filesystem on dev %s.\n",
2826ac27a0ecSDave Kleikamp 		       sb->s_id);
2827ac27a0ecSDave Kleikamp 	goto failed_mount;
2828ac27a0ecSDave Kleikamp 
2829ac27a0ecSDave Kleikamp failed_mount4:
28300390131bSFrank Mayhar 	printk(KERN_ERR "EXT4-fs (device %s): mount failed\n", sb->s_id);
28310390131bSFrank Mayhar 	if (sbi->s_journal) {
2832dab291afSMingming Cao 		jbd2_journal_destroy(sbi->s_journal);
283347b4a50bSJan Kara 		sbi->s_journal = NULL;
28340390131bSFrank Mayhar 	}
2835ac27a0ecSDave Kleikamp failed_mount3:
2836ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_freeblocks_counter);
2837ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_freeinodes_counter);
2838ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_dirs_counter);
28396bc6e63fSAneesh Kumar K.V 	percpu_counter_destroy(&sbi->s_dirtyblocks_counter);
2840ac27a0ecSDave Kleikamp failed_mount2:
2841ac27a0ecSDave Kleikamp 	for (i = 0; i < db_count; i++)
2842ac27a0ecSDave Kleikamp 		brelse(sbi->s_group_desc[i]);
2843ac27a0ecSDave Kleikamp 	kfree(sbi->s_group_desc);
2844ac27a0ecSDave Kleikamp failed_mount:
2845240799cdSTheodore Ts'o 	if (sbi->s_proc) {
28469f6200bbSTheodore Ts'o 		remove_proc_entry(sb->s_id, ext4_proc_root);
2847240799cdSTheodore Ts'o 	}
2848ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
2849ac27a0ecSDave Kleikamp 	for (i = 0; i < MAXQUOTAS; i++)
2850ac27a0ecSDave Kleikamp 		kfree(sbi->s_qf_names[i]);
2851ac27a0ecSDave Kleikamp #endif
2852617ba13bSMingming Cao 	ext4_blkdev_remove(sbi);
2853ac27a0ecSDave Kleikamp 	brelse(bh);
2854ac27a0ecSDave Kleikamp out_fail:
2855ac27a0ecSDave Kleikamp 	sb->s_fs_info = NULL;
2856ac27a0ecSDave Kleikamp 	kfree(sbi);
2857ac27a0ecSDave Kleikamp 	lock_kernel();
28581d1fe1eeSDavid Howells 	return ret;
2859ac27a0ecSDave Kleikamp }
2860ac27a0ecSDave Kleikamp 
2861ac27a0ecSDave Kleikamp /*
2862ac27a0ecSDave Kleikamp  * Setup any per-fs journal parameters now.  We'll do this both on
2863ac27a0ecSDave Kleikamp  * initial mount, once the journal has been initialised but before we've
2864ac27a0ecSDave Kleikamp  * done any recovery; and again on any subsequent remount.
2865ac27a0ecSDave Kleikamp  */
2866617ba13bSMingming Cao static void ext4_init_journal_params(struct super_block *sb, journal_t *journal)
2867ac27a0ecSDave Kleikamp {
2868617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2869ac27a0ecSDave Kleikamp 
2870ac27a0ecSDave Kleikamp 	journal->j_commit_interval = sbi->s_commit_interval;
287130773840STheodore Ts'o 	journal->j_min_batch_time = sbi->s_min_batch_time;
287230773840STheodore Ts'o 	journal->j_max_batch_time = sbi->s_max_batch_time;
2873ac27a0ecSDave Kleikamp 
2874ac27a0ecSDave Kleikamp 	spin_lock(&journal->j_state_lock);
2875ac27a0ecSDave Kleikamp 	if (test_opt(sb, BARRIER))
2876dab291afSMingming Cao 		journal->j_flags |= JBD2_BARRIER;
2877ac27a0ecSDave Kleikamp 	else
2878dab291afSMingming Cao 		journal->j_flags &= ~JBD2_BARRIER;
28795bf5683aSHidehiro Kawai 	if (test_opt(sb, DATA_ERR_ABORT))
28805bf5683aSHidehiro Kawai 		journal->j_flags |= JBD2_ABORT_ON_SYNCDATA_ERR;
28815bf5683aSHidehiro Kawai 	else
28825bf5683aSHidehiro Kawai 		journal->j_flags &= ~JBD2_ABORT_ON_SYNCDATA_ERR;
2883ac27a0ecSDave Kleikamp 	spin_unlock(&journal->j_state_lock);
2884ac27a0ecSDave Kleikamp }
2885ac27a0ecSDave Kleikamp 
2886617ba13bSMingming Cao static journal_t *ext4_get_journal(struct super_block *sb,
2887ac27a0ecSDave Kleikamp 				   unsigned int journal_inum)
2888ac27a0ecSDave Kleikamp {
2889ac27a0ecSDave Kleikamp 	struct inode *journal_inode;
2890ac27a0ecSDave Kleikamp 	journal_t *journal;
2891ac27a0ecSDave Kleikamp 
28920390131bSFrank Mayhar 	BUG_ON(!EXT4_HAS_COMPAT_FEATURE(sb, EXT4_FEATURE_COMPAT_HAS_JOURNAL));
28930390131bSFrank Mayhar 
2894ac27a0ecSDave Kleikamp 	/* First, test for the existence of a valid inode on disk.  Bad
2895ac27a0ecSDave Kleikamp 	 * things happen if we iget() an unused inode, as the subsequent
2896ac27a0ecSDave Kleikamp 	 * iput() will try to delete it. */
2897ac27a0ecSDave Kleikamp 
28981d1fe1eeSDavid Howells 	journal_inode = ext4_iget(sb, journal_inum);
28991d1fe1eeSDavid Howells 	if (IS_ERR(journal_inode)) {
2900617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: no journal found.\n");
2901ac27a0ecSDave Kleikamp 		return NULL;
2902ac27a0ecSDave Kleikamp 	}
2903ac27a0ecSDave Kleikamp 	if (!journal_inode->i_nlink) {
2904ac27a0ecSDave Kleikamp 		make_bad_inode(journal_inode);
2905ac27a0ecSDave Kleikamp 		iput(journal_inode);
2906617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: journal inode is deleted.\n");
2907ac27a0ecSDave Kleikamp 		return NULL;
2908ac27a0ecSDave Kleikamp 	}
2909ac27a0ecSDave Kleikamp 
2910e5f8eab8STheodore Ts'o 	jbd_debug(2, "Journal inode found at %p: %lld bytes\n",
2911ac27a0ecSDave Kleikamp 		  journal_inode, journal_inode->i_size);
29121d1fe1eeSDavid Howells 	if (!S_ISREG(journal_inode->i_mode)) {
2913617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: invalid journal inode.\n");
2914ac27a0ecSDave Kleikamp 		iput(journal_inode);
2915ac27a0ecSDave Kleikamp 		return NULL;
2916ac27a0ecSDave Kleikamp 	}
2917ac27a0ecSDave Kleikamp 
2918dab291afSMingming Cao 	journal = jbd2_journal_init_inode(journal_inode);
2919ac27a0ecSDave Kleikamp 	if (!journal) {
2920617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: Could not load journal inode\n");
2921ac27a0ecSDave Kleikamp 		iput(journal_inode);
2922ac27a0ecSDave Kleikamp 		return NULL;
2923ac27a0ecSDave Kleikamp 	}
2924ac27a0ecSDave Kleikamp 	journal->j_private = sb;
2925617ba13bSMingming Cao 	ext4_init_journal_params(sb, journal);
2926ac27a0ecSDave Kleikamp 	return journal;
2927ac27a0ecSDave Kleikamp }
2928ac27a0ecSDave Kleikamp 
2929617ba13bSMingming Cao static journal_t *ext4_get_dev_journal(struct super_block *sb,
2930ac27a0ecSDave Kleikamp 				       dev_t j_dev)
2931ac27a0ecSDave Kleikamp {
2932ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
2933ac27a0ecSDave Kleikamp 	journal_t *journal;
2934617ba13bSMingming Cao 	ext4_fsblk_t start;
2935617ba13bSMingming Cao 	ext4_fsblk_t len;
2936ac27a0ecSDave Kleikamp 	int hblock, blocksize;
2937617ba13bSMingming Cao 	ext4_fsblk_t sb_block;
2938ac27a0ecSDave Kleikamp 	unsigned long offset;
2939617ba13bSMingming Cao 	struct ext4_super_block *es;
2940ac27a0ecSDave Kleikamp 	struct block_device *bdev;
2941ac27a0ecSDave Kleikamp 
29420390131bSFrank Mayhar 	BUG_ON(!EXT4_HAS_COMPAT_FEATURE(sb, EXT4_FEATURE_COMPAT_HAS_JOURNAL));
29430390131bSFrank Mayhar 
2944617ba13bSMingming Cao 	bdev = ext4_blkdev_get(j_dev);
2945ac27a0ecSDave Kleikamp 	if (bdev == NULL)
2946ac27a0ecSDave Kleikamp 		return NULL;
2947ac27a0ecSDave Kleikamp 
2948ac27a0ecSDave Kleikamp 	if (bd_claim(bdev, sb)) {
2949ac27a0ecSDave Kleikamp 		printk(KERN_ERR
2950abda1418STheodore Ts'o 			"EXT4-fs: failed to claim external journal device.\n");
29519a1c3542SAl Viro 		blkdev_put(bdev, FMODE_READ|FMODE_WRITE);
2952ac27a0ecSDave Kleikamp 		return NULL;
2953ac27a0ecSDave Kleikamp 	}
2954ac27a0ecSDave Kleikamp 
2955ac27a0ecSDave Kleikamp 	blocksize = sb->s_blocksize;
2956ac27a0ecSDave Kleikamp 	hblock = bdev_hardsect_size(bdev);
2957ac27a0ecSDave Kleikamp 	if (blocksize < hblock) {
2958ac27a0ecSDave Kleikamp 		printk(KERN_ERR
2959617ba13bSMingming Cao 			"EXT4-fs: blocksize too small for journal device.\n");
2960ac27a0ecSDave Kleikamp 		goto out_bdev;
2961ac27a0ecSDave Kleikamp 	}
2962ac27a0ecSDave Kleikamp 
2963617ba13bSMingming Cao 	sb_block = EXT4_MIN_BLOCK_SIZE / blocksize;
2964617ba13bSMingming Cao 	offset = EXT4_MIN_BLOCK_SIZE % blocksize;
2965ac27a0ecSDave Kleikamp 	set_blocksize(bdev, blocksize);
2966ac27a0ecSDave Kleikamp 	if (!(bh = __bread(bdev, sb_block, blocksize))) {
2967617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: couldn't read superblock of "
2968ac27a0ecSDave Kleikamp 		       "external journal\n");
2969ac27a0ecSDave Kleikamp 		goto out_bdev;
2970ac27a0ecSDave Kleikamp 	}
2971ac27a0ecSDave Kleikamp 
2972617ba13bSMingming Cao 	es = (struct ext4_super_block *) (((char *)bh->b_data) + offset);
2973617ba13bSMingming Cao 	if ((le16_to_cpu(es->s_magic) != EXT4_SUPER_MAGIC) ||
2974ac27a0ecSDave Kleikamp 	    !(le32_to_cpu(es->s_feature_incompat) &
2975617ba13bSMingming Cao 	      EXT4_FEATURE_INCOMPAT_JOURNAL_DEV)) {
2976617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: external journal has "
2977ac27a0ecSDave Kleikamp 					"bad superblock\n");
2978ac27a0ecSDave Kleikamp 		brelse(bh);
2979ac27a0ecSDave Kleikamp 		goto out_bdev;
2980ac27a0ecSDave Kleikamp 	}
2981ac27a0ecSDave Kleikamp 
2982617ba13bSMingming Cao 	if (memcmp(EXT4_SB(sb)->s_es->s_journal_uuid, es->s_uuid, 16)) {
2983617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: journal UUID does not match\n");
2984ac27a0ecSDave Kleikamp 		brelse(bh);
2985ac27a0ecSDave Kleikamp 		goto out_bdev;
2986ac27a0ecSDave Kleikamp 	}
2987ac27a0ecSDave Kleikamp 
2988bd81d8eeSLaurent Vivier 	len = ext4_blocks_count(es);
2989ac27a0ecSDave Kleikamp 	start = sb_block + 1;
2990ac27a0ecSDave Kleikamp 	brelse(bh);	/* we're done with the superblock */
2991ac27a0ecSDave Kleikamp 
2992dab291afSMingming Cao 	journal = jbd2_journal_init_dev(bdev, sb->s_bdev,
2993ac27a0ecSDave Kleikamp 					start, len, blocksize);
2994ac27a0ecSDave Kleikamp 	if (!journal) {
2995617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: failed to create device journal\n");
2996ac27a0ecSDave Kleikamp 		goto out_bdev;
2997ac27a0ecSDave Kleikamp 	}
2998ac27a0ecSDave Kleikamp 	journal->j_private = sb;
2999ac27a0ecSDave Kleikamp 	ll_rw_block(READ, 1, &journal->j_sb_buffer);
3000ac27a0ecSDave Kleikamp 	wait_on_buffer(journal->j_sb_buffer);
3001ac27a0ecSDave Kleikamp 	if (!buffer_uptodate(journal->j_sb_buffer)) {
3002617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: I/O error on journal device\n");
3003ac27a0ecSDave Kleikamp 		goto out_journal;
3004ac27a0ecSDave Kleikamp 	}
3005ac27a0ecSDave Kleikamp 	if (be32_to_cpu(journal->j_superblock->s_nr_users) != 1) {
3006617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: External journal has more than one "
3007ac27a0ecSDave Kleikamp 					"user (unsupported) - %d\n",
3008ac27a0ecSDave Kleikamp 			be32_to_cpu(journal->j_superblock->s_nr_users));
3009ac27a0ecSDave Kleikamp 		goto out_journal;
3010ac27a0ecSDave Kleikamp 	}
3011617ba13bSMingming Cao 	EXT4_SB(sb)->journal_bdev = bdev;
3012617ba13bSMingming Cao 	ext4_init_journal_params(sb, journal);
3013ac27a0ecSDave Kleikamp 	return journal;
3014ac27a0ecSDave Kleikamp out_journal:
3015dab291afSMingming Cao 	jbd2_journal_destroy(journal);
3016ac27a0ecSDave Kleikamp out_bdev:
3017617ba13bSMingming Cao 	ext4_blkdev_put(bdev);
3018ac27a0ecSDave Kleikamp 	return NULL;
3019ac27a0ecSDave Kleikamp }
3020ac27a0ecSDave Kleikamp 
3021617ba13bSMingming Cao static int ext4_load_journal(struct super_block *sb,
3022617ba13bSMingming Cao 			     struct ext4_super_block *es,
3023ac27a0ecSDave Kleikamp 			     unsigned long journal_devnum)
3024ac27a0ecSDave Kleikamp {
3025ac27a0ecSDave Kleikamp 	journal_t *journal;
3026ac27a0ecSDave Kleikamp 	unsigned int journal_inum = le32_to_cpu(es->s_journal_inum);
3027ac27a0ecSDave Kleikamp 	dev_t journal_dev;
3028ac27a0ecSDave Kleikamp 	int err = 0;
3029ac27a0ecSDave Kleikamp 	int really_read_only;
3030ac27a0ecSDave Kleikamp 
30310390131bSFrank Mayhar 	BUG_ON(!EXT4_HAS_COMPAT_FEATURE(sb, EXT4_FEATURE_COMPAT_HAS_JOURNAL));
30320390131bSFrank Mayhar 
3033ac27a0ecSDave Kleikamp 	if (journal_devnum &&
3034ac27a0ecSDave Kleikamp 	    journal_devnum != le32_to_cpu(es->s_journal_dev)) {
3035617ba13bSMingming Cao 		printk(KERN_INFO "EXT4-fs: external journal device major/minor "
3036ac27a0ecSDave Kleikamp 			"numbers have changed\n");
3037ac27a0ecSDave Kleikamp 		journal_dev = new_decode_dev(journal_devnum);
3038ac27a0ecSDave Kleikamp 	} else
3039ac27a0ecSDave Kleikamp 		journal_dev = new_decode_dev(le32_to_cpu(es->s_journal_dev));
3040ac27a0ecSDave Kleikamp 
3041ac27a0ecSDave Kleikamp 	really_read_only = bdev_read_only(sb->s_bdev);
3042ac27a0ecSDave Kleikamp 
3043ac27a0ecSDave Kleikamp 	/*
3044ac27a0ecSDave Kleikamp 	 * Are we loading a blank journal or performing recovery after a
3045ac27a0ecSDave Kleikamp 	 * crash?  For recovery, we need to check in advance whether we
3046ac27a0ecSDave Kleikamp 	 * can get read-write access to the device.
3047ac27a0ecSDave Kleikamp 	 */
3048ac27a0ecSDave Kleikamp 
3049617ba13bSMingming Cao 	if (EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER)) {
3050ac27a0ecSDave Kleikamp 		if (sb->s_flags & MS_RDONLY) {
3051617ba13bSMingming Cao 			printk(KERN_INFO "EXT4-fs: INFO: recovery "
3052ac27a0ecSDave Kleikamp 					"required on readonly filesystem.\n");
3053ac27a0ecSDave Kleikamp 			if (really_read_only) {
3054617ba13bSMingming Cao 				printk(KERN_ERR "EXT4-fs: write access "
3055ac27a0ecSDave Kleikamp 					"unavailable, cannot proceed.\n");
3056ac27a0ecSDave Kleikamp 				return -EROFS;
3057ac27a0ecSDave Kleikamp 			}
3058617ba13bSMingming Cao 			printk(KERN_INFO "EXT4-fs: write access will "
3059ac27a0ecSDave Kleikamp 			       "be enabled during recovery.\n");
3060ac27a0ecSDave Kleikamp 		}
3061ac27a0ecSDave Kleikamp 	}
3062ac27a0ecSDave Kleikamp 
3063ac27a0ecSDave Kleikamp 	if (journal_inum && journal_dev) {
3064617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: filesystem has both journal "
3065ac27a0ecSDave Kleikamp 		       "and inode journals!\n");
3066ac27a0ecSDave Kleikamp 		return -EINVAL;
3067ac27a0ecSDave Kleikamp 	}
3068ac27a0ecSDave Kleikamp 
3069ac27a0ecSDave Kleikamp 	if (journal_inum) {
3070617ba13bSMingming Cao 		if (!(journal = ext4_get_journal(sb, journal_inum)))
3071ac27a0ecSDave Kleikamp 			return -EINVAL;
3072ac27a0ecSDave Kleikamp 	} else {
3073617ba13bSMingming Cao 		if (!(journal = ext4_get_dev_journal(sb, journal_dev)))
3074ac27a0ecSDave Kleikamp 			return -EINVAL;
3075ac27a0ecSDave Kleikamp 	}
3076ac27a0ecSDave Kleikamp 
30774776004fSTheodore Ts'o 	if (journal->j_flags & JBD2_BARRIER)
30784776004fSTheodore Ts'o 		printk(KERN_INFO "EXT4-fs: barriers enabled\n");
30794776004fSTheodore Ts'o 	else
30804776004fSTheodore Ts'o 		printk(KERN_INFO "EXT4-fs: barriers disabled\n");
30814776004fSTheodore Ts'o 
3082ac27a0ecSDave Kleikamp 	if (!really_read_only && test_opt(sb, UPDATE_JOURNAL)) {
3083dab291afSMingming Cao 		err = jbd2_journal_update_format(journal);
3084ac27a0ecSDave Kleikamp 		if (err)  {
3085617ba13bSMingming Cao 			printk(KERN_ERR "EXT4-fs: error updating journal.\n");
3086dab291afSMingming Cao 			jbd2_journal_destroy(journal);
3087ac27a0ecSDave Kleikamp 			return err;
3088ac27a0ecSDave Kleikamp 		}
3089ac27a0ecSDave Kleikamp 	}
3090ac27a0ecSDave Kleikamp 
3091617ba13bSMingming Cao 	if (!EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER))
3092dab291afSMingming Cao 		err = jbd2_journal_wipe(journal, !really_read_only);
3093ac27a0ecSDave Kleikamp 	if (!err)
3094dab291afSMingming Cao 		err = jbd2_journal_load(journal);
3095ac27a0ecSDave Kleikamp 
3096ac27a0ecSDave Kleikamp 	if (err) {
3097617ba13bSMingming Cao 		printk(KERN_ERR "EXT4-fs: error loading journal.\n");
3098dab291afSMingming Cao 		jbd2_journal_destroy(journal);
3099ac27a0ecSDave Kleikamp 		return err;
3100ac27a0ecSDave Kleikamp 	}
3101ac27a0ecSDave Kleikamp 
3102617ba13bSMingming Cao 	EXT4_SB(sb)->s_journal = journal;
3103617ba13bSMingming Cao 	ext4_clear_journal_err(sb, es);
3104ac27a0ecSDave Kleikamp 
3105ac27a0ecSDave Kleikamp 	if (journal_devnum &&
3106ac27a0ecSDave Kleikamp 	    journal_devnum != le32_to_cpu(es->s_journal_dev)) {
3107ac27a0ecSDave Kleikamp 		es->s_journal_dev = cpu_to_le32(journal_devnum);
3108ac27a0ecSDave Kleikamp 		sb->s_dirt = 1;
3109ac27a0ecSDave Kleikamp 
3110ac27a0ecSDave Kleikamp 		/* Make sure we flush the recovery flag to disk. */
3111617ba13bSMingming Cao 		ext4_commit_super(sb, es, 1);
3112ac27a0ecSDave Kleikamp 	}
3113ac27a0ecSDave Kleikamp 
3114ac27a0ecSDave Kleikamp 	return 0;
3115ac27a0ecSDave Kleikamp }
3116ac27a0ecSDave Kleikamp 
3117c4be0c1dSTakashi Sato static int ext4_commit_super(struct super_block *sb,
31182b2d6d01STheodore Ts'o 			      struct ext4_super_block *es, int sync)
3119ac27a0ecSDave Kleikamp {
3120617ba13bSMingming Cao 	struct buffer_head *sbh = EXT4_SB(sb)->s_sbh;
3121c4be0c1dSTakashi Sato 	int error = 0;
3122ac27a0ecSDave Kleikamp 
3123ac27a0ecSDave Kleikamp 	if (!sbh)
3124c4be0c1dSTakashi Sato 		return error;
3125914258bfSTheodore Ts'o 	if (buffer_write_io_error(sbh)) {
3126914258bfSTheodore Ts'o 		/*
3127914258bfSTheodore Ts'o 		 * Oh, dear.  A previous attempt to write the
3128914258bfSTheodore Ts'o 		 * superblock failed.  This could happen because the
3129914258bfSTheodore Ts'o 		 * USB device was yanked out.  Or it could happen to
3130914258bfSTheodore Ts'o 		 * be a transient write error and maybe the block will
3131914258bfSTheodore Ts'o 		 * be remapped.  Nothing we can do but to retry the
3132914258bfSTheodore Ts'o 		 * write and hope for the best.
3133914258bfSTheodore Ts'o 		 */
3134abda1418STheodore Ts'o 		printk(KERN_ERR "EXT4-fs: previous I/O error to "
3135914258bfSTheodore Ts'o 		       "superblock detected for %s.\n", sb->s_id);
3136914258bfSTheodore Ts'o 		clear_buffer_write_io_error(sbh);
3137914258bfSTheodore Ts'o 		set_buffer_uptodate(sbh);
3138914258bfSTheodore Ts'o 	}
3139ac27a0ecSDave Kleikamp 	es->s_wtime = cpu_to_le32(get_seconds());
3140afc32f7eSTheodore Ts'o 	es->s_kbytes_written =
3141afc32f7eSTheodore Ts'o 		cpu_to_le64(EXT4_SB(sb)->s_kbytes_written +
3142afc32f7eSTheodore Ts'o 			    ((part_stat_read(sb->s_bdev->bd_part, sectors[1]) -
3143afc32f7eSTheodore Ts'o 			      EXT4_SB(sb)->s_sectors_written_start) >> 1));
31445d1b1b3fSAneesh Kumar K.V 	ext4_free_blocks_count_set(es, percpu_counter_sum_positive(
31455d1b1b3fSAneesh Kumar K.V 					&EXT4_SB(sb)->s_freeblocks_counter));
31465d1b1b3fSAneesh Kumar K.V 	es->s_free_inodes_count = cpu_to_le32(percpu_counter_sum_positive(
31475d1b1b3fSAneesh Kumar K.V 					&EXT4_SB(sb)->s_freeinodes_counter));
31485d1b1b3fSAneesh Kumar K.V 
3149ac27a0ecSDave Kleikamp 	BUFFER_TRACE(sbh, "marking dirty");
3150ac27a0ecSDave Kleikamp 	mark_buffer_dirty(sbh);
3151914258bfSTheodore Ts'o 	if (sync) {
3152c4be0c1dSTakashi Sato 		error = sync_dirty_buffer(sbh);
3153c4be0c1dSTakashi Sato 		if (error)
3154c4be0c1dSTakashi Sato 			return error;
3155c4be0c1dSTakashi Sato 
3156c4be0c1dSTakashi Sato 		error = buffer_write_io_error(sbh);
3157c4be0c1dSTakashi Sato 		if (error) {
3158abda1418STheodore Ts'o 			printk(KERN_ERR "EXT4-fs: I/O error while writing "
3159914258bfSTheodore Ts'o 			       "superblock for %s.\n", sb->s_id);
3160914258bfSTheodore Ts'o 			clear_buffer_write_io_error(sbh);
3161914258bfSTheodore Ts'o 			set_buffer_uptodate(sbh);
3162914258bfSTheodore Ts'o 		}
3163914258bfSTheodore Ts'o 	}
3164c4be0c1dSTakashi Sato 	return error;
3165ac27a0ecSDave Kleikamp }
3166ac27a0ecSDave Kleikamp 
3167ac27a0ecSDave Kleikamp 
3168ac27a0ecSDave Kleikamp /*
3169ac27a0ecSDave Kleikamp  * Have we just finished recovery?  If so, and if we are mounting (or
3170ac27a0ecSDave Kleikamp  * remounting) the filesystem readonly, then we will end up with a
3171ac27a0ecSDave Kleikamp  * consistent fs on disk.  Record that fact.
3172ac27a0ecSDave Kleikamp  */
3173617ba13bSMingming Cao static void ext4_mark_recovery_complete(struct super_block *sb,
3174617ba13bSMingming Cao 					struct ext4_super_block *es)
3175ac27a0ecSDave Kleikamp {
3176617ba13bSMingming Cao 	journal_t *journal = EXT4_SB(sb)->s_journal;
3177ac27a0ecSDave Kleikamp 
31780390131bSFrank Mayhar 	if (!EXT4_HAS_COMPAT_FEATURE(sb, EXT4_FEATURE_COMPAT_HAS_JOURNAL)) {
31790390131bSFrank Mayhar 		BUG_ON(journal != NULL);
31800390131bSFrank Mayhar 		return;
31810390131bSFrank Mayhar 	}
3182dab291afSMingming Cao 	jbd2_journal_lock_updates(journal);
31837ffe1ea8SHidehiro Kawai 	if (jbd2_journal_flush(journal) < 0)
31847ffe1ea8SHidehiro Kawai 		goto out;
31857ffe1ea8SHidehiro Kawai 
318632c37730SJan Kara 	lock_super(sb);
3187617ba13bSMingming Cao 	if (EXT4_HAS_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER) &&
3188ac27a0ecSDave Kleikamp 	    sb->s_flags & MS_RDONLY) {
3189617ba13bSMingming Cao 		EXT4_CLEAR_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER);
3190ac27a0ecSDave Kleikamp 		sb->s_dirt = 0;
3191617ba13bSMingming Cao 		ext4_commit_super(sb, es, 1);
3192ac27a0ecSDave Kleikamp 	}
319332c37730SJan Kara 	unlock_super(sb);
31947ffe1ea8SHidehiro Kawai 
31957ffe1ea8SHidehiro Kawai out:
3196dab291afSMingming Cao 	jbd2_journal_unlock_updates(journal);
3197ac27a0ecSDave Kleikamp }
3198ac27a0ecSDave Kleikamp 
3199ac27a0ecSDave Kleikamp /*
3200ac27a0ecSDave Kleikamp  * If we are mounting (or read-write remounting) a filesystem whose journal
3201ac27a0ecSDave Kleikamp  * has recorded an error from a previous lifetime, move that error to the
3202ac27a0ecSDave Kleikamp  * main filesystem now.
3203ac27a0ecSDave Kleikamp  */
3204617ba13bSMingming Cao static void ext4_clear_journal_err(struct super_block *sb,
3205617ba13bSMingming Cao 				   struct ext4_super_block *es)
3206ac27a0ecSDave Kleikamp {
3207ac27a0ecSDave Kleikamp 	journal_t *journal;
3208ac27a0ecSDave Kleikamp 	int j_errno;
3209ac27a0ecSDave Kleikamp 	const char *errstr;
3210ac27a0ecSDave Kleikamp 
32110390131bSFrank Mayhar 	BUG_ON(!EXT4_HAS_COMPAT_FEATURE(sb, EXT4_FEATURE_COMPAT_HAS_JOURNAL));
32120390131bSFrank Mayhar 
3213617ba13bSMingming Cao 	journal = EXT4_SB(sb)->s_journal;
3214ac27a0ecSDave Kleikamp 
3215ac27a0ecSDave Kleikamp 	/*
3216ac27a0ecSDave Kleikamp 	 * Now check for any error status which may have been recorded in the
3217617ba13bSMingming Cao 	 * journal by a prior ext4_error() or ext4_abort()
3218ac27a0ecSDave Kleikamp 	 */
3219ac27a0ecSDave Kleikamp 
3220dab291afSMingming Cao 	j_errno = jbd2_journal_errno(journal);
3221ac27a0ecSDave Kleikamp 	if (j_errno) {
3222ac27a0ecSDave Kleikamp 		char nbuf[16];
3223ac27a0ecSDave Kleikamp 
3224617ba13bSMingming Cao 		errstr = ext4_decode_error(sb, j_errno, nbuf);
322546e665e9SHarvey Harrison 		ext4_warning(sb, __func__, "Filesystem error recorded "
3226ac27a0ecSDave Kleikamp 			     "from previous mount: %s", errstr);
322746e665e9SHarvey Harrison 		ext4_warning(sb, __func__, "Marking fs in need of "
3228ac27a0ecSDave Kleikamp 			     "filesystem check.");
3229ac27a0ecSDave Kleikamp 
3230617ba13bSMingming Cao 		EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
3231617ba13bSMingming Cao 		es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
3232617ba13bSMingming Cao 		ext4_commit_super(sb, es, 1);
3233ac27a0ecSDave Kleikamp 
3234dab291afSMingming Cao 		jbd2_journal_clear_err(journal);
3235ac27a0ecSDave Kleikamp 	}
3236ac27a0ecSDave Kleikamp }
3237ac27a0ecSDave Kleikamp 
3238ac27a0ecSDave Kleikamp /*
3239ac27a0ecSDave Kleikamp  * Force the running and committing transactions to commit,
3240ac27a0ecSDave Kleikamp  * and wait on the commit.
3241ac27a0ecSDave Kleikamp  */
3242617ba13bSMingming Cao int ext4_force_commit(struct super_block *sb)
3243ac27a0ecSDave Kleikamp {
3244ac27a0ecSDave Kleikamp 	journal_t *journal;
32450390131bSFrank Mayhar 	int ret = 0;
3246ac27a0ecSDave Kleikamp 
3247ac27a0ecSDave Kleikamp 	if (sb->s_flags & MS_RDONLY)
3248ac27a0ecSDave Kleikamp 		return 0;
3249ac27a0ecSDave Kleikamp 
3250617ba13bSMingming Cao 	journal = EXT4_SB(sb)->s_journal;
32510390131bSFrank Mayhar 	if (journal) {
3252ac27a0ecSDave Kleikamp 		sb->s_dirt = 0;
3253617ba13bSMingming Cao 		ret = ext4_journal_force_commit(journal);
32540390131bSFrank Mayhar 	}
32550390131bSFrank Mayhar 
3256ac27a0ecSDave Kleikamp 	return ret;
3257ac27a0ecSDave Kleikamp }
3258ac27a0ecSDave Kleikamp 
3259ac27a0ecSDave Kleikamp /*
3260617ba13bSMingming Cao  * Ext4 always journals updates to the superblock itself, so we don't
3261ac27a0ecSDave Kleikamp  * have to propagate any other updates to the superblock on disk at this
326214ce0cb4STheodore Ts'o  * point.  (We can probably nuke this function altogether, and remove
326314ce0cb4STheodore Ts'o  * any mention to sb->s_dirt in all of fs/ext4; eventual cleanup...)
3264ac27a0ecSDave Kleikamp  */
3265617ba13bSMingming Cao static void ext4_write_super(struct super_block *sb)
3266ac27a0ecSDave Kleikamp {
32670390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal) {
3268ac27a0ecSDave Kleikamp 		if (mutex_trylock(&sb->s_lock) != 0)
3269ac27a0ecSDave Kleikamp 			BUG();
3270ac27a0ecSDave Kleikamp 		sb->s_dirt = 0;
32710390131bSFrank Mayhar 	} else {
32720390131bSFrank Mayhar 		ext4_commit_super(sb, EXT4_SB(sb)->s_es, 1);
32730390131bSFrank Mayhar 	}
3274ac27a0ecSDave Kleikamp }
3275ac27a0ecSDave Kleikamp 
3276617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait)
3277ac27a0ecSDave Kleikamp {
327814ce0cb4STheodore Ts'o 	int ret = 0;
32799eddacf9SJan Kara 	tid_t target;
3280ac27a0ecSDave Kleikamp 
3281ede86cc4STheodore Ts'o 	trace_mark(ext4_sync_fs, "dev %s wait %d", sb->s_id, wait);
3282ac27a0ecSDave Kleikamp 	sb->s_dirt = 0;
32830390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal) {
32849eddacf9SJan Kara 		if (jbd2_journal_start_commit(EXT4_SB(sb)->s_journal,
32859eddacf9SJan Kara 					      &target)) {
3286ac27a0ecSDave Kleikamp 			if (wait)
32879eddacf9SJan Kara 				jbd2_log_wait_commit(EXT4_SB(sb)->s_journal,
32889eddacf9SJan Kara 						     target);
32899eddacf9SJan Kara 		}
32900390131bSFrank Mayhar 	} else {
32910390131bSFrank Mayhar 		ext4_commit_super(sb, EXT4_SB(sb)->s_es, wait);
32920390131bSFrank Mayhar 	}
329314ce0cb4STheodore Ts'o 	return ret;
3294ac27a0ecSDave Kleikamp }
3295ac27a0ecSDave Kleikamp 
3296ac27a0ecSDave Kleikamp /*
3297ac27a0ecSDave Kleikamp  * LVM calls this function before a (read-only) snapshot is created.  This
3298ac27a0ecSDave Kleikamp  * gives us a chance to flush the journal completely and mark the fs clean.
3299ac27a0ecSDave Kleikamp  */
3300c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb)
3301ac27a0ecSDave Kleikamp {
3302c4be0c1dSTakashi Sato 	int error = 0;
3303c4be0c1dSTakashi Sato 	journal_t *journal;
3304ac27a0ecSDave Kleikamp 	sb->s_dirt = 0;
3305ac27a0ecSDave Kleikamp 
3306ac27a0ecSDave Kleikamp 	if (!(sb->s_flags & MS_RDONLY)) {
3307c4be0c1dSTakashi Sato 		journal = EXT4_SB(sb)->s_journal;
3308ac27a0ecSDave Kleikamp 
33090390131bSFrank Mayhar 		if (journal) {
3310ac27a0ecSDave Kleikamp 			/* Now we set up the journal barrier. */
3311dab291afSMingming Cao 			jbd2_journal_lock_updates(journal);
33127ffe1ea8SHidehiro Kawai 
33137ffe1ea8SHidehiro Kawai 			/*
33140390131bSFrank Mayhar 			 * We don't want to clear needs_recovery flag when we
33150390131bSFrank Mayhar 			 * failed to flush the journal.
33167ffe1ea8SHidehiro Kawai 			 */
3317c4be0c1dSTakashi Sato 			error = jbd2_journal_flush(journal);
3318c4be0c1dSTakashi Sato 			if (error < 0)
3319c4be0c1dSTakashi Sato 				goto out;
33200390131bSFrank Mayhar 		}
3321ac27a0ecSDave Kleikamp 
3322ac27a0ecSDave Kleikamp 		/* Journal blocked and flushed, clear needs_recovery flag. */
3323617ba13bSMingming Cao 		EXT4_CLEAR_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER);
3324c4be0c1dSTakashi Sato 		error = ext4_commit_super(sb, EXT4_SB(sb)->s_es, 1);
3325c4be0c1dSTakashi Sato 		if (error)
3326c4be0c1dSTakashi Sato 			goto out;
3327ac27a0ecSDave Kleikamp 	}
3328c4be0c1dSTakashi Sato 	return 0;
3329c4be0c1dSTakashi Sato out:
3330c4be0c1dSTakashi Sato 	jbd2_journal_unlock_updates(journal);
3331c4be0c1dSTakashi Sato 	return error;
3332ac27a0ecSDave Kleikamp }
3333ac27a0ecSDave Kleikamp 
3334ac27a0ecSDave Kleikamp /*
3335ac27a0ecSDave Kleikamp  * Called by LVM after the snapshot is done.  We need to reset the RECOVER
3336ac27a0ecSDave Kleikamp  * flag here, even though the filesystem is not technically dirty yet.
3337ac27a0ecSDave Kleikamp  */
3338c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb)
3339ac27a0ecSDave Kleikamp {
33400390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal && !(sb->s_flags & MS_RDONLY)) {
3341ac27a0ecSDave Kleikamp 		lock_super(sb);
3342ac27a0ecSDave Kleikamp 		/* Reser the needs_recovery flag before the fs is unlocked. */
3343617ba13bSMingming Cao 		EXT4_SET_INCOMPAT_FEATURE(sb, EXT4_FEATURE_INCOMPAT_RECOVER);
3344617ba13bSMingming Cao 		ext4_commit_super(sb, EXT4_SB(sb)->s_es, 1);
3345ac27a0ecSDave Kleikamp 		unlock_super(sb);
3346dab291afSMingming Cao 		jbd2_journal_unlock_updates(EXT4_SB(sb)->s_journal);
3347ac27a0ecSDave Kleikamp 	}
3348c4be0c1dSTakashi Sato 	return 0;
3349ac27a0ecSDave Kleikamp }
3350ac27a0ecSDave Kleikamp 
3351617ba13bSMingming Cao static int ext4_remount(struct super_block *sb, int *flags, char *data)
3352ac27a0ecSDave Kleikamp {
3353617ba13bSMingming Cao 	struct ext4_super_block *es;
3354617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3355617ba13bSMingming Cao 	ext4_fsblk_t n_blocks_count = 0;
3356ac27a0ecSDave Kleikamp 	unsigned long old_sb_flags;
3357617ba13bSMingming Cao 	struct ext4_mount_options old_opts;
33588a266467STheodore Ts'o 	ext4_group_t g;
3359b3881f74STheodore Ts'o 	unsigned int journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
3360ac27a0ecSDave Kleikamp 	int err;
3361ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
3362ac27a0ecSDave Kleikamp 	int i;
3363ac27a0ecSDave Kleikamp #endif
3364ac27a0ecSDave Kleikamp 
3365ac27a0ecSDave Kleikamp 	/* Store the original options */
3366ac27a0ecSDave Kleikamp 	old_sb_flags = sb->s_flags;
3367ac27a0ecSDave Kleikamp 	old_opts.s_mount_opt = sbi->s_mount_opt;
3368ac27a0ecSDave Kleikamp 	old_opts.s_resuid = sbi->s_resuid;
3369ac27a0ecSDave Kleikamp 	old_opts.s_resgid = sbi->s_resgid;
3370ac27a0ecSDave Kleikamp 	old_opts.s_commit_interval = sbi->s_commit_interval;
337130773840STheodore Ts'o 	old_opts.s_min_batch_time = sbi->s_min_batch_time;
337230773840STheodore Ts'o 	old_opts.s_max_batch_time = sbi->s_max_batch_time;
3373ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
3374ac27a0ecSDave Kleikamp 	old_opts.s_jquota_fmt = sbi->s_jquota_fmt;
3375ac27a0ecSDave Kleikamp 	for (i = 0; i < MAXQUOTAS; i++)
3376ac27a0ecSDave Kleikamp 		old_opts.s_qf_names[i] = sbi->s_qf_names[i];
3377ac27a0ecSDave Kleikamp #endif
3378b3881f74STheodore Ts'o 	if (sbi->s_journal && sbi->s_journal->j_task->io_context)
3379b3881f74STheodore Ts'o 		journal_ioprio = sbi->s_journal->j_task->io_context->ioprio;
3380ac27a0ecSDave Kleikamp 
3381ac27a0ecSDave Kleikamp 	/*
3382ac27a0ecSDave Kleikamp 	 * Allow the "check" option to be passed as a remount option.
3383ac27a0ecSDave Kleikamp 	 */
3384b3881f74STheodore Ts'o 	if (!parse_options(data, sb, NULL, &journal_ioprio,
3385b3881f74STheodore Ts'o 			   &n_blocks_count, 1)) {
3386ac27a0ecSDave Kleikamp 		err = -EINVAL;
3387ac27a0ecSDave Kleikamp 		goto restore_opts;
3388ac27a0ecSDave Kleikamp 	}
3389ac27a0ecSDave Kleikamp 
3390617ba13bSMingming Cao 	if (sbi->s_mount_opt & EXT4_MOUNT_ABORT)
339146e665e9SHarvey Harrison 		ext4_abort(sb, __func__, "Abort forced by user");
3392ac27a0ecSDave Kleikamp 
3393ac27a0ecSDave Kleikamp 	sb->s_flags = (sb->s_flags & ~MS_POSIXACL) |
3394617ba13bSMingming Cao 		((sbi->s_mount_opt & EXT4_MOUNT_POSIX_ACL) ? MS_POSIXACL : 0);
3395ac27a0ecSDave Kleikamp 
3396ac27a0ecSDave Kleikamp 	es = sbi->s_es;
3397ac27a0ecSDave Kleikamp 
3398b3881f74STheodore Ts'o 	if (sbi->s_journal) {
3399617ba13bSMingming Cao 		ext4_init_journal_params(sb, sbi->s_journal);
3400b3881f74STheodore Ts'o 		set_task_ioprio(sbi->s_journal->j_task, journal_ioprio);
3401b3881f74STheodore Ts'o 	}
3402ac27a0ecSDave Kleikamp 
3403ac27a0ecSDave Kleikamp 	if ((*flags & MS_RDONLY) != (sb->s_flags & MS_RDONLY) ||
3404bd81d8eeSLaurent Vivier 		n_blocks_count > ext4_blocks_count(es)) {
3405617ba13bSMingming Cao 		if (sbi->s_mount_opt & EXT4_MOUNT_ABORT) {
3406ac27a0ecSDave Kleikamp 			err = -EROFS;
3407ac27a0ecSDave Kleikamp 			goto restore_opts;
3408ac27a0ecSDave Kleikamp 		}
3409ac27a0ecSDave Kleikamp 
3410ac27a0ecSDave Kleikamp 		if (*flags & MS_RDONLY) {
3411ac27a0ecSDave Kleikamp 			/*
3412ac27a0ecSDave Kleikamp 			 * First of all, the unconditional stuff we have to do
3413ac27a0ecSDave Kleikamp 			 * to disable replay of the journal when we next remount
3414ac27a0ecSDave Kleikamp 			 */
3415ac27a0ecSDave Kleikamp 			sb->s_flags |= MS_RDONLY;
3416ac27a0ecSDave Kleikamp 
3417ac27a0ecSDave Kleikamp 			/*
3418ac27a0ecSDave Kleikamp 			 * OK, test if we are remounting a valid rw partition
3419ac27a0ecSDave Kleikamp 			 * readonly, and if so set the rdonly flag and then
3420ac27a0ecSDave Kleikamp 			 * mark the partition as valid again.
3421ac27a0ecSDave Kleikamp 			 */
3422617ba13bSMingming Cao 			if (!(es->s_state & cpu_to_le16(EXT4_VALID_FS)) &&
3423617ba13bSMingming Cao 			    (sbi->s_mount_state & EXT4_VALID_FS))
3424ac27a0ecSDave Kleikamp 				es->s_state = cpu_to_le16(sbi->s_mount_state);
3425ac27a0ecSDave Kleikamp 
342632c37730SJan Kara 			/*
342732c37730SJan Kara 			 * We have to unlock super so that we can wait for
342832c37730SJan Kara 			 * transactions.
342932c37730SJan Kara 			 */
34300390131bSFrank Mayhar 			if (sbi->s_journal) {
343132c37730SJan Kara 				unlock_super(sb);
3432617ba13bSMingming Cao 				ext4_mark_recovery_complete(sb, es);
343332c37730SJan Kara 				lock_super(sb);
34340390131bSFrank Mayhar 			}
3435ac27a0ecSDave Kleikamp 		} else {
34363a06d778SAneesh Kumar K.V 			int ret;
3437617ba13bSMingming Cao 			if ((ret = EXT4_HAS_RO_COMPAT_FEATURE(sb,
3438617ba13bSMingming Cao 					~EXT4_FEATURE_RO_COMPAT_SUPP))) {
3439617ba13bSMingming Cao 				printk(KERN_WARNING "EXT4-fs: %s: couldn't "
3440ac27a0ecSDave Kleikamp 				       "remount RDWR because of unsupported "
34413a06d778SAneesh Kumar K.V 				       "optional features (%x).\n", sb->s_id,
34423a06d778SAneesh Kumar K.V 				(le32_to_cpu(sbi->s_es->s_feature_ro_compat) &
34433a06d778SAneesh Kumar K.V 					~EXT4_FEATURE_RO_COMPAT_SUPP));
3444ac27a0ecSDave Kleikamp 				err = -EROFS;
3445ac27a0ecSDave Kleikamp 				goto restore_opts;
3446ac27a0ecSDave Kleikamp 			}
3447ead6596bSEric Sandeen 
3448ead6596bSEric Sandeen 			/*
34498a266467STheodore Ts'o 			 * Make sure the group descriptor checksums
34508a266467STheodore Ts'o 			 * are sane.  If they aren't, refuse to
34518a266467STheodore Ts'o 			 * remount r/w.
34528a266467STheodore Ts'o 			 */
34538a266467STheodore Ts'o 			for (g = 0; g < sbi->s_groups_count; g++) {
34548a266467STheodore Ts'o 				struct ext4_group_desc *gdp =
34558a266467STheodore Ts'o 					ext4_get_group_desc(sb, g, NULL);
34568a266467STheodore Ts'o 
34578a266467STheodore Ts'o 				if (!ext4_group_desc_csum_verify(sbi, g, gdp)) {
34588a266467STheodore Ts'o 					printk(KERN_ERR
34598a266467STheodore Ts'o 	       "EXT4-fs: ext4_remount: "
3460a9df9a49STheodore Ts'o 		"Checksum for group %u failed (%u!=%u)\n",
34618a266467STheodore Ts'o 		g, le16_to_cpu(ext4_group_desc_csum(sbi, g, gdp)),
34628a266467STheodore Ts'o 					       le16_to_cpu(gdp->bg_checksum));
34638a266467STheodore Ts'o 					err = -EINVAL;
34648a266467STheodore Ts'o 					goto restore_opts;
34658a266467STheodore Ts'o 				}
34668a266467STheodore Ts'o 			}
34678a266467STheodore Ts'o 
34688a266467STheodore Ts'o 			/*
3469ead6596bSEric Sandeen 			 * If we have an unprocessed orphan list hanging
3470ead6596bSEric Sandeen 			 * around from a previously readonly bdev mount,
3471ead6596bSEric Sandeen 			 * require a full umount/remount for now.
3472ead6596bSEric Sandeen 			 */
3473ead6596bSEric Sandeen 			if (es->s_last_orphan) {
3474ead6596bSEric Sandeen 				printk(KERN_WARNING "EXT4-fs: %s: couldn't "
3475ead6596bSEric Sandeen 				       "remount RDWR because of unprocessed "
3476ead6596bSEric Sandeen 				       "orphan inode list.  Please "
3477ead6596bSEric Sandeen 				       "umount/remount instead.\n",
3478ead6596bSEric Sandeen 				       sb->s_id);
3479ead6596bSEric Sandeen 				err = -EINVAL;
3480ead6596bSEric Sandeen 				goto restore_opts;
3481ead6596bSEric Sandeen 			}
3482ead6596bSEric Sandeen 
3483ac27a0ecSDave Kleikamp 			/*
3484ac27a0ecSDave Kleikamp 			 * Mounting a RDONLY partition read-write, so reread
3485ac27a0ecSDave Kleikamp 			 * and store the current valid flag.  (It may have
3486ac27a0ecSDave Kleikamp 			 * been changed by e2fsck since we originally mounted
3487ac27a0ecSDave Kleikamp 			 * the partition.)
3488ac27a0ecSDave Kleikamp 			 */
34890390131bSFrank Mayhar 			if (sbi->s_journal)
3490617ba13bSMingming Cao 				ext4_clear_journal_err(sb, es);
3491ac27a0ecSDave Kleikamp 			sbi->s_mount_state = le16_to_cpu(es->s_state);
3492617ba13bSMingming Cao 			if ((err = ext4_group_extend(sb, es, n_blocks_count)))
3493ac27a0ecSDave Kleikamp 				goto restore_opts;
3494617ba13bSMingming Cao 			if (!ext4_setup_super(sb, es, 0))
3495ac27a0ecSDave Kleikamp 				sb->s_flags &= ~MS_RDONLY;
3496ac27a0ecSDave Kleikamp 		}
3497ac27a0ecSDave Kleikamp 	}
34980390131bSFrank Mayhar 	if (sbi->s_journal == NULL)
34990390131bSFrank Mayhar 		ext4_commit_super(sb, es, 1);
35000390131bSFrank Mayhar 
3501ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
3502ac27a0ecSDave Kleikamp 	/* Release old quota file names */
3503ac27a0ecSDave Kleikamp 	for (i = 0; i < MAXQUOTAS; i++)
3504ac27a0ecSDave Kleikamp 		if (old_opts.s_qf_names[i] &&
3505ac27a0ecSDave Kleikamp 		    old_opts.s_qf_names[i] != sbi->s_qf_names[i])
3506ac27a0ecSDave Kleikamp 			kfree(old_opts.s_qf_names[i]);
3507ac27a0ecSDave Kleikamp #endif
3508ac27a0ecSDave Kleikamp 	return 0;
3509ac27a0ecSDave Kleikamp restore_opts:
3510ac27a0ecSDave Kleikamp 	sb->s_flags = old_sb_flags;
3511ac27a0ecSDave Kleikamp 	sbi->s_mount_opt = old_opts.s_mount_opt;
3512ac27a0ecSDave Kleikamp 	sbi->s_resuid = old_opts.s_resuid;
3513ac27a0ecSDave Kleikamp 	sbi->s_resgid = old_opts.s_resgid;
3514ac27a0ecSDave Kleikamp 	sbi->s_commit_interval = old_opts.s_commit_interval;
351530773840STheodore Ts'o 	sbi->s_min_batch_time = old_opts.s_min_batch_time;
351630773840STheodore Ts'o 	sbi->s_max_batch_time = old_opts.s_max_batch_time;
3517ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
3518ac27a0ecSDave Kleikamp 	sbi->s_jquota_fmt = old_opts.s_jquota_fmt;
3519ac27a0ecSDave Kleikamp 	for (i = 0; i < MAXQUOTAS; i++) {
3520ac27a0ecSDave Kleikamp 		if (sbi->s_qf_names[i] &&
3521ac27a0ecSDave Kleikamp 		    old_opts.s_qf_names[i] != sbi->s_qf_names[i])
3522ac27a0ecSDave Kleikamp 			kfree(sbi->s_qf_names[i]);
3523ac27a0ecSDave Kleikamp 		sbi->s_qf_names[i] = old_opts.s_qf_names[i];
3524ac27a0ecSDave Kleikamp 	}
3525ac27a0ecSDave Kleikamp #endif
3526ac27a0ecSDave Kleikamp 	return err;
3527ac27a0ecSDave Kleikamp }
3528ac27a0ecSDave Kleikamp 
3529617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf)
3530ac27a0ecSDave Kleikamp {
3531ac27a0ecSDave Kleikamp 	struct super_block *sb = dentry->d_sb;
3532617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3533617ba13bSMingming Cao 	struct ext4_super_block *es = sbi->s_es;
3534960cc398SPekka Enberg 	u64 fsid;
3535ac27a0ecSDave Kleikamp 
35365e70030dSBadari Pulavarty 	if (test_opt(sb, MINIX_DF)) {
35375e70030dSBadari Pulavarty 		sbi->s_overhead_last = 0;
35386bc9feffSAneesh Kumar K.V 	} else if (sbi->s_blocks_last != ext4_blocks_count(es)) {
3539fd2d4291SAvantika Mathur 		ext4_group_t ngroups = sbi->s_groups_count, i;
35405e70030dSBadari Pulavarty 		ext4_fsblk_t overhead = 0;
3541ac27a0ecSDave Kleikamp 		smp_rmb();
3542ac27a0ecSDave Kleikamp 
3543ac27a0ecSDave Kleikamp 		/*
35445e70030dSBadari Pulavarty 		 * Compute the overhead (FS structures).  This is constant
35455e70030dSBadari Pulavarty 		 * for a given filesystem unless the number of block groups
35465e70030dSBadari Pulavarty 		 * changes so we cache the previous value until it does.
3547ac27a0ecSDave Kleikamp 		 */
3548ac27a0ecSDave Kleikamp 
3549ac27a0ecSDave Kleikamp 		/*
3550ac27a0ecSDave Kleikamp 		 * All of the blocks before first_data_block are
3551ac27a0ecSDave Kleikamp 		 * overhead
3552ac27a0ecSDave Kleikamp 		 */
3553ac27a0ecSDave Kleikamp 		overhead = le32_to_cpu(es->s_first_data_block);
3554ac27a0ecSDave Kleikamp 
3555ac27a0ecSDave Kleikamp 		/*
3556ac27a0ecSDave Kleikamp 		 * Add the overhead attributed to the superblock and
3557ac27a0ecSDave Kleikamp 		 * block group descriptors.  If the sparse superblocks
3558ac27a0ecSDave Kleikamp 		 * feature is turned on, then not all groups have this.
3559ac27a0ecSDave Kleikamp 		 */
3560ac27a0ecSDave Kleikamp 		for (i = 0; i < ngroups; i++) {
3561617ba13bSMingming Cao 			overhead += ext4_bg_has_super(sb, i) +
3562617ba13bSMingming Cao 				ext4_bg_num_gdb(sb, i);
3563ac27a0ecSDave Kleikamp 			cond_resched();
3564ac27a0ecSDave Kleikamp 		}
3565ac27a0ecSDave Kleikamp 
3566ac27a0ecSDave Kleikamp 		/*
3567ac27a0ecSDave Kleikamp 		 * Every block group has an inode bitmap, a block
3568ac27a0ecSDave Kleikamp 		 * bitmap, and an inode table.
3569ac27a0ecSDave Kleikamp 		 */
35705e70030dSBadari Pulavarty 		overhead += ngroups * (2 + sbi->s_itb_per_group);
35715e70030dSBadari Pulavarty 		sbi->s_overhead_last = overhead;
35725e70030dSBadari Pulavarty 		smp_wmb();
35736bc9feffSAneesh Kumar K.V 		sbi->s_blocks_last = ext4_blocks_count(es);
3574ac27a0ecSDave Kleikamp 	}
3575ac27a0ecSDave Kleikamp 
3576617ba13bSMingming Cao 	buf->f_type = EXT4_SUPER_MAGIC;
3577ac27a0ecSDave Kleikamp 	buf->f_bsize = sb->s_blocksize;
35785e70030dSBadari Pulavarty 	buf->f_blocks = ext4_blocks_count(es) - sbi->s_overhead_last;
35796bc6e63fSAneesh Kumar K.V 	buf->f_bfree = percpu_counter_sum_positive(&sbi->s_freeblocks_counter) -
35806bc6e63fSAneesh Kumar K.V 		       percpu_counter_sum_positive(&sbi->s_dirtyblocks_counter);
3581308ba3ecSAneesh Kumar K.V 	ext4_free_blocks_count_set(es, buf->f_bfree);
3582bd81d8eeSLaurent Vivier 	buf->f_bavail = buf->f_bfree - ext4_r_blocks_count(es);
3583bd81d8eeSLaurent Vivier 	if (buf->f_bfree < ext4_r_blocks_count(es))
3584ac27a0ecSDave Kleikamp 		buf->f_bavail = 0;
3585ac27a0ecSDave Kleikamp 	buf->f_files = le32_to_cpu(es->s_inodes_count);
358652d9f3b4SPeter Zijlstra 	buf->f_ffree = percpu_counter_sum_positive(&sbi->s_freeinodes_counter);
35875e70030dSBadari Pulavarty 	es->s_free_inodes_count = cpu_to_le32(buf->f_ffree);
3588617ba13bSMingming Cao 	buf->f_namelen = EXT4_NAME_LEN;
3589960cc398SPekka Enberg 	fsid = le64_to_cpup((void *)es->s_uuid) ^
3590960cc398SPekka Enberg 	       le64_to_cpup((void *)es->s_uuid + sizeof(u64));
3591960cc398SPekka Enberg 	buf->f_fsid.val[0] = fsid & 0xFFFFFFFFUL;
3592960cc398SPekka Enberg 	buf->f_fsid.val[1] = (fsid >> 32) & 0xFFFFFFFFUL;
3593ac27a0ecSDave Kleikamp 	return 0;
3594ac27a0ecSDave Kleikamp }
3595ac27a0ecSDave Kleikamp 
3596ac27a0ecSDave Kleikamp /* Helper function for writing quotas on sync - we need to start transaction before quota file
3597ac27a0ecSDave Kleikamp  * is locked for write. Otherwise the are possible deadlocks:
3598ac27a0ecSDave Kleikamp  * Process 1                         Process 2
3599617ba13bSMingming Cao  * ext4_create()                     quota_sync()
3600dab291afSMingming Cao  *   jbd2_journal_start()                  write_dquot()
3601a269eb18SJan Kara  *   vfs_dq_init()                         down(dqio_mutex)
3602dab291afSMingming Cao  *     down(dqio_mutex)                    jbd2_journal_start()
3603ac27a0ecSDave Kleikamp  *
3604ac27a0ecSDave Kleikamp  */
3605ac27a0ecSDave Kleikamp 
3606ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
3607ac27a0ecSDave Kleikamp 
3608ac27a0ecSDave Kleikamp static inline struct inode *dquot_to_inode(struct dquot *dquot)
3609ac27a0ecSDave Kleikamp {
3610ac27a0ecSDave Kleikamp 	return sb_dqopt(dquot->dq_sb)->files[dquot->dq_type];
3611ac27a0ecSDave Kleikamp }
3612ac27a0ecSDave Kleikamp 
3613617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot)
3614ac27a0ecSDave Kleikamp {
3615ac27a0ecSDave Kleikamp 	int ret, err;
3616ac27a0ecSDave Kleikamp 	handle_t *handle;
3617ac27a0ecSDave Kleikamp 	struct inode *inode;
3618ac27a0ecSDave Kleikamp 
3619ac27a0ecSDave Kleikamp 	inode = dquot_to_inode(dquot);
3620617ba13bSMingming Cao 	handle = ext4_journal_start(inode,
3621617ba13bSMingming Cao 					EXT4_QUOTA_TRANS_BLOCKS(dquot->dq_sb));
3622ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
3623ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
3624ac27a0ecSDave Kleikamp 	ret = dquot_commit(dquot);
3625617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
3626ac27a0ecSDave Kleikamp 	if (!ret)
3627ac27a0ecSDave Kleikamp 		ret = err;
3628ac27a0ecSDave Kleikamp 	return ret;
3629ac27a0ecSDave Kleikamp }
3630ac27a0ecSDave Kleikamp 
3631617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot)
3632ac27a0ecSDave Kleikamp {
3633ac27a0ecSDave Kleikamp 	int ret, err;
3634ac27a0ecSDave Kleikamp 	handle_t *handle;
3635ac27a0ecSDave Kleikamp 
3636617ba13bSMingming Cao 	handle = ext4_journal_start(dquot_to_inode(dquot),
3637617ba13bSMingming Cao 					EXT4_QUOTA_INIT_BLOCKS(dquot->dq_sb));
3638ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
3639ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
3640ac27a0ecSDave Kleikamp 	ret = dquot_acquire(dquot);
3641617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
3642ac27a0ecSDave Kleikamp 	if (!ret)
3643ac27a0ecSDave Kleikamp 		ret = err;
3644ac27a0ecSDave Kleikamp 	return ret;
3645ac27a0ecSDave Kleikamp }
3646ac27a0ecSDave Kleikamp 
3647617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot)
3648ac27a0ecSDave Kleikamp {
3649ac27a0ecSDave Kleikamp 	int ret, err;
3650ac27a0ecSDave Kleikamp 	handle_t *handle;
3651ac27a0ecSDave Kleikamp 
3652617ba13bSMingming Cao 	handle = ext4_journal_start(dquot_to_inode(dquot),
3653617ba13bSMingming Cao 					EXT4_QUOTA_DEL_BLOCKS(dquot->dq_sb));
36549c3013e9SJan Kara 	if (IS_ERR(handle)) {
36559c3013e9SJan Kara 		/* Release dquot anyway to avoid endless cycle in dqput() */
36569c3013e9SJan Kara 		dquot_release(dquot);
3657ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
36589c3013e9SJan Kara 	}
3659ac27a0ecSDave Kleikamp 	ret = dquot_release(dquot);
3660617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
3661ac27a0ecSDave Kleikamp 	if (!ret)
3662ac27a0ecSDave Kleikamp 		ret = err;
3663ac27a0ecSDave Kleikamp 	return ret;
3664ac27a0ecSDave Kleikamp }
3665ac27a0ecSDave Kleikamp 
3666617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot)
3667ac27a0ecSDave Kleikamp {
36682c8be6b2SJan Kara 	/* Are we journaling quotas? */
3669617ba13bSMingming Cao 	if (EXT4_SB(dquot->dq_sb)->s_qf_names[USRQUOTA] ||
3670617ba13bSMingming Cao 	    EXT4_SB(dquot->dq_sb)->s_qf_names[GRPQUOTA]) {
3671ac27a0ecSDave Kleikamp 		dquot_mark_dquot_dirty(dquot);
3672617ba13bSMingming Cao 		return ext4_write_dquot(dquot);
3673ac27a0ecSDave Kleikamp 	} else {
3674ac27a0ecSDave Kleikamp 		return dquot_mark_dquot_dirty(dquot);
3675ac27a0ecSDave Kleikamp 	}
3676ac27a0ecSDave Kleikamp }
3677ac27a0ecSDave Kleikamp 
3678617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type)
3679ac27a0ecSDave Kleikamp {
3680ac27a0ecSDave Kleikamp 	int ret, err;
3681ac27a0ecSDave Kleikamp 	handle_t *handle;
3682ac27a0ecSDave Kleikamp 
3683ac27a0ecSDave Kleikamp 	/* Data block + inode block */
3684617ba13bSMingming Cao 	handle = ext4_journal_start(sb->s_root->d_inode, 2);
3685ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
3686ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
3687ac27a0ecSDave Kleikamp 	ret = dquot_commit_info(sb, type);
3688617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
3689ac27a0ecSDave Kleikamp 	if (!ret)
3690ac27a0ecSDave Kleikamp 		ret = err;
3691ac27a0ecSDave Kleikamp 	return ret;
3692ac27a0ecSDave Kleikamp }
3693ac27a0ecSDave Kleikamp 
3694ac27a0ecSDave Kleikamp /*
3695ac27a0ecSDave Kleikamp  * Turn on quotas during mount time - we need to find
3696ac27a0ecSDave Kleikamp  * the quota file and such...
3697ac27a0ecSDave Kleikamp  */
3698617ba13bSMingming Cao static int ext4_quota_on_mount(struct super_block *sb, int type)
3699ac27a0ecSDave Kleikamp {
3700617ba13bSMingming Cao 	return vfs_quota_on_mount(sb, EXT4_SB(sb)->s_qf_names[type],
3701617ba13bSMingming Cao 			EXT4_SB(sb)->s_jquota_fmt, type);
3702ac27a0ecSDave Kleikamp }
3703ac27a0ecSDave Kleikamp 
3704ac27a0ecSDave Kleikamp /*
3705ac27a0ecSDave Kleikamp  * Standard function to be called on quota_on
3706ac27a0ecSDave Kleikamp  */
3707617ba13bSMingming Cao static int ext4_quota_on(struct super_block *sb, int type, int format_id,
37088264613dSAl Viro 			 char *name, int remount)
3709ac27a0ecSDave Kleikamp {
3710ac27a0ecSDave Kleikamp 	int err;
37118264613dSAl Viro 	struct path path;
3712ac27a0ecSDave Kleikamp 
3713ac27a0ecSDave Kleikamp 	if (!test_opt(sb, QUOTA))
3714ac27a0ecSDave Kleikamp 		return -EINVAL;
37158264613dSAl Viro 	/* When remounting, no checks are needed and in fact, name is NULL */
37160623543bSJan Kara 	if (remount)
37178264613dSAl Viro 		return vfs_quota_on(sb, type, format_id, name, remount);
37180623543bSJan Kara 
37198264613dSAl Viro 	err = kern_path(name, LOOKUP_FOLLOW, &path);
3720ac27a0ecSDave Kleikamp 	if (err)
3721ac27a0ecSDave Kleikamp 		return err;
37220623543bSJan Kara 
3723ac27a0ecSDave Kleikamp 	/* Quotafile not on the same filesystem? */
37248264613dSAl Viro 	if (path.mnt->mnt_sb != sb) {
37258264613dSAl Viro 		path_put(&path);
3726ac27a0ecSDave Kleikamp 		return -EXDEV;
3727ac27a0ecSDave Kleikamp 	}
37280623543bSJan Kara 	/* Journaling quota? */
37290623543bSJan Kara 	if (EXT4_SB(sb)->s_qf_names[type]) {
37302b2d6d01STheodore Ts'o 		/* Quotafile not in fs root? */
37318264613dSAl Viro 		if (path.dentry->d_parent != sb->s_root)
3732ac27a0ecSDave Kleikamp 			printk(KERN_WARNING
3733617ba13bSMingming Cao 				"EXT4-fs: Quota file not on filesystem root. "
37340623543bSJan Kara 				"Journaled quota will not work.\n");
37350623543bSJan Kara 	}
37360623543bSJan Kara 
37370623543bSJan Kara 	/*
37380623543bSJan Kara 	 * When we journal data on quota file, we have to flush journal to see
37390623543bSJan Kara 	 * all updates to the file when we bypass pagecache...
37400623543bSJan Kara 	 */
37410390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal &&
37420390131bSFrank Mayhar 	    ext4_should_journal_data(path.dentry->d_inode)) {
37430623543bSJan Kara 		/*
37440623543bSJan Kara 		 * We don't need to lock updates but journal_flush() could
37450623543bSJan Kara 		 * otherwise be livelocked...
37460623543bSJan Kara 		 */
37470623543bSJan Kara 		jbd2_journal_lock_updates(EXT4_SB(sb)->s_journal);
37487ffe1ea8SHidehiro Kawai 		err = jbd2_journal_flush(EXT4_SB(sb)->s_journal);
37490623543bSJan Kara 		jbd2_journal_unlock_updates(EXT4_SB(sb)->s_journal);
37507ffe1ea8SHidehiro Kawai 		if (err) {
37518264613dSAl Viro 			path_put(&path);
37527ffe1ea8SHidehiro Kawai 			return err;
37537ffe1ea8SHidehiro Kawai 		}
37540623543bSJan Kara 	}
37550623543bSJan Kara 
37568264613dSAl Viro 	err = vfs_quota_on_path(sb, type, format_id, &path);
37578264613dSAl Viro 	path_put(&path);
375877e69dacSAl Viro 	return err;
3759ac27a0ecSDave Kleikamp }
3760ac27a0ecSDave Kleikamp 
3761ac27a0ecSDave Kleikamp /* Read data from quotafile - avoid pagecache and such because we cannot afford
3762ac27a0ecSDave Kleikamp  * acquiring the locks... As quota files are never truncated and quota code
3763ac27a0ecSDave Kleikamp  * itself serializes the operations (and noone else should touch the files)
3764ac27a0ecSDave Kleikamp  * we don't have to be afraid of races */
3765617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
3766ac27a0ecSDave Kleikamp 			       size_t len, loff_t off)
3767ac27a0ecSDave Kleikamp {
3768ac27a0ecSDave Kleikamp 	struct inode *inode = sb_dqopt(sb)->files[type];
3769725d26d3SAneesh Kumar K.V 	ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
3770ac27a0ecSDave Kleikamp 	int err = 0;
3771ac27a0ecSDave Kleikamp 	int offset = off & (sb->s_blocksize - 1);
3772ac27a0ecSDave Kleikamp 	int tocopy;
3773ac27a0ecSDave Kleikamp 	size_t toread;
3774ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
3775ac27a0ecSDave Kleikamp 	loff_t i_size = i_size_read(inode);
3776ac27a0ecSDave Kleikamp 
3777ac27a0ecSDave Kleikamp 	if (off > i_size)
3778ac27a0ecSDave Kleikamp 		return 0;
3779ac27a0ecSDave Kleikamp 	if (off+len > i_size)
3780ac27a0ecSDave Kleikamp 		len = i_size-off;
3781ac27a0ecSDave Kleikamp 	toread = len;
3782ac27a0ecSDave Kleikamp 	while (toread > 0) {
3783ac27a0ecSDave Kleikamp 		tocopy = sb->s_blocksize - offset < toread ?
3784ac27a0ecSDave Kleikamp 				sb->s_blocksize - offset : toread;
3785617ba13bSMingming Cao 		bh = ext4_bread(NULL, inode, blk, 0, &err);
3786ac27a0ecSDave Kleikamp 		if (err)
3787ac27a0ecSDave Kleikamp 			return err;
3788ac27a0ecSDave Kleikamp 		if (!bh)	/* A hole? */
3789ac27a0ecSDave Kleikamp 			memset(data, 0, tocopy);
3790ac27a0ecSDave Kleikamp 		else
3791ac27a0ecSDave Kleikamp 			memcpy(data, bh->b_data+offset, tocopy);
3792ac27a0ecSDave Kleikamp 		brelse(bh);
3793ac27a0ecSDave Kleikamp 		offset = 0;
3794ac27a0ecSDave Kleikamp 		toread -= tocopy;
3795ac27a0ecSDave Kleikamp 		data += tocopy;
3796ac27a0ecSDave Kleikamp 		blk++;
3797ac27a0ecSDave Kleikamp 	}
3798ac27a0ecSDave Kleikamp 	return len;
3799ac27a0ecSDave Kleikamp }
3800ac27a0ecSDave Kleikamp 
3801ac27a0ecSDave Kleikamp /* Write to quotafile (we know the transaction is already started and has
3802ac27a0ecSDave Kleikamp  * enough credits) */
3803617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
3804ac27a0ecSDave Kleikamp 				const char *data, size_t len, loff_t off)
3805ac27a0ecSDave Kleikamp {
3806ac27a0ecSDave Kleikamp 	struct inode *inode = sb_dqopt(sb)->files[type];
3807725d26d3SAneesh Kumar K.V 	ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
3808ac27a0ecSDave Kleikamp 	int err = 0;
3809ac27a0ecSDave Kleikamp 	int offset = off & (sb->s_blocksize - 1);
3810ac27a0ecSDave Kleikamp 	int tocopy;
3811617ba13bSMingming Cao 	int journal_quota = EXT4_SB(sb)->s_qf_names[type] != NULL;
3812ac27a0ecSDave Kleikamp 	size_t towrite = len;
3813ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
3814ac27a0ecSDave Kleikamp 	handle_t *handle = journal_current_handle();
3815ac27a0ecSDave Kleikamp 
38160390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal && !handle) {
3817e5f8eab8STheodore Ts'o 		printk(KERN_WARNING "EXT4-fs: Quota write (off=%llu, len=%llu)"
38189c3013e9SJan Kara 			" cancelled because transaction is not started.\n",
38199c3013e9SJan Kara 			(unsigned long long)off, (unsigned long long)len);
38209c3013e9SJan Kara 		return -EIO;
38219c3013e9SJan Kara 	}
3822ac27a0ecSDave Kleikamp 	mutex_lock_nested(&inode->i_mutex, I_MUTEX_QUOTA);
3823ac27a0ecSDave Kleikamp 	while (towrite > 0) {
3824ac27a0ecSDave Kleikamp 		tocopy = sb->s_blocksize - offset < towrite ?
3825ac27a0ecSDave Kleikamp 				sb->s_blocksize - offset : towrite;
3826617ba13bSMingming Cao 		bh = ext4_bread(handle, inode, blk, 1, &err);
3827ac27a0ecSDave Kleikamp 		if (!bh)
3828ac27a0ecSDave Kleikamp 			goto out;
3829ac27a0ecSDave Kleikamp 		if (journal_quota) {
3830617ba13bSMingming Cao 			err = ext4_journal_get_write_access(handle, bh);
3831ac27a0ecSDave Kleikamp 			if (err) {
3832ac27a0ecSDave Kleikamp 				brelse(bh);
3833ac27a0ecSDave Kleikamp 				goto out;
3834ac27a0ecSDave Kleikamp 			}
3835ac27a0ecSDave Kleikamp 		}
3836ac27a0ecSDave Kleikamp 		lock_buffer(bh);
3837ac27a0ecSDave Kleikamp 		memcpy(bh->b_data+offset, data, tocopy);
3838ac27a0ecSDave Kleikamp 		flush_dcache_page(bh->b_page);
3839ac27a0ecSDave Kleikamp 		unlock_buffer(bh);
3840ac27a0ecSDave Kleikamp 		if (journal_quota)
38410390131bSFrank Mayhar 			err = ext4_handle_dirty_metadata(handle, NULL, bh);
3842ac27a0ecSDave Kleikamp 		else {
3843ac27a0ecSDave Kleikamp 			/* Always do at least ordered writes for quotas */
3844678aaf48SJan Kara 			err = ext4_jbd2_file_inode(handle, inode);
3845ac27a0ecSDave Kleikamp 			mark_buffer_dirty(bh);
3846ac27a0ecSDave Kleikamp 		}
3847ac27a0ecSDave Kleikamp 		brelse(bh);
3848ac27a0ecSDave Kleikamp 		if (err)
3849ac27a0ecSDave Kleikamp 			goto out;
3850ac27a0ecSDave Kleikamp 		offset = 0;
3851ac27a0ecSDave Kleikamp 		towrite -= tocopy;
3852ac27a0ecSDave Kleikamp 		data += tocopy;
3853ac27a0ecSDave Kleikamp 		blk++;
3854ac27a0ecSDave Kleikamp 	}
3855ac27a0ecSDave Kleikamp out:
38564d04e4fbSJan Kara 	if (len == towrite) {
38574d04e4fbSJan Kara 		mutex_unlock(&inode->i_mutex);
3858ac27a0ecSDave Kleikamp 		return err;
38594d04e4fbSJan Kara 	}
3860ac27a0ecSDave Kleikamp 	if (inode->i_size < off+len-towrite) {
3861ac27a0ecSDave Kleikamp 		i_size_write(inode, off+len-towrite);
3862617ba13bSMingming Cao 		EXT4_I(inode)->i_disksize = inode->i_size;
3863ac27a0ecSDave Kleikamp 	}
3864ac27a0ecSDave Kleikamp 	inode->i_mtime = inode->i_ctime = CURRENT_TIME;
3865617ba13bSMingming Cao 	ext4_mark_inode_dirty(handle, inode);
3866ac27a0ecSDave Kleikamp 	mutex_unlock(&inode->i_mutex);
3867ac27a0ecSDave Kleikamp 	return len - towrite;
3868ac27a0ecSDave Kleikamp }
3869ac27a0ecSDave Kleikamp 
3870ac27a0ecSDave Kleikamp #endif
3871ac27a0ecSDave Kleikamp 
3872617ba13bSMingming Cao static int ext4_get_sb(struct file_system_type *fs_type,
3873ac27a0ecSDave Kleikamp 	int flags, const char *dev_name, void *data, struct vfsmount *mnt)
3874ac27a0ecSDave Kleikamp {
3875617ba13bSMingming Cao 	return get_sb_bdev(fs_type, flags, dev_name, data, ext4_fill_super, mnt);
3876ac27a0ecSDave Kleikamp }
3877ac27a0ecSDave Kleikamp 
387803010a33STheodore Ts'o static struct file_system_type ext4_fs_type = {
3879ac27a0ecSDave Kleikamp 	.owner		= THIS_MODULE,
388003010a33STheodore Ts'o 	.name		= "ext4",
3881617ba13bSMingming Cao 	.get_sb		= ext4_get_sb,
3882ac27a0ecSDave Kleikamp 	.kill_sb	= kill_block_super,
3883ac27a0ecSDave Kleikamp 	.fs_flags	= FS_REQUIRES_DEV,
3884ac27a0ecSDave Kleikamp };
3885ac27a0ecSDave Kleikamp 
388603010a33STheodore Ts'o #ifdef CONFIG_EXT4DEV_COMPAT
388703010a33STheodore Ts'o static int ext4dev_get_sb(struct file_system_type *fs_type,
388803010a33STheodore Ts'o 	int flags, const char *dev_name, void *data, struct vfsmount *mnt)
388903010a33STheodore Ts'o {
389003010a33STheodore Ts'o 	printk(KERN_WARNING "EXT4-fs: Update your userspace programs "
389103010a33STheodore Ts'o 	       "to mount using ext4\n");
389203010a33STheodore Ts'o 	printk(KERN_WARNING "EXT4-fs: ext4dev backwards compatibility "
389303010a33STheodore Ts'o 	       "will go away by 2.6.31\n");
389403010a33STheodore Ts'o 	return get_sb_bdev(fs_type, flags, dev_name, data, ext4_fill_super, mnt);
389503010a33STheodore Ts'o }
389603010a33STheodore Ts'o 
389703010a33STheodore Ts'o static struct file_system_type ext4dev_fs_type = {
389803010a33STheodore Ts'o 	.owner		= THIS_MODULE,
389903010a33STheodore Ts'o 	.name		= "ext4dev",
390003010a33STheodore Ts'o 	.get_sb		= ext4dev_get_sb,
390103010a33STheodore Ts'o 	.kill_sb	= kill_block_super,
390203010a33STheodore Ts'o 	.fs_flags	= FS_REQUIRES_DEV,
390303010a33STheodore Ts'o };
390403010a33STheodore Ts'o MODULE_ALIAS("ext4dev");
390503010a33STheodore Ts'o #endif
390603010a33STheodore Ts'o 
3907617ba13bSMingming Cao static int __init init_ext4_fs(void)
3908ac27a0ecSDave Kleikamp {
3909c9de560dSAlex Tomas 	int err;
3910c9de560dSAlex Tomas 
39113197ebdbSTheodore Ts'o 	ext4_kset = kset_create_and_add("ext4", NULL, fs_kobj);
39123197ebdbSTheodore Ts'o 	if (!ext4_kset)
39133197ebdbSTheodore Ts'o 		return -ENOMEM;
39149f6200bbSTheodore Ts'o 	ext4_proc_root = proc_mkdir("fs/ext4", NULL);
3915c9de560dSAlex Tomas 	err = init_ext4_mballoc();
3916ac27a0ecSDave Kleikamp 	if (err)
3917ac27a0ecSDave Kleikamp 		return err;
3918c9de560dSAlex Tomas 
3919c9de560dSAlex Tomas 	err = init_ext4_xattr();
3920c9de560dSAlex Tomas 	if (err)
3921c9de560dSAlex Tomas 		goto out2;
3922ac27a0ecSDave Kleikamp 	err = init_inodecache();
3923ac27a0ecSDave Kleikamp 	if (err)
3924ac27a0ecSDave Kleikamp 		goto out1;
392503010a33STheodore Ts'o 	err = register_filesystem(&ext4_fs_type);
3926ac27a0ecSDave Kleikamp 	if (err)
3927ac27a0ecSDave Kleikamp 		goto out;
392803010a33STheodore Ts'o #ifdef CONFIG_EXT4DEV_COMPAT
392903010a33STheodore Ts'o 	err = register_filesystem(&ext4dev_fs_type);
393003010a33STheodore Ts'o 	if (err) {
393103010a33STheodore Ts'o 		unregister_filesystem(&ext4_fs_type);
393203010a33STheodore Ts'o 		goto out;
393303010a33STheodore Ts'o 	}
393403010a33STheodore Ts'o #endif
3935ac27a0ecSDave Kleikamp 	return 0;
3936ac27a0ecSDave Kleikamp out:
3937ac27a0ecSDave Kleikamp 	destroy_inodecache();
3938ac27a0ecSDave Kleikamp out1:
3939617ba13bSMingming Cao 	exit_ext4_xattr();
3940c9de560dSAlex Tomas out2:
3941c9de560dSAlex Tomas 	exit_ext4_mballoc();
3942ac27a0ecSDave Kleikamp 	return err;
3943ac27a0ecSDave Kleikamp }
3944ac27a0ecSDave Kleikamp 
3945617ba13bSMingming Cao static void __exit exit_ext4_fs(void)
3946ac27a0ecSDave Kleikamp {
394703010a33STheodore Ts'o 	unregister_filesystem(&ext4_fs_type);
394803010a33STheodore Ts'o #ifdef CONFIG_EXT4DEV_COMPAT
3949617ba13bSMingming Cao 	unregister_filesystem(&ext4dev_fs_type);
395003010a33STheodore Ts'o #endif
3951ac27a0ecSDave Kleikamp 	destroy_inodecache();
3952617ba13bSMingming Cao 	exit_ext4_xattr();
3953c9de560dSAlex Tomas 	exit_ext4_mballoc();
39549f6200bbSTheodore Ts'o 	remove_proc_entry("fs/ext4", NULL);
39553197ebdbSTheodore Ts'o 	kset_unregister(ext4_kset);
3956ac27a0ecSDave Kleikamp }
3957ac27a0ecSDave Kleikamp 
3958ac27a0ecSDave Kleikamp MODULE_AUTHOR("Remy Card, Stephen Tweedie, Andrew Morton, Andreas Dilger, Theodore Ts'o and others");
395983982b6fSTheodore Ts'o MODULE_DESCRIPTION("Fourth Extended Filesystem");
3960ac27a0ecSDave Kleikamp MODULE_LICENSE("GPL");
3961617ba13bSMingming Cao module_init(init_ext4_fs)
3962617ba13bSMingming Cao module_exit(exit_ext4_fs)
3963