xref: /linux/fs/ext4/super.c (revision 54902099b1d8b62bea7cfd949aa3acd9eae1c3db)
1f5166768STheodore Ts'o // SPDX-License-Identifier: GPL-2.0
2ac27a0ecSDave Kleikamp /*
3617ba13bSMingming Cao  *  linux/fs/ext4/super.c
4ac27a0ecSDave Kleikamp  *
5ac27a0ecSDave Kleikamp  * Copyright (C) 1992, 1993, 1994, 1995
6ac27a0ecSDave Kleikamp  * Remy Card (card@masi.ibp.fr)
7ac27a0ecSDave Kleikamp  * Laboratoire MASI - Institut Blaise Pascal
8ac27a0ecSDave Kleikamp  * Universite Pierre et Marie Curie (Paris VI)
9ac27a0ecSDave Kleikamp  *
10ac27a0ecSDave Kleikamp  *  from
11ac27a0ecSDave Kleikamp  *
12ac27a0ecSDave Kleikamp  *  linux/fs/minix/inode.c
13ac27a0ecSDave Kleikamp  *
14ac27a0ecSDave Kleikamp  *  Copyright (C) 1991, 1992  Linus Torvalds
15ac27a0ecSDave Kleikamp  *
16ac27a0ecSDave Kleikamp  *  Big-endian to little-endian byte-swapping/bitmaps by
17ac27a0ecSDave Kleikamp  *        David S. Miller (davem@caip.rutgers.edu), 1995
18ac27a0ecSDave Kleikamp  */
19ac27a0ecSDave Kleikamp 
20ac27a0ecSDave Kleikamp #include <linux/module.h>
21ac27a0ecSDave Kleikamp #include <linux/string.h>
22ac27a0ecSDave Kleikamp #include <linux/fs.h>
23ac27a0ecSDave Kleikamp #include <linux/time.h>
24c5ca7c76STheodore Ts'o #include <linux/vmalloc.h>
25ac27a0ecSDave Kleikamp #include <linux/slab.h>
26ac27a0ecSDave Kleikamp #include <linux/init.h>
27ac27a0ecSDave Kleikamp #include <linux/blkdev.h>
2866114cadSTejun Heo #include <linux/backing-dev.h>
29ac27a0ecSDave Kleikamp #include <linux/parser.h>
30ac27a0ecSDave Kleikamp #include <linux/buffer_head.h>
31a5694255SChristoph Hellwig #include <linux/exportfs.h>
32ac27a0ecSDave Kleikamp #include <linux/vfs.h>
33ac27a0ecSDave Kleikamp #include <linux/random.h>
34ac27a0ecSDave Kleikamp #include <linux/mount.h>
35ac27a0ecSDave Kleikamp #include <linux/namei.h>
36ac27a0ecSDave Kleikamp #include <linux/quotaops.h>
37ac27a0ecSDave Kleikamp #include <linux/seq_file.h>
383197ebdbSTheodore Ts'o #include <linux/ctype.h>
391330593eSVignesh Babu #include <linux/log2.h>
40717d50e4SAndreas Dilger #include <linux/crc16.h>
41ef510424SDan Williams #include <linux/dax.h>
427c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
43ee73f9a5SJeff Layton #include <linux/iversion.h>
44c83ad55eSGabriel Krisman Bertazi #include <linux/unicode.h>
45c6a564ffSChristoph Hellwig #include <linux/part_stat.h>
46bfff6873SLukas Czerner #include <linux/kthread.h>
47bfff6873SLukas Czerner #include <linux/freezer.h>
489a089b21SGabriel Krisman Bertazi #include <linux/fsnotify.h>
49e5a185c2SLukas Czerner #include <linux/fs_context.h>
50e5a185c2SLukas Czerner #include <linux/fs_parser.h>
51bfff6873SLukas Czerner 
523dcf5451SChristoph Hellwig #include "ext4.h"
534a092d73STheodore Ts'o #include "ext4_extents.h"	/* Needed for trace points definition */
543dcf5451SChristoph Hellwig #include "ext4_jbd2.h"
55ac27a0ecSDave Kleikamp #include "xattr.h"
56ac27a0ecSDave Kleikamp #include "acl.h"
573661d286STheodore Ts'o #include "mballoc.h"
580c9ec4beSDarrick J. Wong #include "fsmap.h"
59ac27a0ecSDave Kleikamp 
609bffad1eSTheodore Ts'o #define CREATE_TRACE_POINTS
619bffad1eSTheodore Ts'o #include <trace/events/ext4.h>
629bffad1eSTheodore Ts'o 
630b75a840SLukas Czerner static struct ext4_lazy_init *ext4_li_info;
6459ebc7fdSZheng Yongjun static DEFINE_MUTEX(ext4_li_mtx);
65e294a537STheodore Ts'o static struct ratelimit_state ext4_mount_msg_ratelimit;
669f6200bbSTheodore Ts'o 
67617ba13bSMingming Cao static int ext4_load_journal(struct super_block *, struct ext4_super_block *,
68ac27a0ecSDave Kleikamp 			     unsigned long journal_devnum);
692adf6da8STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root);
702d01ddc8SJan Kara static void ext4_update_super(struct super_block *sb);
714392fbc4SJan Kara static int ext4_commit_super(struct super_block *sb);
7211215630SJan Kara static int ext4_mark_recovery_complete(struct super_block *sb,
73617ba13bSMingming Cao 					struct ext4_super_block *es);
7411215630SJan Kara static int ext4_clear_journal_err(struct super_block *sb,
75617ba13bSMingming Cao 				  struct ext4_super_block *es);
76617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait);
77617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf);
78c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb);
79c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb);
802035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb);
812035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb);
82bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void);
83bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb);
848f1f7453SEric Sandeen static void ext4_clear_request_list(void);
85c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb,
86c6cb7e77SEric Whitney 					    unsigned int journal_inum);
87da812f61SLukas Czerner static int ext4_validate_options(struct fs_context *fc);
88b6bd2435SLukas Czerner static int ext4_check_opt_consistency(struct fs_context *fc,
89e6e268cbSLukas Czerner 				      struct super_block *sb);
9085456054SEric Biggers static void ext4_apply_options(struct fs_context *fc, struct super_block *sb);
9102f960f8SLukas Czerner static int ext4_parse_param(struct fs_context *fc, struct fs_parameter *param);
92cebe85d5SLukas Czerner static int ext4_get_tree(struct fs_context *fc);
93cebe85d5SLukas Czerner static int ext4_reconfigure(struct fs_context *fc);
94cebe85d5SLukas Czerner static void ext4_fc_free(struct fs_context *fc);
95cebe85d5SLukas Czerner static int ext4_init_fs_context(struct fs_context *fc);
96cebe85d5SLukas Czerner static const struct fs_parameter_spec ext4_param_specs[];
97ac27a0ecSDave Kleikamp 
98e74031fdSJan Kara /*
99e74031fdSJan Kara  * Lock ordering
100e74031fdSJan Kara  *
101e74031fdSJan Kara  * page fault path:
102d4f5258eSJan Kara  * mmap_lock -> sb_start_pagefault -> invalidate_lock (r) -> transaction start
103d4f5258eSJan Kara  *   -> page lock -> i_data_sem (rw)
104e74031fdSJan Kara  *
105e74031fdSJan Kara  * buffered write path:
106c1e8d7c6SMichel Lespinasse  * sb_start_write -> i_mutex -> mmap_lock
107e74031fdSJan Kara  * sb_start_write -> i_mutex -> transaction start -> page lock ->
108e74031fdSJan Kara  *   i_data_sem (rw)
109e74031fdSJan Kara  *
110e74031fdSJan Kara  * truncate:
111d4f5258eSJan Kara  * sb_start_write -> i_mutex -> invalidate_lock (w) -> i_mmap_rwsem (w) ->
112d4f5258eSJan Kara  *   page lock
113d4f5258eSJan Kara  * sb_start_write -> i_mutex -> invalidate_lock (w) -> transaction start ->
1141d39834fSNikolay Borisov  *   i_data_sem (rw)
115e74031fdSJan Kara  *
116e74031fdSJan Kara  * direct IO:
117c1e8d7c6SMichel Lespinasse  * sb_start_write -> i_mutex -> mmap_lock
1181d39834fSNikolay Borisov  * sb_start_write -> i_mutex -> transaction start -> i_data_sem (rw)
119e74031fdSJan Kara  *
120e74031fdSJan Kara  * writepages:
121e74031fdSJan Kara  * transaction start -> page lock(s) -> i_data_sem (rw)
122e74031fdSJan Kara  */
123e74031fdSJan Kara 
12402f960f8SLukas Czerner static const struct fs_context_operations ext4_context_ops = {
12502f960f8SLukas Czerner 	.parse_param	= ext4_parse_param,
126cebe85d5SLukas Czerner 	.get_tree	= ext4_get_tree,
127cebe85d5SLukas Czerner 	.reconfigure	= ext4_reconfigure,
128cebe85d5SLukas Czerner 	.free		= ext4_fc_free,
12902f960f8SLukas Czerner };
13002f960f8SLukas Czerner 
13102f960f8SLukas Czerner 
132c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2)
1332035e776STheodore Ts'o static struct file_system_type ext2_fs_type = {
1342035e776STheodore Ts'o 	.owner			= THIS_MODULE,
1352035e776STheodore Ts'o 	.name			= "ext2",
136cebe85d5SLukas Czerner 	.init_fs_context	= ext4_init_fs_context,
137cebe85d5SLukas Czerner 	.parameters		= ext4_param_specs,
1382035e776STheodore Ts'o 	.kill_sb		= kill_block_super,
1392035e776STheodore Ts'o 	.fs_flags		= FS_REQUIRES_DEV,
1402035e776STheodore Ts'o };
1417f78e035SEric W. Biederman MODULE_ALIAS_FS("ext2");
142fa7614ddSEric W. Biederman MODULE_ALIAS("ext2");
1432035e776STheodore Ts'o #define IS_EXT2_SB(sb) ((sb)->s_bdev->bd_holder == &ext2_fs_type)
1442035e776STheodore Ts'o #else
1452035e776STheodore Ts'o #define IS_EXT2_SB(sb) (0)
1462035e776STheodore Ts'o #endif
1472035e776STheodore Ts'o 
1482035e776STheodore Ts'o 
149ba69f9abSJan Kara static struct file_system_type ext3_fs_type = {
150ba69f9abSJan Kara 	.owner			= THIS_MODULE,
151ba69f9abSJan Kara 	.name			= "ext3",
152cebe85d5SLukas Czerner 	.init_fs_context	= ext4_init_fs_context,
153cebe85d5SLukas Czerner 	.parameters		= ext4_param_specs,
154ba69f9abSJan Kara 	.kill_sb		= kill_block_super,
155ba69f9abSJan Kara 	.fs_flags		= FS_REQUIRES_DEV,
156ba69f9abSJan Kara };
1577f78e035SEric W. Biederman MODULE_ALIAS_FS("ext3");
158fa7614ddSEric W. Biederman MODULE_ALIAS("ext3");
159ba69f9abSJan Kara #define IS_EXT3_SB(sb) ((sb)->s_bdev->bd_holder == &ext3_fs_type)
160bd81d8eeSLaurent Vivier 
161fa491b14Szhangyi (F) 
16267c0f556SBart Van Assche static inline void __ext4_read_bh(struct buffer_head *bh, blk_opf_t op_flags,
163fa491b14Szhangyi (F) 				  bh_end_io_t *end_io)
164fa491b14Szhangyi (F) {
165fb265c9cSTheodore Ts'o 	/*
166fa491b14Szhangyi (F) 	 * buffer's verified bit is no longer valid after reading from
167fa491b14Szhangyi (F) 	 * disk again due to write out error, clear it to make sure we
168fa491b14Szhangyi (F) 	 * recheck the buffer contents.
169fa491b14Szhangyi (F) 	 */
170fa491b14Szhangyi (F) 	clear_buffer_verified(bh);
171fa491b14Szhangyi (F) 
172fa491b14Szhangyi (F) 	bh->b_end_io = end_io ? end_io : end_buffer_read_sync;
173fa491b14Szhangyi (F) 	get_bh(bh);
1741420c4a5SBart Van Assche 	submit_bh(REQ_OP_READ | op_flags, bh);
175fa491b14Szhangyi (F) }
176fa491b14Szhangyi (F) 
17767c0f556SBart Van Assche void ext4_read_bh_nowait(struct buffer_head *bh, blk_opf_t op_flags,
178fa491b14Szhangyi (F) 			 bh_end_io_t *end_io)
179fa491b14Szhangyi (F) {
180fa491b14Szhangyi (F) 	BUG_ON(!buffer_locked(bh));
181fa491b14Szhangyi (F) 
182fa491b14Szhangyi (F) 	if (ext4_buffer_uptodate(bh)) {
183fa491b14Szhangyi (F) 		unlock_buffer(bh);
184fa491b14Szhangyi (F) 		return;
185fa491b14Szhangyi (F) 	}
186fa491b14Szhangyi (F) 	__ext4_read_bh(bh, op_flags, end_io);
187fa491b14Szhangyi (F) }
188fa491b14Szhangyi (F) 
18967c0f556SBart Van Assche int ext4_read_bh(struct buffer_head *bh, blk_opf_t op_flags, bh_end_io_t *end_io)
190fa491b14Szhangyi (F) {
191fa491b14Szhangyi (F) 	BUG_ON(!buffer_locked(bh));
192fa491b14Szhangyi (F) 
193fa491b14Szhangyi (F) 	if (ext4_buffer_uptodate(bh)) {
194fa491b14Szhangyi (F) 		unlock_buffer(bh);
195fa491b14Szhangyi (F) 		return 0;
196fa491b14Szhangyi (F) 	}
197fa491b14Szhangyi (F) 
198fa491b14Szhangyi (F) 	__ext4_read_bh(bh, op_flags, end_io);
199fa491b14Szhangyi (F) 
200fa491b14Szhangyi (F) 	wait_on_buffer(bh);
201fa491b14Szhangyi (F) 	if (buffer_uptodate(bh))
202fa491b14Szhangyi (F) 		return 0;
203fa491b14Szhangyi (F) 	return -EIO;
204fa491b14Szhangyi (F) }
205fa491b14Szhangyi (F) 
20667c0f556SBart Van Assche int ext4_read_bh_lock(struct buffer_head *bh, blk_opf_t op_flags, bool wait)
207fa491b14Szhangyi (F) {
2080b73284cSZhang Yi 	lock_buffer(bh);
2090b73284cSZhang Yi 	if (!wait) {
210fa491b14Szhangyi (F) 		ext4_read_bh_nowait(bh, op_flags, NULL);
211fa491b14Szhangyi (F) 		return 0;
212fa491b14Szhangyi (F) 	}
2130b73284cSZhang Yi 	return ext4_read_bh(bh, op_flags, NULL);
214fa491b14Szhangyi (F) }
215fa491b14Szhangyi (F) 
216fb265c9cSTheodore Ts'o /*
2178394a6abSzhangyi (F)  * This works like __bread_gfp() except it uses ERR_PTR for error
218fb265c9cSTheodore Ts'o  * returns.  Currently with sb_bread it's impossible to distinguish
219fb265c9cSTheodore Ts'o  * between ENOMEM and EIO situations (since both result in a NULL
220fb265c9cSTheodore Ts'o  * return.
221fb265c9cSTheodore Ts'o  */
2228394a6abSzhangyi (F) static struct buffer_head *__ext4_sb_bread_gfp(struct super_block *sb,
22367c0f556SBart Van Assche 					       sector_t block,
22467c0f556SBart Van Assche 					       blk_opf_t op_flags, gfp_t gfp)
225fb265c9cSTheodore Ts'o {
2262d069c08Szhangyi (F) 	struct buffer_head *bh;
2272d069c08Szhangyi (F) 	int ret;
228fb265c9cSTheodore Ts'o 
2298394a6abSzhangyi (F) 	bh = sb_getblk_gfp(sb, block, gfp);
230fb265c9cSTheodore Ts'o 	if (bh == NULL)
231fb265c9cSTheodore Ts'o 		return ERR_PTR(-ENOMEM);
232cf2834a5STheodore Ts'o 	if (ext4_buffer_uptodate(bh))
233fb265c9cSTheodore Ts'o 		return bh;
2342d069c08Szhangyi (F) 
2352d069c08Szhangyi (F) 	ret = ext4_read_bh_lock(bh, REQ_META | op_flags, true);
2362d069c08Szhangyi (F) 	if (ret) {
237fb265c9cSTheodore Ts'o 		put_bh(bh);
2382d069c08Szhangyi (F) 		return ERR_PTR(ret);
2392d069c08Szhangyi (F) 	}
2402d069c08Szhangyi (F) 	return bh;
241fb265c9cSTheodore Ts'o }
242fb265c9cSTheodore Ts'o 
2438394a6abSzhangyi (F) struct buffer_head *ext4_sb_bread(struct super_block *sb, sector_t block,
24467c0f556SBart Van Assche 				   blk_opf_t op_flags)
2458394a6abSzhangyi (F) {
2468394a6abSzhangyi (F) 	return __ext4_sb_bread_gfp(sb, block, op_flags, __GFP_MOVABLE);
2478394a6abSzhangyi (F) }
2488394a6abSzhangyi (F) 
2498394a6abSzhangyi (F) struct buffer_head *ext4_sb_bread_unmovable(struct super_block *sb,
2508394a6abSzhangyi (F) 					    sector_t block)
2518394a6abSzhangyi (F) {
2528394a6abSzhangyi (F) 	return __ext4_sb_bread_gfp(sb, block, 0, 0);
2538394a6abSzhangyi (F) }
2548394a6abSzhangyi (F) 
2555df1d412Szhangyi (F) void ext4_sb_breadahead_unmovable(struct super_block *sb, sector_t block)
2565df1d412Szhangyi (F) {
2575df1d412Szhangyi (F) 	struct buffer_head *bh = sb_getblk_gfp(sb, block, 0);
2585df1d412Szhangyi (F) 
2595df1d412Szhangyi (F) 	if (likely(bh)) {
2600b73284cSZhang Yi 		if (trylock_buffer(bh))
2610b73284cSZhang Yi 			ext4_read_bh_nowait(bh, REQ_RAHEAD, NULL);
2625df1d412Szhangyi (F) 		brelse(bh);
2635df1d412Szhangyi (F) 	}
264c197855eSStephen Hemminger }
265a9c47317SDarrick J. Wong 
266a9c47317SDarrick J. Wong static int ext4_verify_csum_type(struct super_block *sb,
2679aa5d32bSDmitry Monakhov 				 struct ext4_super_block *es)
268a9c47317SDarrick J. Wong {
269a9c47317SDarrick J. Wong 	if (!ext4_has_feature_metadata_csum(sb))
270a9c47317SDarrick J. Wong 		return 1;
271a9c47317SDarrick J. Wong 
272a9c47317SDarrick J. Wong 	return es->s_checksum_type == EXT4_CRC32C_CHKSUM;
27306db49e6STheodore Ts'o }
274a9c47317SDarrick J. Wong 
275bbc605cdSLukas Czerner __le32 ext4_superblock_csum(struct super_block *sb,
276a9c47317SDarrick J. Wong 			    struct ext4_super_block *es)
277a9c47317SDarrick J. Wong {
278a9c47317SDarrick J. Wong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
279a9c47317SDarrick J. Wong 	int offset = offsetof(struct ext4_super_block, s_checksum);
280a9c47317SDarrick J. Wong 	__u32 csum;
281a9c47317SDarrick J. Wong 
282a9c47317SDarrick J. Wong 	csum = ext4_chksum(sbi, ~0, (char *)es, offset);
283a9c47317SDarrick J. Wong 
284a9c47317SDarrick J. Wong 	return cpu_to_le32(csum);
285a9c47317SDarrick J. Wong }
286a9c47317SDarrick J. Wong 
287a9c47317SDarrick J. Wong static int ext4_superblock_csum_verify(struct super_block *sb,
288a9c47317SDarrick J. Wong 				       struct ext4_super_block *es)
289a9c47317SDarrick J. Wong {
290a9c47317SDarrick J. Wong 	if (!ext4_has_metadata_csum(sb))
291a9c47317SDarrick J. Wong 		return 1;
292a9c47317SDarrick J. Wong 
293a9c47317SDarrick J. Wong 	return es->s_checksum == ext4_superblock_csum(sb, es);
294a9c47317SDarrick J. Wong }
295a9c47317SDarrick J. Wong 
296a9c47317SDarrick J. Wong void ext4_superblock_csum_set(struct super_block *sb)
297a9c47317SDarrick J. Wong {
29806db49e6STheodore Ts'o 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
29906db49e6STheodore Ts'o 
3009aa5d32bSDmitry Monakhov 	if (!ext4_has_metadata_csum(sb))
301a9c47317SDarrick J. Wong 		return;
302a9c47317SDarrick J. Wong 
303a9c47317SDarrick J. Wong 	es->s_checksum = ext4_superblock_csum(sb, es);
304a9c47317SDarrick J. Wong }
305a9c47317SDarrick J. Wong 
3068fadc143SAlexandre Ratchov ext4_fsblk_t ext4_block_bitmap(struct super_block *sb,
3078fadc143SAlexandre Ratchov 			       struct ext4_group_desc *bg)
308bd81d8eeSLaurent Vivier {
3093a14589cSAneesh Kumar K.V 	return le32_to_cpu(bg->bg_block_bitmap_lo) |
3108fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
3118fadc143SAlexandre Ratchov 		 (ext4_fsblk_t)le32_to_cpu(bg->bg_block_bitmap_hi) << 32 : 0);
312bd81d8eeSLaurent Vivier }
313bd81d8eeSLaurent Vivier 
3148fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_bitmap(struct super_block *sb,
3158fadc143SAlexandre Ratchov 			       struct ext4_group_desc *bg)
316bd81d8eeSLaurent Vivier {
3175272f837SAneesh Kumar K.V 	return le32_to_cpu(bg->bg_inode_bitmap_lo) |
3188fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
3198fadc143SAlexandre Ratchov 		 (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_bitmap_hi) << 32 : 0);
320bd81d8eeSLaurent Vivier }
321bd81d8eeSLaurent Vivier 
3228fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_table(struct super_block *sb,
3238fadc143SAlexandre Ratchov 			      struct ext4_group_desc *bg)
324bd81d8eeSLaurent Vivier {
3255272f837SAneesh Kumar K.V 	return le32_to_cpu(bg->bg_inode_table_lo) |
3268fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
3278fadc143SAlexandre Ratchov 		 (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_table_hi) << 32 : 0);
328bd81d8eeSLaurent Vivier }
329bd81d8eeSLaurent Vivier 
330021b65bbSTheodore Ts'o __u32 ext4_free_group_clusters(struct super_block *sb,
331560671a0SAneesh Kumar K.V 			       struct ext4_group_desc *bg)
332560671a0SAneesh Kumar K.V {
333560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_free_blocks_count_lo) |
334560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
335560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_free_blocks_count_hi) << 16 : 0);
336560671a0SAneesh Kumar K.V }
337560671a0SAneesh Kumar K.V 
338560671a0SAneesh Kumar K.V __u32 ext4_free_inodes_count(struct super_block *sb,
339560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
340560671a0SAneesh Kumar K.V {
341560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_free_inodes_count_lo) |
342560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
343560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_free_inodes_count_hi) << 16 : 0);
344560671a0SAneesh Kumar K.V }
345560671a0SAneesh Kumar K.V 
346560671a0SAneesh Kumar K.V __u32 ext4_used_dirs_count(struct super_block *sb,
347560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
348560671a0SAneesh Kumar K.V {
349560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_used_dirs_count_lo) |
350560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
351560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_used_dirs_count_hi) << 16 : 0);
352560671a0SAneesh Kumar K.V }
353560671a0SAneesh Kumar K.V 
354560671a0SAneesh Kumar K.V __u32 ext4_itable_unused_count(struct super_block *sb,
355560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
356560671a0SAneesh Kumar K.V {
357560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_itable_unused_lo) |
358560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
359560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_itable_unused_hi) << 16 : 0);
360560671a0SAneesh Kumar K.V }
361560671a0SAneesh Kumar K.V 
3628fadc143SAlexandre Ratchov void ext4_block_bitmap_set(struct super_block *sb,
3638fadc143SAlexandre Ratchov 			   struct ext4_group_desc *bg, ext4_fsblk_t blk)
364bd81d8eeSLaurent Vivier {
3653a14589cSAneesh Kumar K.V 	bg->bg_block_bitmap_lo = cpu_to_le32((u32)blk);
3668fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
3678fadc143SAlexandre Ratchov 		bg->bg_block_bitmap_hi = cpu_to_le32(blk >> 32);
368bd81d8eeSLaurent Vivier }
369bd81d8eeSLaurent Vivier 
3708fadc143SAlexandre Ratchov void ext4_inode_bitmap_set(struct super_block *sb,
3718fadc143SAlexandre Ratchov 			   struct ext4_group_desc *bg, ext4_fsblk_t blk)
372bd81d8eeSLaurent Vivier {
3735272f837SAneesh Kumar K.V 	bg->bg_inode_bitmap_lo  = cpu_to_le32((u32)blk);
3748fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
3758fadc143SAlexandre Ratchov 		bg->bg_inode_bitmap_hi = cpu_to_le32(blk >> 32);
376bd81d8eeSLaurent Vivier }
377bd81d8eeSLaurent Vivier 
3788fadc143SAlexandre Ratchov void ext4_inode_table_set(struct super_block *sb,
3798fadc143SAlexandre Ratchov 			  struct ext4_group_desc *bg, ext4_fsblk_t blk)
380bd81d8eeSLaurent Vivier {
3815272f837SAneesh Kumar K.V 	bg->bg_inode_table_lo = cpu_to_le32((u32)blk);
3828fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
3838fadc143SAlexandre Ratchov 		bg->bg_inode_table_hi = cpu_to_le32(blk >> 32);
384bd81d8eeSLaurent Vivier }
385bd81d8eeSLaurent Vivier 
386021b65bbSTheodore Ts'o void ext4_free_group_clusters_set(struct super_block *sb,
387560671a0SAneesh Kumar K.V 				  struct ext4_group_desc *bg, __u32 count)
388560671a0SAneesh Kumar K.V {
389560671a0SAneesh Kumar K.V 	bg->bg_free_blocks_count_lo = cpu_to_le16((__u16)count);
390560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
391560671a0SAneesh Kumar K.V 		bg->bg_free_blocks_count_hi = cpu_to_le16(count >> 16);
392560671a0SAneesh Kumar K.V }
393560671a0SAneesh Kumar K.V 
394560671a0SAneesh Kumar K.V void ext4_free_inodes_set(struct super_block *sb,
395560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
396560671a0SAneesh Kumar K.V {
397560671a0SAneesh Kumar K.V 	bg->bg_free_inodes_count_lo = cpu_to_le16((__u16)count);
398560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
399560671a0SAneesh Kumar K.V 		bg->bg_free_inodes_count_hi = cpu_to_le16(count >> 16);
400560671a0SAneesh Kumar K.V }
401560671a0SAneesh Kumar K.V 
402560671a0SAneesh Kumar K.V void ext4_used_dirs_set(struct super_block *sb,
403560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
404560671a0SAneesh Kumar K.V {
405560671a0SAneesh Kumar K.V 	bg->bg_used_dirs_count_lo = cpu_to_le16((__u16)count);
406560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
407560671a0SAneesh Kumar K.V 		bg->bg_used_dirs_count_hi = cpu_to_le16(count >> 16);
408560671a0SAneesh Kumar K.V }
409560671a0SAneesh Kumar K.V 
410560671a0SAneesh Kumar K.V void ext4_itable_unused_set(struct super_block *sb,
411560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
412560671a0SAneesh Kumar K.V {
413560671a0SAneesh Kumar K.V 	bg->bg_itable_unused_lo = cpu_to_le16((__u16)count);
414560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
415560671a0SAneesh Kumar K.V 		bg->bg_itable_unused_hi = cpu_to_le16(count >> 16);
416560671a0SAneesh Kumar K.V }
417560671a0SAneesh Kumar K.V 
418c92dc856SJan Kara static void __ext4_update_tstamp(__le32 *lo, __u8 *hi, time64_t now)
4196a0678a7SArnd Bergmann {
4206a0678a7SArnd Bergmann 	now = clamp_val(now, 0, (1ull << 40) - 1);
4216a0678a7SArnd Bergmann 
4226a0678a7SArnd Bergmann 	*lo = cpu_to_le32(lower_32_bits(now));
4236a0678a7SArnd Bergmann 	*hi = upper_32_bits(now);
4246a0678a7SArnd Bergmann }
4256a0678a7SArnd Bergmann 
4266a0678a7SArnd Bergmann static time64_t __ext4_get_tstamp(__le32 *lo, __u8 *hi)
4276a0678a7SArnd Bergmann {
4286a0678a7SArnd Bergmann 	return ((time64_t)(*hi) << 32) + le32_to_cpu(*lo);
4296a0678a7SArnd Bergmann }
4306a0678a7SArnd Bergmann #define ext4_update_tstamp(es, tstamp) \
431c92dc856SJan Kara 	__ext4_update_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi, \
432c92dc856SJan Kara 			     ktime_get_real_seconds())
4336a0678a7SArnd Bergmann #define ext4_get_tstamp(es, tstamp) \
4346a0678a7SArnd Bergmann 	__ext4_get_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi)
435d3d1faf6SCurt Wohlgemuth 
436bdfe0cbdSTheodore Ts'o /*
437bdfe0cbdSTheodore Ts'o  * The del_gendisk() function uninitializes the disk-specific data
438bdfe0cbdSTheodore Ts'o  * structures, including the bdi structure, without telling anyone
439bdfe0cbdSTheodore Ts'o  * else.  Once this happens, any attempt to call mark_buffer_dirty()
440bdfe0cbdSTheodore Ts'o  * (for example, by ext4_commit_super), will cause a kernel OOPS.
441bdfe0cbdSTheodore Ts'o  * This is a kludge to prevent these oops until we can put in a proper
442bdfe0cbdSTheodore Ts'o  * hook in del_gendisk() to inform the VFS and file system layers.
443bdfe0cbdSTheodore Ts'o  */
444bdfe0cbdSTheodore Ts'o static int block_device_ejected(struct super_block *sb)
445bdfe0cbdSTheodore Ts'o {
446bdfe0cbdSTheodore Ts'o 	struct inode *bd_inode = sb->s_bdev->bd_inode;
447bdfe0cbdSTheodore Ts'o 	struct backing_dev_info *bdi = inode_to_bdi(bd_inode);
448bdfe0cbdSTheodore Ts'o 
449bdfe0cbdSTheodore Ts'o 	return bdi->dev == NULL;
450bdfe0cbdSTheodore Ts'o }
451bdfe0cbdSTheodore Ts'o 
45218aadd47SBobi Jam static void ext4_journal_commit_callback(journal_t *journal, transaction_t *txn)
45318aadd47SBobi Jam {
45418aadd47SBobi Jam 	struct super_block		*sb = journal->j_private;
45518aadd47SBobi Jam 	struct ext4_sb_info		*sbi = EXT4_SB(sb);
45618aadd47SBobi Jam 	int				error = is_journal_aborted(journal);
4575d3ee208SDmitry Monakhov 	struct ext4_journal_cb_entry	*jce;
45818aadd47SBobi Jam 
4595d3ee208SDmitry Monakhov 	BUG_ON(txn->t_state == T_FINISHED);
460a0154344SDaeho Jeong 
461a0154344SDaeho Jeong 	ext4_process_freed_data(sb, txn->t_tid);
462a0154344SDaeho Jeong 
46318aadd47SBobi Jam 	spin_lock(&sbi->s_md_lock);
4645d3ee208SDmitry Monakhov 	while (!list_empty(&txn->t_private_list)) {
4655d3ee208SDmitry Monakhov 		jce = list_entry(txn->t_private_list.next,
4665d3ee208SDmitry Monakhov 				 struct ext4_journal_cb_entry, jce_list);
46718aadd47SBobi Jam 		list_del_init(&jce->jce_list);
46818aadd47SBobi Jam 		spin_unlock(&sbi->s_md_lock);
46918aadd47SBobi Jam 		jce->jce_func(sb, jce, error);
47018aadd47SBobi Jam 		spin_lock(&sbi->s_md_lock);
47118aadd47SBobi Jam 	}
47218aadd47SBobi Jam 	spin_unlock(&sbi->s_md_lock);
47318aadd47SBobi Jam }
4741c13d5c0STheodore Ts'o 
475afb585a9SMauricio Faria de Oliveira /*
476afb585a9SMauricio Faria de Oliveira  * This writepage callback for write_cache_pages()
477afb585a9SMauricio Faria de Oliveira  * takes care of a few cases after page cleaning.
478afb585a9SMauricio Faria de Oliveira  *
479afb585a9SMauricio Faria de Oliveira  * write_cache_pages() already checks for dirty pages
480afb585a9SMauricio Faria de Oliveira  * and calls clear_page_dirty_for_io(), which we want,
481afb585a9SMauricio Faria de Oliveira  * to write protect the pages.
482afb585a9SMauricio Faria de Oliveira  *
483afb585a9SMauricio Faria de Oliveira  * However, we may have to redirty a page (see below.)
484afb585a9SMauricio Faria de Oliveira  */
485d585bdbeSMatthew Wilcox (Oracle) static int ext4_journalled_writepage_callback(struct folio *folio,
486afb585a9SMauricio Faria de Oliveira 					      struct writeback_control *wbc,
487afb585a9SMauricio Faria de Oliveira 					      void *data)
488afb585a9SMauricio Faria de Oliveira {
489afb585a9SMauricio Faria de Oliveira 	transaction_t *transaction = (transaction_t *) data;
490afb585a9SMauricio Faria de Oliveira 	struct buffer_head *bh, *head;
491afb585a9SMauricio Faria de Oliveira 	struct journal_head *jh;
492afb585a9SMauricio Faria de Oliveira 
493d585bdbeSMatthew Wilcox (Oracle) 	bh = head = folio_buffers(folio);
494afb585a9SMauricio Faria de Oliveira 	do {
495afb585a9SMauricio Faria de Oliveira 		/*
496afb585a9SMauricio Faria de Oliveira 		 * We have to redirty a page in these cases:
497afb585a9SMauricio Faria de Oliveira 		 * 1) If buffer is dirty, it means the page was dirty because it
498afb585a9SMauricio Faria de Oliveira 		 * contains a buffer that needs checkpointing. So the dirty bit
499afb585a9SMauricio Faria de Oliveira 		 * needs to be preserved so that checkpointing writes the buffer
500afb585a9SMauricio Faria de Oliveira 		 * properly.
501afb585a9SMauricio Faria de Oliveira 		 * 2) If buffer is not part of the committing transaction
502afb585a9SMauricio Faria de Oliveira 		 * (we may have just accidentally come across this buffer because
503afb585a9SMauricio Faria de Oliveira 		 * inode range tracking is not exact) or if the currently running
504afb585a9SMauricio Faria de Oliveira 		 * transaction already contains this buffer as well, dirty bit
505afb585a9SMauricio Faria de Oliveira 		 * needs to be preserved so that the buffer gets writeprotected
506afb585a9SMauricio Faria de Oliveira 		 * properly on running transaction's commit.
507afb585a9SMauricio Faria de Oliveira 		 */
508afb585a9SMauricio Faria de Oliveira 		jh = bh2jh(bh);
509afb585a9SMauricio Faria de Oliveira 		if (buffer_dirty(bh) ||
510afb585a9SMauricio Faria de Oliveira 		    (jh && (jh->b_transaction != transaction ||
511afb585a9SMauricio Faria de Oliveira 			    jh->b_next_transaction))) {
512d585bdbeSMatthew Wilcox (Oracle) 			folio_redirty_for_writepage(wbc, folio);
513afb585a9SMauricio Faria de Oliveira 			goto out;
514afb585a9SMauricio Faria de Oliveira 		}
515afb585a9SMauricio Faria de Oliveira 	} while ((bh = bh->b_this_page) != head);
516afb585a9SMauricio Faria de Oliveira 
517afb585a9SMauricio Faria de Oliveira out:
518afb585a9SMauricio Faria de Oliveira 	return AOP_WRITEPAGE_ACTIVATE;
519afb585a9SMauricio Faria de Oliveira }
520afb585a9SMauricio Faria de Oliveira 
521afb585a9SMauricio Faria de Oliveira static int ext4_journalled_submit_inode_data_buffers(struct jbd2_inode *jinode)
522afb585a9SMauricio Faria de Oliveira {
523afb585a9SMauricio Faria de Oliveira 	struct address_space *mapping = jinode->i_vfs_inode->i_mapping;
524afb585a9SMauricio Faria de Oliveira 	struct writeback_control wbc = {
525afb585a9SMauricio Faria de Oliveira 		.sync_mode =  WB_SYNC_ALL,
526afb585a9SMauricio Faria de Oliveira 		.nr_to_write = LONG_MAX,
527afb585a9SMauricio Faria de Oliveira 		.range_start = jinode->i_dirty_start,
528afb585a9SMauricio Faria de Oliveira 		.range_end = jinode->i_dirty_end,
529afb585a9SMauricio Faria de Oliveira         };
530afb585a9SMauricio Faria de Oliveira 
531afb585a9SMauricio Faria de Oliveira 	return write_cache_pages(mapping, &wbc,
532afb585a9SMauricio Faria de Oliveira 				 ext4_journalled_writepage_callback,
533afb585a9SMauricio Faria de Oliveira 				 jinode->i_transaction);
534afb585a9SMauricio Faria de Oliveira }
535afb585a9SMauricio Faria de Oliveira 
536afb585a9SMauricio Faria de Oliveira static int ext4_journal_submit_inode_data_buffers(struct jbd2_inode *jinode)
537afb585a9SMauricio Faria de Oliveira {
538afb585a9SMauricio Faria de Oliveira 	int ret;
539afb585a9SMauricio Faria de Oliveira 
540afb585a9SMauricio Faria de Oliveira 	if (ext4_should_journal_data(jinode->i_vfs_inode))
541afb585a9SMauricio Faria de Oliveira 		ret = ext4_journalled_submit_inode_data_buffers(jinode);
542afb585a9SMauricio Faria de Oliveira 	else
54359205c8dSJan Kara 		ret = ext4_normal_submit_inode_data_buffers(jinode);
544afb585a9SMauricio Faria de Oliveira 	return ret;
545afb585a9SMauricio Faria de Oliveira }
546afb585a9SMauricio Faria de Oliveira 
547afb585a9SMauricio Faria de Oliveira static int ext4_journal_finish_inode_data_buffers(struct jbd2_inode *jinode)
548afb585a9SMauricio Faria de Oliveira {
549afb585a9SMauricio Faria de Oliveira 	int ret = 0;
550afb585a9SMauricio Faria de Oliveira 
551afb585a9SMauricio Faria de Oliveira 	if (!ext4_should_journal_data(jinode->i_vfs_inode))
552afb585a9SMauricio Faria de Oliveira 		ret = jbd2_journal_finish_inode_data_buffers(jinode);
553afb585a9SMauricio Faria de Oliveira 
554afb585a9SMauricio Faria de Oliveira 	return ret;
555afb585a9SMauricio Faria de Oliveira }
556afb585a9SMauricio Faria de Oliveira 
5571dc1097fSJan Kara static bool system_going_down(void)
5581dc1097fSJan Kara {
5591dc1097fSJan Kara 	return system_state == SYSTEM_HALT || system_state == SYSTEM_POWER_OFF
5601dc1097fSJan Kara 		|| system_state == SYSTEM_RESTART;
5611dc1097fSJan Kara }
5621dc1097fSJan Kara 
56302a7780eSJan Kara struct ext4_err_translation {
56402a7780eSJan Kara 	int code;
56502a7780eSJan Kara 	int errno;
56602a7780eSJan Kara };
56702a7780eSJan Kara 
56802a7780eSJan Kara #define EXT4_ERR_TRANSLATE(err) { .code = EXT4_ERR_##err, .errno = err }
56902a7780eSJan Kara 
57002a7780eSJan Kara static struct ext4_err_translation err_translation[] = {
57102a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EIO),
57202a7780eSJan Kara 	EXT4_ERR_TRANSLATE(ENOMEM),
57302a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EFSBADCRC),
57402a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EFSCORRUPTED),
57502a7780eSJan Kara 	EXT4_ERR_TRANSLATE(ENOSPC),
57602a7780eSJan Kara 	EXT4_ERR_TRANSLATE(ENOKEY),
57702a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EROFS),
57802a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EFBIG),
57902a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EEXIST),
58002a7780eSJan Kara 	EXT4_ERR_TRANSLATE(ERANGE),
58102a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EOVERFLOW),
58202a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EBUSY),
58302a7780eSJan Kara 	EXT4_ERR_TRANSLATE(ENOTDIR),
58402a7780eSJan Kara 	EXT4_ERR_TRANSLATE(ENOTEMPTY),
58502a7780eSJan Kara 	EXT4_ERR_TRANSLATE(ESHUTDOWN),
58602a7780eSJan Kara 	EXT4_ERR_TRANSLATE(EFAULT),
58702a7780eSJan Kara };
58802a7780eSJan Kara 
58902a7780eSJan Kara static int ext4_errno_to_code(int errno)
59002a7780eSJan Kara {
59102a7780eSJan Kara 	int i;
59202a7780eSJan Kara 
59302a7780eSJan Kara 	for (i = 0; i < ARRAY_SIZE(err_translation); i++)
59402a7780eSJan Kara 		if (err_translation[i].errno == errno)
59502a7780eSJan Kara 			return err_translation[i].code;
59602a7780eSJan Kara 	return EXT4_ERR_UNKNOWN;
59702a7780eSJan Kara }
59802a7780eSJan Kara 
5992d01ddc8SJan Kara static void save_error_info(struct super_block *sb, int error,
60040676623SJan Kara 			    __u32 ino, __u64 block,
60140676623SJan Kara 			    const char *func, unsigned int line)
60240676623SJan Kara {
603c92dc856SJan Kara 	struct ext4_sb_info *sbi = EXT4_SB(sb);
60440676623SJan Kara 
60502a7780eSJan Kara 	/* We default to EFSCORRUPTED error... */
60602a7780eSJan Kara 	if (error == 0)
60702a7780eSJan Kara 		error = EFSCORRUPTED;
608c92dc856SJan Kara 
609c92dc856SJan Kara 	spin_lock(&sbi->s_error_lock);
610c92dc856SJan Kara 	sbi->s_add_error_count++;
611c92dc856SJan Kara 	sbi->s_last_error_code = error;
612c92dc856SJan Kara 	sbi->s_last_error_line = line;
613c92dc856SJan Kara 	sbi->s_last_error_ino = ino;
614c92dc856SJan Kara 	sbi->s_last_error_block = block;
615c92dc856SJan Kara 	sbi->s_last_error_func = func;
616c92dc856SJan Kara 	sbi->s_last_error_time = ktime_get_real_seconds();
617c92dc856SJan Kara 	if (!sbi->s_first_error_time) {
618c92dc856SJan Kara 		sbi->s_first_error_code = error;
619c92dc856SJan Kara 		sbi->s_first_error_line = line;
620c92dc856SJan Kara 		sbi->s_first_error_ino = ino;
621c92dc856SJan Kara 		sbi->s_first_error_block = block;
622c92dc856SJan Kara 		sbi->s_first_error_func = func;
623c92dc856SJan Kara 		sbi->s_first_error_time = sbi->s_last_error_time;
62440676623SJan Kara 	}
625c92dc856SJan Kara 	spin_unlock(&sbi->s_error_lock);
62640676623SJan Kara }
62740676623SJan Kara 
628ac27a0ecSDave Kleikamp /* Deal with the reporting of failure conditions on a filesystem such as
629ac27a0ecSDave Kleikamp  * inconsistencies detected or read IO failures.
630ac27a0ecSDave Kleikamp  *
631ac27a0ecSDave Kleikamp  * On ext2, we can store the error state of the filesystem in the
632617ba13bSMingming Cao  * superblock.  That is not possible on ext4, because we may have other
633ac27a0ecSDave Kleikamp  * write ordering constraints on the superblock which prevent us from
634ac27a0ecSDave Kleikamp  * writing it out straight away; and given that the journal is about to
635ac27a0ecSDave Kleikamp  * be aborted, we can't rely on the current, or future, transactions to
636ac27a0ecSDave Kleikamp  * write out the superblock safely.
637ac27a0ecSDave Kleikamp  *
638dab291afSMingming Cao  * We'll just use the jbd2_journal_abort() error code to record an error in
639d6b198bcSThadeu Lima de Souza Cascardo  * the journal instead.  On recovery, the journal will complain about
640ac27a0ecSDave Kleikamp  * that error until we've noted it down and cleared it.
641014c9caaSJan Kara  *
642014c9caaSJan Kara  * If force_ro is set, we unconditionally force the filesystem into an
643014c9caaSJan Kara  * ABORT|READONLY state, unless the error response on the fs has been set to
644014c9caaSJan Kara  * panic in which case we take the easy way out and panic immediately. This is
645014c9caaSJan Kara  * used to deal with unrecoverable failures such as journal IO errors or ENOMEM
646014c9caaSJan Kara  * at a critical moment in log management.
647ac27a0ecSDave Kleikamp  */
648e789ca0cSJan Kara static void ext4_handle_error(struct super_block *sb, bool force_ro, int error,
649e789ca0cSJan Kara 			      __u32 ino, __u64 block,
650e789ca0cSJan Kara 			      const char *func, unsigned int line)
651ac27a0ecSDave Kleikamp {
652b08070ecSJan Kara 	journal_t *journal = EXT4_SB(sb)->s_journal;
6532d01ddc8SJan Kara 	bool continue_fs = !force_ro && test_opt(sb, ERRORS_CONT);
654b08070ecSJan Kara 
655e789ca0cSJan Kara 	EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
656327eaf73STheodore Ts'o 	if (test_opt(sb, WARN_ON_ERROR))
657327eaf73STheodore Ts'o 		WARN_ON_ONCE(1);
658327eaf73STheodore Ts'o 
6592d01ddc8SJan Kara 	if (!continue_fs && !sb_rdonly(sb)) {
6609b5f6c9bSHarshad Shirwadkar 		ext4_set_mount_flag(sb, EXT4_MF_FS_ABORTED);
661ac27a0ecSDave Kleikamp 		if (journal)
662dab291afSMingming Cao 			jbd2_journal_abort(journal, -EIO);
6632d01ddc8SJan Kara 	}
6642d01ddc8SJan Kara 
6652d01ddc8SJan Kara 	if (!bdev_read_only(sb->s_bdev)) {
6662d01ddc8SJan Kara 		save_error_info(sb, error, ino, block, func, line);
6672d01ddc8SJan Kara 		/*
6682d01ddc8SJan Kara 		 * In case the fs should keep running, we need to writeout
6692d01ddc8SJan Kara 		 * superblock through the journal. Due to lock ordering
6702d01ddc8SJan Kara 		 * constraints, it may not be safe to do it right here so we
6712d01ddc8SJan Kara 		 * defer superblock flushing to a workqueue.
6722d01ddc8SJan Kara 		 */
673bb9464e0Syangerkun 		if (continue_fs && journal)
6742d01ddc8SJan Kara 			schedule_work(&EXT4_SB(sb)->s_error_work);
6752d01ddc8SJan Kara 		else
6762d01ddc8SJan Kara 			ext4_commit_super(sb);
6772d01ddc8SJan Kara 	}
6782d01ddc8SJan Kara 
6791dc1097fSJan Kara 	/*
6801dc1097fSJan Kara 	 * We force ERRORS_RO behavior when system is rebooting. Otherwise we
6811dc1097fSJan Kara 	 * could panic during 'reboot -f' as the underlying device got already
6821dc1097fSJan Kara 	 * disabled.
6831dc1097fSJan Kara 	 */
684014c9caaSJan Kara 	if (test_opt(sb, ERRORS_PANIC) && !system_going_down()) {
685617ba13bSMingming Cao 		panic("EXT4-fs (device %s): panic forced after error\n",
686ac27a0ecSDave Kleikamp 			sb->s_id);
687ac27a0ecSDave Kleikamp 	}
688ac2f7ca5SYe Bin 
689ac2f7ca5SYe Bin 	if (sb_rdonly(sb) || continue_fs)
690ac2f7ca5SYe Bin 		return;
691ac2f7ca5SYe Bin 
692014c9caaSJan Kara 	ext4_msg(sb, KERN_CRIT, "Remounting filesystem read-only");
693014c9caaSJan Kara 	/*
694014c9caaSJan Kara 	 * Make sure updated value of ->s_mount_flags will be visible before
695014c9caaSJan Kara 	 * ->s_flags update
696014c9caaSJan Kara 	 */
697014c9caaSJan Kara 	smp_wmb();
698014c9caaSJan Kara 	sb->s_flags |= SB_RDONLY;
6994327ba52SDaeho Jeong }
700ac27a0ecSDave Kleikamp 
701c92dc856SJan Kara static void flush_stashed_error_work(struct work_struct *work)
702c92dc856SJan Kara {
703c92dc856SJan Kara 	struct ext4_sb_info *sbi = container_of(work, struct ext4_sb_info,
704c92dc856SJan Kara 						s_error_work);
7052d01ddc8SJan Kara 	journal_t *journal = sbi->s_journal;
7062d01ddc8SJan Kara 	handle_t *handle;
707c92dc856SJan Kara 
7082d01ddc8SJan Kara 	/*
7092d01ddc8SJan Kara 	 * If the journal is still running, we have to write out superblock
7102d01ddc8SJan Kara 	 * through the journal to avoid collisions of other journalled sb
7112d01ddc8SJan Kara 	 * updates.
7122d01ddc8SJan Kara 	 *
7132d01ddc8SJan Kara 	 * We use directly jbd2 functions here to avoid recursing back into
7142d01ddc8SJan Kara 	 * ext4 error handling code during handling of previous errors.
7152d01ddc8SJan Kara 	 */
7162d01ddc8SJan Kara 	if (!sb_rdonly(sbi->s_sb) && journal) {
717558d6450SYe Bin 		struct buffer_head *sbh = sbi->s_sbh;
7182d01ddc8SJan Kara 		handle = jbd2_journal_start(journal, 1);
7192d01ddc8SJan Kara 		if (IS_ERR(handle))
7202d01ddc8SJan Kara 			goto write_directly;
721558d6450SYe Bin 		if (jbd2_journal_get_write_access(handle, sbh)) {
7222d01ddc8SJan Kara 			jbd2_journal_stop(handle);
7232d01ddc8SJan Kara 			goto write_directly;
7242d01ddc8SJan Kara 		}
7252d01ddc8SJan Kara 		ext4_update_super(sbi->s_sb);
726558d6450SYe Bin 		if (buffer_write_io_error(sbh) || !buffer_uptodate(sbh)) {
727558d6450SYe Bin 			ext4_msg(sbi->s_sb, KERN_ERR, "previous I/O error to "
728558d6450SYe Bin 				 "superblock detected");
729558d6450SYe Bin 			clear_buffer_write_io_error(sbh);
730558d6450SYe Bin 			set_buffer_uptodate(sbh);
731558d6450SYe Bin 		}
732558d6450SYe Bin 
733558d6450SYe Bin 		if (jbd2_journal_dirty_metadata(handle, sbh)) {
7342d01ddc8SJan Kara 			jbd2_journal_stop(handle);
7352d01ddc8SJan Kara 			goto write_directly;
7362d01ddc8SJan Kara 		}
7372d01ddc8SJan Kara 		jbd2_journal_stop(handle);
738d578b994SJonathan Davies 		ext4_notify_error_sysfs(sbi);
7392d01ddc8SJan Kara 		return;
7402d01ddc8SJan Kara 	}
7412d01ddc8SJan Kara write_directly:
7422d01ddc8SJan Kara 	/*
7432d01ddc8SJan Kara 	 * Write through journal failed. Write sb directly to get error info
7442d01ddc8SJan Kara 	 * out and hope for the best.
7452d01ddc8SJan Kara 	 */
7464392fbc4SJan Kara 	ext4_commit_super(sbi->s_sb);
747d578b994SJonathan Davies 	ext4_notify_error_sysfs(sbi);
748ac27a0ecSDave Kleikamp }
749ac27a0ecSDave Kleikamp 
750efbed4dcSTheodore Ts'o #define ext4_error_ratelimit(sb)					\
751efbed4dcSTheodore Ts'o 		___ratelimit(&(EXT4_SB(sb)->s_err_ratelimit_state),	\
752efbed4dcSTheodore Ts'o 			     "EXT4-fs error")
753efbed4dcSTheodore Ts'o 
75412062dddSEric Sandeen void __ext4_error(struct super_block *sb, const char *function,
755014c9caaSJan Kara 		  unsigned int line, bool force_ro, int error, __u64 block,
75654d3adbcSTheodore Ts'o 		  const char *fmt, ...)
757ac27a0ecSDave Kleikamp {
7580ff2ea7dSJoe Perches 	struct va_format vaf;
759ac27a0ecSDave Kleikamp 	va_list args;
760ac27a0ecSDave Kleikamp 
7610db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(sb))))
7620db1ff22STheodore Ts'o 		return;
7630db1ff22STheodore Ts'o 
764ccf0f32aSTheodore Ts'o 	trace_ext4_error(sb, function, line);
765efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(sb)) {
766ac27a0ecSDave Kleikamp 		va_start(args, fmt);
7670ff2ea7dSJoe Perches 		vaf.fmt = fmt;
7680ff2ea7dSJoe Perches 		vaf.va = &args;
769efbed4dcSTheodore Ts'o 		printk(KERN_CRIT
770efbed4dcSTheodore Ts'o 		       "EXT4-fs error (device %s): %s:%d: comm %s: %pV\n",
7710ff2ea7dSJoe Perches 		       sb->s_id, function, line, current->comm, &vaf);
772ac27a0ecSDave Kleikamp 		va_end(args);
773efbed4dcSTheodore Ts'o 	}
7749a089b21SGabriel Krisman Bertazi 	fsnotify_sb_error(sb, NULL, error ? error : EFSCORRUPTED);
7759a089b21SGabriel Krisman Bertazi 
776e789ca0cSJan Kara 	ext4_handle_error(sb, force_ro, error, 0, block, function, line);
777ac27a0ecSDave Kleikamp }
778ac27a0ecSDave Kleikamp 
779e7c96e8eSJoe Perches void __ext4_error_inode(struct inode *inode, const char *function,
78054d3adbcSTheodore Ts'o 			unsigned int line, ext4_fsblk_t block, int error,
781273df556SFrank Mayhar 			const char *fmt, ...)
782273df556SFrank Mayhar {
783273df556SFrank Mayhar 	va_list args;
784f7c21177STheodore Ts'o 	struct va_format vaf;
785273df556SFrank Mayhar 
7860db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
7870db1ff22STheodore Ts'o 		return;
7880db1ff22STheodore Ts'o 
789ccf0f32aSTheodore Ts'o 	trace_ext4_error(inode->i_sb, function, line);
790efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(inode->i_sb)) {
791273df556SFrank Mayhar 		va_start(args, fmt);
792f7c21177STheodore Ts'o 		vaf.fmt = fmt;
793f7c21177STheodore Ts'o 		vaf.va = &args;
794c398eda0STheodore Ts'o 		if (block)
795d9ee81daSJoe Perches 			printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
796d9ee81daSJoe Perches 			       "inode #%lu: block %llu: comm %s: %pV\n",
797d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
798d9ee81daSJoe Perches 			       block, current->comm, &vaf);
799d9ee81daSJoe Perches 		else
800d9ee81daSJoe Perches 			printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
801d9ee81daSJoe Perches 			       "inode #%lu: comm %s: %pV\n",
802d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
803d9ee81daSJoe Perches 			       current->comm, &vaf);
804273df556SFrank Mayhar 		va_end(args);
805efbed4dcSTheodore Ts'o 	}
8069a089b21SGabriel Krisman Bertazi 	fsnotify_sb_error(inode->i_sb, inode, error ? error : EFSCORRUPTED);
8079a089b21SGabriel Krisman Bertazi 
808e789ca0cSJan Kara 	ext4_handle_error(inode->i_sb, false, error, inode->i_ino, block,
80954d3adbcSTheodore Ts'o 			  function, line);
810273df556SFrank Mayhar }
811273df556SFrank Mayhar 
812e7c96e8eSJoe Perches void __ext4_error_file(struct file *file, const char *function,
813f7c21177STheodore Ts'o 		       unsigned int line, ext4_fsblk_t block,
814f7c21177STheodore Ts'o 		       const char *fmt, ...)
815273df556SFrank Mayhar {
816273df556SFrank Mayhar 	va_list args;
817f7c21177STheodore Ts'o 	struct va_format vaf;
818496ad9aaSAl Viro 	struct inode *inode = file_inode(file);
819273df556SFrank Mayhar 	char pathname[80], *path;
820273df556SFrank Mayhar 
8210db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
8220db1ff22STheodore Ts'o 		return;
8230db1ff22STheodore Ts'o 
824ccf0f32aSTheodore Ts'o 	trace_ext4_error(inode->i_sb, function, line);
825efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(inode->i_sb)) {
8269bf39ab2SMiklos Szeredi 		path = file_path(file, pathname, sizeof(pathname));
827f9a62d09SDan Carpenter 		if (IS_ERR(path))
828273df556SFrank Mayhar 			path = "(unknown)";
829f7c21177STheodore Ts'o 		va_start(args, fmt);
830f7c21177STheodore Ts'o 		vaf.fmt = fmt;
831f7c21177STheodore Ts'o 		vaf.va = &args;
832d9ee81daSJoe Perches 		if (block)
833d9ee81daSJoe Perches 			printk(KERN_CRIT
834d9ee81daSJoe Perches 			       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
835d9ee81daSJoe Perches 			       "block %llu: comm %s: path %s: %pV\n",
836d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
837d9ee81daSJoe Perches 			       block, current->comm, path, &vaf);
838d9ee81daSJoe Perches 		else
839d9ee81daSJoe Perches 			printk(KERN_CRIT
840d9ee81daSJoe Perches 			       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
841d9ee81daSJoe Perches 			       "comm %s: path %s: %pV\n",
842d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
843d9ee81daSJoe Perches 			       current->comm, path, &vaf);
844273df556SFrank Mayhar 		va_end(args);
845efbed4dcSTheodore Ts'o 	}
8469a089b21SGabriel Krisman Bertazi 	fsnotify_sb_error(inode->i_sb, inode, EFSCORRUPTED);
8479a089b21SGabriel Krisman Bertazi 
848e789ca0cSJan Kara 	ext4_handle_error(inode->i_sb, false, EFSCORRUPTED, inode->i_ino, block,
84954d3adbcSTheodore Ts'o 			  function, line);
850273df556SFrank Mayhar }
851273df556SFrank Mayhar 
852722887ddSTheodore Ts'o const char *ext4_decode_error(struct super_block *sb, int errno,
853ac27a0ecSDave Kleikamp 			      char nbuf[16])
854ac27a0ecSDave Kleikamp {
855ac27a0ecSDave Kleikamp 	char *errstr = NULL;
856ac27a0ecSDave Kleikamp 
857ac27a0ecSDave Kleikamp 	switch (errno) {
8586a797d27SDarrick J. Wong 	case -EFSCORRUPTED:
8596a797d27SDarrick J. Wong 		errstr = "Corrupt filesystem";
8606a797d27SDarrick J. Wong 		break;
8616a797d27SDarrick J. Wong 	case -EFSBADCRC:
8626a797d27SDarrick J. Wong 		errstr = "Filesystem failed CRC";
8636a797d27SDarrick J. Wong 		break;
864ac27a0ecSDave Kleikamp 	case -EIO:
865ac27a0ecSDave Kleikamp 		errstr = "IO failure";
866ac27a0ecSDave Kleikamp 		break;
867ac27a0ecSDave Kleikamp 	case -ENOMEM:
868ac27a0ecSDave Kleikamp 		errstr = "Out of memory";
869ac27a0ecSDave Kleikamp 		break;
870ac27a0ecSDave Kleikamp 	case -EROFS:
87178f1ddbbSTheodore Ts'o 		if (!sb || (EXT4_SB(sb)->s_journal &&
87278f1ddbbSTheodore Ts'o 			    EXT4_SB(sb)->s_journal->j_flags & JBD2_ABORT))
873ac27a0ecSDave Kleikamp 			errstr = "Journal has aborted";
874ac27a0ecSDave Kleikamp 		else
875ac27a0ecSDave Kleikamp 			errstr = "Readonly filesystem";
876ac27a0ecSDave Kleikamp 		break;
877ac27a0ecSDave Kleikamp 	default:
878ac27a0ecSDave Kleikamp 		/* If the caller passed in an extra buffer for unknown
879ac27a0ecSDave Kleikamp 		 * errors, textualise them now.  Else we just return
880ac27a0ecSDave Kleikamp 		 * NULL. */
881ac27a0ecSDave Kleikamp 		if (nbuf) {
882ac27a0ecSDave Kleikamp 			/* Check for truncated error codes... */
883ac27a0ecSDave Kleikamp 			if (snprintf(nbuf, 16, "error %d", -errno) >= 0)
884ac27a0ecSDave Kleikamp 				errstr = nbuf;
885ac27a0ecSDave Kleikamp 		}
886ac27a0ecSDave Kleikamp 		break;
887ac27a0ecSDave Kleikamp 	}
888ac27a0ecSDave Kleikamp 
889ac27a0ecSDave Kleikamp 	return errstr;
890ac27a0ecSDave Kleikamp }
891ac27a0ecSDave Kleikamp 
892617ba13bSMingming Cao /* __ext4_std_error decodes expected errors from journaling functions
893ac27a0ecSDave Kleikamp  * automatically and invokes the appropriate error response.  */
894ac27a0ecSDave Kleikamp 
895c398eda0STheodore Ts'o void __ext4_std_error(struct super_block *sb, const char *function,
896c398eda0STheodore Ts'o 		      unsigned int line, int errno)
897ac27a0ecSDave Kleikamp {
898ac27a0ecSDave Kleikamp 	char nbuf[16];
899ac27a0ecSDave Kleikamp 	const char *errstr;
900ac27a0ecSDave Kleikamp 
9010db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(sb))))
9020db1ff22STheodore Ts'o 		return;
9030db1ff22STheodore Ts'o 
904ac27a0ecSDave Kleikamp 	/* Special case: if the error is EROFS, and we're not already
905ac27a0ecSDave Kleikamp 	 * inside a transaction, then there's really no point in logging
906ac27a0ecSDave Kleikamp 	 * an error. */
907bc98a42cSDavid Howells 	if (errno == -EROFS && journal_current_handle() == NULL && sb_rdonly(sb))
908ac27a0ecSDave Kleikamp 		return;
909ac27a0ecSDave Kleikamp 
910efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(sb)) {
911617ba13bSMingming Cao 		errstr = ext4_decode_error(sb, errno, nbuf);
912c398eda0STheodore Ts'o 		printk(KERN_CRIT "EXT4-fs error (device %s) in %s:%d: %s\n",
913c398eda0STheodore Ts'o 		       sb->s_id, function, line, errstr);
914efbed4dcSTheodore Ts'o 	}
9159a089b21SGabriel Krisman Bertazi 	fsnotify_sb_error(sb, NULL, errno ? errno : EFSCORRUPTED);
916ac27a0ecSDave Kleikamp 
917e789ca0cSJan Kara 	ext4_handle_error(sb, false, -errno, 0, 0, function, line);
918ac27a0ecSDave Kleikamp }
919ac27a0ecSDave Kleikamp 
920e7c96e8eSJoe Perches void __ext4_msg(struct super_block *sb,
921e7c96e8eSJoe Perches 		const char *prefix, const char *fmt, ...)
922b31e1552SEric Sandeen {
9230ff2ea7dSJoe Perches 	struct va_format vaf;
924b31e1552SEric Sandeen 	va_list args;
925b31e1552SEric Sandeen 
926da812f61SLukas Czerner 	if (sb) {
9271cf006edSDmitry Monakhov 		atomic_inc(&EXT4_SB(sb)->s_msg_count);
928da812f61SLukas Czerner 		if (!___ratelimit(&(EXT4_SB(sb)->s_msg_ratelimit_state),
929da812f61SLukas Czerner 				  "EXT4-fs"))
930efbed4dcSTheodore Ts'o 			return;
931da812f61SLukas Czerner 	}
932efbed4dcSTheodore Ts'o 
933b31e1552SEric Sandeen 	va_start(args, fmt);
9340ff2ea7dSJoe Perches 	vaf.fmt = fmt;
9350ff2ea7dSJoe Perches 	vaf.va = &args;
936da812f61SLukas Czerner 	if (sb)
9370ff2ea7dSJoe Perches 		printk("%sEXT4-fs (%s): %pV\n", prefix, sb->s_id, &vaf);
938da812f61SLukas Czerner 	else
939da812f61SLukas Czerner 		printk("%sEXT4-fs: %pV\n", prefix, &vaf);
940b31e1552SEric Sandeen 	va_end(args);
941b31e1552SEric Sandeen }
942b31e1552SEric Sandeen 
9431cf006edSDmitry Monakhov static int ext4_warning_ratelimit(struct super_block *sb)
9441cf006edSDmitry Monakhov {
9451cf006edSDmitry Monakhov 	atomic_inc(&EXT4_SB(sb)->s_warning_count);
9461cf006edSDmitry Monakhov 	return ___ratelimit(&(EXT4_SB(sb)->s_warning_ratelimit_state),
9471cf006edSDmitry Monakhov 			    "EXT4-fs warning");
9481cf006edSDmitry Monakhov }
949b03a2f7eSAndreas Dilger 
95012062dddSEric Sandeen void __ext4_warning(struct super_block *sb, const char *function,
951c398eda0STheodore Ts'o 		    unsigned int line, const char *fmt, ...)
952ac27a0ecSDave Kleikamp {
9530ff2ea7dSJoe Perches 	struct va_format vaf;
954ac27a0ecSDave Kleikamp 	va_list args;
955ac27a0ecSDave Kleikamp 
956b03a2f7eSAndreas Dilger 	if (!ext4_warning_ratelimit(sb))
957efbed4dcSTheodore Ts'o 		return;
958efbed4dcSTheodore Ts'o 
959ac27a0ecSDave Kleikamp 	va_start(args, fmt);
9600ff2ea7dSJoe Perches 	vaf.fmt = fmt;
9610ff2ea7dSJoe Perches 	vaf.va = &args;
9620ff2ea7dSJoe Perches 	printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: %pV\n",
9630ff2ea7dSJoe Perches 	       sb->s_id, function, line, &vaf);
964ac27a0ecSDave Kleikamp 	va_end(args);
965ac27a0ecSDave Kleikamp }
966ac27a0ecSDave Kleikamp 
967b03a2f7eSAndreas Dilger void __ext4_warning_inode(const struct inode *inode, const char *function,
968b03a2f7eSAndreas Dilger 			  unsigned int line, const char *fmt, ...)
969b03a2f7eSAndreas Dilger {
970b03a2f7eSAndreas Dilger 	struct va_format vaf;
971b03a2f7eSAndreas Dilger 	va_list args;
972b03a2f7eSAndreas Dilger 
973b03a2f7eSAndreas Dilger 	if (!ext4_warning_ratelimit(inode->i_sb))
974b03a2f7eSAndreas Dilger 		return;
975b03a2f7eSAndreas Dilger 
976b03a2f7eSAndreas Dilger 	va_start(args, fmt);
977b03a2f7eSAndreas Dilger 	vaf.fmt = fmt;
978b03a2f7eSAndreas Dilger 	vaf.va = &args;
979b03a2f7eSAndreas Dilger 	printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: "
980b03a2f7eSAndreas Dilger 	       "inode #%lu: comm %s: %pV\n", inode->i_sb->s_id,
981b03a2f7eSAndreas Dilger 	       function, line, inode->i_ino, current->comm, &vaf);
982b03a2f7eSAndreas Dilger 	va_end(args);
983b03a2f7eSAndreas Dilger }
984b03a2f7eSAndreas Dilger 
985e29136f8STheodore Ts'o void __ext4_grp_locked_error(const char *function, unsigned int line,
986e29136f8STheodore Ts'o 			     struct super_block *sb, ext4_group_t grp,
987e29136f8STheodore Ts'o 			     unsigned long ino, ext4_fsblk_t block,
988e29136f8STheodore Ts'o 			     const char *fmt, ...)
9895d1b1b3fSAneesh Kumar K.V __releases(bitlock)
9905d1b1b3fSAneesh Kumar K.V __acquires(bitlock)
9915d1b1b3fSAneesh Kumar K.V {
9920ff2ea7dSJoe Perches 	struct va_format vaf;
9935d1b1b3fSAneesh Kumar K.V 	va_list args;
9945d1b1b3fSAneesh Kumar K.V 
9950db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(sb))))
9960db1ff22STheodore Ts'o 		return;
9970db1ff22STheodore Ts'o 
998ccf0f32aSTheodore Ts'o 	trace_ext4_error(sb, function, line);
999efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(sb)) {
10005d1b1b3fSAneesh Kumar K.V 		va_start(args, fmt);
10010ff2ea7dSJoe Perches 		vaf.fmt = fmt;
10020ff2ea7dSJoe Perches 		vaf.va = &args;
100321149d61SRobin Dong 		printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: group %u, ",
1004e29136f8STheodore Ts'o 		       sb->s_id, function, line, grp);
1005e29136f8STheodore Ts'o 		if (ino)
10060ff2ea7dSJoe Perches 			printk(KERN_CONT "inode %lu: ", ino);
1007e29136f8STheodore Ts'o 		if (block)
1008efbed4dcSTheodore Ts'o 			printk(KERN_CONT "block %llu:",
1009efbed4dcSTheodore Ts'o 			       (unsigned long long) block);
10100ff2ea7dSJoe Perches 		printk(KERN_CONT "%pV\n", &vaf);
10115d1b1b3fSAneesh Kumar K.V 		va_end(args);
1012efbed4dcSTheodore Ts'o 	}
10135d1b1b3fSAneesh Kumar K.V 
1014c92dc856SJan Kara 	if (test_opt(sb, ERRORS_CONT)) {
1015327eaf73STheodore Ts'o 		if (test_opt(sb, WARN_ON_ERROR))
1016327eaf73STheodore Ts'o 			WARN_ON_ONCE(1);
1017e789ca0cSJan Kara 		EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
10182d01ddc8SJan Kara 		if (!bdev_read_only(sb->s_bdev)) {
10192d01ddc8SJan Kara 			save_error_info(sb, EFSCORRUPTED, ino, block, function,
10202d01ddc8SJan Kara 					line);
1021c92dc856SJan Kara 			schedule_work(&EXT4_SB(sb)->s_error_work);
10222d01ddc8SJan Kara 		}
10235d1b1b3fSAneesh Kumar K.V 		return;
10245d1b1b3fSAneesh Kumar K.V 	}
10255d1b1b3fSAneesh Kumar K.V 	ext4_unlock_group(sb, grp);
1026e789ca0cSJan Kara 	ext4_handle_error(sb, false, EFSCORRUPTED, ino, block, function, line);
10275d1b1b3fSAneesh Kumar K.V 	/*
10285d1b1b3fSAneesh Kumar K.V 	 * We only get here in the ERRORS_RO case; relocking the group
10295d1b1b3fSAneesh Kumar K.V 	 * may be dangerous, but nothing bad will happen since the
10305d1b1b3fSAneesh Kumar K.V 	 * filesystem will have already been marked read/only and the
10315d1b1b3fSAneesh Kumar K.V 	 * journal has been aborted.  We return 1 as a hint to callers
10325d1b1b3fSAneesh Kumar K.V 	 * who might what to use the return value from
103325985edcSLucas De Marchi 	 * ext4_grp_locked_error() to distinguish between the
10345d1b1b3fSAneesh Kumar K.V 	 * ERRORS_CONT and ERRORS_RO case, and perhaps return more
10355d1b1b3fSAneesh Kumar K.V 	 * aggressively from the ext4 function in question, with a
10365d1b1b3fSAneesh Kumar K.V 	 * more appropriate error code.
10375d1b1b3fSAneesh Kumar K.V 	 */
10385d1b1b3fSAneesh Kumar K.V 	ext4_lock_group(sb, grp);
10395d1b1b3fSAneesh Kumar K.V 	return;
10405d1b1b3fSAneesh Kumar K.V }
10415d1b1b3fSAneesh Kumar K.V 
1042db79e6d1SWang Shilong void ext4_mark_group_bitmap_corrupted(struct super_block *sb,
1043db79e6d1SWang Shilong 				     ext4_group_t group,
1044db79e6d1SWang Shilong 				     unsigned int flags)
1045db79e6d1SWang Shilong {
1046db79e6d1SWang Shilong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1047db79e6d1SWang Shilong 	struct ext4_group_info *grp = ext4_get_group_info(sb, group);
1048db79e6d1SWang Shilong 	struct ext4_group_desc *gdp = ext4_get_group_desc(sb, group, NULL);
10499af0b3d1SWang Shilong 	int ret;
1050db79e6d1SWang Shilong 
10519af0b3d1SWang Shilong 	if (flags & EXT4_GROUP_INFO_BBITMAP_CORRUPT) {
10529af0b3d1SWang Shilong 		ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_BBITMAP_CORRUPT_BIT,
10539af0b3d1SWang Shilong 					    &grp->bb_state);
10549af0b3d1SWang Shilong 		if (!ret)
1055db79e6d1SWang Shilong 			percpu_counter_sub(&sbi->s_freeclusters_counter,
1056db79e6d1SWang Shilong 					   grp->bb_free);
1057db79e6d1SWang Shilong 	}
1058db79e6d1SWang Shilong 
10599af0b3d1SWang Shilong 	if (flags & EXT4_GROUP_INFO_IBITMAP_CORRUPT) {
10609af0b3d1SWang Shilong 		ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_IBITMAP_CORRUPT_BIT,
10619af0b3d1SWang Shilong 					    &grp->bb_state);
10629af0b3d1SWang Shilong 		if (!ret && gdp) {
1063db79e6d1SWang Shilong 			int count;
1064db79e6d1SWang Shilong 
1065db79e6d1SWang Shilong 			count = ext4_free_inodes_count(sb, gdp);
1066db79e6d1SWang Shilong 			percpu_counter_sub(&sbi->s_freeinodes_counter,
1067db79e6d1SWang Shilong 					   count);
1068db79e6d1SWang Shilong 		}
1069db79e6d1SWang Shilong 	}
1070db79e6d1SWang Shilong }
1071db79e6d1SWang Shilong 
1072617ba13bSMingming Cao void ext4_update_dynamic_rev(struct super_block *sb)
1073ac27a0ecSDave Kleikamp {
1074617ba13bSMingming Cao 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
1075ac27a0ecSDave Kleikamp 
1076617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) > EXT4_GOOD_OLD_REV)
1077ac27a0ecSDave Kleikamp 		return;
1078ac27a0ecSDave Kleikamp 
107912062dddSEric Sandeen 	ext4_warning(sb,
1080ac27a0ecSDave Kleikamp 		     "updating to rev %d because of new feature flag, "
1081ac27a0ecSDave Kleikamp 		     "running e2fsck is recommended",
1082617ba13bSMingming Cao 		     EXT4_DYNAMIC_REV);
1083ac27a0ecSDave Kleikamp 
1084617ba13bSMingming Cao 	es->s_first_ino = cpu_to_le32(EXT4_GOOD_OLD_FIRST_INO);
1085617ba13bSMingming Cao 	es->s_inode_size = cpu_to_le16(EXT4_GOOD_OLD_INODE_SIZE);
1086617ba13bSMingming Cao 	es->s_rev_level = cpu_to_le32(EXT4_DYNAMIC_REV);
1087ac27a0ecSDave Kleikamp 	/* leave es->s_feature_*compat flags alone */
1088ac27a0ecSDave Kleikamp 	/* es->s_uuid will be set by e2fsck if empty */
1089ac27a0ecSDave Kleikamp 
1090ac27a0ecSDave Kleikamp 	/*
1091ac27a0ecSDave Kleikamp 	 * The rest of the superblock fields should be zero, and if not it
1092ac27a0ecSDave Kleikamp 	 * means they are likely already in use, so leave them alone.  We
1093ac27a0ecSDave Kleikamp 	 * can leave it up to e2fsck to clean up any inconsistencies there.
1094ac27a0ecSDave Kleikamp 	 */
1095ac27a0ecSDave Kleikamp }
1096ac27a0ecSDave Kleikamp 
1097ac27a0ecSDave Kleikamp /*
1098ac27a0ecSDave Kleikamp  * Open the external journal device
1099ac27a0ecSDave Kleikamp  */
1100b31e1552SEric Sandeen static struct block_device *ext4_blkdev_get(dev_t dev, struct super_block *sb)
1101ac27a0ecSDave Kleikamp {
1102ac27a0ecSDave Kleikamp 	struct block_device *bdev;
1103ac27a0ecSDave Kleikamp 
1104d4d77629STejun Heo 	bdev = blkdev_get_by_dev(dev, FMODE_READ|FMODE_WRITE|FMODE_EXCL, sb);
1105ac27a0ecSDave Kleikamp 	if (IS_ERR(bdev))
1106ac27a0ecSDave Kleikamp 		goto fail;
1107ac27a0ecSDave Kleikamp 	return bdev;
1108ac27a0ecSDave Kleikamp 
1109ac27a0ecSDave Kleikamp fail:
1110ea3edd4dSChristoph Hellwig 	ext4_msg(sb, KERN_ERR,
1111ea3edd4dSChristoph Hellwig 		 "failed to open journal device unknown-block(%u,%u) %ld",
1112ea3edd4dSChristoph Hellwig 		 MAJOR(dev), MINOR(dev), PTR_ERR(bdev));
1113ac27a0ecSDave Kleikamp 	return NULL;
1114ac27a0ecSDave Kleikamp }
1115ac27a0ecSDave Kleikamp 
1116ac27a0ecSDave Kleikamp /*
1117ac27a0ecSDave Kleikamp  * Release the journal device
1118ac27a0ecSDave Kleikamp  */
11194385bab1SAl Viro static void ext4_blkdev_put(struct block_device *bdev)
1120ac27a0ecSDave Kleikamp {
11214385bab1SAl Viro 	blkdev_put(bdev, FMODE_READ|FMODE_WRITE|FMODE_EXCL);
1122ac27a0ecSDave Kleikamp }
1123ac27a0ecSDave Kleikamp 
11244385bab1SAl Viro static void ext4_blkdev_remove(struct ext4_sb_info *sbi)
1125ac27a0ecSDave Kleikamp {
1126ac27a0ecSDave Kleikamp 	struct block_device *bdev;
1127ee7ed3aaSChunguang Xu 	bdev = sbi->s_journal_bdev;
1128ac27a0ecSDave Kleikamp 	if (bdev) {
11294385bab1SAl Viro 		ext4_blkdev_put(bdev);
1130ee7ed3aaSChunguang Xu 		sbi->s_journal_bdev = NULL;
1131ac27a0ecSDave Kleikamp 	}
1132ac27a0ecSDave Kleikamp }
1133ac27a0ecSDave Kleikamp 
1134ac27a0ecSDave Kleikamp static inline struct inode *orphan_list_entry(struct list_head *l)
1135ac27a0ecSDave Kleikamp {
1136617ba13bSMingming Cao 	return &list_entry(l, struct ext4_inode_info, i_orphan)->vfs_inode;
1137ac27a0ecSDave Kleikamp }
1138ac27a0ecSDave Kleikamp 
1139617ba13bSMingming Cao static void dump_orphan_list(struct super_block *sb, struct ext4_sb_info *sbi)
1140ac27a0ecSDave Kleikamp {
1141ac27a0ecSDave Kleikamp 	struct list_head *l;
1142ac27a0ecSDave Kleikamp 
1143b31e1552SEric Sandeen 	ext4_msg(sb, KERN_ERR, "sb orphan head is %d",
1144ac27a0ecSDave Kleikamp 		 le32_to_cpu(sbi->s_es->s_last_orphan));
1145ac27a0ecSDave Kleikamp 
1146ac27a0ecSDave Kleikamp 	printk(KERN_ERR "sb_info orphan list:\n");
1147ac27a0ecSDave Kleikamp 	list_for_each(l, &sbi->s_orphan) {
1148ac27a0ecSDave Kleikamp 		struct inode *inode = orphan_list_entry(l);
1149ac27a0ecSDave Kleikamp 		printk(KERN_ERR "  "
1150ac27a0ecSDave Kleikamp 		       "inode %s:%lu at %p: mode %o, nlink %d, next %d\n",
1151ac27a0ecSDave Kleikamp 		       inode->i_sb->s_id, inode->i_ino, inode,
1152ac27a0ecSDave Kleikamp 		       inode->i_mode, inode->i_nlink,
1153ac27a0ecSDave Kleikamp 		       NEXT_ORPHAN(inode));
1154ac27a0ecSDave Kleikamp 	}
1155ac27a0ecSDave Kleikamp }
1156ac27a0ecSDave Kleikamp 
1157957153fcSJan Kara #ifdef CONFIG_QUOTA
1158957153fcSJan Kara static int ext4_quota_off(struct super_block *sb, int type);
1159957153fcSJan Kara 
1160957153fcSJan Kara static inline void ext4_quota_off_umount(struct super_block *sb)
1161957153fcSJan Kara {
1162957153fcSJan Kara 	int type;
1163957153fcSJan Kara 
1164957153fcSJan Kara 	/* Use our quota_off function to clear inode flags etc. */
1165957153fcSJan Kara 	for (type = 0; type < EXT4_MAXQUOTAS; type++)
1166957153fcSJan Kara 		ext4_quota_off(sb, type);
1167957153fcSJan Kara }
116833458eabSTheodore Ts'o 
116933458eabSTheodore Ts'o /*
117033458eabSTheodore Ts'o  * This is a helper function which is used in the mount/remount
117133458eabSTheodore Ts'o  * codepaths (which holds s_umount) to fetch the quota file name.
117233458eabSTheodore Ts'o  */
117333458eabSTheodore Ts'o static inline char *get_qf_name(struct super_block *sb,
117433458eabSTheodore Ts'o 				struct ext4_sb_info *sbi,
117533458eabSTheodore Ts'o 				int type)
117633458eabSTheodore Ts'o {
117733458eabSTheodore Ts'o 	return rcu_dereference_protected(sbi->s_qf_names[type],
117833458eabSTheodore Ts'o 					 lockdep_is_held(&sb->s_umount));
117933458eabSTheodore Ts'o }
1180957153fcSJan Kara #else
1181957153fcSJan Kara static inline void ext4_quota_off_umount(struct super_block *sb)
1182957153fcSJan Kara {
1183957153fcSJan Kara }
1184957153fcSJan Kara #endif
1185957153fcSJan Kara 
11861f79467cSJason Yan static int ext4_percpu_param_init(struct ext4_sb_info *sbi)
11871f79467cSJason Yan {
11881f79467cSJason Yan 	ext4_fsblk_t block;
11891f79467cSJason Yan 	int err;
11901f79467cSJason Yan 
11911f79467cSJason Yan 	block = ext4_count_free_clusters(sbi->s_sb);
11921f79467cSJason Yan 	ext4_free_blocks_count_set(sbi->s_es, EXT4_C2B(sbi, block));
11931f79467cSJason Yan 	err = percpu_counter_init(&sbi->s_freeclusters_counter, block,
11941f79467cSJason Yan 				  GFP_KERNEL);
11951f79467cSJason Yan 	if (!err) {
11961f79467cSJason Yan 		unsigned long freei = ext4_count_free_inodes(sbi->s_sb);
11971f79467cSJason Yan 		sbi->s_es->s_free_inodes_count = cpu_to_le32(freei);
11981f79467cSJason Yan 		err = percpu_counter_init(&sbi->s_freeinodes_counter, freei,
11991f79467cSJason Yan 					  GFP_KERNEL);
12001f79467cSJason Yan 	}
12011f79467cSJason Yan 	if (!err)
12021f79467cSJason Yan 		err = percpu_counter_init(&sbi->s_dirs_counter,
12031f79467cSJason Yan 					  ext4_count_dirs(sbi->s_sb), GFP_KERNEL);
12041f79467cSJason Yan 	if (!err)
12051f79467cSJason Yan 		err = percpu_counter_init(&sbi->s_dirtyclusters_counter, 0,
12061f79467cSJason Yan 					  GFP_KERNEL);
12071f79467cSJason Yan 	if (!err)
12081f79467cSJason Yan 		err = percpu_counter_init(&sbi->s_sra_exceeded_retry_limit, 0,
12091f79467cSJason Yan 					  GFP_KERNEL);
12101f79467cSJason Yan 	if (!err)
12111f79467cSJason Yan 		err = percpu_init_rwsem(&sbi->s_writepages_rwsem);
12121f79467cSJason Yan 
12131f79467cSJason Yan 	if (err)
12141f79467cSJason Yan 		ext4_msg(sbi->s_sb, KERN_ERR, "insufficient memory");
12151f79467cSJason Yan 
12161f79467cSJason Yan 	return err;
12171f79467cSJason Yan }
12181f79467cSJason Yan 
12191f79467cSJason Yan static void ext4_percpu_param_destroy(struct ext4_sb_info *sbi)
12201f79467cSJason Yan {
12211f79467cSJason Yan 	percpu_counter_destroy(&sbi->s_freeclusters_counter);
12221f79467cSJason Yan 	percpu_counter_destroy(&sbi->s_freeinodes_counter);
12231f79467cSJason Yan 	percpu_counter_destroy(&sbi->s_dirs_counter);
12241f79467cSJason Yan 	percpu_counter_destroy(&sbi->s_dirtyclusters_counter);
12251f79467cSJason Yan 	percpu_counter_destroy(&sbi->s_sra_exceeded_retry_limit);
12261f79467cSJason Yan 	percpu_free_rwsem(&sbi->s_writepages_rwsem);
12271f79467cSJason Yan }
12281f79467cSJason Yan 
12296ef68498SJason Yan static void ext4_group_desc_free(struct ext4_sb_info *sbi)
12306ef68498SJason Yan {
12316ef68498SJason Yan 	struct buffer_head **group_desc;
12326ef68498SJason Yan 	int i;
12336ef68498SJason Yan 
12346ef68498SJason Yan 	rcu_read_lock();
12356ef68498SJason Yan 	group_desc = rcu_dereference(sbi->s_group_desc);
12366ef68498SJason Yan 	for (i = 0; i < sbi->s_gdb_count; i++)
12376ef68498SJason Yan 		brelse(group_desc[i]);
12386ef68498SJason Yan 	kvfree(group_desc);
12396ef68498SJason Yan 	rcu_read_unlock();
12406ef68498SJason Yan }
12416ef68498SJason Yan 
1242dcbf8758SJason Yan static void ext4_flex_groups_free(struct ext4_sb_info *sbi)
1243dcbf8758SJason Yan {
1244dcbf8758SJason Yan 	struct flex_groups **flex_groups;
1245dcbf8758SJason Yan 	int i;
1246dcbf8758SJason Yan 
1247dcbf8758SJason Yan 	rcu_read_lock();
1248dcbf8758SJason Yan 	flex_groups = rcu_dereference(sbi->s_flex_groups);
1249dcbf8758SJason Yan 	if (flex_groups) {
1250dcbf8758SJason Yan 		for (i = 0; i < sbi->s_flex_groups_allocated; i++)
1251dcbf8758SJason Yan 			kvfree(flex_groups[i]);
1252dcbf8758SJason Yan 		kvfree(flex_groups);
1253dcbf8758SJason Yan 	}
1254dcbf8758SJason Yan 	rcu_read_unlock();
1255dcbf8758SJason Yan }
1256dcbf8758SJason Yan 
1257617ba13bSMingming Cao static void ext4_put_super(struct super_block *sb)
1258ac27a0ecSDave Kleikamp {
1259617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1260617ba13bSMingming Cao 	struct ext4_super_block *es = sbi->s_es;
126197abd7d4STheodore Ts'o 	int aborted = 0;
1262ef2cabf7SHidehiro Kawai 	int i, err;
1263ac27a0ecSDave Kleikamp 
1264b98535d0SYe Bin 	/*
1265b98535d0SYe Bin 	 * Unregister sysfs before destroying jbd2 journal.
1266b98535d0SYe Bin 	 * Since we could still access attr_journal_task attribute via sysfs
1267b98535d0SYe Bin 	 * path which could have sbi->s_journal->j_task as NULL
1268b98535d0SYe Bin 	 * Unregister sysfs before flush sbi->s_error_work.
1269b98535d0SYe Bin 	 * Since user may read /proc/fs/ext4/xx/mb_groups during umount, If
1270b98535d0SYe Bin 	 * read metadata verify failed then will queue error work.
1271b98535d0SYe Bin 	 * flush_stashed_error_work will call start_this_handle may trigger
1272b98535d0SYe Bin 	 * BUG_ON.
1273b98535d0SYe Bin 	 */
1274b98535d0SYe Bin 	ext4_unregister_sysfs(sb);
1275b98535d0SYe Bin 
12764808cb5bSZhang Yi 	if (___ratelimit(&ext4_mount_msg_ratelimit, "EXT4-fs unmount"))
1277bb0fbc78SLukas Czerner 		ext4_msg(sb, KERN_INFO, "unmounting filesystem %pU.",
1278bb0fbc78SLukas Czerner 			 &sb->s_uuid);
12794808cb5bSZhang Yi 
1280857ac889SLukas Czerner 	ext4_unregister_li_request(sb);
1281957153fcSJan Kara 	ext4_quota_off_umount(sb);
1282e0ccfd95SChristoph Hellwig 
1283c92dc856SJan Kara 	flush_work(&sbi->s_error_work);
12842e8fa54eSJan Kara 	destroy_workqueue(sbi->rsv_conversion_wq);
128502f310fcSJan Kara 	ext4_release_orphan_info(sb);
12864c0425ffSMingming Cao 
12870390131bSFrank Mayhar 	if (sbi->s_journal) {
128897abd7d4STheodore Ts'o 		aborted = is_journal_aborted(sbi->s_journal);
1289ef2cabf7SHidehiro Kawai 		err = jbd2_journal_destroy(sbi->s_journal);
129047b4a50bSJan Kara 		sbi->s_journal = NULL;
1291878520acSTheodore Ts'o 		if ((err < 0) && !aborted) {
129254d3adbcSTheodore Ts'o 			ext4_abort(sb, -err, "Couldn't clean up the journal");
12930390131bSFrank Mayhar 		}
1294878520acSTheodore Ts'o 	}
1295d4edac31SJosef Bacik 
1296d3922a77SZheng Liu 	ext4_es_unregister_shrinker(sbi);
1297292a089dSSteven Rostedt (Google) 	timer_shutdown_sync(&sbi->s_err_report);
1298d4edac31SJosef Bacik 	ext4_release_system_zone(sb);
1299d4edac31SJosef Bacik 	ext4_mb_release(sb);
1300d4edac31SJosef Bacik 	ext4_ext_release(sb);
1301d4edac31SJosef Bacik 
1302bc98a42cSDavid Howells 	if (!sb_rdonly(sb) && !aborted) {
1303e2b911c5SDarrick J. Wong 		ext4_clear_feature_journal_needs_recovery(sb);
130402f310fcSJan Kara 		ext4_clear_feature_orphan_present(sb);
1305ac27a0ecSDave Kleikamp 		es->s_state = cpu_to_le16(sbi->s_mount_state);
1306ac27a0ecSDave Kleikamp 	}
1307bc98a42cSDavid Howells 	if (!sb_rdonly(sb))
13084392fbc4SJan Kara 		ext4_commit_super(sb);
1309a8e25a83SArtem Bityutskiy 
13106ef68498SJason Yan 	ext4_group_desc_free(sbi);
1311dcbf8758SJason Yan 	ext4_flex_groups_free(sbi);
13121f79467cSJason Yan 	ext4_percpu_param_destroy(sbi);
1313ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1314a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
131533458eabSTheodore Ts'o 		kfree(get_qf_name(sb, sbi, i));
1316ac27a0ecSDave Kleikamp #endif
1317ac27a0ecSDave Kleikamp 
1318ac27a0ecSDave Kleikamp 	/* Debugging code just in case the in-memory inode orphan list
1319ac27a0ecSDave Kleikamp 	 * isn't empty.  The on-disk one can be non-empty if we've
1320ac27a0ecSDave Kleikamp 	 * detected an error and taken the fs readonly, but the
1321ac27a0ecSDave Kleikamp 	 * in-memory list had better be clean by this point. */
1322ac27a0ecSDave Kleikamp 	if (!list_empty(&sbi->s_orphan))
1323ac27a0ecSDave Kleikamp 		dump_orphan_list(sb, sbi);
1324837c23fbSChunguang Xu 	ASSERT(list_empty(&sbi->s_orphan));
1325ac27a0ecSDave Kleikamp 
132689d96a6fSTheodore Ts'o 	sync_blockdev(sb->s_bdev);
1327f98393a6SPeter Zijlstra 	invalidate_bdev(sb->s_bdev);
1328ee7ed3aaSChunguang Xu 	if (sbi->s_journal_bdev && sbi->s_journal_bdev != sb->s_bdev) {
1329ac27a0ecSDave Kleikamp 		/*
1330ac27a0ecSDave Kleikamp 		 * Invalidate the journal device's buffers.  We don't want them
1331ac27a0ecSDave Kleikamp 		 * floating about in memory - the physical journal device may
1332ac27a0ecSDave Kleikamp 		 * hotswapped, and it breaks the `ro-after' testing code.
1333ac27a0ecSDave Kleikamp 		 */
1334ee7ed3aaSChunguang Xu 		sync_blockdev(sbi->s_journal_bdev);
1335ee7ed3aaSChunguang Xu 		invalidate_bdev(sbi->s_journal_bdev);
1336617ba13bSMingming Cao 		ext4_blkdev_remove(sbi);
1337ac27a0ecSDave Kleikamp 	}
133850c15df6SChengguang Xu 
1339dec214d0STahsin Erdogan 	ext4_xattr_destroy_cache(sbi->s_ea_inode_cache);
1340dec214d0STahsin Erdogan 	sbi->s_ea_inode_cache = NULL;
134150c15df6SChengguang Xu 
134247387409STahsin Erdogan 	ext4_xattr_destroy_cache(sbi->s_ea_block_cache);
134347387409STahsin Erdogan 	sbi->s_ea_block_cache = NULL;
134450c15df6SChengguang Xu 
1345618f0031SPavel Skripkin 	ext4_stop_mmpd(sbi);
1346618f0031SPavel Skripkin 
13479060dd2cSEric Sandeen 	brelse(sbi->s_sbh);
1348ac27a0ecSDave Kleikamp 	sb->s_fs_info = NULL;
13493197ebdbSTheodore Ts'o 	/*
13503197ebdbSTheodore Ts'o 	 * Now that we are completely done shutting down the
13513197ebdbSTheodore Ts'o 	 * superblock, we need to actually destroy the kobject.
13523197ebdbSTheodore Ts'o 	 */
13533197ebdbSTheodore Ts'o 	kobject_put(&sbi->s_kobj);
13543197ebdbSTheodore Ts'o 	wait_for_completion(&sbi->s_kobj_unregister);
13550441984aSDarrick J. Wong 	if (sbi->s_chksum_driver)
13560441984aSDarrick J. Wong 		crypto_free_shash(sbi->s_chksum_driver);
1357705895b6SPekka Enberg 	kfree(sbi->s_blockgroup_lock);
13588012b866SShiyang Ruan 	fs_put_dax(sbi->s_daxdev, NULL);
1359ac4acb1fSEric Biggers 	fscrypt_free_dummy_policy(&sbi->s_dummy_enc_policy);
13605298d4bfSChristoph Hellwig #if IS_ENABLED(CONFIG_UNICODE)
1361f8f4acb6SDaniel Rosenberg 	utf8_unload(sb->s_encoding);
1362c83ad55eSGabriel Krisman Bertazi #endif
1363ac27a0ecSDave Kleikamp 	kfree(sbi);
1364ac27a0ecSDave Kleikamp }
1365ac27a0ecSDave Kleikamp 
1366e18b890bSChristoph Lameter static struct kmem_cache *ext4_inode_cachep;
1367ac27a0ecSDave Kleikamp 
1368ac27a0ecSDave Kleikamp /*
1369ac27a0ecSDave Kleikamp  * Called inside transaction, so use GFP_NOFS
1370ac27a0ecSDave Kleikamp  */
1371617ba13bSMingming Cao static struct inode *ext4_alloc_inode(struct super_block *sb)
1372ac27a0ecSDave Kleikamp {
1373617ba13bSMingming Cao 	struct ext4_inode_info *ei;
1374ac27a0ecSDave Kleikamp 
1375fd60b288SMuchun Song 	ei = alloc_inode_sb(sb, ext4_inode_cachep, GFP_NOFS);
1376ac27a0ecSDave Kleikamp 	if (!ei)
1377ac27a0ecSDave Kleikamp 		return NULL;
13780b8e58a1SAndreas Dilger 
1379ee73f9a5SJeff Layton 	inode_set_iversion(&ei->vfs_inode, 1);
13807ea71af9SYe Bin 	ei->i_flags = 0;
1381202ee5dfSTheodore Ts'o 	spin_lock_init(&ei->i_raw_lock);
138238727786SOjaswin Mujoo 	ei->i_prealloc_node = RB_ROOT;
138327bc446eSbrookxu 	atomic_set(&ei->i_prealloc_active, 0);
138438727786SOjaswin Mujoo 	rwlock_init(&ei->i_prealloc_lock);
13859a26b661SZheng Liu 	ext4_es_init_tree(&ei->i_es_tree);
13869a26b661SZheng Liu 	rwlock_init(&ei->i_es_lock);
1387edaa53caSZheng Liu 	INIT_LIST_HEAD(&ei->i_es_list);
1388eb68d0e2SZheng Liu 	ei->i_es_all_nr = 0;
1389edaa53caSZheng Liu 	ei->i_es_shk_nr = 0;
1390dd475925SJan Kara 	ei->i_es_shrink_lblk = 0;
1391d2a17637SMingming Cao 	ei->i_reserved_data_blocks = 0;
1392d2a17637SMingming Cao 	spin_lock_init(&(ei->i_block_reservation_lock));
13931dc0aa46SEric Whitney 	ext4_init_pending_tree(&ei->i_pending_tree);
1394a9e7f447SDmitry Monakhov #ifdef CONFIG_QUOTA
1395a9e7f447SDmitry Monakhov 	ei->i_reserved_quota = 0;
139696c7e0d9SJan Kara 	memset(&ei->i_dquot, 0, sizeof(ei->i_dquot));
1397a9e7f447SDmitry Monakhov #endif
13988aefcd55STheodore Ts'o 	ei->jinode = NULL;
13992e8fa54eSJan Kara 	INIT_LIST_HEAD(&ei->i_rsv_conversion_list);
1400744692dcSJiaying Zhang 	spin_lock_init(&ei->i_completed_io_lock);
1401b436b9beSJan Kara 	ei->i_sync_tid = 0;
1402b436b9beSJan Kara 	ei->i_datasync_tid = 0;
1403e27f41e1SDmitry Monakhov 	atomic_set(&ei->i_unwritten, 0);
14042e8fa54eSJan Kara 	INIT_WORK(&ei->i_rsv_conversion_work, ext4_end_io_rsv_work);
1405aa75f4d3SHarshad Shirwadkar 	ext4_fc_init_inode(&ei->vfs_inode);
1406aa75f4d3SHarshad Shirwadkar 	mutex_init(&ei->i_fc_lock);
1407ac27a0ecSDave Kleikamp 	return &ei->vfs_inode;
1408ac27a0ecSDave Kleikamp }
1409ac27a0ecSDave Kleikamp 
14107ff9c073STheodore Ts'o static int ext4_drop_inode(struct inode *inode)
14117ff9c073STheodore Ts'o {
14127ff9c073STheodore Ts'o 	int drop = generic_drop_inode(inode);
14137ff9c073STheodore Ts'o 
141429b3692eSEric Biggers 	if (!drop)
141529b3692eSEric Biggers 		drop = fscrypt_drop_inode(inode);
141629b3692eSEric Biggers 
14177ff9c073STheodore Ts'o 	trace_ext4_drop_inode(inode, drop);
14187ff9c073STheodore Ts'o 	return drop;
14197ff9c073STheodore Ts'o }
14207ff9c073STheodore Ts'o 
142194053139SAl Viro static void ext4_free_in_core_inode(struct inode *inode)
1422fa0d7e3dSNick Piggin {
14232c58d548SEric Biggers 	fscrypt_free_inode(inode);
1424aa75f4d3SHarshad Shirwadkar 	if (!list_empty(&(EXT4_I(inode)->i_fc_list))) {
1425aa75f4d3SHarshad Shirwadkar 		pr_warn("%s: inode %ld still in fc list",
1426aa75f4d3SHarshad Shirwadkar 			__func__, inode->i_ino);
1427aa75f4d3SHarshad Shirwadkar 	}
1428fa0d7e3dSNick Piggin 	kmem_cache_free(ext4_inode_cachep, EXT4_I(inode));
1429fa0d7e3dSNick Piggin }
1430fa0d7e3dSNick Piggin 
1431617ba13bSMingming Cao static void ext4_destroy_inode(struct inode *inode)
1432ac27a0ecSDave Kleikamp {
14339f7dd93dSVasily Averin 	if (!list_empty(&(EXT4_I(inode)->i_orphan))) {
1434b31e1552SEric Sandeen 		ext4_msg(inode->i_sb, KERN_ERR,
1435b31e1552SEric Sandeen 			 "Inode %lu (%p): orphan list check failed!",
1436b31e1552SEric Sandeen 			 inode->i_ino, EXT4_I(inode));
14379f7dd93dSVasily Averin 		print_hex_dump(KERN_INFO, "", DUMP_PREFIX_ADDRESS, 16, 4,
14389f7dd93dSVasily Averin 				EXT4_I(inode), sizeof(struct ext4_inode_info),
14399f7dd93dSVasily Averin 				true);
14409f7dd93dSVasily Averin 		dump_stack();
14419f7dd93dSVasily Averin 	}
14426fed8395SJeffle Xu 
14436fed8395SJeffle Xu 	if (EXT4_I(inode)->i_reserved_data_blocks)
14446fed8395SJeffle Xu 		ext4_msg(inode->i_sb, KERN_ERR,
14456fed8395SJeffle Xu 			 "Inode %lu (%p): i_reserved_data_blocks (%u) not cleared!",
14466fed8395SJeffle Xu 			 inode->i_ino, EXT4_I(inode),
14476fed8395SJeffle Xu 			 EXT4_I(inode)->i_reserved_data_blocks);
1448ac27a0ecSDave Kleikamp }
1449ac27a0ecSDave Kleikamp 
145051cc5068SAlexey Dobriyan static void init_once(void *foo)
1451ac27a0ecSDave Kleikamp {
1452c30365b9SYu Zhe 	struct ext4_inode_info *ei = foo;
1453ac27a0ecSDave Kleikamp 
1454ac27a0ecSDave Kleikamp 	INIT_LIST_HEAD(&ei->i_orphan);
1455ac27a0ecSDave Kleikamp 	init_rwsem(&ei->xattr_sem);
14560e855ac8SAneesh Kumar K.V 	init_rwsem(&ei->i_data_sem);
1457ac27a0ecSDave Kleikamp 	inode_init_once(&ei->vfs_inode);
1458aa75f4d3SHarshad Shirwadkar 	ext4_fc_init_inode(&ei->vfs_inode);
1459ac27a0ecSDave Kleikamp }
1460ac27a0ecSDave Kleikamp 
1461e67bc2b3SFabian Frederick static int __init init_inodecache(void)
1462ac27a0ecSDave Kleikamp {
1463f8dd7c70SDavid Windsor 	ext4_inode_cachep = kmem_cache_create_usercopy("ext4_inode_cache",
1464f8dd7c70SDavid Windsor 				sizeof(struct ext4_inode_info), 0,
1465f8dd7c70SDavid Windsor 				(SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD|
1466f8dd7c70SDavid Windsor 					SLAB_ACCOUNT),
1467f8dd7c70SDavid Windsor 				offsetof(struct ext4_inode_info, i_data),
1468f8dd7c70SDavid Windsor 				sizeof_field(struct ext4_inode_info, i_data),
146920c2df83SPaul Mundt 				init_once);
1470617ba13bSMingming Cao 	if (ext4_inode_cachep == NULL)
1471ac27a0ecSDave Kleikamp 		return -ENOMEM;
1472ac27a0ecSDave Kleikamp 	return 0;
1473ac27a0ecSDave Kleikamp }
1474ac27a0ecSDave Kleikamp 
1475ac27a0ecSDave Kleikamp static void destroy_inodecache(void)
1476ac27a0ecSDave Kleikamp {
14778c0a8537SKirill A. Shutemov 	/*
14788c0a8537SKirill A. Shutemov 	 * Make sure all delayed rcu free inodes are flushed before we
14798c0a8537SKirill A. Shutemov 	 * destroy cache.
14808c0a8537SKirill A. Shutemov 	 */
14818c0a8537SKirill A. Shutemov 	rcu_barrier();
1482617ba13bSMingming Cao 	kmem_cache_destroy(ext4_inode_cachep);
1483ac27a0ecSDave Kleikamp }
1484ac27a0ecSDave Kleikamp 
14850930fcc1SAl Viro void ext4_clear_inode(struct inode *inode)
1486ac27a0ecSDave Kleikamp {
1487aa75f4d3SHarshad Shirwadkar 	ext4_fc_del(inode);
14880930fcc1SAl Viro 	invalidate_inode_buffers(inode);
1489dbd5768fSJan Kara 	clear_inode(inode);
149027bc446eSbrookxu 	ext4_discard_preallocations(inode, 0);
149151865fdaSZheng Liu 	ext4_es_remove_extent(inode, 0, EXT_MAX_BLOCKS);
1492f4c2d372SJan Kara 	dquot_drop(inode);
14938aefcd55STheodore Ts'o 	if (EXT4_I(inode)->jinode) {
14948aefcd55STheodore Ts'o 		jbd2_journal_release_jbd_inode(EXT4_JOURNAL(inode),
14958aefcd55STheodore Ts'o 					       EXT4_I(inode)->jinode);
14968aefcd55STheodore Ts'o 		jbd2_free_inode(EXT4_I(inode)->jinode);
14978aefcd55STheodore Ts'o 		EXT4_I(inode)->jinode = NULL;
14988aefcd55STheodore Ts'o 	}
14993d204e24SEric Biggers 	fscrypt_put_encryption_info(inode);
1500c93d8f88SEric Biggers 	fsverity_cleanup_inode(inode);
1501ac27a0ecSDave Kleikamp }
1502ac27a0ecSDave Kleikamp 
15031b961ac0SChristoph Hellwig static struct inode *ext4_nfs_get_inode(struct super_block *sb,
15041b961ac0SChristoph Hellwig 					u64 ino, u32 generation)
1505ac27a0ecSDave Kleikamp {
1506ac27a0ecSDave Kleikamp 	struct inode *inode;
1507ac27a0ecSDave Kleikamp 
15088a363970STheodore Ts'o 	/*
1509ac27a0ecSDave Kleikamp 	 * Currently we don't know the generation for parent directory, so
1510ac27a0ecSDave Kleikamp 	 * a generation of 0 means "accept any"
1511ac27a0ecSDave Kleikamp 	 */
15128a363970STheodore Ts'o 	inode = ext4_iget(sb, ino, EXT4_IGET_HANDLE);
15131d1fe1eeSDavid Howells 	if (IS_ERR(inode))
15141d1fe1eeSDavid Howells 		return ERR_CAST(inode);
15151d1fe1eeSDavid Howells 	if (generation && inode->i_generation != generation) {
1516ac27a0ecSDave Kleikamp 		iput(inode);
1517ac27a0ecSDave Kleikamp 		return ERR_PTR(-ESTALE);
1518ac27a0ecSDave Kleikamp 	}
15191b961ac0SChristoph Hellwig 
15201b961ac0SChristoph Hellwig 	return inode;
1521ac27a0ecSDave Kleikamp }
15221b961ac0SChristoph Hellwig 
15231b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_dentry(struct super_block *sb, struct fid *fid,
15241b961ac0SChristoph Hellwig 					int fh_len, int fh_type)
15251b961ac0SChristoph Hellwig {
15261b961ac0SChristoph Hellwig 	return generic_fh_to_dentry(sb, fid, fh_len, fh_type,
15271b961ac0SChristoph Hellwig 				    ext4_nfs_get_inode);
15281b961ac0SChristoph Hellwig }
15291b961ac0SChristoph Hellwig 
15301b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_parent(struct super_block *sb, struct fid *fid,
15311b961ac0SChristoph Hellwig 					int fh_len, int fh_type)
15321b961ac0SChristoph Hellwig {
15331b961ac0SChristoph Hellwig 	return generic_fh_to_parent(sb, fid, fh_len, fh_type,
15341b961ac0SChristoph Hellwig 				    ext4_nfs_get_inode);
1535ac27a0ecSDave Kleikamp }
1536ac27a0ecSDave Kleikamp 
1537fde87268STheodore Ts'o static int ext4_nfs_commit_metadata(struct inode *inode)
1538fde87268STheodore Ts'o {
1539fde87268STheodore Ts'o 	struct writeback_control wbc = {
1540fde87268STheodore Ts'o 		.sync_mode = WB_SYNC_ALL
1541fde87268STheodore Ts'o 	};
1542fde87268STheodore Ts'o 
1543fde87268STheodore Ts'o 	trace_ext4_nfs_commit_metadata(inode);
1544fde87268STheodore Ts'o 	return ext4_write_inode(inode, &wbc);
1545fde87268STheodore Ts'o }
1546fde87268STheodore Ts'o 
1547ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1548d6006186SEric Biggers static const char * const quotatypes[] = INITQFNAMES;
1549689c958cSLi Xi #define QTYPE2NAME(t) (quotatypes[t])
1550ac27a0ecSDave Kleikamp 
1551617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot);
1552617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot);
1553617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot);
1554617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot);
1555617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type);
15566f28e087SJan Kara static int ext4_quota_on(struct super_block *sb, int type, int format_id,
15578c54ca9cSAl Viro 			 const struct path *path);
1558617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
1559ac27a0ecSDave Kleikamp 			       size_t len, loff_t off);
1560617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
1561ac27a0ecSDave Kleikamp 				const char *data, size_t len, loff_t off);
15627c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id,
15637c319d32SAditya Kali 			     unsigned int flags);
1564ac27a0ecSDave Kleikamp 
156596c7e0d9SJan Kara static struct dquot **ext4_get_dquots(struct inode *inode)
156696c7e0d9SJan Kara {
156796c7e0d9SJan Kara 	return EXT4_I(inode)->i_dquot;
156896c7e0d9SJan Kara }
156996c7e0d9SJan Kara 
157061e225dcSAlexey Dobriyan static const struct dquot_operations ext4_quota_operations = {
157160e58e0fSMingming Cao 	.get_reserved_space	= ext4_get_reserved_space,
1572617ba13bSMingming Cao 	.write_dquot		= ext4_write_dquot,
1573617ba13bSMingming Cao 	.acquire_dquot		= ext4_acquire_dquot,
1574617ba13bSMingming Cao 	.release_dquot		= ext4_release_dquot,
1575617ba13bSMingming Cao 	.mark_dirty		= ext4_mark_dquot_dirty,
1576a5b5ee32SJan Kara 	.write_info		= ext4_write_info,
1577a5b5ee32SJan Kara 	.alloc_dquot		= dquot_alloc,
1578a5b5ee32SJan Kara 	.destroy_dquot		= dquot_destroy,
1579040cb378SLi Xi 	.get_projid		= ext4_get_projid,
15807a9ca53aSTahsin Erdogan 	.get_inode_usage	= ext4_get_inode_usage,
1581ebc11f7bSChengguang Xu 	.get_next_id		= dquot_get_next_id,
1582ac27a0ecSDave Kleikamp };
1583ac27a0ecSDave Kleikamp 
15840d54b217SAlexey Dobriyan static const struct quotactl_ops ext4_qctl_operations = {
1585617ba13bSMingming Cao 	.quota_on	= ext4_quota_on,
1586ca0e05e4SDmitry Monakhov 	.quota_off	= ext4_quota_off,
1587287a8095SChristoph Hellwig 	.quota_sync	= dquot_quota_sync,
15880a240339SJan Kara 	.get_state	= dquot_get_state,
1589287a8095SChristoph Hellwig 	.set_info	= dquot_set_dqinfo,
1590287a8095SChristoph Hellwig 	.get_dqblk	= dquot_get_dqblk,
15916332b9b5SEric Sandeen 	.set_dqblk	= dquot_set_dqblk,
15926332b9b5SEric Sandeen 	.get_nextdqblk	= dquot_get_next_dqblk,
1593ac27a0ecSDave Kleikamp };
1594ac27a0ecSDave Kleikamp #endif
1595ac27a0ecSDave Kleikamp 
1596ee9b6d61SJosef 'Jeff' Sipek static const struct super_operations ext4_sops = {
1597617ba13bSMingming Cao 	.alloc_inode	= ext4_alloc_inode,
159894053139SAl Viro 	.free_inode	= ext4_free_in_core_inode,
1599617ba13bSMingming Cao 	.destroy_inode	= ext4_destroy_inode,
1600617ba13bSMingming Cao 	.write_inode	= ext4_write_inode,
1601617ba13bSMingming Cao 	.dirty_inode	= ext4_dirty_inode,
16027ff9c073STheodore Ts'o 	.drop_inode	= ext4_drop_inode,
16030930fcc1SAl Viro 	.evict_inode	= ext4_evict_inode,
1604617ba13bSMingming Cao 	.put_super	= ext4_put_super,
1605617ba13bSMingming Cao 	.sync_fs	= ext4_sync_fs,
1606c4be0c1dSTakashi Sato 	.freeze_fs	= ext4_freeze,
1607c4be0c1dSTakashi Sato 	.unfreeze_fs	= ext4_unfreeze,
1608617ba13bSMingming Cao 	.statfs		= ext4_statfs,
1609617ba13bSMingming Cao 	.show_options	= ext4_show_options,
1610ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1611617ba13bSMingming Cao 	.quota_read	= ext4_quota_read,
1612617ba13bSMingming Cao 	.quota_write	= ext4_quota_write,
161396c7e0d9SJan Kara 	.get_dquots	= ext4_get_dquots,
1614ac27a0ecSDave Kleikamp #endif
1615ac27a0ecSDave Kleikamp };
1616ac27a0ecSDave Kleikamp 
161739655164SChristoph Hellwig static const struct export_operations ext4_export_ops = {
16181b961ac0SChristoph Hellwig 	.fh_to_dentry = ext4_fh_to_dentry,
16191b961ac0SChristoph Hellwig 	.fh_to_parent = ext4_fh_to_parent,
1620617ba13bSMingming Cao 	.get_parent = ext4_get_parent,
1621fde87268STheodore Ts'o 	.commit_metadata = ext4_nfs_commit_metadata,
1622ac27a0ecSDave Kleikamp };
1623ac27a0ecSDave Kleikamp 
1624ac27a0ecSDave Kleikamp enum {
1625ac27a0ecSDave Kleikamp 	Opt_bsd_df, Opt_minix_df, Opt_grpid, Opt_nogrpid,
1626ba2e524dSLukas Czerner 	Opt_resgid, Opt_resuid, Opt_sb,
162772578c33STheodore Ts'o 	Opt_nouid32, Opt_debug, Opt_removed,
16282d544ec9SYang Xu 	Opt_user_xattr, Opt_acl,
162972578c33STheodore Ts'o 	Opt_auto_da_alloc, Opt_noauto_da_alloc, Opt_noload,
1630ad4eec61SEric Sandeen 	Opt_commit, Opt_min_batch_time, Opt_max_batch_time, Opt_journal_dev,
1631ad4eec61SEric Sandeen 	Opt_journal_path, Opt_journal_checksum, Opt_journal_async_commit,
1632ac27a0ecSDave Kleikamp 	Opt_abort, Opt_data_journal, Opt_data_ordered, Opt_data_writeback,
16336ddb2447STheodore Ts'o 	Opt_data_err_abort, Opt_data_err_ignore, Opt_test_dummy_encryption,
16344f74d15fSEric Biggers 	Opt_inlinecrypt,
1635ba2e524dSLukas Czerner 	Opt_usrjquota, Opt_grpjquota, Opt_quota,
1636ee4a3fcdSTheodore Ts'o 	Opt_noquota, Opt_barrier, Opt_nobarrier, Opt_err,
16371ff20307SJeff Layton 	Opt_usrquota, Opt_grpquota, Opt_prjquota,
16389cb20f94SIra Weiny 	Opt_dax, Opt_dax_always, Opt_dax_inode, Opt_dax_never,
1639327eaf73STheodore Ts'o 	Opt_stripe, Opt_delalloc, Opt_nodelalloc, Opt_warn_on_error,
16404437992bSLukas Czerner 	Opt_nowarn_on_error, Opt_mblk_io_submit, Opt_debug_want_extra_isize,
16411449032bSTheodore Ts'o 	Opt_nomblk_io_submit, Opt_block_validity, Opt_noblock_validity,
16425328e635SEric Sandeen 	Opt_inode_readahead_blks, Opt_journal_ioprio,
1643744692dcSJiaying Zhang 	Opt_dioread_nolock, Opt_dioread_lock,
1644fc6cb1cdSTheodore Ts'o 	Opt_discard, Opt_nodiscard, Opt_init_itable, Opt_noinit_itable,
1645cdb7ee4cSTahsin Erdogan 	Opt_max_dir_size_kb, Opt_nojournal_checksum, Opt_nombcache,
164621175ca4SHarshad Shirwadkar 	Opt_no_prefetch_block_bitmaps, Opt_mb_optimize_scan,
1647e5a185c2SLukas Czerner 	Opt_errors, Opt_data, Opt_data_err, Opt_jqfmt, Opt_dax_type,
16488016e29fSHarshad Shirwadkar #ifdef CONFIG_EXT4_DEBUG
164999c880deSHarshad Shirwadkar 	Opt_fc_debug_max_replay, Opt_fc_debug_force
16508016e29fSHarshad Shirwadkar #endif
1651ac27a0ecSDave Kleikamp };
1652ac27a0ecSDave Kleikamp 
1653e5a185c2SLukas Czerner static const struct constant_table ext4_param_errors[] = {
1654ba2e524dSLukas Czerner 	{"continue",	EXT4_MOUNT_ERRORS_CONT},
1655ba2e524dSLukas Czerner 	{"panic",	EXT4_MOUNT_ERRORS_PANIC},
1656ba2e524dSLukas Czerner 	{"remount-ro",	EXT4_MOUNT_ERRORS_RO},
1657e5a185c2SLukas Czerner 	{}
1658e5a185c2SLukas Czerner };
1659e5a185c2SLukas Czerner 
1660e5a185c2SLukas Czerner static const struct constant_table ext4_param_data[] = {
1661ba2e524dSLukas Czerner 	{"journal",	EXT4_MOUNT_JOURNAL_DATA},
1662ba2e524dSLukas Czerner 	{"ordered",	EXT4_MOUNT_ORDERED_DATA},
1663ba2e524dSLukas Czerner 	{"writeback",	EXT4_MOUNT_WRITEBACK_DATA},
1664e5a185c2SLukas Czerner 	{}
1665e5a185c2SLukas Czerner };
1666e5a185c2SLukas Czerner 
1667e5a185c2SLukas Czerner static const struct constant_table ext4_param_data_err[] = {
1668e5a185c2SLukas Czerner 	{"abort",	Opt_data_err_abort},
1669e5a185c2SLukas Czerner 	{"ignore",	Opt_data_err_ignore},
1670e5a185c2SLukas Czerner 	{}
1671e5a185c2SLukas Czerner };
1672e5a185c2SLukas Czerner 
1673e5a185c2SLukas Czerner static const struct constant_table ext4_param_jqfmt[] = {
1674ba2e524dSLukas Czerner 	{"vfsold",	QFMT_VFS_OLD},
1675ba2e524dSLukas Czerner 	{"vfsv0",	QFMT_VFS_V0},
1676ba2e524dSLukas Czerner 	{"vfsv1",	QFMT_VFS_V1},
1677e5a185c2SLukas Czerner 	{}
1678e5a185c2SLukas Czerner };
1679e5a185c2SLukas Czerner 
1680e5a185c2SLukas Czerner static const struct constant_table ext4_param_dax[] = {
1681e5a185c2SLukas Czerner 	{"always",	Opt_dax_always},
1682e5a185c2SLukas Czerner 	{"inode",	Opt_dax_inode},
1683e5a185c2SLukas Czerner 	{"never",	Opt_dax_never},
1684e5a185c2SLukas Czerner 	{}
1685e5a185c2SLukas Czerner };
1686e5a185c2SLukas Czerner 
1687e5a185c2SLukas Czerner /* String parameter that allows empty argument */
1688e5a185c2SLukas Czerner #define fsparam_string_empty(NAME, OPT) \
1689e5a185c2SLukas Czerner 	__fsparam(fs_param_is_string, NAME, OPT, fs_param_can_be_empty, NULL)
1690e5a185c2SLukas Czerner 
1691e5a185c2SLukas Czerner /*
1692e5a185c2SLukas Czerner  * Mount option specification
1693e5a185c2SLukas Czerner  * We don't use fsparam_flag_no because of the way we set the
1694e5a185c2SLukas Czerner  * options and the way we show them in _ext4_show_options(). To
1695e5a185c2SLukas Czerner  * keep the changes to a minimum, let's keep the negative options
1696e5a185c2SLukas Czerner  * separate for now.
1697e5a185c2SLukas Czerner  */
1698e5a185c2SLukas Czerner static const struct fs_parameter_spec ext4_param_specs[] = {
1699e5a185c2SLukas Czerner 	fsparam_flag	("bsddf",		Opt_bsd_df),
1700e5a185c2SLukas Czerner 	fsparam_flag	("minixdf",		Opt_minix_df),
1701e5a185c2SLukas Czerner 	fsparam_flag	("grpid",		Opt_grpid),
1702e5a185c2SLukas Czerner 	fsparam_flag	("bsdgroups",		Opt_grpid),
1703e5a185c2SLukas Czerner 	fsparam_flag	("nogrpid",		Opt_nogrpid),
1704e5a185c2SLukas Czerner 	fsparam_flag	("sysvgroups",		Opt_nogrpid),
1705e5a185c2SLukas Czerner 	fsparam_u32	("resgid",		Opt_resgid),
1706e5a185c2SLukas Czerner 	fsparam_u32	("resuid",		Opt_resuid),
1707e5a185c2SLukas Czerner 	fsparam_u32	("sb",			Opt_sb),
1708e5a185c2SLukas Czerner 	fsparam_enum	("errors",		Opt_errors, ext4_param_errors),
1709e5a185c2SLukas Czerner 	fsparam_flag	("nouid32",		Opt_nouid32),
1710e5a185c2SLukas Czerner 	fsparam_flag	("debug",		Opt_debug),
1711e5a185c2SLukas Czerner 	fsparam_flag	("oldalloc",		Opt_removed),
1712e5a185c2SLukas Czerner 	fsparam_flag	("orlov",		Opt_removed),
1713e5a185c2SLukas Czerner 	fsparam_flag	("user_xattr",		Opt_user_xattr),
1714e5a185c2SLukas Czerner 	fsparam_flag	("acl",			Opt_acl),
1715e5a185c2SLukas Czerner 	fsparam_flag	("norecovery",		Opt_noload),
1716e5a185c2SLukas Czerner 	fsparam_flag	("noload",		Opt_noload),
1717e5a185c2SLukas Czerner 	fsparam_flag	("bh",			Opt_removed),
1718e5a185c2SLukas Czerner 	fsparam_flag	("nobh",		Opt_removed),
1719e5a185c2SLukas Czerner 	fsparam_u32	("commit",		Opt_commit),
1720e5a185c2SLukas Czerner 	fsparam_u32	("min_batch_time",	Opt_min_batch_time),
1721e5a185c2SLukas Czerner 	fsparam_u32	("max_batch_time",	Opt_max_batch_time),
1722e5a185c2SLukas Czerner 	fsparam_u32	("journal_dev",		Opt_journal_dev),
1723e5a185c2SLukas Czerner 	fsparam_bdev	("journal_path",	Opt_journal_path),
1724e5a185c2SLukas Czerner 	fsparam_flag	("journal_checksum",	Opt_journal_checksum),
1725e5a185c2SLukas Czerner 	fsparam_flag	("nojournal_checksum",	Opt_nojournal_checksum),
1726e5a185c2SLukas Czerner 	fsparam_flag	("journal_async_commit",Opt_journal_async_commit),
1727e5a185c2SLukas Czerner 	fsparam_flag	("abort",		Opt_abort),
1728e5a185c2SLukas Czerner 	fsparam_enum	("data",		Opt_data, ext4_param_data),
1729e5a185c2SLukas Czerner 	fsparam_enum	("data_err",		Opt_data_err,
1730e5a185c2SLukas Czerner 						ext4_param_data_err),
1731e5a185c2SLukas Czerner 	fsparam_string_empty
1732e5a185c2SLukas Czerner 			("usrjquota",		Opt_usrjquota),
1733e5a185c2SLukas Czerner 	fsparam_string_empty
1734e5a185c2SLukas Czerner 			("grpjquota",		Opt_grpjquota),
1735e5a185c2SLukas Czerner 	fsparam_enum	("jqfmt",		Opt_jqfmt, ext4_param_jqfmt),
1736e5a185c2SLukas Czerner 	fsparam_flag	("grpquota",		Opt_grpquota),
1737e5a185c2SLukas Czerner 	fsparam_flag	("quota",		Opt_quota),
1738e5a185c2SLukas Czerner 	fsparam_flag	("noquota",		Opt_noquota),
1739e5a185c2SLukas Czerner 	fsparam_flag	("usrquota",		Opt_usrquota),
1740e5a185c2SLukas Czerner 	fsparam_flag	("prjquota",		Opt_prjquota),
1741e5a185c2SLukas Czerner 	fsparam_flag	("barrier",		Opt_barrier),
1742e5a185c2SLukas Czerner 	fsparam_u32	("barrier",		Opt_barrier),
1743e5a185c2SLukas Czerner 	fsparam_flag	("nobarrier",		Opt_nobarrier),
17441ff20307SJeff Layton 	fsparam_flag	("i_version",		Opt_removed),
1745e5a185c2SLukas Czerner 	fsparam_flag	("dax",			Opt_dax),
1746e5a185c2SLukas Czerner 	fsparam_enum	("dax",			Opt_dax_type, ext4_param_dax),
1747e5a185c2SLukas Czerner 	fsparam_u32	("stripe",		Opt_stripe),
1748e5a185c2SLukas Czerner 	fsparam_flag	("delalloc",		Opt_delalloc),
1749e5a185c2SLukas Czerner 	fsparam_flag	("nodelalloc",		Opt_nodelalloc),
1750e5a185c2SLukas Czerner 	fsparam_flag	("warn_on_error",	Opt_warn_on_error),
1751e5a185c2SLukas Czerner 	fsparam_flag	("nowarn_on_error",	Opt_nowarn_on_error),
1752e5a185c2SLukas Czerner 	fsparam_u32	("debug_want_extra_isize",
1753e5a185c2SLukas Czerner 						Opt_debug_want_extra_isize),
1754e5a185c2SLukas Czerner 	fsparam_flag	("mblk_io_submit",	Opt_removed),
1755e5a185c2SLukas Czerner 	fsparam_flag	("nomblk_io_submit",	Opt_removed),
1756e5a185c2SLukas Czerner 	fsparam_flag	("block_validity",	Opt_block_validity),
1757e5a185c2SLukas Czerner 	fsparam_flag	("noblock_validity",	Opt_noblock_validity),
1758e5a185c2SLukas Czerner 	fsparam_u32	("inode_readahead_blks",
1759e5a185c2SLukas Czerner 						Opt_inode_readahead_blks),
1760e5a185c2SLukas Czerner 	fsparam_u32	("journal_ioprio",	Opt_journal_ioprio),
1761e5a185c2SLukas Czerner 	fsparam_u32	("auto_da_alloc",	Opt_auto_da_alloc),
1762e5a185c2SLukas Czerner 	fsparam_flag	("auto_da_alloc",	Opt_auto_da_alloc),
1763e5a185c2SLukas Czerner 	fsparam_flag	("noauto_da_alloc",	Opt_noauto_da_alloc),
1764e5a185c2SLukas Czerner 	fsparam_flag	("dioread_nolock",	Opt_dioread_nolock),
1765e5a185c2SLukas Czerner 	fsparam_flag	("nodioread_nolock",	Opt_dioread_lock),
1766e5a185c2SLukas Czerner 	fsparam_flag	("dioread_lock",	Opt_dioread_lock),
1767e5a185c2SLukas Czerner 	fsparam_flag	("discard",		Opt_discard),
1768e5a185c2SLukas Czerner 	fsparam_flag	("nodiscard",		Opt_nodiscard),
1769e5a185c2SLukas Czerner 	fsparam_u32	("init_itable",		Opt_init_itable),
1770e5a185c2SLukas Czerner 	fsparam_flag	("init_itable",		Opt_init_itable),
1771e5a185c2SLukas Czerner 	fsparam_flag	("noinit_itable",	Opt_noinit_itable),
1772e5a185c2SLukas Czerner #ifdef CONFIG_EXT4_DEBUG
1773e5a185c2SLukas Czerner 	fsparam_flag	("fc_debug_force",	Opt_fc_debug_force),
1774e5a185c2SLukas Czerner 	fsparam_u32	("fc_debug_max_replay",	Opt_fc_debug_max_replay),
1775e5a185c2SLukas Czerner #endif
1776e5a185c2SLukas Czerner 	fsparam_u32	("max_dir_size_kb",	Opt_max_dir_size_kb),
1777e5a185c2SLukas Czerner 	fsparam_flag	("test_dummy_encryption",
1778e5a185c2SLukas Czerner 						Opt_test_dummy_encryption),
1779e5a185c2SLukas Czerner 	fsparam_string	("test_dummy_encryption",
1780e5a185c2SLukas Czerner 						Opt_test_dummy_encryption),
1781e5a185c2SLukas Czerner 	fsparam_flag	("inlinecrypt",		Opt_inlinecrypt),
1782e5a185c2SLukas Czerner 	fsparam_flag	("nombcache",		Opt_nombcache),
1783e5a185c2SLukas Czerner 	fsparam_flag	("no_mbcache",		Opt_nombcache),	/* for backward compatibility */
1784e5a185c2SLukas Czerner 	fsparam_flag	("prefetch_block_bitmaps",
1785e5a185c2SLukas Czerner 						Opt_removed),
1786e5a185c2SLukas Czerner 	fsparam_flag	("no_prefetch_block_bitmaps",
1787e5a185c2SLukas Czerner 						Opt_no_prefetch_block_bitmaps),
1788e5a185c2SLukas Czerner 	fsparam_s32	("mb_optimize_scan",	Opt_mb_optimize_scan),
1789e5a185c2SLukas Czerner 	fsparam_string	("check",		Opt_removed),	/* mount option from ext2/3 */
1790e5a185c2SLukas Czerner 	fsparam_flag	("nocheck",		Opt_removed),	/* mount option from ext2/3 */
1791e5a185c2SLukas Czerner 	fsparam_flag	("reservation",		Opt_removed),	/* mount option from ext2/3 */
1792e5a185c2SLukas Czerner 	fsparam_flag	("noreservation",	Opt_removed),	/* mount option from ext2/3 */
1793e5a185c2SLukas Czerner 	fsparam_u32	("journal",		Opt_removed),	/* mount option from ext2/3 */
1794e5a185c2SLukas Czerner 	{}
1795e5a185c2SLukas Czerner };
1796e5a185c2SLukas Czerner 
1797b3881f74STheodore Ts'o #define DEFAULT_JOURNAL_IOPRIO (IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, 3))
1798196e402aSHarshad Shirwadkar 
179926092bf5STheodore Ts'o #define MOPT_SET	0x0001
180026092bf5STheodore Ts'o #define MOPT_CLEAR	0x0002
180126092bf5STheodore Ts'o #define MOPT_NOSUPPORT	0x0004
180226092bf5STheodore Ts'o #define MOPT_EXPLICIT	0x0008
180326092bf5STheodore Ts'o #ifdef CONFIG_QUOTA
180426092bf5STheodore Ts'o #define MOPT_Q		0
1805ba2e524dSLukas Czerner #define MOPT_QFMT	0x0010
180626092bf5STheodore Ts'o #else
180726092bf5STheodore Ts'o #define MOPT_Q		MOPT_NOSUPPORT
180826092bf5STheodore Ts'o #define MOPT_QFMT	MOPT_NOSUPPORT
180926092bf5STheodore Ts'o #endif
1810ba2e524dSLukas Czerner #define MOPT_NO_EXT2	0x0020
1811ba2e524dSLukas Czerner #define MOPT_NO_EXT3	0x0040
18128dc0aa8cSTheodore Ts'o #define MOPT_EXT4_ONLY	(MOPT_NO_EXT2 | MOPT_NO_EXT3)
1813ba2e524dSLukas Czerner #define MOPT_SKIP	0x0080
1814ba2e524dSLukas Czerner #define	MOPT_2		0x0100
181526092bf5STheodore Ts'o 
181626092bf5STheodore Ts'o static const struct mount_opts {
181726092bf5STheodore Ts'o 	int	token;
181826092bf5STheodore Ts'o 	int	mount_opt;
181926092bf5STheodore Ts'o 	int	flags;
182026092bf5STheodore Ts'o } ext4_mount_opts[] = {
182126092bf5STheodore Ts'o 	{Opt_minix_df, EXT4_MOUNT_MINIX_DF, MOPT_SET},
182226092bf5STheodore Ts'o 	{Opt_bsd_df, EXT4_MOUNT_MINIX_DF, MOPT_CLEAR},
182326092bf5STheodore Ts'o 	{Opt_grpid, EXT4_MOUNT_GRPID, MOPT_SET},
182426092bf5STheodore Ts'o 	{Opt_nogrpid, EXT4_MOUNT_GRPID, MOPT_CLEAR},
182526092bf5STheodore Ts'o 	{Opt_block_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_SET},
182626092bf5STheodore Ts'o 	{Opt_noblock_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_CLEAR},
18278dc0aa8cSTheodore Ts'o 	{Opt_dioread_nolock, EXT4_MOUNT_DIOREAD_NOLOCK,
18288dc0aa8cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_SET},
18298dc0aa8cSTheodore Ts'o 	{Opt_dioread_lock, EXT4_MOUNT_DIOREAD_NOLOCK,
18308dc0aa8cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_CLEAR},
183126092bf5STheodore Ts'o 	{Opt_discard, EXT4_MOUNT_DISCARD, MOPT_SET},
183226092bf5STheodore Ts'o 	{Opt_nodiscard, EXT4_MOUNT_DISCARD, MOPT_CLEAR},
18338dc0aa8cSTheodore Ts'o 	{Opt_delalloc, EXT4_MOUNT_DELALLOC,
18348dc0aa8cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
18358dc0aa8cSTheodore Ts'o 	{Opt_nodelalloc, EXT4_MOUNT_DELALLOC,
183659d9fa5cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_CLEAR},
1837327eaf73STheodore Ts'o 	{Opt_warn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_SET},
1838327eaf73STheodore Ts'o 	{Opt_nowarn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_CLEAR},
1839cb8435dcSEric Biggers 	{Opt_commit, 0, MOPT_NO_EXT2},
1840c6d3d56dSDarrick J. Wong 	{Opt_nojournal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM,
1841c6d3d56dSDarrick J. Wong 	 MOPT_EXT4_ONLY | MOPT_CLEAR},
18428dc0aa8cSTheodore Ts'o 	{Opt_journal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM,
18431e381f60SDmitry Monakhov 	 MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
184426092bf5STheodore Ts'o 	{Opt_journal_async_commit, (EXT4_MOUNT_JOURNAL_ASYNC_COMMIT |
18458dc0aa8cSTheodore Ts'o 				    EXT4_MOUNT_JOURNAL_CHECKSUM),
18461e381f60SDmitry Monakhov 	 MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
18478dc0aa8cSTheodore Ts'o 	{Opt_noload, EXT4_MOUNT_NOLOAD, MOPT_NO_EXT2 | MOPT_SET},
1848ba2e524dSLukas Czerner 	{Opt_data_err, EXT4_MOUNT_DATA_ERR_ABORT, MOPT_NO_EXT2},
184926092bf5STheodore Ts'o 	{Opt_barrier, EXT4_MOUNT_BARRIER, MOPT_SET},
185026092bf5STheodore Ts'o 	{Opt_nobarrier, EXT4_MOUNT_BARRIER, MOPT_CLEAR},
185126092bf5STheodore Ts'o 	{Opt_noauto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_SET},
185226092bf5STheodore Ts'o 	{Opt_auto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_CLEAR},
185326092bf5STheodore Ts'o 	{Opt_noinit_itable, EXT4_MOUNT_INIT_INODE_TABLE, MOPT_CLEAR},
1854ba2e524dSLukas Czerner 	{Opt_dax_type, 0, MOPT_EXT4_ONLY},
1855ba2e524dSLukas Czerner 	{Opt_journal_dev, 0, MOPT_NO_EXT2},
1856ba2e524dSLukas Czerner 	{Opt_journal_path, 0, MOPT_NO_EXT2},
1857ba2e524dSLukas Czerner 	{Opt_journal_ioprio, 0, MOPT_NO_EXT2},
1858ba2e524dSLukas Czerner 	{Opt_data, 0, MOPT_NO_EXT2},
185926092bf5STheodore Ts'o 	{Opt_user_xattr, EXT4_MOUNT_XATTR_USER, MOPT_SET},
186026092bf5STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
186126092bf5STheodore Ts'o 	{Opt_acl, EXT4_MOUNT_POSIX_ACL, MOPT_SET},
186226092bf5STheodore Ts'o #else
186326092bf5STheodore Ts'o 	{Opt_acl, 0, MOPT_NOSUPPORT},
186426092bf5STheodore Ts'o #endif
186526092bf5STheodore Ts'o 	{Opt_nouid32, EXT4_MOUNT_NO_UID32, MOPT_SET},
186626092bf5STheodore Ts'o 	{Opt_debug, EXT4_MOUNT_DEBUG, MOPT_SET},
186726092bf5STheodore Ts'o 	{Opt_quota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA, MOPT_SET | MOPT_Q},
186826092bf5STheodore Ts'o 	{Opt_usrquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA,
186926092bf5STheodore Ts'o 							MOPT_SET | MOPT_Q},
187026092bf5STheodore Ts'o 	{Opt_grpquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_GRPQUOTA,
187126092bf5STheodore Ts'o 							MOPT_SET | MOPT_Q},
187249da9392SJan Kara 	{Opt_prjquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_PRJQUOTA,
187349da9392SJan Kara 							MOPT_SET | MOPT_Q},
187426092bf5STheodore Ts'o 	{Opt_noquota, (EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA |
187549da9392SJan Kara 		       EXT4_MOUNT_GRPQUOTA | EXT4_MOUNT_PRJQUOTA),
187649da9392SJan Kara 							MOPT_CLEAR | MOPT_Q},
1877ba2e524dSLukas Czerner 	{Opt_usrjquota, 0, MOPT_Q},
1878ba2e524dSLukas Czerner 	{Opt_grpjquota, 0, MOPT_Q},
1879ba2e524dSLukas Czerner 	{Opt_jqfmt, 0, MOPT_QFMT},
1880cdb7ee4cSTahsin Erdogan 	{Opt_nombcache, EXT4_MOUNT_NO_MBCACHE, MOPT_SET},
188121175ca4SHarshad Shirwadkar 	{Opt_no_prefetch_block_bitmaps, EXT4_MOUNT_NO_PREFETCH_BLOCK_BITMAPS,
18823d392b26STheodore Ts'o 	 MOPT_SET},
188399c880deSHarshad Shirwadkar #ifdef CONFIG_EXT4_DEBUG
18840f0672ffSHarshad Shirwadkar 	{Opt_fc_debug_force, EXT4_MOUNT2_JOURNAL_FAST_COMMIT,
18850f0672ffSHarshad Shirwadkar 	 MOPT_SET | MOPT_2 | MOPT_EXT4_ONLY},
18868016e29fSHarshad Shirwadkar #endif
188726092bf5STheodore Ts'o 	{Opt_err, 0, 0}
188826092bf5STheodore Ts'o };
188926092bf5STheodore Ts'o 
18905298d4bfSChristoph Hellwig #if IS_ENABLED(CONFIG_UNICODE)
1891c83ad55eSGabriel Krisman Bertazi static const struct ext4_sb_encodings {
1892c83ad55eSGabriel Krisman Bertazi 	__u16 magic;
1893c83ad55eSGabriel Krisman Bertazi 	char *name;
189449bd03ccSChristoph Hellwig 	unsigned int version;
1895c83ad55eSGabriel Krisman Bertazi } ext4_sb_encoding_map[] = {
189649bd03ccSChristoph Hellwig 	{EXT4_ENC_UTF8_12_1, "utf8", UNICODE_AGE(12, 1, 0)},
1897c83ad55eSGabriel Krisman Bertazi };
1898c83ad55eSGabriel Krisman Bertazi 
1899aa8bf298SChristoph Hellwig static const struct ext4_sb_encodings *
1900aa8bf298SChristoph Hellwig ext4_sb_read_encoding(const struct ext4_super_block *es)
1901c83ad55eSGabriel Krisman Bertazi {
1902c83ad55eSGabriel Krisman Bertazi 	__u16 magic = le16_to_cpu(es->s_encoding);
1903c83ad55eSGabriel Krisman Bertazi 	int i;
1904c83ad55eSGabriel Krisman Bertazi 
1905c83ad55eSGabriel Krisman Bertazi 	for (i = 0; i < ARRAY_SIZE(ext4_sb_encoding_map); i++)
1906c83ad55eSGabriel Krisman Bertazi 		if (magic == ext4_sb_encoding_map[i].magic)
1907aa8bf298SChristoph Hellwig 			return &ext4_sb_encoding_map[i];
1908c83ad55eSGabriel Krisman Bertazi 
1909aa8bf298SChristoph Hellwig 	return NULL;
1910c83ad55eSGabriel Krisman Bertazi }
1911c83ad55eSGabriel Krisman Bertazi #endif
1912c83ad55eSGabriel Krisman Bertazi 
19136e47a3ccSLukas Czerner #define EXT4_SPEC_JQUOTA			(1 <<  0)
19146e47a3ccSLukas Czerner #define EXT4_SPEC_JQFMT				(1 <<  1)
19156e47a3ccSLukas Czerner #define EXT4_SPEC_DATAJ				(1 <<  2)
19166e47a3ccSLukas Czerner #define EXT4_SPEC_SB_BLOCK			(1 <<  3)
19176e47a3ccSLukas Czerner #define EXT4_SPEC_JOURNAL_DEV			(1 <<  4)
19186e47a3ccSLukas Czerner #define EXT4_SPEC_JOURNAL_IOPRIO		(1 <<  5)
19196e47a3ccSLukas Czerner #define EXT4_SPEC_s_want_extra_isize		(1 <<  7)
19206e47a3ccSLukas Czerner #define EXT4_SPEC_s_max_batch_time		(1 <<  8)
19216e47a3ccSLukas Czerner #define EXT4_SPEC_s_min_batch_time		(1 <<  9)
19226e47a3ccSLukas Czerner #define EXT4_SPEC_s_inode_readahead_blks	(1 << 10)
19236e47a3ccSLukas Czerner #define EXT4_SPEC_s_li_wait_mult		(1 << 11)
19246e47a3ccSLukas Czerner #define EXT4_SPEC_s_max_dir_size_kb		(1 << 12)
19256e47a3ccSLukas Czerner #define EXT4_SPEC_s_stripe			(1 << 13)
19266e47a3ccSLukas Czerner #define EXT4_SPEC_s_resuid			(1 << 14)
19276e47a3ccSLukas Czerner #define EXT4_SPEC_s_resgid			(1 << 15)
19286e47a3ccSLukas Czerner #define EXT4_SPEC_s_commit_interval		(1 << 16)
19296e47a3ccSLukas Czerner #define EXT4_SPEC_s_fc_debug_max_replay		(1 << 17)
19307edfd85bSLukas Czerner #define EXT4_SPEC_s_sb_block			(1 << 18)
193127b38686SOjaswin Mujoo #define EXT4_SPEC_mb_optimize_scan		(1 << 19)
19326e47a3ccSLukas Czerner 
1933461c3af0SLukas Czerner struct ext4_fs_context {
1934e6e268cbSLukas Czerner 	char		*s_qf_names[EXT4_MAXQUOTAS];
193585456054SEric Biggers 	struct fscrypt_dummy_policy dummy_enc_policy;
1936e6e268cbSLukas Czerner 	int		s_jquota_fmt;	/* Format of quota to use */
19376e47a3ccSLukas Czerner #ifdef CONFIG_EXT4_DEBUG
19386e47a3ccSLukas Czerner 	int s_fc_debug_max_replay;
19396e47a3ccSLukas Czerner #endif
19406e47a3ccSLukas Czerner 	unsigned short	qname_spec;
19416e47a3ccSLukas Czerner 	unsigned long	vals_s_flags;	/* Bits to set in s_flags */
19426e47a3ccSLukas Czerner 	unsigned long	mask_s_flags;	/* Bits changed in s_flags */
19436e47a3ccSLukas Czerner 	unsigned long	journal_devnum;
19446e47a3ccSLukas Czerner 	unsigned long	s_commit_interval;
19456e47a3ccSLukas Czerner 	unsigned long	s_stripe;
19466e47a3ccSLukas Czerner 	unsigned int	s_inode_readahead_blks;
19476e47a3ccSLukas Czerner 	unsigned int	s_want_extra_isize;
19486e47a3ccSLukas Czerner 	unsigned int	s_li_wait_mult;
19496e47a3ccSLukas Czerner 	unsigned int	s_max_dir_size_kb;
19506e47a3ccSLukas Czerner 	unsigned int	journal_ioprio;
19516e47a3ccSLukas Czerner 	unsigned int	vals_s_mount_opt;
19526e47a3ccSLukas Czerner 	unsigned int	mask_s_mount_opt;
19536e47a3ccSLukas Czerner 	unsigned int	vals_s_mount_opt2;
19546e47a3ccSLukas Czerner 	unsigned int	mask_s_mount_opt2;
1955e3952fccSLukas Czerner 	unsigned long	vals_s_mount_flags;
1956e3952fccSLukas Czerner 	unsigned long	mask_s_mount_flags;
1957b6bd2435SLukas Czerner 	unsigned int	opt_flags;	/* MOPT flags */
19586e47a3ccSLukas Czerner 	unsigned int	spec;
19596e47a3ccSLukas Czerner 	u32		s_max_batch_time;
19606e47a3ccSLukas Czerner 	u32		s_min_batch_time;
19616e47a3ccSLukas Czerner 	kuid_t		s_resuid;
19626e47a3ccSLukas Czerner 	kgid_t		s_resgid;
19637edfd85bSLukas Czerner 	ext4_fsblk_t	s_sb_block;
1964b237e304SHarshad Shirwadkar };
1965b237e304SHarshad Shirwadkar 
1966cebe85d5SLukas Czerner static void ext4_fc_free(struct fs_context *fc)
1967cebe85d5SLukas Czerner {
1968cebe85d5SLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
1969cebe85d5SLukas Czerner 	int i;
1970cebe85d5SLukas Czerner 
1971cebe85d5SLukas Czerner 	if (!ctx)
1972cebe85d5SLukas Czerner 		return;
1973cebe85d5SLukas Czerner 
1974cebe85d5SLukas Czerner 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
1975cebe85d5SLukas Czerner 		kfree(ctx->s_qf_names[i]);
1976cebe85d5SLukas Czerner 
197785456054SEric Biggers 	fscrypt_free_dummy_policy(&ctx->dummy_enc_policy);
1978cebe85d5SLukas Czerner 	kfree(ctx);
1979cebe85d5SLukas Czerner }
1980cebe85d5SLukas Czerner 
1981cebe85d5SLukas Czerner int ext4_init_fs_context(struct fs_context *fc)
1982cebe85d5SLukas Czerner {
1983da9e4802SDan Carpenter 	struct ext4_fs_context *ctx;
1984cebe85d5SLukas Czerner 
1985cebe85d5SLukas Czerner 	ctx = kzalloc(sizeof(struct ext4_fs_context), GFP_KERNEL);
1986cebe85d5SLukas Czerner 	if (!ctx)
1987cebe85d5SLukas Czerner 		return -ENOMEM;
1988cebe85d5SLukas Czerner 
1989cebe85d5SLukas Czerner 	fc->fs_private = ctx;
1990cebe85d5SLukas Czerner 	fc->ops = &ext4_context_ops;
1991cebe85d5SLukas Czerner 
1992cebe85d5SLukas Czerner 	return 0;
1993cebe85d5SLukas Czerner }
1994cebe85d5SLukas Czerner 
1995e6e268cbSLukas Czerner #ifdef CONFIG_QUOTA
1996e6e268cbSLukas Czerner /*
1997e6e268cbSLukas Czerner  * Note the name of the specified quota file.
1998e6e268cbSLukas Czerner  */
1999e6e268cbSLukas Czerner static int note_qf_name(struct fs_context *fc, int qtype,
2000e6e268cbSLukas Czerner 		       struct fs_parameter *param)
2001e6e268cbSLukas Czerner {
2002e6e268cbSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
2003e6e268cbSLukas Czerner 	char *qname;
2004e6e268cbSLukas Czerner 
2005e6e268cbSLukas Czerner 	if (param->size < 1) {
2006e6e268cbSLukas Czerner 		ext4_msg(NULL, KERN_ERR, "Missing quota name");
2007e6e268cbSLukas Czerner 		return -EINVAL;
2008e6e268cbSLukas Czerner 	}
2009e6e268cbSLukas Czerner 	if (strchr(param->string, '/')) {
2010e6e268cbSLukas Czerner 		ext4_msg(NULL, KERN_ERR,
2011e6e268cbSLukas Czerner 			 "quotafile must be on filesystem root");
2012e6e268cbSLukas Czerner 		return -EINVAL;
2013e6e268cbSLukas Czerner 	}
2014e6e268cbSLukas Czerner 	if (ctx->s_qf_names[qtype]) {
2015e6e268cbSLukas Czerner 		if (strcmp(ctx->s_qf_names[qtype], param->string) != 0) {
2016e6e268cbSLukas Czerner 			ext4_msg(NULL, KERN_ERR,
2017e6e268cbSLukas Czerner 				 "%s quota file already specified",
2018e6e268cbSLukas Czerner 				 QTYPE2NAME(qtype));
2019e6e268cbSLukas Czerner 			return -EINVAL;
2020e6e268cbSLukas Czerner 		}
2021e6e268cbSLukas Czerner 		return 0;
2022e6e268cbSLukas Czerner 	}
2023e6e268cbSLukas Czerner 
2024e6e268cbSLukas Czerner 	qname = kmemdup_nul(param->string, param->size, GFP_KERNEL);
2025e6e268cbSLukas Czerner 	if (!qname) {
2026e6e268cbSLukas Czerner 		ext4_msg(NULL, KERN_ERR,
2027e6e268cbSLukas Czerner 			 "Not enough memory for storing quotafile name");
2028e6e268cbSLukas Czerner 		return -ENOMEM;
2029e6e268cbSLukas Czerner 	}
2030e6e268cbSLukas Czerner 	ctx->s_qf_names[qtype] = qname;
2031e6e268cbSLukas Czerner 	ctx->qname_spec |= 1 << qtype;
20326e47a3ccSLukas Czerner 	ctx->spec |= EXT4_SPEC_JQUOTA;
2033e6e268cbSLukas Czerner 	return 0;
2034e6e268cbSLukas Czerner }
2035e6e268cbSLukas Czerner 
2036e6e268cbSLukas Czerner /*
2037e6e268cbSLukas Czerner  * Clear the name of the specified quota file.
2038e6e268cbSLukas Czerner  */
2039e6e268cbSLukas Czerner static int unnote_qf_name(struct fs_context *fc, int qtype)
2040e6e268cbSLukas Czerner {
2041e6e268cbSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
2042e6e268cbSLukas Czerner 
2043e6e268cbSLukas Czerner 	if (ctx->s_qf_names[qtype])
2044e6e268cbSLukas Czerner 		kfree(ctx->s_qf_names[qtype]);
2045e6e268cbSLukas Czerner 
2046e6e268cbSLukas Czerner 	ctx->s_qf_names[qtype] = NULL;
2047e6e268cbSLukas Czerner 	ctx->qname_spec |= 1 << qtype;
20486e47a3ccSLukas Czerner 	ctx->spec |= EXT4_SPEC_JQUOTA;
2049e6e268cbSLukas Czerner 	return 0;
2050e6e268cbSLukas Czerner }
2051e6e268cbSLukas Czerner #endif
2052e6e268cbSLukas Czerner 
205385456054SEric Biggers static int ext4_parse_test_dummy_encryption(const struct fs_parameter *param,
205485456054SEric Biggers 					    struct ext4_fs_context *ctx)
205585456054SEric Biggers {
205685456054SEric Biggers 	int err;
205785456054SEric Biggers 
205885456054SEric Biggers 	if (!IS_ENABLED(CONFIG_FS_ENCRYPTION)) {
205985456054SEric Biggers 		ext4_msg(NULL, KERN_WARNING,
206085456054SEric Biggers 			 "test_dummy_encryption option not supported");
206185456054SEric Biggers 		return -EINVAL;
206285456054SEric Biggers 	}
206385456054SEric Biggers 	err = fscrypt_parse_test_dummy_encryption(param,
206485456054SEric Biggers 						  &ctx->dummy_enc_policy);
206585456054SEric Biggers 	if (err == -EINVAL) {
206685456054SEric Biggers 		ext4_msg(NULL, KERN_WARNING,
206785456054SEric Biggers 			 "Value of option \"%s\" is unrecognized", param->key);
206885456054SEric Biggers 	} else if (err == -EEXIST) {
206985456054SEric Biggers 		ext4_msg(NULL, KERN_WARNING,
207085456054SEric Biggers 			 "Conflicting test_dummy_encryption options");
207185456054SEric Biggers 		return -EINVAL;
207285456054SEric Biggers 	}
207385456054SEric Biggers 	return err;
207485456054SEric Biggers }
207585456054SEric Biggers 
20766e47a3ccSLukas Czerner #define EXT4_SET_CTX(name)						\
20774c246728SLukas Czerner static inline void ctx_set_##name(struct ext4_fs_context *ctx,		\
20784c246728SLukas Czerner 				  unsigned long flag)			\
20796e47a3ccSLukas Czerner {									\
20806e47a3ccSLukas Czerner 	ctx->mask_s_##name |= flag;					\
20816e47a3ccSLukas Czerner 	ctx->vals_s_##name |= flag;					\
2082e3952fccSLukas Czerner }
2083e3952fccSLukas Czerner 
2084e3952fccSLukas Czerner #define EXT4_CLEAR_CTX(name)						\
20854c246728SLukas Czerner static inline void ctx_clear_##name(struct ext4_fs_context *ctx,	\
20864c246728SLukas Czerner 				    unsigned long flag)			\
20876e47a3ccSLukas Czerner {									\
20886e47a3ccSLukas Czerner 	ctx->mask_s_##name |= flag;					\
20896e47a3ccSLukas Czerner 	ctx->vals_s_##name &= ~flag;					\
2090e3952fccSLukas Czerner }
2091e3952fccSLukas Czerner 
2092e3952fccSLukas Czerner #define EXT4_TEST_CTX(name)						\
20934c246728SLukas Czerner static inline unsigned long						\
20944c246728SLukas Czerner ctx_test_##name(struct ext4_fs_context *ctx, unsigned long flag)	\
20956e47a3ccSLukas Czerner {									\
20964c246728SLukas Czerner 	return (ctx->vals_s_##name & flag);				\
2097e3952fccSLukas Czerner }
20986e47a3ccSLukas Czerner 
2099e3952fccSLukas Czerner EXT4_SET_CTX(flags); /* set only */
21006e47a3ccSLukas Czerner EXT4_SET_CTX(mount_opt);
2101e3952fccSLukas Czerner EXT4_CLEAR_CTX(mount_opt);
2102e3952fccSLukas Czerner EXT4_TEST_CTX(mount_opt);
21036e47a3ccSLukas Czerner EXT4_SET_CTX(mount_opt2);
2104e3952fccSLukas Czerner EXT4_CLEAR_CTX(mount_opt2);
2105e3952fccSLukas Czerner EXT4_TEST_CTX(mount_opt2);
2106e3952fccSLukas Czerner 
2107e3952fccSLukas Czerner static inline void ctx_set_mount_flag(struct ext4_fs_context *ctx, int bit)
2108e3952fccSLukas Czerner {
2109e3952fccSLukas Czerner 	set_bit(bit, &ctx->mask_s_mount_flags);
2110e3952fccSLukas Czerner 	set_bit(bit, &ctx->vals_s_mount_flags);
2111e3952fccSLukas Czerner }
21126e47a3ccSLukas Czerner 
211302f960f8SLukas Czerner static int ext4_parse_param(struct fs_context *fc, struct fs_parameter *param)
211426092bf5STheodore Ts'o {
2115461c3af0SLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
2116461c3af0SLukas Czerner 	struct fs_parse_result result;
211726092bf5STheodore Ts'o 	const struct mount_opts *m;
2118461c3af0SLukas Czerner 	int is_remount;
211908cefc7aSEric W. Biederman 	kuid_t uid;
212008cefc7aSEric W. Biederman 	kgid_t gid;
2121461c3af0SLukas Czerner 	int token;
2122461c3af0SLukas Czerner 
2123461c3af0SLukas Czerner 	token = fs_parse(fc, ext4_param_specs, param, &result);
2124461c3af0SLukas Czerner 	if (token < 0)
2125461c3af0SLukas Czerner 		return token;
2126461c3af0SLukas Czerner 	is_remount = fc->purpose == FS_CONTEXT_FOR_RECONFIGURE;
212726092bf5STheodore Ts'o 
2128ba2e524dSLukas Czerner 	for (m = ext4_mount_opts; m->token != Opt_err; m++)
2129ba2e524dSLukas Czerner 		if (token == m->token)
2130ba2e524dSLukas Czerner 			break;
2131ba2e524dSLukas Czerner 
2132ba2e524dSLukas Czerner 	ctx->opt_flags |= m->flags;
2133ba2e524dSLukas Czerner 
2134ba2e524dSLukas Czerner 	if (m->flags & MOPT_EXPLICIT) {
2135ba2e524dSLukas Czerner 		if (m->mount_opt & EXT4_MOUNT_DELALLOC) {
2136ba2e524dSLukas Czerner 			ctx_set_mount_opt2(ctx, EXT4_MOUNT2_EXPLICIT_DELALLOC);
2137ba2e524dSLukas Czerner 		} else if (m->mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) {
2138ba2e524dSLukas Czerner 			ctx_set_mount_opt2(ctx,
2139ba2e524dSLukas Czerner 				       EXT4_MOUNT2_EXPLICIT_JOURNAL_CHECKSUM);
2140ba2e524dSLukas Czerner 		} else
2141ba2e524dSLukas Czerner 			return -EINVAL;
2142ba2e524dSLukas Czerner 	}
2143ba2e524dSLukas Czerner 
2144ba2e524dSLukas Czerner 	if (m->flags & MOPT_NOSUPPORT) {
2145ba2e524dSLukas Czerner 		ext4_msg(NULL, KERN_ERR, "%s option not supported",
2146ba2e524dSLukas Czerner 			 param->key);
2147ba2e524dSLukas Czerner 		return 0;
2148ba2e524dSLukas Czerner 	}
2149ba2e524dSLukas Czerner 
2150ba2e524dSLukas Czerner 	switch (token) {
215157f73c2cSTheodore Ts'o #ifdef CONFIG_QUOTA
2152ba2e524dSLukas Czerner 	case Opt_usrjquota:
2153461c3af0SLukas Czerner 		if (!*param->string)
2154e6e268cbSLukas Czerner 			return unnote_qf_name(fc, USRQUOTA);
2155461c3af0SLukas Czerner 		else
2156e6e268cbSLukas Czerner 			return note_qf_name(fc, USRQUOTA, param);
2157ba2e524dSLukas Czerner 	case Opt_grpjquota:
2158461c3af0SLukas Czerner 		if (!*param->string)
2159e6e268cbSLukas Czerner 			return unnote_qf_name(fc, GRPQUOTA);
2160461c3af0SLukas Czerner 		else
2161e6e268cbSLukas Czerner 			return note_qf_name(fc, GRPQUOTA, param);
216257f73c2cSTheodore Ts'o #endif
216326092bf5STheodore Ts'o 	case Opt_sb:
21647edfd85bSLukas Czerner 		if (fc->purpose == FS_CONTEXT_FOR_RECONFIGURE) {
21657edfd85bSLukas Czerner 			ext4_msg(NULL, KERN_WARNING,
21667edfd85bSLukas Czerner 				 "Ignoring %s option on remount", param->key);
21677edfd85bSLukas Czerner 		} else {
21687edfd85bSLukas Czerner 			ctx->s_sb_block = result.uint_32;
21697edfd85bSLukas Czerner 			ctx->spec |= EXT4_SPEC_s_sb_block;
21707edfd85bSLukas Czerner 		}
217102f960f8SLukas Czerner 		return 0;
217226092bf5STheodore Ts'o 	case Opt_removed:
2173da812f61SLukas Czerner 		ext4_msg(NULL, KERN_WARNING, "Ignoring removed %s option",
2174461c3af0SLukas Czerner 			 param->key);
217502f960f8SLukas Czerner 		return 0;
217626092bf5STheodore Ts'o 	case Opt_abort:
2177e3952fccSLukas Czerner 		ctx_set_mount_flag(ctx, EXT4_MF_FS_ABORTED);
217802f960f8SLukas Czerner 		return 0;
21794f74d15fSEric Biggers 	case Opt_inlinecrypt:
21804f74d15fSEric Biggers #ifdef CONFIG_FS_ENCRYPTION_INLINE_CRYPT
21816e47a3ccSLukas Czerner 		ctx_set_flags(ctx, SB_INLINECRYPT);
21824f74d15fSEric Biggers #else
2183da812f61SLukas Czerner 		ext4_msg(NULL, KERN_ERR, "inline encryption not supported");
21844f74d15fSEric Biggers #endif
218502f960f8SLukas Czerner 		return 0;
2186461c3af0SLukas Czerner 	case Opt_errors:
21876e47a3ccSLukas Czerner 		ctx_clear_mount_opt(ctx, EXT4_MOUNT_ERRORS_MASK);
2188ba2e524dSLukas Czerner 		ctx_set_mount_opt(ctx, result.uint_32);
2189ba2e524dSLukas Czerner 		return 0;
2190ba2e524dSLukas Czerner #ifdef CONFIG_QUOTA
2191ba2e524dSLukas Czerner 	case Opt_jqfmt:
2192ba2e524dSLukas Czerner 		ctx->s_jquota_fmt = result.uint_32;
2193ba2e524dSLukas Czerner 		ctx->spec |= EXT4_SPEC_JQFMT;
2194ba2e524dSLukas Czerner 		return 0;
2195ba2e524dSLukas Czerner #endif
2196ba2e524dSLukas Czerner 	case Opt_data:
2197ba2e524dSLukas Czerner 		ctx_clear_mount_opt(ctx, EXT4_MOUNT_DATA_FLAGS);
2198ba2e524dSLukas Czerner 		ctx_set_mount_opt(ctx, result.uint_32);
2199ba2e524dSLukas Czerner 		ctx->spec |= EXT4_SPEC_DATAJ;
2200ba2e524dSLukas Czerner 		return 0;
2201ba2e524dSLukas Czerner 	case Opt_commit:
2202461c3af0SLukas Czerner 		if (result.uint_32 == 0)
2203934b0de1SWang Jianjian 			result.uint_32 = JBD2_DEFAULT_MAX_COMMIT_AGE;
2204461c3af0SLukas Czerner 		else if (result.uint_32 > INT_MAX / HZ) {
2205da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR,
22069ba55543Szhangyi (F) 				 "Invalid commit interval %d, "
22079ba55543Szhangyi (F) 				 "must be smaller than %d",
2208461c3af0SLukas Czerner 				 result.uint_32, INT_MAX / HZ);
2209da812f61SLukas Czerner 			return -EINVAL;
22109ba55543Szhangyi (F) 		}
22116e47a3ccSLukas Czerner 		ctx->s_commit_interval = HZ * result.uint_32;
22126e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_commit_interval;
2213ba2e524dSLukas Czerner 		return 0;
2214ba2e524dSLukas Czerner 	case Opt_debug_want_extra_isize:
22156e47a3ccSLukas Czerner 		if ((result.uint_32 & 1) || (result.uint_32 < 4)) {
2216da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR,
2217461c3af0SLukas Czerner 				 "Invalid want_extra_isize %d", result.uint_32);
2218da812f61SLukas Czerner 			return -EINVAL;
22199803387cSTheodore Ts'o 		}
22206e47a3ccSLukas Czerner 		ctx->s_want_extra_isize = result.uint_32;
22216e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_want_extra_isize;
2222ba2e524dSLukas Czerner 		return 0;
2223ba2e524dSLukas Czerner 	case Opt_max_batch_time:
22246e47a3ccSLukas Czerner 		ctx->s_max_batch_time = result.uint_32;
22256e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_max_batch_time;
2226ba2e524dSLukas Czerner 		return 0;
2227ba2e524dSLukas Czerner 	case Opt_min_batch_time:
22286e47a3ccSLukas Czerner 		ctx->s_min_batch_time = result.uint_32;
22296e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_min_batch_time;
2230ba2e524dSLukas Czerner 		return 0;
2231ba2e524dSLukas Czerner 	case Opt_inode_readahead_blks:
2232461c3af0SLukas Czerner 		if (result.uint_32 &&
2233461c3af0SLukas Czerner 		    (result.uint_32 > (1 << 30) ||
2234461c3af0SLukas Czerner 		     !is_power_of_2(result.uint_32))) {
2235da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR,
2236e33e60eaSJan Kara 				 "EXT4-fs: inode_readahead_blks must be "
2237e33e60eaSJan Kara 				 "0 or a power of 2 smaller than 2^31");
2238da812f61SLukas Czerner 			return -EINVAL;
223926092bf5STheodore Ts'o 		}
22406e47a3ccSLukas Czerner 		ctx->s_inode_readahead_blks = result.uint_32;
22416e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_inode_readahead_blks;
2242ba2e524dSLukas Czerner 		return 0;
2243ba2e524dSLukas Czerner 	case Opt_init_itable:
22446e47a3ccSLukas Czerner 		ctx_set_mount_opt(ctx, EXT4_MOUNT_INIT_INODE_TABLE);
22456e47a3ccSLukas Czerner 		ctx->s_li_wait_mult = EXT4_DEF_LI_WAIT_MULT;
2246461c3af0SLukas Czerner 		if (param->type == fs_value_is_string)
22476e47a3ccSLukas Czerner 			ctx->s_li_wait_mult = result.uint_32;
22486e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_li_wait_mult;
2249ba2e524dSLukas Czerner 		return 0;
2250ba2e524dSLukas Czerner 	case Opt_max_dir_size_kb:
22516e47a3ccSLukas Czerner 		ctx->s_max_dir_size_kb = result.uint_32;
22526e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_max_dir_size_kb;
2253ba2e524dSLukas Czerner 		return 0;
22548016e29fSHarshad Shirwadkar #ifdef CONFIG_EXT4_DEBUG
2255ba2e524dSLukas Czerner 	case Opt_fc_debug_max_replay:
22566e47a3ccSLukas Czerner 		ctx->s_fc_debug_max_replay = result.uint_32;
22576e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_fc_debug_max_replay;
2258ba2e524dSLukas Czerner 		return 0;
22598016e29fSHarshad Shirwadkar #endif
2260ba2e524dSLukas Czerner 	case Opt_stripe:
22616e47a3ccSLukas Czerner 		ctx->s_stripe = result.uint_32;
22626e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_stripe;
2263ba2e524dSLukas Czerner 		return 0;
2264ba2e524dSLukas Czerner 	case Opt_resuid:
2265461c3af0SLukas Czerner 		uid = make_kuid(current_user_ns(), result.uint_32);
22660efb3b23SJan Kara 		if (!uid_valid(uid)) {
2267da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR, "Invalid uid value %d",
2268461c3af0SLukas Czerner 				 result.uint_32);
2269da812f61SLukas Czerner 			return -EINVAL;
22700efb3b23SJan Kara 		}
22716e47a3ccSLukas Czerner 		ctx->s_resuid = uid;
22726e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_resuid;
2273ba2e524dSLukas Czerner 		return 0;
2274ba2e524dSLukas Czerner 	case Opt_resgid:
2275461c3af0SLukas Czerner 		gid = make_kgid(current_user_ns(), result.uint_32);
22760efb3b23SJan Kara 		if (!gid_valid(gid)) {
2277da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR, "Invalid gid value %d",
2278461c3af0SLukas Czerner 				 result.uint_32);
2279da812f61SLukas Czerner 			return -EINVAL;
22800efb3b23SJan Kara 		}
22816e47a3ccSLukas Czerner 		ctx->s_resgid = gid;
22826e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_s_resgid;
2283ba2e524dSLukas Czerner 		return 0;
2284ba2e524dSLukas Czerner 	case Opt_journal_dev:
22850efb3b23SJan Kara 		if (is_remount) {
2286da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR,
22870efb3b23SJan Kara 				 "Cannot specify journal on remount");
2288da812f61SLukas Czerner 			return -EINVAL;
22890efb3b23SJan Kara 		}
2290461c3af0SLukas Czerner 		ctx->journal_devnum = result.uint_32;
22916e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_JOURNAL_DEV;
2292ba2e524dSLukas Czerner 		return 0;
2293ba2e524dSLukas Czerner 	case Opt_journal_path:
2294ba2e524dSLukas Czerner 	{
2295ad4eec61SEric Sandeen 		struct inode *journal_inode;
2296ad4eec61SEric Sandeen 		struct path path;
2297ad4eec61SEric Sandeen 		int error;
2298ad4eec61SEric Sandeen 
2299ad4eec61SEric Sandeen 		if (is_remount) {
2300da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR,
2301ad4eec61SEric Sandeen 				 "Cannot specify journal on remount");
2302da812f61SLukas Czerner 			return -EINVAL;
2303ad4eec61SEric Sandeen 		}
2304ad4eec61SEric Sandeen 
2305e3ea75eeSLukas Czerner 		error = fs_lookup_param(fc, param, 1, LOOKUP_FOLLOW, &path);
2306ad4eec61SEric Sandeen 		if (error) {
2307da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR, "error: could not find "
2308461c3af0SLukas Czerner 				 "journal device path");
2309da812f61SLukas Czerner 			return -EINVAL;
2310ad4eec61SEric Sandeen 		}
2311ad4eec61SEric Sandeen 
23122b0143b5SDavid Howells 		journal_inode = d_inode(path.dentry);
2313461c3af0SLukas Czerner 		ctx->journal_devnum = new_encode_dev(journal_inode->i_rdev);
23146e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_JOURNAL_DEV;
2315ad4eec61SEric Sandeen 		path_put(&path);
2316ba2e524dSLukas Czerner 		return 0;
2317ba2e524dSLukas Czerner 	}
2318ba2e524dSLukas Czerner 	case Opt_journal_ioprio:
2319461c3af0SLukas Czerner 		if (result.uint_32 > 7) {
2320da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR, "Invalid journal IO priority"
23210efb3b23SJan Kara 				 " (must be 0-7)");
2322da812f61SLukas Czerner 			return -EINVAL;
23230efb3b23SJan Kara 		}
2324461c3af0SLukas Czerner 		ctx->journal_ioprio =
2325461c3af0SLukas Czerner 			IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, result.uint_32);
23266e47a3ccSLukas Czerner 		ctx->spec |= EXT4_SPEC_JOURNAL_IOPRIO;
2327ba2e524dSLukas Czerner 		return 0;
2328ba2e524dSLukas Czerner 	case Opt_test_dummy_encryption:
232985456054SEric Biggers 		return ext4_parse_test_dummy_encryption(param, ctx);
2330ba2e524dSLukas Czerner 	case Opt_dax:
2331ba2e524dSLukas Czerner 	case Opt_dax_type:
2332ef83b6e8SDan Williams #ifdef CONFIG_FS_DAX
2333ba2e524dSLukas Czerner 	{
2334ba2e524dSLukas Czerner 		int type = (token == Opt_dax) ?
2335ba2e524dSLukas Czerner 			   Opt_dax : result.uint_32;
2336ba2e524dSLukas Czerner 
2337ba2e524dSLukas Czerner 		switch (type) {
23389cb20f94SIra Weiny 		case Opt_dax:
23399cb20f94SIra Weiny 		case Opt_dax_always:
2340ba2e524dSLukas Czerner 			ctx_set_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS);
23416e47a3ccSLukas Czerner 			ctx_clear_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER);
23429cb20f94SIra Weiny 			break;
23439cb20f94SIra Weiny 		case Opt_dax_never:
2344ba2e524dSLukas Czerner 			ctx_set_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER);
23456e47a3ccSLukas Czerner 			ctx_clear_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS);
23469cb20f94SIra Weiny 			break;
23479cb20f94SIra Weiny 		case Opt_dax_inode:
23486e47a3ccSLukas Czerner 			ctx_clear_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS);
23496e47a3ccSLukas Czerner 			ctx_clear_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER);
23509cb20f94SIra Weiny 			/* Strictly for printing options */
2351ba2e524dSLukas Czerner 			ctx_set_mount_opt2(ctx, EXT4_MOUNT2_DAX_INODE);
23529cb20f94SIra Weiny 			break;
23539cb20f94SIra Weiny 		}
2354ba2e524dSLukas Czerner 		return 0;
2355ba2e524dSLukas Czerner 	}
2356ef83b6e8SDan Williams #else
2357da812f61SLukas Czerner 		ext4_msg(NULL, KERN_INFO, "dax option not supported");
2358da812f61SLukas Czerner 		return -EINVAL;
2359923ae0ffSRoss Zwisler #endif
2360ba2e524dSLukas Czerner 	case Opt_data_err:
2361ba2e524dSLukas Czerner 		if (result.uint_32 == Opt_data_err_abort)
23626e47a3ccSLukas Czerner 			ctx_set_mount_opt(ctx, m->mount_opt);
2363ba2e524dSLukas Czerner 		else if (result.uint_32 == Opt_data_err_ignore)
23646e47a3ccSLukas Czerner 			ctx_clear_mount_opt(ctx, m->mount_opt);
2365ba2e524dSLukas Czerner 		return 0;
2366ba2e524dSLukas Czerner 	case Opt_mb_optimize_scan:
236727b38686SOjaswin Mujoo 		if (result.int_32 == 1) {
236827b38686SOjaswin Mujoo 			ctx_set_mount_opt2(ctx, EXT4_MOUNT2_MB_OPTIMIZE_SCAN);
236927b38686SOjaswin Mujoo 			ctx->spec |= EXT4_SPEC_mb_optimize_scan;
237027b38686SOjaswin Mujoo 		} else if (result.int_32 == 0) {
237127b38686SOjaswin Mujoo 			ctx_clear_mount_opt2(ctx, EXT4_MOUNT2_MB_OPTIMIZE_SCAN);
237227b38686SOjaswin Mujoo 			ctx->spec |= EXT4_SPEC_mb_optimize_scan;
237327b38686SOjaswin Mujoo 		} else {
2374da812f61SLukas Czerner 			ext4_msg(NULL, KERN_WARNING,
2375196e402aSHarshad Shirwadkar 				 "mb_optimize_scan should be set to 0 or 1.");
2376da812f61SLukas Czerner 			return -EINVAL;
2377196e402aSHarshad Shirwadkar 		}
2378ba2e524dSLukas Czerner 		return 0;
2379ba2e524dSLukas Czerner 	}
2380ba2e524dSLukas Czerner 
2381ba2e524dSLukas Czerner 	/*
2382ba2e524dSLukas Czerner 	 * At this point we should only be getting options requiring MOPT_SET,
2383ba2e524dSLukas Czerner 	 * or MOPT_CLEAR. Anything else is a bug
2384ba2e524dSLukas Czerner 	 */
2385ba2e524dSLukas Czerner 	if (m->token == Opt_err) {
2386ba2e524dSLukas Czerner 		ext4_msg(NULL, KERN_WARNING, "buggy handling of option %s",
2387ba2e524dSLukas Czerner 			 param->key);
2388ba2e524dSLukas Czerner 		WARN_ON(1);
2389ba2e524dSLukas Czerner 		return -EINVAL;
2390ba2e524dSLukas Czerner 	}
2391ba2e524dSLukas Czerner 
2392ba2e524dSLukas Czerner 	else {
2393461c3af0SLukas Czerner 		unsigned int set = 0;
2394461c3af0SLukas Czerner 
2395461c3af0SLukas Czerner 		if ((param->type == fs_value_is_flag) ||
2396461c3af0SLukas Czerner 		    result.uint_32 > 0)
2397461c3af0SLukas Czerner 			set = 1;
2398461c3af0SLukas Czerner 
239926092bf5STheodore Ts'o 		if (m->flags & MOPT_CLEAR)
2400461c3af0SLukas Czerner 			set = !set;
240126092bf5STheodore Ts'o 		else if (unlikely(!(m->flags & MOPT_SET))) {
2402da812f61SLukas Czerner 			ext4_msg(NULL, KERN_WARNING,
2403461c3af0SLukas Czerner 				 "buggy handling of option %s",
2404461c3af0SLukas Czerner 				 param->key);
240526092bf5STheodore Ts'o 			WARN_ON(1);
2406da812f61SLukas Czerner 			return -EINVAL;
240726092bf5STheodore Ts'o 		}
2408995a3ed6SHarshad Shirwadkar 		if (m->flags & MOPT_2) {
2409461c3af0SLukas Czerner 			if (set != 0)
24106e47a3ccSLukas Czerner 				ctx_set_mount_opt2(ctx, m->mount_opt);
2411995a3ed6SHarshad Shirwadkar 			else
24126e47a3ccSLukas Czerner 				ctx_clear_mount_opt2(ctx, m->mount_opt);
2413995a3ed6SHarshad Shirwadkar 		} else {
2414461c3af0SLukas Czerner 			if (set != 0)
24156e47a3ccSLukas Czerner 				ctx_set_mount_opt(ctx, m->mount_opt);
241626092bf5STheodore Ts'o 			else
24176e47a3ccSLukas Czerner 				ctx_clear_mount_opt(ctx, m->mount_opt);
241826092bf5STheodore Ts'o 		}
2419995a3ed6SHarshad Shirwadkar 	}
2420ba2e524dSLukas Czerner 
242102f960f8SLukas Czerner 	return 0;
242226092bf5STheodore Ts'o }
242326092bf5STheodore Ts'o 
24247edfd85bSLukas Czerner static int parse_options(struct fs_context *fc, char *options)
2425ac27a0ecSDave Kleikamp {
2426461c3af0SLukas Czerner 	struct fs_parameter param;
2427461c3af0SLukas Czerner 	int ret;
2428461c3af0SLukas Czerner 	char *key;
2429ac27a0ecSDave Kleikamp 
2430ac27a0ecSDave Kleikamp 	if (!options)
24317edfd85bSLukas Czerner 		return 0;
2432461c3af0SLukas Czerner 
2433461c3af0SLukas Czerner 	while ((key = strsep(&options, ",")) != NULL) {
2434461c3af0SLukas Czerner 		if (*key) {
2435461c3af0SLukas Czerner 			size_t v_len = 0;
2436461c3af0SLukas Czerner 			char *value = strchr(key, '=');
2437461c3af0SLukas Czerner 
2438461c3af0SLukas Czerner 			param.type = fs_value_is_flag;
2439461c3af0SLukas Czerner 			param.string = NULL;
2440461c3af0SLukas Czerner 
2441461c3af0SLukas Czerner 			if (value) {
2442461c3af0SLukas Czerner 				if (value == key)
2443ac27a0ecSDave Kleikamp 					continue;
2444461c3af0SLukas Czerner 
2445461c3af0SLukas Czerner 				*value++ = 0;
2446461c3af0SLukas Czerner 				v_len = strlen(value);
2447461c3af0SLukas Czerner 				param.string = kmemdup_nul(value, v_len,
2448461c3af0SLukas Czerner 							   GFP_KERNEL);
2449461c3af0SLukas Czerner 				if (!param.string)
24507edfd85bSLukas Czerner 					return -ENOMEM;
2451461c3af0SLukas Czerner 				param.type = fs_value_is_string;
2452461c3af0SLukas Czerner 			}
2453461c3af0SLukas Czerner 
2454461c3af0SLukas Czerner 			param.key = key;
2455461c3af0SLukas Czerner 			param.size = v_len;
2456461c3af0SLukas Czerner 
245702f960f8SLukas Czerner 			ret = ext4_parse_param(fc, &param);
2458461c3af0SLukas Czerner 			if (param.string)
2459461c3af0SLukas Czerner 				kfree(param.string);
2460461c3af0SLukas Czerner 			if (ret < 0)
24617edfd85bSLukas Czerner 				return ret;
2462ac27a0ecSDave Kleikamp 		}
2463461c3af0SLukas Czerner 	}
2464461c3af0SLukas Czerner 
24657edfd85bSLukas Czerner 	ret = ext4_validate_options(fc);
2466da812f61SLukas Czerner 	if (ret < 0)
24677edfd85bSLukas Czerner 		return ret;
24687edfd85bSLukas Czerner 
24697edfd85bSLukas Czerner 	return 0;
24707edfd85bSLukas Czerner }
24717edfd85bSLukas Czerner 
24727edfd85bSLukas Czerner static int parse_apply_sb_mount_options(struct super_block *sb,
24737edfd85bSLukas Czerner 					struct ext4_fs_context *m_ctx)
24747edfd85bSLukas Czerner {
24757edfd85bSLukas Czerner 	struct ext4_sb_info *sbi = EXT4_SB(sb);
24767edfd85bSLukas Czerner 	char *s_mount_opts = NULL;
24777edfd85bSLukas Czerner 	struct ext4_fs_context *s_ctx = NULL;
24787edfd85bSLukas Czerner 	struct fs_context *fc = NULL;
24797edfd85bSLukas Czerner 	int ret = -ENOMEM;
24807edfd85bSLukas Czerner 
24817edfd85bSLukas Czerner 	if (!sbi->s_es->s_mount_opts[0])
2482da812f61SLukas Czerner 		return 0;
2483da812f61SLukas Czerner 
24847edfd85bSLukas Czerner 	s_mount_opts = kstrndup(sbi->s_es->s_mount_opts,
24857edfd85bSLukas Czerner 				sizeof(sbi->s_es->s_mount_opts),
24867edfd85bSLukas Czerner 				GFP_KERNEL);
24877edfd85bSLukas Czerner 	if (!s_mount_opts)
24887edfd85bSLukas Czerner 		return ret;
2489e6e268cbSLukas Czerner 
24907edfd85bSLukas Czerner 	fc = kzalloc(sizeof(struct fs_context), GFP_KERNEL);
24917edfd85bSLukas Czerner 	if (!fc)
24927edfd85bSLukas Czerner 		goto out_free;
2493e6e268cbSLukas Czerner 
24947edfd85bSLukas Czerner 	s_ctx = kzalloc(sizeof(struct ext4_fs_context), GFP_KERNEL);
24957edfd85bSLukas Czerner 	if (!s_ctx)
24967edfd85bSLukas Czerner 		goto out_free;
24977edfd85bSLukas Czerner 
24987edfd85bSLukas Czerner 	fc->fs_private = s_ctx;
24997edfd85bSLukas Czerner 	fc->s_fs_info = sbi;
25007edfd85bSLukas Czerner 
25017edfd85bSLukas Czerner 	ret = parse_options(fc, s_mount_opts);
25027edfd85bSLukas Czerner 	if (ret < 0)
25037edfd85bSLukas Czerner 		goto parse_failed;
25047edfd85bSLukas Czerner 
25057edfd85bSLukas Czerner 	ret = ext4_check_opt_consistency(fc, sb);
25067edfd85bSLukas Czerner 	if (ret < 0) {
25077edfd85bSLukas Czerner parse_failed:
25087edfd85bSLukas Czerner 		ext4_msg(sb, KERN_WARNING,
25097edfd85bSLukas Czerner 			 "failed to parse options in superblock: %s",
25107edfd85bSLukas Czerner 			 s_mount_opts);
25117edfd85bSLukas Czerner 		ret = 0;
25127edfd85bSLukas Czerner 		goto out_free;
25137edfd85bSLukas Czerner 	}
25147edfd85bSLukas Czerner 
25157edfd85bSLukas Czerner 	if (s_ctx->spec & EXT4_SPEC_JOURNAL_DEV)
25167edfd85bSLukas Czerner 		m_ctx->journal_devnum = s_ctx->journal_devnum;
25177edfd85bSLukas Czerner 	if (s_ctx->spec & EXT4_SPEC_JOURNAL_IOPRIO)
25187edfd85bSLukas Czerner 		m_ctx->journal_ioprio = s_ctx->journal_ioprio;
25197edfd85bSLukas Czerner 
252085456054SEric Biggers 	ext4_apply_options(fc, sb);
252185456054SEric Biggers 	ret = 0;
25227edfd85bSLukas Czerner 
25237edfd85bSLukas Czerner out_free:
2524c069db76SEric Biggers 	if (fc) {
2525c069db76SEric Biggers 		ext4_fc_free(fc);
25267edfd85bSLukas Czerner 		kfree(fc);
2527c069db76SEric Biggers 	}
25287edfd85bSLukas Czerner 	kfree(s_mount_opts);
25297edfd85bSLukas Czerner 	return ret;
25304c94bff9SLukas Czerner }
25314c94bff9SLukas Czerner 
2532e6e268cbSLukas Czerner static void ext4_apply_quota_options(struct fs_context *fc,
2533e6e268cbSLukas Czerner 				     struct super_block *sb)
2534e6e268cbSLukas Czerner {
2535e6e268cbSLukas Czerner #ifdef CONFIG_QUOTA
25366e47a3ccSLukas Czerner 	bool quota_feature = ext4_has_feature_quota(sb);
2537e6e268cbSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
2538e6e268cbSLukas Czerner 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2539e6e268cbSLukas Czerner 	char *qname;
2540e6e268cbSLukas Czerner 	int i;
2541e6e268cbSLukas Czerner 
25426e47a3ccSLukas Czerner 	if (quota_feature)
25436e47a3ccSLukas Czerner 		return;
25446e47a3ccSLukas Czerner 
25456e47a3ccSLukas Czerner 	if (ctx->spec & EXT4_SPEC_JQUOTA) {
2546e6e268cbSLukas Czerner 		for (i = 0; i < EXT4_MAXQUOTAS; i++) {
2547e6e268cbSLukas Czerner 			if (!(ctx->qname_spec & (1 << i)))
2548e6e268cbSLukas Czerner 				continue;
25496e47a3ccSLukas Czerner 
2550e6e268cbSLukas Czerner 			qname = ctx->s_qf_names[i]; /* May be NULL */
25514c1bd5a9SLukas Czerner 			if (qname)
25524c1bd5a9SLukas Czerner 				set_opt(sb, QUOTA);
2553e6e268cbSLukas Czerner 			ctx->s_qf_names[i] = NULL;
255413b215a9SLukas Czerner 			qname = rcu_replace_pointer(sbi->s_qf_names[i], qname,
255513b215a9SLukas Czerner 						lockdep_is_held(&sb->s_umount));
255613b215a9SLukas Czerner 			if (qname)
255713b215a9SLukas Czerner 				kfree_rcu(qname);
2558e6e268cbSLukas Czerner 		}
25596e47a3ccSLukas Czerner 	}
25606e47a3ccSLukas Czerner 
25616e47a3ccSLukas Czerner 	if (ctx->spec & EXT4_SPEC_JQFMT)
25626e47a3ccSLukas Czerner 		sbi->s_jquota_fmt = ctx->s_jquota_fmt;
2563e6e268cbSLukas Czerner #endif
2564e6e268cbSLukas Czerner }
2565e6e268cbSLukas Czerner 
2566e6e268cbSLukas Czerner /*
2567e6e268cbSLukas Czerner  * Check quota settings consistency.
2568e6e268cbSLukas Czerner  */
2569e6e268cbSLukas Czerner static int ext4_check_quota_consistency(struct fs_context *fc,
2570e6e268cbSLukas Czerner 					struct super_block *sb)
2571e6e268cbSLukas Czerner {
2572e6e268cbSLukas Czerner #ifdef CONFIG_QUOTA
2573e6e268cbSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
2574e6e268cbSLukas Czerner 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2575e6e268cbSLukas Czerner 	bool quota_feature = ext4_has_feature_quota(sb);
2576e6e268cbSLukas Czerner 	bool quota_loaded = sb_any_quota_loaded(sb);
25776e47a3ccSLukas Czerner 	bool usr_qf_name, grp_qf_name, usrquota, grpquota;
25786e47a3ccSLukas Czerner 	int quota_flags, i;
2579e6e268cbSLukas Czerner 
25806e47a3ccSLukas Czerner 	/*
25816e47a3ccSLukas Czerner 	 * We do the test below only for project quotas. 'usrquota' and
25826e47a3ccSLukas Czerner 	 * 'grpquota' mount options are allowed even without quota feature
25836e47a3ccSLukas Czerner 	 * to support legacy quotas in quota files.
25846e47a3ccSLukas Czerner 	 */
25856e47a3ccSLukas Czerner 	if (ctx_test_mount_opt(ctx, EXT4_MOUNT_PRJQUOTA) &&
25866e47a3ccSLukas Czerner 	    !ext4_has_feature_project(sb)) {
25876e47a3ccSLukas Czerner 		ext4_msg(NULL, KERN_ERR, "Project quota feature not enabled. "
25886e47a3ccSLukas Czerner 			 "Cannot enable project quota enforcement.");
25896e47a3ccSLukas Czerner 		return -EINVAL;
25906e47a3ccSLukas Czerner 	}
25916e47a3ccSLukas Czerner 
25926e47a3ccSLukas Czerner 	quota_flags = EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA |
25936e47a3ccSLukas Czerner 		      EXT4_MOUNT_GRPQUOTA | EXT4_MOUNT_PRJQUOTA;
25946e47a3ccSLukas Czerner 	if (quota_loaded &&
25956e47a3ccSLukas Czerner 	    ctx->mask_s_mount_opt & quota_flags &&
25966e47a3ccSLukas Czerner 	    !ctx_test_mount_opt(ctx, quota_flags))
25976e47a3ccSLukas Czerner 		goto err_quota_change;
25986e47a3ccSLukas Czerner 
25996e47a3ccSLukas Czerner 	if (ctx->spec & EXT4_SPEC_JQUOTA) {
2600e6e268cbSLukas Czerner 
2601e6e268cbSLukas Czerner 		for (i = 0; i < EXT4_MAXQUOTAS; i++) {
2602e6e268cbSLukas Czerner 			if (!(ctx->qname_spec & (1 << i)))
2603e6e268cbSLukas Czerner 				continue;
2604e6e268cbSLukas Czerner 
26056e47a3ccSLukas Czerner 			if (quota_loaded &&
26066e47a3ccSLukas Czerner 			    !!sbi->s_qf_names[i] != !!ctx->s_qf_names[i])
2607e6e268cbSLukas Czerner 				goto err_jquota_change;
2608e6e268cbSLukas Czerner 
2609e6e268cbSLukas Czerner 			if (sbi->s_qf_names[i] && ctx->s_qf_names[i] &&
261013b215a9SLukas Czerner 			    strcmp(get_qf_name(sb, sbi, i),
2611e6e268cbSLukas Czerner 				   ctx->s_qf_names[i]) != 0)
2612e6e268cbSLukas Czerner 				goto err_jquota_specified;
2613e6e268cbSLukas Czerner 		}
26146e47a3ccSLukas Czerner 
26156e47a3ccSLukas Czerner 		if (quota_feature) {
26166e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_INFO,
26176e47a3ccSLukas Czerner 				 "Journaled quota options ignored when "
26186e47a3ccSLukas Czerner 				 "QUOTA feature is enabled");
26196e47a3ccSLukas Czerner 			return 0;
26206e47a3ccSLukas Czerner 		}
2621e6e268cbSLukas Czerner 	}
2622e6e268cbSLukas Czerner 
26236e47a3ccSLukas Czerner 	if (ctx->spec & EXT4_SPEC_JQFMT) {
2624e6e268cbSLukas Czerner 		if (sbi->s_jquota_fmt != ctx->s_jquota_fmt && quota_loaded)
26256e47a3ccSLukas Czerner 			goto err_jquota_change;
2626e6e268cbSLukas Czerner 		if (quota_feature) {
2627e6e268cbSLukas Czerner 			ext4_msg(NULL, KERN_INFO, "Quota format mount options "
2628e6e268cbSLukas Czerner 				 "ignored when QUOTA feature is enabled");
2629e6e268cbSLukas Czerner 			return 0;
2630e6e268cbSLukas Czerner 		}
2631e6e268cbSLukas Czerner 	}
26326e47a3ccSLukas Czerner 
26336e47a3ccSLukas Czerner 	/* Make sure we don't mix old and new quota format */
26346e47a3ccSLukas Czerner 	usr_qf_name = (get_qf_name(sb, sbi, USRQUOTA) ||
26356e47a3ccSLukas Czerner 		       ctx->s_qf_names[USRQUOTA]);
26366e47a3ccSLukas Czerner 	grp_qf_name = (get_qf_name(sb, sbi, GRPQUOTA) ||
26376e47a3ccSLukas Czerner 		       ctx->s_qf_names[GRPQUOTA]);
26386e47a3ccSLukas Czerner 
26396e47a3ccSLukas Czerner 	usrquota = (ctx_test_mount_opt(ctx, EXT4_MOUNT_USRQUOTA) ||
26406e47a3ccSLukas Czerner 		    test_opt(sb, USRQUOTA));
26416e47a3ccSLukas Czerner 
26426e47a3ccSLukas Czerner 	grpquota = (ctx_test_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA) ||
26436e47a3ccSLukas Czerner 		    test_opt(sb, GRPQUOTA));
26446e47a3ccSLukas Czerner 
26456e47a3ccSLukas Czerner 	if (usr_qf_name) {
26466e47a3ccSLukas Czerner 		ctx_clear_mount_opt(ctx, EXT4_MOUNT_USRQUOTA);
26476e47a3ccSLukas Czerner 		usrquota = false;
26486e47a3ccSLukas Czerner 	}
26496e47a3ccSLukas Czerner 	if (grp_qf_name) {
26506e47a3ccSLukas Czerner 		ctx_clear_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA);
26516e47a3ccSLukas Czerner 		grpquota = false;
26526e47a3ccSLukas Czerner 	}
26536e47a3ccSLukas Czerner 
26546e47a3ccSLukas Czerner 	if (usr_qf_name || grp_qf_name) {
26556e47a3ccSLukas Czerner 		if (usrquota || grpquota) {
26566e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_ERR, "old and new quota "
26576e47a3ccSLukas Czerner 				 "format mixing");
26586e47a3ccSLukas Czerner 			return -EINVAL;
26596e47a3ccSLukas Czerner 		}
26606e47a3ccSLukas Czerner 
26616e47a3ccSLukas Czerner 		if (!(ctx->spec & EXT4_SPEC_JQFMT || sbi->s_jquota_fmt)) {
26626e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_ERR, "journaled quota format "
26636e47a3ccSLukas Czerner 				 "not specified");
26646e47a3ccSLukas Czerner 			return -EINVAL;
26656e47a3ccSLukas Czerner 		}
26666e47a3ccSLukas Czerner 	}
26676e47a3ccSLukas Czerner 
2668e6e268cbSLukas Czerner 	return 0;
2669e6e268cbSLukas Czerner 
2670e6e268cbSLukas Czerner err_quota_change:
2671e6e268cbSLukas Czerner 	ext4_msg(NULL, KERN_ERR,
2672e6e268cbSLukas Czerner 		 "Cannot change quota options when quota turned on");
2673e6e268cbSLukas Czerner 	return -EINVAL;
2674e6e268cbSLukas Czerner err_jquota_change:
2675e6e268cbSLukas Czerner 	ext4_msg(NULL, KERN_ERR, "Cannot change journaled quota "
2676e6e268cbSLukas Czerner 		 "options when quota turned on");
2677e6e268cbSLukas Czerner 	return -EINVAL;
2678e6e268cbSLukas Czerner err_jquota_specified:
2679e6e268cbSLukas Czerner 	ext4_msg(NULL, KERN_ERR, "%s quota file already specified",
2680e6e268cbSLukas Czerner 		 QTYPE2NAME(i));
2681e6e268cbSLukas Czerner 	return -EINVAL;
2682e6e268cbSLukas Czerner #else
2683e6e268cbSLukas Czerner 	return 0;
2684e6e268cbSLukas Czerner #endif
2685e6e268cbSLukas Czerner }
2686e6e268cbSLukas Czerner 
26875f41fdaeSEric Biggers static int ext4_check_test_dummy_encryption(const struct fs_context *fc,
26885f41fdaeSEric Biggers 					    struct super_block *sb)
26895f41fdaeSEric Biggers {
26905f41fdaeSEric Biggers 	const struct ext4_fs_context *ctx = fc->fs_private;
26915f41fdaeSEric Biggers 	const struct ext4_sb_info *sbi = EXT4_SB(sb);
26925f41fdaeSEric Biggers 
269385456054SEric Biggers 	if (!fscrypt_is_dummy_policy_set(&ctx->dummy_enc_policy))
26945f41fdaeSEric Biggers 		return 0;
26955f41fdaeSEric Biggers 
26965f41fdaeSEric Biggers 	if (!ext4_has_feature_encrypt(sb)) {
26975f41fdaeSEric Biggers 		ext4_msg(NULL, KERN_WARNING,
26985f41fdaeSEric Biggers 			 "test_dummy_encryption requires encrypt feature");
26995f41fdaeSEric Biggers 		return -EINVAL;
27005f41fdaeSEric Biggers 	}
27015f41fdaeSEric Biggers 	/*
27025f41fdaeSEric Biggers 	 * This mount option is just for testing, and it's not worthwhile to
27035f41fdaeSEric Biggers 	 * implement the extra complexity (e.g. RCU protection) that would be
27045f41fdaeSEric Biggers 	 * needed to allow it to be set or changed during remount.  We do allow
27055f41fdaeSEric Biggers 	 * it to be specified during remount, but only if there is no change.
27065f41fdaeSEric Biggers 	 */
270785456054SEric Biggers 	if (fc->purpose == FS_CONTEXT_FOR_RECONFIGURE) {
270885456054SEric Biggers 		if (fscrypt_dummy_policies_equal(&sbi->s_dummy_enc_policy,
270985456054SEric Biggers 						 &ctx->dummy_enc_policy))
271085456054SEric Biggers 			return 0;
27115f41fdaeSEric Biggers 		ext4_msg(NULL, KERN_WARNING,
271285456054SEric Biggers 			 "Can't set or change test_dummy_encryption on remount");
27135f41fdaeSEric Biggers 		return -EINVAL;
27145f41fdaeSEric Biggers 	}
271585456054SEric Biggers 	/* Also make sure s_mount_opts didn't contain a conflicting value. */
271685456054SEric Biggers 	if (fscrypt_is_dummy_policy_set(&sbi->s_dummy_enc_policy)) {
271785456054SEric Biggers 		if (fscrypt_dummy_policies_equal(&sbi->s_dummy_enc_policy,
271885456054SEric Biggers 						 &ctx->dummy_enc_policy))
27195f41fdaeSEric Biggers 			return 0;
272085456054SEric Biggers 		ext4_msg(NULL, KERN_WARNING,
272185456054SEric Biggers 			 "Conflicting test_dummy_encryption options");
272285456054SEric Biggers 		return -EINVAL;
272385456054SEric Biggers 	}
27247959eb19SEric Biggers 	return 0;
272585456054SEric Biggers }
272685456054SEric Biggers 
272785456054SEric Biggers static void ext4_apply_test_dummy_encryption(struct ext4_fs_context *ctx,
272885456054SEric Biggers 					     struct super_block *sb)
272985456054SEric Biggers {
273085456054SEric Biggers 	if (!fscrypt_is_dummy_policy_set(&ctx->dummy_enc_policy) ||
273185456054SEric Biggers 	    /* if already set, it was already verified to be the same */
273285456054SEric Biggers 	    fscrypt_is_dummy_policy_set(&EXT4_SB(sb)->s_dummy_enc_policy))
273385456054SEric Biggers 		return;
273485456054SEric Biggers 	EXT4_SB(sb)->s_dummy_enc_policy = ctx->dummy_enc_policy;
273585456054SEric Biggers 	memset(&ctx->dummy_enc_policy, 0, sizeof(ctx->dummy_enc_policy));
273685456054SEric Biggers 	ext4_msg(sb, KERN_WARNING, "Test dummy encryption mode enabled");
27375f41fdaeSEric Biggers }
27385f41fdaeSEric Biggers 
2739b6bd2435SLukas Czerner static int ext4_check_opt_consistency(struct fs_context *fc,
2740b6bd2435SLukas Czerner 				      struct super_block *sb)
2741b6bd2435SLukas Czerner {
2742b6bd2435SLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
27436e47a3ccSLukas Czerner 	struct ext4_sb_info *sbi = fc->s_fs_info;
27446e47a3ccSLukas Czerner 	int is_remount = fc->purpose == FS_CONTEXT_FOR_RECONFIGURE;
27455f41fdaeSEric Biggers 	int err;
2746b6bd2435SLukas Czerner 
2747b6bd2435SLukas Czerner 	if ((ctx->opt_flags & MOPT_NO_EXT2) && IS_EXT2_SB(sb)) {
2748b6bd2435SLukas Czerner 		ext4_msg(NULL, KERN_ERR,
2749b6bd2435SLukas Czerner 			 "Mount option(s) incompatible with ext2");
2750b6bd2435SLukas Czerner 		return -EINVAL;
2751b6bd2435SLukas Czerner 	}
2752b6bd2435SLukas Czerner 	if ((ctx->opt_flags & MOPT_NO_EXT3) && IS_EXT3_SB(sb)) {
2753b6bd2435SLukas Czerner 		ext4_msg(NULL, KERN_ERR,
2754b6bd2435SLukas Czerner 			 "Mount option(s) incompatible with ext3");
2755b6bd2435SLukas Czerner 		return -EINVAL;
2756b6bd2435SLukas Czerner 	}
2757b6bd2435SLukas Czerner 
27586e47a3ccSLukas Czerner 	if (ctx->s_want_extra_isize >
27596e47a3ccSLukas Czerner 	    (sbi->s_inode_size - EXT4_GOOD_OLD_INODE_SIZE)) {
27606e47a3ccSLukas Czerner 		ext4_msg(NULL, KERN_ERR,
27616e47a3ccSLukas Czerner 			 "Invalid want_extra_isize %d",
27626e47a3ccSLukas Czerner 			 ctx->s_want_extra_isize);
27636e47a3ccSLukas Czerner 		return -EINVAL;
27646e47a3ccSLukas Czerner 	}
27656e47a3ccSLukas Czerner 
27666e47a3ccSLukas Czerner 	if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DIOREAD_NOLOCK)) {
27676e47a3ccSLukas Czerner 		int blocksize =
27686e47a3ccSLukas Czerner 			BLOCK_SIZE << le32_to_cpu(sbi->s_es->s_log_block_size);
27696e47a3ccSLukas Czerner 		if (blocksize < PAGE_SIZE)
27706e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_WARNING, "Warning: mounting with an "
27716e47a3ccSLukas Czerner 				 "experimental mount option 'dioread_nolock' "
27726e47a3ccSLukas Czerner 				 "for blocksize < PAGE_SIZE");
27736e47a3ccSLukas Czerner 	}
27746e47a3ccSLukas Czerner 
27755f41fdaeSEric Biggers 	err = ext4_check_test_dummy_encryption(fc, sb);
27765f41fdaeSEric Biggers 	if (err)
27775f41fdaeSEric Biggers 		return err;
27786e47a3ccSLukas Czerner 
27796e47a3ccSLukas Czerner 	if ((ctx->spec & EXT4_SPEC_DATAJ) && is_remount) {
27806e47a3ccSLukas Czerner 		if (!sbi->s_journal) {
27816e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_WARNING,
27826e47a3ccSLukas Czerner 				 "Remounting file system with no journal "
27836e47a3ccSLukas Czerner 				 "so ignoring journalled data option");
27846e47a3ccSLukas Czerner 			ctx_clear_mount_opt(ctx, EXT4_MOUNT_DATA_FLAGS);
27854c246728SLukas Czerner 		} else if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DATA_FLAGS) !=
27864c246728SLukas Czerner 			   test_opt(sb, DATA_FLAGS)) {
27876e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_ERR, "Cannot change data mode "
27886e47a3ccSLukas Czerner 				 "on remount");
27896e47a3ccSLukas Czerner 			return -EINVAL;
27906e47a3ccSLukas Czerner 		}
27916e47a3ccSLukas Czerner 	}
27926e47a3ccSLukas Czerner 
27936e47a3ccSLukas Czerner 	if (is_remount) {
27946e47a3ccSLukas Czerner 		if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS) &&
27956e47a3ccSLukas Czerner 		    (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)) {
27966e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_ERR, "can't mount with "
27976e47a3ccSLukas Czerner 				 "both data=journal and dax");
27986e47a3ccSLukas Czerner 			return -EINVAL;
27996e47a3ccSLukas Czerner 		}
28006e47a3ccSLukas Czerner 
28016e47a3ccSLukas Czerner 		if (ctx_test_mount_opt(ctx, EXT4_MOUNT_DAX_ALWAYS) &&
28026e47a3ccSLukas Czerner 		    (!(sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS) ||
28036e47a3ccSLukas Czerner 		     (sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_NEVER))) {
28046e47a3ccSLukas Czerner fail_dax_change_remount:
28056e47a3ccSLukas Czerner 			ext4_msg(NULL, KERN_ERR, "can't change "
28066e47a3ccSLukas Czerner 				 "dax mount option while remounting");
28076e47a3ccSLukas Czerner 			return -EINVAL;
28086e47a3ccSLukas Czerner 		} else if (ctx_test_mount_opt2(ctx, EXT4_MOUNT2_DAX_NEVER) &&
28096e47a3ccSLukas Czerner 			 (!(sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_NEVER) ||
28106e47a3ccSLukas Czerner 			  (sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS))) {
28116e47a3ccSLukas Czerner 			goto fail_dax_change_remount;
28126e47a3ccSLukas Czerner 		} else if (ctx_test_mount_opt2(ctx, EXT4_MOUNT2_DAX_INODE) &&
28136e47a3ccSLukas Czerner 			   ((sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS) ||
28146e47a3ccSLukas Czerner 			    (sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_NEVER) ||
28156e47a3ccSLukas Czerner 			    !(sbi->s_mount_opt2 & EXT4_MOUNT2_DAX_INODE))) {
28166e47a3ccSLukas Czerner 			goto fail_dax_change_remount;
28176e47a3ccSLukas Czerner 		}
28186e47a3ccSLukas Czerner 	}
28196e47a3ccSLukas Czerner 
2820b6bd2435SLukas Czerner 	return ext4_check_quota_consistency(fc, sb);
2821b6bd2435SLukas Czerner }
2822b6bd2435SLukas Czerner 
282385456054SEric Biggers static void ext4_apply_options(struct fs_context *fc, struct super_block *sb)
28246e47a3ccSLukas Czerner {
28256e47a3ccSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
28266e47a3ccSLukas Czerner 	struct ext4_sb_info *sbi = fc->s_fs_info;
28276e47a3ccSLukas Czerner 
28286e47a3ccSLukas Czerner 	sbi->s_mount_opt &= ~ctx->mask_s_mount_opt;
28296e47a3ccSLukas Czerner 	sbi->s_mount_opt |= ctx->vals_s_mount_opt;
28306e47a3ccSLukas Czerner 	sbi->s_mount_opt2 &= ~ctx->mask_s_mount_opt2;
28316e47a3ccSLukas Czerner 	sbi->s_mount_opt2 |= ctx->vals_s_mount_opt2;
28326e47a3ccSLukas Czerner 	sbi->s_mount_flags &= ~ctx->mask_s_mount_flags;
28336e47a3ccSLukas Czerner 	sbi->s_mount_flags |= ctx->vals_s_mount_flags;
28346e47a3ccSLukas Czerner 	sb->s_flags &= ~ctx->mask_s_flags;
28356e47a3ccSLukas Czerner 	sb->s_flags |= ctx->vals_s_flags;
28366e47a3ccSLukas Czerner 
28376e47a3ccSLukas Czerner #define APPLY(X) ({ if (ctx->spec & EXT4_SPEC_##X) sbi->X = ctx->X; })
28386e47a3ccSLukas Czerner 	APPLY(s_commit_interval);
28396e47a3ccSLukas Czerner 	APPLY(s_stripe);
28406e47a3ccSLukas Czerner 	APPLY(s_max_batch_time);
28416e47a3ccSLukas Czerner 	APPLY(s_min_batch_time);
28426e47a3ccSLukas Czerner 	APPLY(s_want_extra_isize);
28436e47a3ccSLukas Czerner 	APPLY(s_inode_readahead_blks);
28446e47a3ccSLukas Czerner 	APPLY(s_max_dir_size_kb);
28456e47a3ccSLukas Czerner 	APPLY(s_li_wait_mult);
28466e47a3ccSLukas Czerner 	APPLY(s_resgid);
28476e47a3ccSLukas Czerner 	APPLY(s_resuid);
28486e47a3ccSLukas Czerner 
28496e47a3ccSLukas Czerner #ifdef CONFIG_EXT4_DEBUG
28506e47a3ccSLukas Czerner 	APPLY(s_fc_debug_max_replay);
28516e47a3ccSLukas Czerner #endif
28526e47a3ccSLukas Czerner 
28536e47a3ccSLukas Czerner 	ext4_apply_quota_options(fc, sb);
285485456054SEric Biggers 	ext4_apply_test_dummy_encryption(ctx, sb);
28556e47a3ccSLukas Czerner }
28566e47a3ccSLukas Czerner 
28576e47a3ccSLukas Czerner 
2858da812f61SLukas Czerner static int ext4_validate_options(struct fs_context *fc)
28594c94bff9SLukas Czerner {
2860ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
28616e47a3ccSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
28624c94bff9SLukas Czerner 	char *usr_qf_name, *grp_qf_name;
28636e47a3ccSLukas Czerner 
28646e47a3ccSLukas Czerner 	usr_qf_name = ctx->s_qf_names[USRQUOTA];
28656e47a3ccSLukas Czerner 	grp_qf_name = ctx->s_qf_names[GRPQUOTA];
28666e47a3ccSLukas Czerner 
286733458eabSTheodore Ts'o 	if (usr_qf_name || grp_qf_name) {
28686e47a3ccSLukas Czerner 		if (ctx_test_mount_opt(ctx, EXT4_MOUNT_USRQUOTA) && usr_qf_name)
28696e47a3ccSLukas Czerner 			ctx_clear_mount_opt(ctx, EXT4_MOUNT_USRQUOTA);
2870ac27a0ecSDave Kleikamp 
28716e47a3ccSLukas Czerner 		if (ctx_test_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA) && grp_qf_name)
28726e47a3ccSLukas Czerner 			ctx_clear_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA);
2873ac27a0ecSDave Kleikamp 
28746e47a3ccSLukas Czerner 		if (ctx_test_mount_opt(ctx, EXT4_MOUNT_USRQUOTA) ||
28756e47a3ccSLukas Czerner 		    ctx_test_mount_opt(ctx, EXT4_MOUNT_GRPQUOTA)) {
2876da812f61SLukas Czerner 			ext4_msg(NULL, KERN_ERR, "old and new quota "
2877b31e1552SEric Sandeen 				 "format mixing");
2878da812f61SLukas Czerner 			return -EINVAL;
2879ac27a0ecSDave Kleikamp 		}
2880ac27a0ecSDave Kleikamp 	}
2881ac27a0ecSDave Kleikamp #endif
28826e47a3ccSLukas Czerner 	return 1;
2883ac27a0ecSDave Kleikamp }
2884ac27a0ecSDave Kleikamp 
28852adf6da8STheodore Ts'o static inline void ext4_show_quota_options(struct seq_file *seq,
28862adf6da8STheodore Ts'o 					   struct super_block *sb)
28872adf6da8STheodore Ts'o {
28882adf6da8STheodore Ts'o #if defined(CONFIG_QUOTA)
28892adf6da8STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
289033458eabSTheodore Ts'o 	char *usr_qf_name, *grp_qf_name;
28912adf6da8STheodore Ts'o 
28922adf6da8STheodore Ts'o 	if (sbi->s_jquota_fmt) {
28932adf6da8STheodore Ts'o 		char *fmtname = "";
28942adf6da8STheodore Ts'o 
28952adf6da8STheodore Ts'o 		switch (sbi->s_jquota_fmt) {
28962adf6da8STheodore Ts'o 		case QFMT_VFS_OLD:
28972adf6da8STheodore Ts'o 			fmtname = "vfsold";
28982adf6da8STheodore Ts'o 			break;
28992adf6da8STheodore Ts'o 		case QFMT_VFS_V0:
29002adf6da8STheodore Ts'o 			fmtname = "vfsv0";
29012adf6da8STheodore Ts'o 			break;
29022adf6da8STheodore Ts'o 		case QFMT_VFS_V1:
29032adf6da8STheodore Ts'o 			fmtname = "vfsv1";
29042adf6da8STheodore Ts'o 			break;
29052adf6da8STheodore Ts'o 		}
29062adf6da8STheodore Ts'o 		seq_printf(seq, ",jqfmt=%s", fmtname);
29072adf6da8STheodore Ts'o 	}
29082adf6da8STheodore Ts'o 
290933458eabSTheodore Ts'o 	rcu_read_lock();
291033458eabSTheodore Ts'o 	usr_qf_name = rcu_dereference(sbi->s_qf_names[USRQUOTA]);
291133458eabSTheodore Ts'o 	grp_qf_name = rcu_dereference(sbi->s_qf_names[GRPQUOTA]);
291233458eabSTheodore Ts'o 	if (usr_qf_name)
291333458eabSTheodore Ts'o 		seq_show_option(seq, "usrjquota", usr_qf_name);
291433458eabSTheodore Ts'o 	if (grp_qf_name)
291533458eabSTheodore Ts'o 		seq_show_option(seq, "grpjquota", grp_qf_name);
291633458eabSTheodore Ts'o 	rcu_read_unlock();
29172adf6da8STheodore Ts'o #endif
29182adf6da8STheodore Ts'o }
29192adf6da8STheodore Ts'o 
29205a916be1STheodore Ts'o static const char *token2str(int token)
29215a916be1STheodore Ts'o {
292297d8a670SLukas Czerner 	const struct fs_parameter_spec *spec;
29235a916be1STheodore Ts'o 
292497d8a670SLukas Czerner 	for (spec = ext4_param_specs; spec->name != NULL; spec++)
292597d8a670SLukas Czerner 		if (spec->opt == token && !spec->type)
29265a916be1STheodore Ts'o 			break;
292797d8a670SLukas Czerner 	return spec->name;
29285a916be1STheodore Ts'o }
29295a916be1STheodore Ts'o 
29302adf6da8STheodore Ts'o /*
29312adf6da8STheodore Ts'o  * Show an option if
29322adf6da8STheodore Ts'o  *  - it's set to a non-default value OR
29332adf6da8STheodore Ts'o  *  - if the per-sb default is different from the global default
29342adf6da8STheodore Ts'o  */
293566acdcf4STheodore Ts'o static int _ext4_show_options(struct seq_file *seq, struct super_block *sb,
293666acdcf4STheodore Ts'o 			      int nodefs)
29372adf6da8STheodore Ts'o {
29382adf6da8STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
29392adf6da8STheodore Ts'o 	struct ext4_super_block *es = sbi->s_es;
2940e3645d72SZhang Yi 	int def_errors;
29415a916be1STheodore Ts'o 	const struct mount_opts *m;
294266acdcf4STheodore Ts'o 	char sep = nodefs ? '\n' : ',';
29432adf6da8STheodore Ts'o 
294466acdcf4STheodore Ts'o #define SEQ_OPTS_PUTS(str) seq_printf(seq, "%c" str, sep)
294566acdcf4STheodore Ts'o #define SEQ_OPTS_PRINT(str, arg) seq_printf(seq, "%c" str, sep, arg)
29462adf6da8STheodore Ts'o 
29472adf6da8STheodore Ts'o 	if (sbi->s_sb_block != 1)
29485a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("sb=%llu", sbi->s_sb_block);
29495a916be1STheodore Ts'o 
29505a916be1STheodore Ts'o 	for (m = ext4_mount_opts; m->token != Opt_err; m++) {
29515a916be1STheodore Ts'o 		int want_set = m->flags & MOPT_SET;
2952e3645d72SZhang Yi 		int opt_2 = m->flags & MOPT_2;
2953e3645d72SZhang Yi 		unsigned int mount_opt, def_mount_opt;
2954e3645d72SZhang Yi 
29555a916be1STheodore Ts'o 		if (((m->flags & (MOPT_SET|MOPT_CLEAR)) == 0) ||
2956ba2e524dSLukas Czerner 		    m->flags & MOPT_SKIP)
29575a916be1STheodore Ts'o 			continue;
2958e3645d72SZhang Yi 
2959e3645d72SZhang Yi 		if (opt_2) {
2960e3645d72SZhang Yi 			mount_opt = sbi->s_mount_opt2;
2961e3645d72SZhang Yi 			def_mount_opt = sbi->s_def_mount_opt2;
2962e3645d72SZhang Yi 		} else {
2963e3645d72SZhang Yi 			mount_opt = sbi->s_mount_opt;
2964e3645d72SZhang Yi 			def_mount_opt = sbi->s_def_mount_opt;
2965e3645d72SZhang Yi 		}
2966e3645d72SZhang Yi 		/* skip if same as the default */
2967e3645d72SZhang Yi 		if (!nodefs && !(m->mount_opt & (mount_opt ^ def_mount_opt)))
2968e3645d72SZhang Yi 			continue;
2969e3645d72SZhang Yi 		/* select Opt_noFoo vs Opt_Foo */
29705a916be1STheodore Ts'o 		if ((want_set &&
2971e3645d72SZhang Yi 		     (mount_opt & m->mount_opt) != m->mount_opt) ||
2972e3645d72SZhang Yi 		    (!want_set && (mount_opt & m->mount_opt)))
2973e3645d72SZhang Yi 			continue;
29745a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("%s", token2str(m->token));
29755a916be1STheodore Ts'o 	}
29765a916be1STheodore Ts'o 
297708cefc7aSEric W. Biederman 	if (nodefs || !uid_eq(sbi->s_resuid, make_kuid(&init_user_ns, EXT4_DEF_RESUID)) ||
29785a916be1STheodore Ts'o 	    le16_to_cpu(es->s_def_resuid) != EXT4_DEF_RESUID)
297908cefc7aSEric W. Biederman 		SEQ_OPTS_PRINT("resuid=%u",
298008cefc7aSEric W. Biederman 				from_kuid_munged(&init_user_ns, sbi->s_resuid));
298108cefc7aSEric W. Biederman 	if (nodefs || !gid_eq(sbi->s_resgid, make_kgid(&init_user_ns, EXT4_DEF_RESGID)) ||
29825a916be1STheodore Ts'o 	    le16_to_cpu(es->s_def_resgid) != EXT4_DEF_RESGID)
298308cefc7aSEric W. Biederman 		SEQ_OPTS_PRINT("resgid=%u",
298408cefc7aSEric W. Biederman 				from_kgid_munged(&init_user_ns, sbi->s_resgid));
298566acdcf4STheodore Ts'o 	def_errors = nodefs ? -1 : le16_to_cpu(es->s_errors);
29865a916be1STheodore Ts'o 	if (test_opt(sb, ERRORS_RO) && def_errors != EXT4_ERRORS_RO)
29875a916be1STheodore Ts'o 		SEQ_OPTS_PUTS("errors=remount-ro");
29882adf6da8STheodore Ts'o 	if (test_opt(sb, ERRORS_CONT) && def_errors != EXT4_ERRORS_CONTINUE)
29895a916be1STheodore Ts'o 		SEQ_OPTS_PUTS("errors=continue");
29902adf6da8STheodore Ts'o 	if (test_opt(sb, ERRORS_PANIC) && def_errors != EXT4_ERRORS_PANIC)
29915a916be1STheodore Ts'o 		SEQ_OPTS_PUTS("errors=panic");
299266acdcf4STheodore Ts'o 	if (nodefs || sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ)
29935a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("commit=%lu", sbi->s_commit_interval / HZ);
299466acdcf4STheodore Ts'o 	if (nodefs || sbi->s_min_batch_time != EXT4_DEF_MIN_BATCH_TIME)
29955a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("min_batch_time=%u", sbi->s_min_batch_time);
299666acdcf4STheodore Ts'o 	if (nodefs || sbi->s_max_batch_time != EXT4_DEF_MAX_BATCH_TIME)
29975a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("max_batch_time=%u", sbi->s_max_batch_time);
299866acdcf4STheodore Ts'o 	if (nodefs || sbi->s_stripe)
29995a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("stripe=%lu", sbi->s_stripe);
300068afa7e0STyson Nottingham 	if (nodefs || EXT4_MOUNT_DATA_FLAGS &
3001e3645d72SZhang Yi 			(sbi->s_mount_opt ^ sbi->s_def_mount_opt)) {
30022adf6da8STheodore Ts'o 		if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
30035a916be1STheodore Ts'o 			SEQ_OPTS_PUTS("data=journal");
30042adf6da8STheodore Ts'o 		else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
30055a916be1STheodore Ts'o 			SEQ_OPTS_PUTS("data=ordered");
30062adf6da8STheodore Ts'o 		else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_WRITEBACK_DATA)
30075a916be1STheodore Ts'o 			SEQ_OPTS_PUTS("data=writeback");
30085a916be1STheodore Ts'o 	}
300966acdcf4STheodore Ts'o 	if (nodefs ||
301066acdcf4STheodore Ts'o 	    sbi->s_inode_readahead_blks != EXT4_DEF_INODE_READAHEAD_BLKS)
30115a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("inode_readahead_blks=%u",
30122adf6da8STheodore Ts'o 			       sbi->s_inode_readahead_blks);
30132adf6da8STheodore Ts'o 
3014ceec0376STyson Nottingham 	if (test_opt(sb, INIT_INODE_TABLE) && (nodefs ||
301566acdcf4STheodore Ts'o 		       (sbi->s_li_wait_mult != EXT4_DEF_LI_WAIT_MULT)))
30165a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("init_itable=%u", sbi->s_li_wait_mult);
3017df981d03STheodore Ts'o 	if (nodefs || sbi->s_max_dir_size_kb)
3018df981d03STheodore Ts'o 		SEQ_OPTS_PRINT("max_dir_size_kb=%u", sbi->s_max_dir_size_kb);
30197915a861SAles Novak 	if (test_opt(sb, DATA_ERR_ABORT))
30207915a861SAles Novak 		SEQ_OPTS_PUTS("data_err=abort");
3021ed318a6cSEric Biggers 
3022ed318a6cSEric Biggers 	fscrypt_show_test_dummy_encryption(seq, sep, sb);
30232adf6da8STheodore Ts'o 
30244f74d15fSEric Biggers 	if (sb->s_flags & SB_INLINECRYPT)
30254f74d15fSEric Biggers 		SEQ_OPTS_PUTS("inlinecrypt");
30264f74d15fSEric Biggers 
30279cb20f94SIra Weiny 	if (test_opt(sb, DAX_ALWAYS)) {
30289cb20f94SIra Weiny 		if (IS_EXT2_SB(sb))
30299cb20f94SIra Weiny 			SEQ_OPTS_PUTS("dax");
30309cb20f94SIra Weiny 		else
30319cb20f94SIra Weiny 			SEQ_OPTS_PUTS("dax=always");
30329cb20f94SIra Weiny 	} else if (test_opt2(sb, DAX_NEVER)) {
30339cb20f94SIra Weiny 		SEQ_OPTS_PUTS("dax=never");
30349cb20f94SIra Weiny 	} else if (test_opt2(sb, DAX_INODE)) {
30359cb20f94SIra Weiny 		SEQ_OPTS_PUTS("dax=inode");
30369cb20f94SIra Weiny 	}
30373fa5d23eSOjaswin Mujoo 
30383fa5d23eSOjaswin Mujoo 	if (sbi->s_groups_count >= MB_DEFAULT_LINEAR_SCAN_THRESHOLD &&
30393fa5d23eSOjaswin Mujoo 			!test_opt2(sb, MB_OPTIMIZE_SCAN)) {
30403fa5d23eSOjaswin Mujoo 		SEQ_OPTS_PUTS("mb_optimize_scan=0");
30413fa5d23eSOjaswin Mujoo 	} else if (sbi->s_groups_count < MB_DEFAULT_LINEAR_SCAN_THRESHOLD &&
30423fa5d23eSOjaswin Mujoo 			test_opt2(sb, MB_OPTIMIZE_SCAN)) {
30433fa5d23eSOjaswin Mujoo 		SEQ_OPTS_PUTS("mb_optimize_scan=1");
30443fa5d23eSOjaswin Mujoo 	}
30453fa5d23eSOjaswin Mujoo 
30462adf6da8STheodore Ts'o 	ext4_show_quota_options(seq, sb);
30472adf6da8STheodore Ts'o 	return 0;
30482adf6da8STheodore Ts'o }
30492adf6da8STheodore Ts'o 
305066acdcf4STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root)
305166acdcf4STheodore Ts'o {
305266acdcf4STheodore Ts'o 	return _ext4_show_options(seq, root->d_sb, 0);
305366acdcf4STheodore Ts'o }
305466acdcf4STheodore Ts'o 
3055ebd173beSTheodore Ts'o int ext4_seq_options_show(struct seq_file *seq, void *offset)
305666acdcf4STheodore Ts'o {
305766acdcf4STheodore Ts'o 	struct super_block *sb = seq->private;
305866acdcf4STheodore Ts'o 	int rc;
305966acdcf4STheodore Ts'o 
3060bc98a42cSDavid Howells 	seq_puts(seq, sb_rdonly(sb) ? "ro" : "rw");
306166acdcf4STheodore Ts'o 	rc = _ext4_show_options(seq, sb, 1);
306266acdcf4STheodore Ts'o 	seq_puts(seq, "\n");
306366acdcf4STheodore Ts'o 	return rc;
306466acdcf4STheodore Ts'o }
306566acdcf4STheodore Ts'o 
3066617ba13bSMingming Cao static int ext4_setup_super(struct super_block *sb, struct ext4_super_block *es,
3067ac27a0ecSDave Kleikamp 			    int read_only)
3068ac27a0ecSDave Kleikamp {
3069617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3070c89128a0SJaegeuk Kim 	int err = 0;
3071ac27a0ecSDave Kleikamp 
3072617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) > EXT4_MAX_SUPP_REV) {
3073b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "revision level too high, "
3074b31e1552SEric Sandeen 			 "forcing read-only mode");
3075c89128a0SJaegeuk Kim 		err = -EROFS;
30765adaccacSyangerkun 		goto done;
3077ac27a0ecSDave Kleikamp 	}
3078ac27a0ecSDave Kleikamp 	if (read_only)
3079281b5995STheodore Ts'o 		goto done;
3080617ba13bSMingming Cao 	if (!(sbi->s_mount_state & EXT4_VALID_FS))
3081b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING, "warning: mounting unchecked fs, "
3082b31e1552SEric Sandeen 			 "running e2fsck is recommended");
3083c8b459f4SLukas Czerner 	else if (sbi->s_mount_state & EXT4_ERROR_FS)
3084b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING,
3085b31e1552SEric Sandeen 			 "warning: mounting fs with errors, "
3086b31e1552SEric Sandeen 			 "running e2fsck is recommended");
3087ed3ce80aSTao Ma 	else if ((__s16) le16_to_cpu(es->s_max_mnt_count) > 0 &&
3088ac27a0ecSDave Kleikamp 		 le16_to_cpu(es->s_mnt_count) >=
3089ac27a0ecSDave Kleikamp 		 (unsigned short) (__s16) le16_to_cpu(es->s_max_mnt_count))
3090b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING,
3091b31e1552SEric Sandeen 			 "warning: maximal mount count reached, "
3092b31e1552SEric Sandeen 			 "running e2fsck is recommended");
3093ac27a0ecSDave Kleikamp 	else if (le32_to_cpu(es->s_checkinterval) &&
30946a0678a7SArnd Bergmann 		 (ext4_get_tstamp(es, s_lastcheck) +
30956a0678a7SArnd Bergmann 		  le32_to_cpu(es->s_checkinterval) <= ktime_get_real_seconds()))
3096b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING,
3097b31e1552SEric Sandeen 			 "warning: checktime reached, "
3098b31e1552SEric Sandeen 			 "running e2fsck is recommended");
30990390131bSFrank Mayhar 	if (!sbi->s_journal)
3100216c34b2SMarcin Slusarz 		es->s_state &= cpu_to_le16(~EXT4_VALID_FS);
3101ac27a0ecSDave Kleikamp 	if (!(__s16) le16_to_cpu(es->s_max_mnt_count))
3102617ba13bSMingming Cao 		es->s_max_mnt_count = cpu_to_le16(EXT4_DFL_MAX_MNT_COUNT);
3103e8546d06SMarcin Slusarz 	le16_add_cpu(&es->s_mnt_count, 1);
31046a0678a7SArnd Bergmann 	ext4_update_tstamp(es, s_mtime);
310502f310fcSJan Kara 	if (sbi->s_journal) {
3106e2b911c5SDarrick J. Wong 		ext4_set_feature_journal_needs_recovery(sb);
310702f310fcSJan Kara 		if (ext4_has_feature_orphan_file(sb))
310802f310fcSJan Kara 			ext4_set_feature_orphan_present(sb);
310902f310fcSJan Kara 	}
3110ac27a0ecSDave Kleikamp 
31114392fbc4SJan Kara 	err = ext4_commit_super(sb);
3112281b5995STheodore Ts'o done:
3113ac27a0ecSDave Kleikamp 	if (test_opt(sb, DEBUG))
3114a9df9a49STheodore Ts'o 		printk(KERN_INFO "[EXT4 FS bs=%lu, gc=%u, "
3115a2595b8aSTheodore Ts'o 				"bpg=%lu, ipg=%lu, mo=%04x, mo2=%04x]\n",
3116ac27a0ecSDave Kleikamp 			sb->s_blocksize,
3117ac27a0ecSDave Kleikamp 			sbi->s_groups_count,
3118617ba13bSMingming Cao 			EXT4_BLOCKS_PER_GROUP(sb),
3119617ba13bSMingming Cao 			EXT4_INODES_PER_GROUP(sb),
3120a2595b8aSTheodore Ts'o 			sbi->s_mount_opt, sbi->s_mount_opt2);
3121c89128a0SJaegeuk Kim 	return err;
3122ac27a0ecSDave Kleikamp }
3123ac27a0ecSDave Kleikamp 
3124117fff10STheodore Ts'o int ext4_alloc_flex_bg_array(struct super_block *sb, ext4_group_t ngroup)
3125117fff10STheodore Ts'o {
3126117fff10STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
31277c990728SSuraj Jitindar Singh 	struct flex_groups **old_groups, **new_groups;
312837b0b6b8SDan Carpenter 	int size, i, j;
3129117fff10STheodore Ts'o 
3130117fff10STheodore Ts'o 	if (!sbi->s_log_groups_per_flex)
3131117fff10STheodore Ts'o 		return 0;
3132117fff10STheodore Ts'o 
3133117fff10STheodore Ts'o 	size = ext4_flex_group(sbi, ngroup - 1) + 1;
3134117fff10STheodore Ts'o 	if (size <= sbi->s_flex_groups_allocated)
3135117fff10STheodore Ts'o 		return 0;
3136117fff10STheodore Ts'o 
31377c990728SSuraj Jitindar Singh 	new_groups = kvzalloc(roundup_pow_of_two(size *
31387c990728SSuraj Jitindar Singh 			      sizeof(*sbi->s_flex_groups)), GFP_KERNEL);
3139117fff10STheodore Ts'o 	if (!new_groups) {
31407c990728SSuraj Jitindar Singh 		ext4_msg(sb, KERN_ERR,
31417c990728SSuraj Jitindar Singh 			 "not enough memory for %d flex group pointers", size);
3142117fff10STheodore Ts'o 		return -ENOMEM;
3143117fff10STheodore Ts'o 	}
31447c990728SSuraj Jitindar Singh 	for (i = sbi->s_flex_groups_allocated; i < size; i++) {
31457c990728SSuraj Jitindar Singh 		new_groups[i] = kvzalloc(roundup_pow_of_two(
31467c990728SSuraj Jitindar Singh 					 sizeof(struct flex_groups)),
31477c990728SSuraj Jitindar Singh 					 GFP_KERNEL);
31487c990728SSuraj Jitindar Singh 		if (!new_groups[i]) {
314937b0b6b8SDan Carpenter 			for (j = sbi->s_flex_groups_allocated; j < i; j++)
315037b0b6b8SDan Carpenter 				kvfree(new_groups[j]);
31517c990728SSuraj Jitindar Singh 			kvfree(new_groups);
31527c990728SSuraj Jitindar Singh 			ext4_msg(sb, KERN_ERR,
31537c990728SSuraj Jitindar Singh 				 "not enough memory for %d flex groups", size);
31547c990728SSuraj Jitindar Singh 			return -ENOMEM;
3155117fff10STheodore Ts'o 		}
31567c990728SSuraj Jitindar Singh 	}
31577c990728SSuraj Jitindar Singh 	rcu_read_lock();
31587c990728SSuraj Jitindar Singh 	old_groups = rcu_dereference(sbi->s_flex_groups);
31597c990728SSuraj Jitindar Singh 	if (old_groups)
31607c990728SSuraj Jitindar Singh 		memcpy(new_groups, old_groups,
31617c990728SSuraj Jitindar Singh 		       (sbi->s_flex_groups_allocated *
31627c990728SSuraj Jitindar Singh 			sizeof(struct flex_groups *)));
31637c990728SSuraj Jitindar Singh 	rcu_read_unlock();
31647c990728SSuraj Jitindar Singh 	rcu_assign_pointer(sbi->s_flex_groups, new_groups);
31657c990728SSuraj Jitindar Singh 	sbi->s_flex_groups_allocated = size;
31667c990728SSuraj Jitindar Singh 	if (old_groups)
31677c990728SSuraj Jitindar Singh 		ext4_kvfree_array_rcu(old_groups);
3168117fff10STheodore Ts'o 	return 0;
3169117fff10STheodore Ts'o }
3170117fff10STheodore Ts'o 
3171772cb7c8SJose R. Santos static int ext4_fill_flex_info(struct super_block *sb)
3172772cb7c8SJose R. Santos {
3173772cb7c8SJose R. Santos 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3174772cb7c8SJose R. Santos 	struct ext4_group_desc *gdp = NULL;
31757c990728SSuraj Jitindar Singh 	struct flex_groups *fg;
3176772cb7c8SJose R. Santos 	ext4_group_t flex_group;
3177117fff10STheodore Ts'o 	int i, err;
3178772cb7c8SJose R. Santos 
3179503358aeSTheodore Ts'o 	sbi->s_log_groups_per_flex = sbi->s_es->s_log_groups_per_flex;
3180d50f2ab6SXi Wang 	if (sbi->s_log_groups_per_flex < 1 || sbi->s_log_groups_per_flex > 31) {
3181772cb7c8SJose R. Santos 		sbi->s_log_groups_per_flex = 0;
3182772cb7c8SJose R. Santos 		return 1;
3183772cb7c8SJose R. Santos 	}
3184772cb7c8SJose R. Santos 
3185117fff10STheodore Ts'o 	err = ext4_alloc_flex_bg_array(sb, sbi->s_groups_count);
3186117fff10STheodore Ts'o 	if (err)
3187772cb7c8SJose R. Santos 		goto failed;
3188772cb7c8SJose R. Santos 
3189772cb7c8SJose R. Santos 	for (i = 0; i < sbi->s_groups_count; i++) {
319088b6edd1STheodore Ts'o 		gdp = ext4_get_group_desc(sb, i, NULL);
3191772cb7c8SJose R. Santos 
3192772cb7c8SJose R. Santos 		flex_group = ext4_flex_group(sbi, i);
31937c990728SSuraj Jitindar Singh 		fg = sbi_array_rcu_deref(sbi, s_flex_groups, flex_group);
31947c990728SSuraj Jitindar Singh 		atomic_add(ext4_free_inodes_count(sb, gdp), &fg->free_inodes);
319590ba983fSTheodore Ts'o 		atomic64_add(ext4_free_group_clusters(sb, gdp),
31967c990728SSuraj Jitindar Singh 			     &fg->free_clusters);
31977c990728SSuraj Jitindar Singh 		atomic_add(ext4_used_dirs_count(sb, gdp), &fg->used_dirs);
3198772cb7c8SJose R. Santos 	}
3199772cb7c8SJose R. Santos 
3200772cb7c8SJose R. Santos 	return 1;
3201772cb7c8SJose R. Santos failed:
3202772cb7c8SJose R. Santos 	return 0;
3203772cb7c8SJose R. Santos }
3204772cb7c8SJose R. Santos 
3205e2b911c5SDarrick J. Wong static __le16 ext4_group_desc_csum(struct super_block *sb, __u32 block_group,
3206717d50e4SAndreas Dilger 				   struct ext4_group_desc *gdp)
3207717d50e4SAndreas Dilger {
3208b47820edSDaeho Jeong 	int offset = offsetof(struct ext4_group_desc, bg_checksum);
3209717d50e4SAndreas Dilger 	__u16 crc = 0;
3210717d50e4SAndreas Dilger 	__le32 le_group = cpu_to_le32(block_group);
3211e2b911c5SDarrick J. Wong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3212717d50e4SAndreas Dilger 
32139aa5d32bSDmitry Monakhov 	if (ext4_has_metadata_csum(sbi->s_sb)) {
3214feb0ab32SDarrick J. Wong 		/* Use new metadata_csum algorithm */
3215feb0ab32SDarrick J. Wong 		__u32 csum32;
3216b47820edSDaeho Jeong 		__u16 dummy_csum = 0;
3217feb0ab32SDarrick J. Wong 
3218feb0ab32SDarrick J. Wong 		csum32 = ext4_chksum(sbi, sbi->s_csum_seed, (__u8 *)&le_group,
3219feb0ab32SDarrick J. Wong 				     sizeof(le_group));
3220b47820edSDaeho Jeong 		csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp, offset);
3221b47820edSDaeho Jeong 		csum32 = ext4_chksum(sbi, csum32, (__u8 *)&dummy_csum,
3222b47820edSDaeho Jeong 				     sizeof(dummy_csum));
3223b47820edSDaeho Jeong 		offset += sizeof(dummy_csum);
3224b47820edSDaeho Jeong 		if (offset < sbi->s_desc_size)
3225b47820edSDaeho Jeong 			csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp + offset,
3226b47820edSDaeho Jeong 					     sbi->s_desc_size - offset);
3227feb0ab32SDarrick J. Wong 
3228feb0ab32SDarrick J. Wong 		crc = csum32 & 0xFFFF;
3229feb0ab32SDarrick J. Wong 		goto out;
3230feb0ab32SDarrick J. Wong 	}
3231feb0ab32SDarrick J. Wong 
3232feb0ab32SDarrick J. Wong 	/* old crc16 code */
3233e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_gdt_csum(sb))
3234813d32f9SDarrick J. Wong 		return 0;
3235813d32f9SDarrick J. Wong 
3236717d50e4SAndreas Dilger 	crc = crc16(~0, sbi->s_es->s_uuid, sizeof(sbi->s_es->s_uuid));
3237717d50e4SAndreas Dilger 	crc = crc16(crc, (__u8 *)&le_group, sizeof(le_group));
3238717d50e4SAndreas Dilger 	crc = crc16(crc, (__u8 *)gdp, offset);
3239717d50e4SAndreas Dilger 	offset += sizeof(gdp->bg_checksum); /* skip checksum */
3240717d50e4SAndreas Dilger 	/* for checksum of struct ext4_group_desc do the rest...*/
3241e2b911c5SDarrick J. Wong 	if (ext4_has_feature_64bit(sb) &&
3242717d50e4SAndreas Dilger 	    offset < le16_to_cpu(sbi->s_es->s_desc_size))
3243717d50e4SAndreas Dilger 		crc = crc16(crc, (__u8 *)gdp + offset,
3244717d50e4SAndreas Dilger 			    le16_to_cpu(sbi->s_es->s_desc_size) -
3245717d50e4SAndreas Dilger 				offset);
3246717d50e4SAndreas Dilger 
3247feb0ab32SDarrick J. Wong out:
3248717d50e4SAndreas Dilger 	return cpu_to_le16(crc);
3249717d50e4SAndreas Dilger }
3250717d50e4SAndreas Dilger 
3251feb0ab32SDarrick J. Wong int ext4_group_desc_csum_verify(struct super_block *sb, __u32 block_group,
3252717d50e4SAndreas Dilger 				struct ext4_group_desc *gdp)
3253717d50e4SAndreas Dilger {
3254feb0ab32SDarrick J. Wong 	if (ext4_has_group_desc_csum(sb) &&
3255e2b911c5SDarrick J. Wong 	    (gdp->bg_checksum != ext4_group_desc_csum(sb, block_group, gdp)))
3256717d50e4SAndreas Dilger 		return 0;
3257717d50e4SAndreas Dilger 
3258717d50e4SAndreas Dilger 	return 1;
3259717d50e4SAndreas Dilger }
3260717d50e4SAndreas Dilger 
3261feb0ab32SDarrick J. Wong void ext4_group_desc_csum_set(struct super_block *sb, __u32 block_group,
3262feb0ab32SDarrick J. Wong 			      struct ext4_group_desc *gdp)
3263feb0ab32SDarrick J. Wong {
3264feb0ab32SDarrick J. Wong 	if (!ext4_has_group_desc_csum(sb))
3265feb0ab32SDarrick J. Wong 		return;
3266e2b911c5SDarrick J. Wong 	gdp->bg_checksum = ext4_group_desc_csum(sb, block_group, gdp);
3267feb0ab32SDarrick J. Wong }
3268feb0ab32SDarrick J. Wong 
3269ac27a0ecSDave Kleikamp /* Called at mount-time, super-block is locked */
3270bfff6873SLukas Czerner static int ext4_check_descriptors(struct super_block *sb,
3271829fa70dSTheodore Ts'o 				  ext4_fsblk_t sb_block,
3272bfff6873SLukas Czerner 				  ext4_group_t *first_not_zeroed)
3273ac27a0ecSDave Kleikamp {
3274617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3275617ba13bSMingming Cao 	ext4_fsblk_t first_block = le32_to_cpu(sbi->s_es->s_first_data_block);
3276617ba13bSMingming Cao 	ext4_fsblk_t last_block;
327744de022cSTheodore Ts'o 	ext4_fsblk_t last_bg_block = sb_block + ext4_bg_num_gdb(sb, 0);
3278bd81d8eeSLaurent Vivier 	ext4_fsblk_t block_bitmap;
3279bd81d8eeSLaurent Vivier 	ext4_fsblk_t inode_bitmap;
3280bd81d8eeSLaurent Vivier 	ext4_fsblk_t inode_table;
3281ce421581SJose R. Santos 	int flexbg_flag = 0;
3282bfff6873SLukas Czerner 	ext4_group_t i, grp = sbi->s_groups_count;
3283ac27a0ecSDave Kleikamp 
3284e2b911c5SDarrick J. Wong 	if (ext4_has_feature_flex_bg(sb))
3285ce421581SJose R. Santos 		flexbg_flag = 1;
3286ce421581SJose R. Santos 
3287617ba13bSMingming Cao 	ext4_debug("Checking group descriptors");
3288ac27a0ecSDave Kleikamp 
3289197cd65aSAkinobu Mita 	for (i = 0; i < sbi->s_groups_count; i++) {
3290197cd65aSAkinobu Mita 		struct ext4_group_desc *gdp = ext4_get_group_desc(sb, i, NULL);
3291197cd65aSAkinobu Mita 
3292ce421581SJose R. Santos 		if (i == sbi->s_groups_count - 1 || flexbg_flag)
3293bd81d8eeSLaurent Vivier 			last_block = ext4_blocks_count(sbi->s_es) - 1;
3294ac27a0ecSDave Kleikamp 		else
3295ac27a0ecSDave Kleikamp 			last_block = first_block +
3296617ba13bSMingming Cao 				(EXT4_BLOCKS_PER_GROUP(sb) - 1);
3297ac27a0ecSDave Kleikamp 
3298bfff6873SLukas Czerner 		if ((grp == sbi->s_groups_count) &&
3299bfff6873SLukas Czerner 		   !(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
3300bfff6873SLukas Czerner 			grp = i;
3301bfff6873SLukas Czerner 
33028fadc143SAlexandre Ratchov 		block_bitmap = ext4_block_bitmap(sb, gdp);
3303829fa70dSTheodore Ts'o 		if (block_bitmap == sb_block) {
3304829fa70dSTheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3305829fa70dSTheodore Ts'o 				 "Block bitmap for group %u overlaps "
3306829fa70dSTheodore Ts'o 				 "superblock", i);
330718db4b4eSTheodore Ts'o 			if (!sb_rdonly(sb))
330818db4b4eSTheodore Ts'o 				return 0;
3309829fa70dSTheodore Ts'o 		}
331077260807STheodore Ts'o 		if (block_bitmap >= sb_block + 1 &&
331177260807STheodore Ts'o 		    block_bitmap <= last_bg_block) {
331277260807STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
331377260807STheodore Ts'o 				 "Block bitmap for group %u overlaps "
331477260807STheodore Ts'o 				 "block group descriptors", i);
331577260807STheodore Ts'o 			if (!sb_rdonly(sb))
331677260807STheodore Ts'o 				return 0;
331777260807STheodore Ts'o 		}
33182b2d6d01STheodore Ts'o 		if (block_bitmap < first_block || block_bitmap > last_block) {
3319b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3320a9df9a49STheodore Ts'o 			       "Block bitmap for group %u not in group "
3321b31e1552SEric Sandeen 			       "(block %llu)!", i, block_bitmap);
3322ac27a0ecSDave Kleikamp 			return 0;
3323ac27a0ecSDave Kleikamp 		}
33248fadc143SAlexandre Ratchov 		inode_bitmap = ext4_inode_bitmap(sb, gdp);
3325829fa70dSTheodore Ts'o 		if (inode_bitmap == sb_block) {
3326829fa70dSTheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3327829fa70dSTheodore Ts'o 				 "Inode bitmap for group %u overlaps "
3328829fa70dSTheodore Ts'o 				 "superblock", i);
332918db4b4eSTheodore Ts'o 			if (!sb_rdonly(sb))
333018db4b4eSTheodore Ts'o 				return 0;
3331829fa70dSTheodore Ts'o 		}
333277260807STheodore Ts'o 		if (inode_bitmap >= sb_block + 1 &&
333377260807STheodore Ts'o 		    inode_bitmap <= last_bg_block) {
333477260807STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
333577260807STheodore Ts'o 				 "Inode bitmap for group %u overlaps "
333677260807STheodore Ts'o 				 "block group descriptors", i);
333777260807STheodore Ts'o 			if (!sb_rdonly(sb))
333877260807STheodore Ts'o 				return 0;
333977260807STheodore Ts'o 		}
33402b2d6d01STheodore Ts'o 		if (inode_bitmap < first_block || inode_bitmap > last_block) {
3341b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3342a9df9a49STheodore Ts'o 			       "Inode bitmap for group %u not in group "
3343b31e1552SEric Sandeen 			       "(block %llu)!", i, inode_bitmap);
3344ac27a0ecSDave Kleikamp 			return 0;
3345ac27a0ecSDave Kleikamp 		}
33468fadc143SAlexandre Ratchov 		inode_table = ext4_inode_table(sb, gdp);
3347829fa70dSTheodore Ts'o 		if (inode_table == sb_block) {
3348829fa70dSTheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3349829fa70dSTheodore Ts'o 				 "Inode table for group %u overlaps "
3350829fa70dSTheodore Ts'o 				 "superblock", i);
335118db4b4eSTheodore Ts'o 			if (!sb_rdonly(sb))
335218db4b4eSTheodore Ts'o 				return 0;
3353829fa70dSTheodore Ts'o 		}
335477260807STheodore Ts'o 		if (inode_table >= sb_block + 1 &&
335577260807STheodore Ts'o 		    inode_table <= last_bg_block) {
335677260807STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
335777260807STheodore Ts'o 				 "Inode table for group %u overlaps "
335877260807STheodore Ts'o 				 "block group descriptors", i);
335977260807STheodore Ts'o 			if (!sb_rdonly(sb))
336077260807STheodore Ts'o 				return 0;
336177260807STheodore Ts'o 		}
3362bd81d8eeSLaurent Vivier 		if (inode_table < first_block ||
33632b2d6d01STheodore Ts'o 		    inode_table + sbi->s_itb_per_group - 1 > last_block) {
3364b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3365a9df9a49STheodore Ts'o 			       "Inode table for group %u not in group "
3366b31e1552SEric Sandeen 			       "(block %llu)!", i, inode_table);
3367ac27a0ecSDave Kleikamp 			return 0;
3368ac27a0ecSDave Kleikamp 		}
3369955ce5f5SAneesh Kumar K.V 		ext4_lock_group(sb, i);
3370feb0ab32SDarrick J. Wong 		if (!ext4_group_desc_csum_verify(sb, i, gdp)) {
3371b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
3372b31e1552SEric Sandeen 				 "Checksum for group %u failed (%u!=%u)",
3373e2b911c5SDarrick J. Wong 				 i, le16_to_cpu(ext4_group_desc_csum(sb, i,
3374fd2d4291SAvantika Mathur 				     gdp)), le16_to_cpu(gdp->bg_checksum));
3375bc98a42cSDavid Howells 			if (!sb_rdonly(sb)) {
3376955ce5f5SAneesh Kumar K.V 				ext4_unlock_group(sb, i);
3377717d50e4SAndreas Dilger 				return 0;
3378717d50e4SAndreas Dilger 			}
33797ee1ec4cSLi Zefan 		}
3380955ce5f5SAneesh Kumar K.V 		ext4_unlock_group(sb, i);
3381ce421581SJose R. Santos 		if (!flexbg_flag)
3382617ba13bSMingming Cao 			first_block += EXT4_BLOCKS_PER_GROUP(sb);
3383ac27a0ecSDave Kleikamp 	}
3384bfff6873SLukas Czerner 	if (NULL != first_not_zeroed)
3385bfff6873SLukas Czerner 		*first_not_zeroed = grp;
3386ac27a0ecSDave Kleikamp 	return 1;
3387ac27a0ecSDave Kleikamp }
3388ac27a0ecSDave Kleikamp 
3389cd2291a4SEric Sandeen /*
3390cd2291a4SEric Sandeen  * Maximal extent format file size.
3391cd2291a4SEric Sandeen  * Resulting logical blkno at s_maxbytes must fit in our on-disk
3392cd2291a4SEric Sandeen  * extent format containers, within a sector_t, and within i_blocks
3393cd2291a4SEric Sandeen  * in the vfs.  ext4 inode has 48 bits of i_block in fsblock units,
3394cd2291a4SEric Sandeen  * so that won't be a limiting factor.
3395cd2291a4SEric Sandeen  *
3396f17722f9SLukas Czerner  * However there is other limiting factor. We do store extents in the form
3397f17722f9SLukas Czerner  * of starting block and length, hence the resulting length of the extent
3398f17722f9SLukas Czerner  * covering maximum file size must fit into on-disk format containers as
3399f17722f9SLukas Czerner  * well. Given that length is always by 1 unit bigger than max unit (because
3400f17722f9SLukas Czerner  * we count 0 as well) we have to lower the s_maxbytes by one fs block.
3401f17722f9SLukas Czerner  *
3402cd2291a4SEric Sandeen  * Note, this does *not* consider any metadata overhead for vfs i_blocks.
3403cd2291a4SEric Sandeen  */
3404f287a1a5STheodore Ts'o static loff_t ext4_max_size(int blkbits, int has_huge_files)
3405cd2291a4SEric Sandeen {
3406cd2291a4SEric Sandeen 	loff_t res;
3407cd2291a4SEric Sandeen 	loff_t upper_limit = MAX_LFS_FILESIZE;
3408cd2291a4SEric Sandeen 
340972deb455SChristoph Hellwig 	BUILD_BUG_ON(sizeof(blkcnt_t) < sizeof(u64));
341072deb455SChristoph Hellwig 
341172deb455SChristoph Hellwig 	if (!has_huge_files) {
3412cd2291a4SEric Sandeen 		upper_limit = (1LL << 32) - 1;
3413cd2291a4SEric Sandeen 
3414cd2291a4SEric Sandeen 		/* total blocks in file system block size */
3415cd2291a4SEric Sandeen 		upper_limit >>= (blkbits - 9);
3416cd2291a4SEric Sandeen 		upper_limit <<= blkbits;
3417cd2291a4SEric Sandeen 	}
3418cd2291a4SEric Sandeen 
3419f17722f9SLukas Czerner 	/*
3420f17722f9SLukas Czerner 	 * 32-bit extent-start container, ee_block. We lower the maxbytes
3421f17722f9SLukas Czerner 	 * by one fs block, so ee_len can cover the extent of maximum file
3422f17722f9SLukas Czerner 	 * size
3423f17722f9SLukas Czerner 	 */
3424f17722f9SLukas Czerner 	res = (1LL << 32) - 1;
3425cd2291a4SEric Sandeen 	res <<= blkbits;
3426cd2291a4SEric Sandeen 
3427cd2291a4SEric Sandeen 	/* Sanity check against vm- & vfs- imposed limits */
3428cd2291a4SEric Sandeen 	if (res > upper_limit)
3429cd2291a4SEric Sandeen 		res = upper_limit;
3430cd2291a4SEric Sandeen 
3431cd2291a4SEric Sandeen 	return res;
3432cd2291a4SEric Sandeen }
3433ac27a0ecSDave Kleikamp 
3434ac27a0ecSDave Kleikamp /*
3435cd2291a4SEric Sandeen  * Maximal bitmap file size.  There is a direct, and {,double-,triple-}indirect
34360fc1b451SAneesh Kumar K.V  * block limit, and also a limit of (2^48 - 1) 512-byte sectors in i_blocks.
34370fc1b451SAneesh Kumar K.V  * We need to be 1 filesystem block less than the 2^48 sector limit.
3438ac27a0ecSDave Kleikamp  */
3439f287a1a5STheodore Ts'o static loff_t ext4_max_bitmap_size(int bits, int has_huge_files)
3440ac27a0ecSDave Kleikamp {
34415c93e8ecSZhang Yi 	loff_t upper_limit, res = EXT4_NDIR_BLOCKS;
34420fc1b451SAneesh Kumar K.V 	int meta_blocks;
34435c93e8ecSZhang Yi 	unsigned int ppb = 1 << (bits - 2);
344475ca6ad4SRitesh Harjani 
344575ca6ad4SRitesh Harjani 	/*
344675ca6ad4SRitesh Harjani 	 * This is calculated to be the largest file size for a dense, block
34470b8e58a1SAndreas Dilger 	 * mapped file such that the file's total number of 512-byte sectors,
34480b8e58a1SAndreas Dilger 	 * including data and all indirect blocks, does not exceed (2^48 - 1).
34490b8e58a1SAndreas Dilger 	 *
34500b8e58a1SAndreas Dilger 	 * __u32 i_blocks_lo and _u16 i_blocks_high represent the total
34510b8e58a1SAndreas Dilger 	 * number of 512-byte sectors of the file.
34520fc1b451SAneesh Kumar K.V 	 */
345372deb455SChristoph Hellwig 	if (!has_huge_files) {
34540fc1b451SAneesh Kumar K.V 		/*
345572deb455SChristoph Hellwig 		 * !has_huge_files or implies that the inode i_block field
345672deb455SChristoph Hellwig 		 * represents total file blocks in 2^32 512-byte sectors ==
345772deb455SChristoph Hellwig 		 * size of vfs inode i_blocks * 8
34580fc1b451SAneesh Kumar K.V 		 */
34590fc1b451SAneesh Kumar K.V 		upper_limit = (1LL << 32) - 1;
34600fc1b451SAneesh Kumar K.V 
34610fc1b451SAneesh Kumar K.V 		/* total blocks in file system block size */
34620fc1b451SAneesh Kumar K.V 		upper_limit >>= (bits - 9);
34630fc1b451SAneesh Kumar K.V 
34640fc1b451SAneesh Kumar K.V 	} else {
34658180a562SAneesh Kumar K.V 		/*
34668180a562SAneesh Kumar K.V 		 * We use 48 bit ext4_inode i_blocks
34678180a562SAneesh Kumar K.V 		 * With EXT4_HUGE_FILE_FL set the i_blocks
34688180a562SAneesh Kumar K.V 		 * represent total number of blocks in
34698180a562SAneesh Kumar K.V 		 * file system block size
34708180a562SAneesh Kumar K.V 		 */
34710fc1b451SAneesh Kumar K.V 		upper_limit = (1LL << 48) - 1;
34720fc1b451SAneesh Kumar K.V 
34730fc1b451SAneesh Kumar K.V 	}
34740fc1b451SAneesh Kumar K.V 
34755c93e8ecSZhang Yi 	/* Compute how many blocks we can address by block tree */
34765c93e8ecSZhang Yi 	res += ppb;
34775c93e8ecSZhang Yi 	res += ppb * ppb;
34785c93e8ecSZhang Yi 	res += ((loff_t)ppb) * ppb * ppb;
34795c93e8ecSZhang Yi 	/* Compute how many metadata blocks are needed */
34805c93e8ecSZhang Yi 	meta_blocks = 1;
34815c93e8ecSZhang Yi 	meta_blocks += 1 + ppb;
34825c93e8ecSZhang Yi 	meta_blocks += 1 + ppb + ppb * ppb;
34835c93e8ecSZhang Yi 	/* Does block tree limit file size? */
34845c93e8ecSZhang Yi 	if (res + meta_blocks <= upper_limit)
34855c93e8ecSZhang Yi 		goto check_lfs;
34865c93e8ecSZhang Yi 
34875c93e8ecSZhang Yi 	res = upper_limit;
34885c93e8ecSZhang Yi 	/* How many metadata blocks are needed for addressing upper_limit? */
34895c93e8ecSZhang Yi 	upper_limit -= EXT4_NDIR_BLOCKS;
34900fc1b451SAneesh Kumar K.V 	/* indirect blocks */
34910fc1b451SAneesh Kumar K.V 	meta_blocks = 1;
34925c93e8ecSZhang Yi 	upper_limit -= ppb;
34930fc1b451SAneesh Kumar K.V 	/* double indirect blocks */
34945c93e8ecSZhang Yi 	if (upper_limit < ppb * ppb) {
34955c93e8ecSZhang Yi 		meta_blocks += 1 + DIV_ROUND_UP_ULL(upper_limit, ppb);
34965c93e8ecSZhang Yi 		res -= meta_blocks;
34975c93e8ecSZhang Yi 		goto check_lfs;
34985c93e8ecSZhang Yi 	}
34995c93e8ecSZhang Yi 	meta_blocks += 1 + ppb;
35005c93e8ecSZhang Yi 	upper_limit -= ppb * ppb;
35015c93e8ecSZhang Yi 	/* tripple indirect blocks for the rest */
35025c93e8ecSZhang Yi 	meta_blocks += 1 + DIV_ROUND_UP_ULL(upper_limit, ppb) +
35035c93e8ecSZhang Yi 		DIV_ROUND_UP_ULL(upper_limit, ppb*ppb);
35045c93e8ecSZhang Yi 	res -= meta_blocks;
35055c93e8ecSZhang Yi check_lfs:
3506ac27a0ecSDave Kleikamp 	res <<= bits;
35070fc1b451SAneesh Kumar K.V 	if (res > MAX_LFS_FILESIZE)
35080fc1b451SAneesh Kumar K.V 		res = MAX_LFS_FILESIZE;
35090fc1b451SAneesh Kumar K.V 
35105c93e8ecSZhang Yi 	return res;
3511ac27a0ecSDave Kleikamp }
3512ac27a0ecSDave Kleikamp 
3513617ba13bSMingming Cao static ext4_fsblk_t descriptor_loc(struct super_block *sb,
351470bbb3e0SAndrew Morton 				   ext4_fsblk_t logical_sb_block, int nr)
3515ac27a0ecSDave Kleikamp {
3516617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3517fd2d4291SAvantika Mathur 	ext4_group_t bg, first_meta_bg;
3518ac27a0ecSDave Kleikamp 	int has_super = 0;
3519ac27a0ecSDave Kleikamp 
3520ac27a0ecSDave Kleikamp 	first_meta_bg = le32_to_cpu(sbi->s_es->s_first_meta_bg);
3521ac27a0ecSDave Kleikamp 
3522e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_meta_bg(sb) || nr < first_meta_bg)
352370bbb3e0SAndrew Morton 		return logical_sb_block + nr + 1;
3524ac27a0ecSDave Kleikamp 	bg = sbi->s_desc_per_block * nr;
3525617ba13bSMingming Cao 	if (ext4_bg_has_super(sb, bg))
3526ac27a0ecSDave Kleikamp 		has_super = 1;
35270b8e58a1SAndreas Dilger 
3528bd63f6b0SDarrick J. Wong 	/*
3529bd63f6b0SDarrick J. Wong 	 * If we have a meta_bg fs with 1k blocks, group 0's GDT is at
3530bd63f6b0SDarrick J. Wong 	 * block 2, not 1.  If s_first_data_block == 0 (bigalloc is enabled
3531bd63f6b0SDarrick J. Wong 	 * on modern mke2fs or blksize > 1k on older mke2fs) then we must
3532bd63f6b0SDarrick J. Wong 	 * compensate.
3533bd63f6b0SDarrick J. Wong 	 */
3534bd63f6b0SDarrick J. Wong 	if (sb->s_blocksize == 1024 && nr == 0 &&
353549598e04SJun Piao 	    le32_to_cpu(sbi->s_es->s_first_data_block) == 0)
3536bd63f6b0SDarrick J. Wong 		has_super++;
3537bd63f6b0SDarrick J. Wong 
3538617ba13bSMingming Cao 	return (has_super + ext4_group_first_block_no(sb, bg));
3539ac27a0ecSDave Kleikamp }
3540ac27a0ecSDave Kleikamp 
3541c9de560dSAlex Tomas /**
3542c9de560dSAlex Tomas  * ext4_get_stripe_size: Get the stripe size.
3543c9de560dSAlex Tomas  * @sbi: In memory super block info
3544c9de560dSAlex Tomas  *
3545c9de560dSAlex Tomas  * If we have specified it via mount option, then
3546c9de560dSAlex Tomas  * use the mount option value. If the value specified at mount time is
3547c9de560dSAlex Tomas  * greater than the blocks per group use the super block value.
3548c9de560dSAlex Tomas  * If the super block value is greater than blocks per group return 0.
3549c9de560dSAlex Tomas  * Allocator needs it be less than blocks per group.
3550c9de560dSAlex Tomas  *
3551c9de560dSAlex Tomas  */
3552c9de560dSAlex Tomas static unsigned long ext4_get_stripe_size(struct ext4_sb_info *sbi)
3553c9de560dSAlex Tomas {
3554c9de560dSAlex Tomas 	unsigned long stride = le16_to_cpu(sbi->s_es->s_raid_stride);
3555c9de560dSAlex Tomas 	unsigned long stripe_width =
3556c9de560dSAlex Tomas 			le32_to_cpu(sbi->s_es->s_raid_stripe_width);
35573eb08658SDan Ehrenberg 	int ret;
3558c9de560dSAlex Tomas 
3559c9de560dSAlex Tomas 	if (sbi->s_stripe && sbi->s_stripe <= sbi->s_blocks_per_group)
35603eb08658SDan Ehrenberg 		ret = sbi->s_stripe;
35615469d7c3SJan Kara 	else if (stripe_width && stripe_width <= sbi->s_blocks_per_group)
35623eb08658SDan Ehrenberg 		ret = stripe_width;
35635469d7c3SJan Kara 	else if (stride && stride <= sbi->s_blocks_per_group)
35643eb08658SDan Ehrenberg 		ret = stride;
35653eb08658SDan Ehrenberg 	else
35663eb08658SDan Ehrenberg 		ret = 0;
3567c9de560dSAlex Tomas 
35683eb08658SDan Ehrenberg 	/*
35693eb08658SDan Ehrenberg 	 * If the stripe width is 1, this makes no sense and
35703eb08658SDan Ehrenberg 	 * we set it to 0 to turn off stripe handling code.
35713eb08658SDan Ehrenberg 	 */
35723eb08658SDan Ehrenberg 	if (ret <= 1)
35733eb08658SDan Ehrenberg 		ret = 0;
3574c9de560dSAlex Tomas 
35753eb08658SDan Ehrenberg 	return ret;
3576c9de560dSAlex Tomas }
3577ac27a0ecSDave Kleikamp 
3578a13fb1a4SEric Sandeen /*
3579a13fb1a4SEric Sandeen  * Check whether this filesystem can be mounted based on
3580a13fb1a4SEric Sandeen  * the features present and the RDONLY/RDWR mount requested.
3581a13fb1a4SEric Sandeen  * Returns 1 if this filesystem can be mounted as requested,
3582a13fb1a4SEric Sandeen  * 0 if it cannot be.
3583a13fb1a4SEric Sandeen  */
358425c6d98fSJan Kara int ext4_feature_set_ok(struct super_block *sb, int readonly)
3585a13fb1a4SEric Sandeen {
3586e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext4_incompat_features(sb)) {
3587a13fb1a4SEric Sandeen 		ext4_msg(sb, KERN_ERR,
3588a13fb1a4SEric Sandeen 			"Couldn't mount because of "
3589a13fb1a4SEric Sandeen 			"unsupported optional features (%x)",
3590a13fb1a4SEric Sandeen 			(le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_incompat) &
3591a13fb1a4SEric Sandeen 			~EXT4_FEATURE_INCOMPAT_SUPP));
3592a13fb1a4SEric Sandeen 		return 0;
3593a13fb1a4SEric Sandeen 	}
3594a13fb1a4SEric Sandeen 
35955298d4bfSChristoph Hellwig #if !IS_ENABLED(CONFIG_UNICODE)
3596c83ad55eSGabriel Krisman Bertazi 	if (ext4_has_feature_casefold(sb)) {
3597c83ad55eSGabriel Krisman Bertazi 		ext4_msg(sb, KERN_ERR,
3598c83ad55eSGabriel Krisman Bertazi 			 "Filesystem with casefold feature cannot be "
3599c83ad55eSGabriel Krisman Bertazi 			 "mounted without CONFIG_UNICODE");
3600c83ad55eSGabriel Krisman Bertazi 		return 0;
3601c83ad55eSGabriel Krisman Bertazi 	}
3602c83ad55eSGabriel Krisman Bertazi #endif
3603c83ad55eSGabriel Krisman Bertazi 
3604a13fb1a4SEric Sandeen 	if (readonly)
3605a13fb1a4SEric Sandeen 		return 1;
3606a13fb1a4SEric Sandeen 
3607e2b911c5SDarrick J. Wong 	if (ext4_has_feature_readonly(sb)) {
36082cb5cc8bSDarrick J. Wong 		ext4_msg(sb, KERN_INFO, "filesystem is read-only");
36091751e8a6SLinus Torvalds 		sb->s_flags |= SB_RDONLY;
36102cb5cc8bSDarrick J. Wong 		return 1;
36112cb5cc8bSDarrick J. Wong 	}
36122cb5cc8bSDarrick J. Wong 
3613a13fb1a4SEric Sandeen 	/* Check that feature set is OK for a read-write mount */
3614e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext4_ro_compat_features(sb)) {
3615a13fb1a4SEric Sandeen 		ext4_msg(sb, KERN_ERR, "couldn't mount RDWR because of "
3616a13fb1a4SEric Sandeen 			 "unsupported optional features (%x)",
3617a13fb1a4SEric Sandeen 			 (le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_ro_compat) &
3618a13fb1a4SEric Sandeen 				~EXT4_FEATURE_RO_COMPAT_SUPP));
3619a13fb1a4SEric Sandeen 		return 0;
3620a13fb1a4SEric Sandeen 	}
3621e2b911c5SDarrick J. Wong 	if (ext4_has_feature_bigalloc(sb) && !ext4_has_feature_extents(sb)) {
3622bab08ab9STheodore Ts'o 		ext4_msg(sb, KERN_ERR,
3623bab08ab9STheodore Ts'o 			 "Can't support bigalloc feature without "
3624bab08ab9STheodore Ts'o 			 "extents feature\n");
3625bab08ab9STheodore Ts'o 		return 0;
3626bab08ab9STheodore Ts'o 	}
36277c319d32SAditya Kali 
36289db176bcSJan Kara #if !IS_ENABLED(CONFIG_QUOTA) || !IS_ENABLED(CONFIG_QFMT_V2)
3629d65d87a0STheodore Ts'o 	if (!readonly && (ext4_has_feature_quota(sb) ||
3630d65d87a0STheodore Ts'o 			  ext4_has_feature_project(sb))) {
36317c319d32SAditya Kali 		ext4_msg(sb, KERN_ERR,
3632d65d87a0STheodore Ts'o 			 "The kernel was not built with CONFIG_QUOTA and CONFIG_QFMT_V2");
3633689c958cSLi Xi 		return 0;
3634689c958cSLi Xi 	}
36357c319d32SAditya Kali #endif  /* CONFIG_QUOTA */
3636a13fb1a4SEric Sandeen 	return 1;
3637a13fb1a4SEric Sandeen }
3638a13fb1a4SEric Sandeen 
363966e61a9eSTheodore Ts'o /*
364066e61a9eSTheodore Ts'o  * This function is called once a day if we have errors logged
364166e61a9eSTheodore Ts'o  * on the file system
364266e61a9eSTheodore Ts'o  */
3643235699a8SKees Cook static void print_daily_error_info(struct timer_list *t)
364466e61a9eSTheodore Ts'o {
3645235699a8SKees Cook 	struct ext4_sb_info *sbi = from_timer(sbi, t, s_err_report);
3646235699a8SKees Cook 	struct super_block *sb = sbi->s_sb;
3647235699a8SKees Cook 	struct ext4_super_block *es = sbi->s_es;
364866e61a9eSTheodore Ts'o 
364966e61a9eSTheodore Ts'o 	if (es->s_error_count)
3650ae0f78deSTheodore Ts'o 		/* fsck newer than v1.41.13 is needed to clean this condition. */
3651ae0f78deSTheodore Ts'o 		ext4_msg(sb, KERN_NOTICE, "error count since last fsck: %u",
365266e61a9eSTheodore Ts'o 			 le32_to_cpu(es->s_error_count));
365366e61a9eSTheodore Ts'o 	if (es->s_first_error_time) {
36546a0678a7SArnd Bergmann 		printk(KERN_NOTICE "EXT4-fs (%s): initial error at time %llu: %.*s:%d",
36556a0678a7SArnd Bergmann 		       sb->s_id,
36566a0678a7SArnd Bergmann 		       ext4_get_tstamp(es, s_first_error_time),
365766e61a9eSTheodore Ts'o 		       (int) sizeof(es->s_first_error_func),
365866e61a9eSTheodore Ts'o 		       es->s_first_error_func,
365966e61a9eSTheodore Ts'o 		       le32_to_cpu(es->s_first_error_line));
366066e61a9eSTheodore Ts'o 		if (es->s_first_error_ino)
3661651e1c3bSJoe Perches 			printk(KERN_CONT ": inode %u",
366266e61a9eSTheodore Ts'o 			       le32_to_cpu(es->s_first_error_ino));
366366e61a9eSTheodore Ts'o 		if (es->s_first_error_block)
3664651e1c3bSJoe Perches 			printk(KERN_CONT ": block %llu", (unsigned long long)
366566e61a9eSTheodore Ts'o 			       le64_to_cpu(es->s_first_error_block));
3666651e1c3bSJoe Perches 		printk(KERN_CONT "\n");
366766e61a9eSTheodore Ts'o 	}
366866e61a9eSTheodore Ts'o 	if (es->s_last_error_time) {
36696a0678a7SArnd Bergmann 		printk(KERN_NOTICE "EXT4-fs (%s): last error at time %llu: %.*s:%d",
36706a0678a7SArnd Bergmann 		       sb->s_id,
36716a0678a7SArnd Bergmann 		       ext4_get_tstamp(es, s_last_error_time),
367266e61a9eSTheodore Ts'o 		       (int) sizeof(es->s_last_error_func),
367366e61a9eSTheodore Ts'o 		       es->s_last_error_func,
367466e61a9eSTheodore Ts'o 		       le32_to_cpu(es->s_last_error_line));
367566e61a9eSTheodore Ts'o 		if (es->s_last_error_ino)
3676651e1c3bSJoe Perches 			printk(KERN_CONT ": inode %u",
367766e61a9eSTheodore Ts'o 			       le32_to_cpu(es->s_last_error_ino));
367866e61a9eSTheodore Ts'o 		if (es->s_last_error_block)
3679651e1c3bSJoe Perches 			printk(KERN_CONT ": block %llu", (unsigned long long)
368066e61a9eSTheodore Ts'o 			       le64_to_cpu(es->s_last_error_block));
3681651e1c3bSJoe Perches 		printk(KERN_CONT "\n");
368266e61a9eSTheodore Ts'o 	}
368366e61a9eSTheodore Ts'o 	mod_timer(&sbi->s_err_report, jiffies + 24*60*60*HZ);  /* Once a day */
368466e61a9eSTheodore Ts'o }
368566e61a9eSTheodore Ts'o 
3686bfff6873SLukas Czerner /* Find next suitable group and run ext4_init_inode_table */
3687bfff6873SLukas Czerner static int ext4_run_li_request(struct ext4_li_request *elr)
3688bfff6873SLukas Czerner {
3689bfff6873SLukas Czerner 	struct ext4_group_desc *gdp = NULL;
36903d392b26STheodore Ts'o 	struct super_block *sb = elr->lr_super;
36913d392b26STheodore Ts'o 	ext4_group_t ngroups = EXT4_SB(sb)->s_groups_count;
36923d392b26STheodore Ts'o 	ext4_group_t group = elr->lr_next_group;
36933d392b26STheodore Ts'o 	unsigned int prefetch_ios = 0;
3694bfff6873SLukas Czerner 	int ret = 0;
369539fec688SShaoying Xu 	u64 start_time;
3696bfff6873SLukas Czerner 
36973d392b26STheodore Ts'o 	if (elr->lr_mode == EXT4_LI_MODE_PREFETCH_BBITMAP) {
36983d392b26STheodore Ts'o 		elr->lr_next_group = ext4_mb_prefetch(sb, group,
36993d392b26STheodore Ts'o 				EXT4_SB(sb)->s_mb_prefetch, &prefetch_ios);
37003d392b26STheodore Ts'o 		if (prefetch_ios)
37013d392b26STheodore Ts'o 			ext4_mb_prefetch_fini(sb, elr->lr_next_group,
37023d392b26STheodore Ts'o 					      prefetch_ios);
37033d392b26STheodore Ts'o 		trace_ext4_prefetch_bitmaps(sb, group, elr->lr_next_group,
37043d392b26STheodore Ts'o 					    prefetch_ios);
37053d392b26STheodore Ts'o 		if (group >= elr->lr_next_group) {
37063d392b26STheodore Ts'o 			ret = 1;
37073d392b26STheodore Ts'o 			if (elr->lr_first_not_zeroed != ngroups &&
37083d392b26STheodore Ts'o 			    !sb_rdonly(sb) && test_opt(sb, INIT_INODE_TABLE)) {
37093d392b26STheodore Ts'o 				elr->lr_next_group = elr->lr_first_not_zeroed;
37103d392b26STheodore Ts'o 				elr->lr_mode = EXT4_LI_MODE_ITABLE;
37113d392b26STheodore Ts'o 				ret = 0;
37123d392b26STheodore Ts'o 			}
37133d392b26STheodore Ts'o 		}
37143d392b26STheodore Ts'o 		return ret;
37153d392b26STheodore Ts'o 	}
3716bfff6873SLukas Czerner 
37173d392b26STheodore Ts'o 	for (; group < ngroups; group++) {
3718bfff6873SLukas Czerner 		gdp = ext4_get_group_desc(sb, group, NULL);
3719bfff6873SLukas Czerner 		if (!gdp) {
3720bfff6873SLukas Czerner 			ret = 1;
3721bfff6873SLukas Czerner 			break;
3722bfff6873SLukas Czerner 		}
3723bfff6873SLukas Czerner 
3724bfff6873SLukas Czerner 		if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
3725bfff6873SLukas Czerner 			break;
3726bfff6873SLukas Czerner 	}
3727bfff6873SLukas Czerner 
37287f511862STheodore Ts'o 	if (group >= ngroups)
3729bfff6873SLukas Czerner 		ret = 1;
3730bfff6873SLukas Czerner 
3731bfff6873SLukas Czerner 	if (!ret) {
373239fec688SShaoying Xu 		start_time = ktime_get_real_ns();
3733bfff6873SLukas Czerner 		ret = ext4_init_inode_table(sb, group,
3734bfff6873SLukas Czerner 					    elr->lr_timeout ? 0 : 1);
37353d392b26STheodore Ts'o 		trace_ext4_lazy_itable_init(sb, group);
3736bfff6873SLukas Czerner 		if (elr->lr_timeout == 0) {
373739fec688SShaoying Xu 			elr->lr_timeout = nsecs_to_jiffies((ktime_get_real_ns() - start_time) *
373839fec688SShaoying Xu 				EXT4_SB(elr->lr_super)->s_li_wait_mult);
3739bfff6873SLukas Czerner 		}
3740bfff6873SLukas Czerner 		elr->lr_next_sched = jiffies + elr->lr_timeout;
3741bfff6873SLukas Czerner 		elr->lr_next_group = group + 1;
3742bfff6873SLukas Czerner 	}
3743bfff6873SLukas Czerner 	return ret;
3744bfff6873SLukas Czerner }
3745bfff6873SLukas Czerner 
3746bfff6873SLukas Czerner /*
3747bfff6873SLukas Czerner  * Remove lr_request from the list_request and free the
37484ed5c033SLukas Czerner  * request structure. Should be called with li_list_mtx held
3749bfff6873SLukas Czerner  */
3750bfff6873SLukas Czerner static void ext4_remove_li_request(struct ext4_li_request *elr)
3751bfff6873SLukas Czerner {
3752bfff6873SLukas Czerner 	if (!elr)
3753bfff6873SLukas Czerner 		return;
3754bfff6873SLukas Czerner 
3755bfff6873SLukas Czerner 	list_del(&elr->lr_request);
37563d392b26STheodore Ts'o 	EXT4_SB(elr->lr_super)->s_li_request = NULL;
3757bfff6873SLukas Czerner 	kfree(elr);
3758bfff6873SLukas Czerner }
3759bfff6873SLukas Czerner 
3760bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb)
3761bfff6873SLukas Czerner {
37621bb933fbSLukas Czerner 	mutex_lock(&ext4_li_mtx);
37631bb933fbSLukas Czerner 	if (!ext4_li_info) {
37641bb933fbSLukas Czerner 		mutex_unlock(&ext4_li_mtx);
3765bfff6873SLukas Czerner 		return;
37661bb933fbSLukas Czerner 	}
3767bfff6873SLukas Czerner 
3768bfff6873SLukas Czerner 	mutex_lock(&ext4_li_info->li_list_mtx);
37691bb933fbSLukas Czerner 	ext4_remove_li_request(EXT4_SB(sb)->s_li_request);
3770bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_info->li_list_mtx);
37711bb933fbSLukas Czerner 	mutex_unlock(&ext4_li_mtx);
3772bfff6873SLukas Czerner }
3773bfff6873SLukas Czerner 
37748f1f7453SEric Sandeen static struct task_struct *ext4_lazyinit_task;
37758f1f7453SEric Sandeen 
3776bfff6873SLukas Czerner /*
3777bfff6873SLukas Czerner  * This is the function where ext4lazyinit thread lives. It walks
3778bfff6873SLukas Czerner  * through the request list searching for next scheduled filesystem.
3779bfff6873SLukas Czerner  * When such a fs is found, run the lazy initialization request
3780bfff6873SLukas Czerner  * (ext4_rn_li_request) and keep track of the time spend in this
3781bfff6873SLukas Czerner  * function. Based on that time we compute next schedule time of
3782bfff6873SLukas Czerner  * the request. When walking through the list is complete, compute
3783bfff6873SLukas Czerner  * next waking time and put itself into sleep.
3784bfff6873SLukas Czerner  */
3785bfff6873SLukas Czerner static int ext4_lazyinit_thread(void *arg)
3786bfff6873SLukas Czerner {
3787c30365b9SYu Zhe 	struct ext4_lazy_init *eli = arg;
3788bfff6873SLukas Czerner 	struct list_head *pos, *n;
3789bfff6873SLukas Czerner 	struct ext4_li_request *elr;
37904ed5c033SLukas Czerner 	unsigned long next_wakeup, cur;
3791bfff6873SLukas Czerner 
3792bfff6873SLukas Czerner 	BUG_ON(NULL == eli);
37933b575495SLalith Rajendran 	set_freezable();
3794bfff6873SLukas Czerner 
3795bfff6873SLukas Czerner cont_thread:
3796bfff6873SLukas Czerner 	while (true) {
3797bfff6873SLukas Czerner 		next_wakeup = MAX_JIFFY_OFFSET;
3798bfff6873SLukas Czerner 
3799bfff6873SLukas Czerner 		mutex_lock(&eli->li_list_mtx);
3800bfff6873SLukas Czerner 		if (list_empty(&eli->li_request_list)) {
3801bfff6873SLukas Czerner 			mutex_unlock(&eli->li_list_mtx);
3802bfff6873SLukas Czerner 			goto exit_thread;
3803bfff6873SLukas Czerner 		}
3804bfff6873SLukas Czerner 		list_for_each_safe(pos, n, &eli->li_request_list) {
3805e22834f0SDmitry Monakhov 			int err = 0;
3806e22834f0SDmitry Monakhov 			int progress = 0;
3807bfff6873SLukas Czerner 			elr = list_entry(pos, struct ext4_li_request,
3808bfff6873SLukas Czerner 					 lr_request);
3809bfff6873SLukas Czerner 
3810e22834f0SDmitry Monakhov 			if (time_before(jiffies, elr->lr_next_sched)) {
3811e22834f0SDmitry Monakhov 				if (time_before(elr->lr_next_sched, next_wakeup))
3812e22834f0SDmitry Monakhov 					next_wakeup = elr->lr_next_sched;
3813e22834f0SDmitry Monakhov 				continue;
3814e22834f0SDmitry Monakhov 			}
3815e22834f0SDmitry Monakhov 			if (down_read_trylock(&elr->lr_super->s_umount)) {
3816e22834f0SDmitry Monakhov 				if (sb_start_write_trylock(elr->lr_super)) {
3817e22834f0SDmitry Monakhov 					progress = 1;
3818e22834f0SDmitry Monakhov 					/*
3819e22834f0SDmitry Monakhov 					 * We hold sb->s_umount, sb can not
3820e22834f0SDmitry Monakhov 					 * be removed from the list, it is
3821e22834f0SDmitry Monakhov 					 * now safe to drop li_list_mtx
3822e22834f0SDmitry Monakhov 					 */
3823e22834f0SDmitry Monakhov 					mutex_unlock(&eli->li_list_mtx);
3824e22834f0SDmitry Monakhov 					err = ext4_run_li_request(elr);
3825e22834f0SDmitry Monakhov 					sb_end_write(elr->lr_super);
3826e22834f0SDmitry Monakhov 					mutex_lock(&eli->li_list_mtx);
3827e22834f0SDmitry Monakhov 					n = pos->next;
3828e22834f0SDmitry Monakhov 				}
3829e22834f0SDmitry Monakhov 				up_read((&elr->lr_super->s_umount));
3830e22834f0SDmitry Monakhov 			}
3831b2c78cd0STheodore Ts'o 			/* error, remove the lazy_init job */
3832e22834f0SDmitry Monakhov 			if (err) {
3833bfff6873SLukas Czerner 				ext4_remove_li_request(elr);
3834bfff6873SLukas Czerner 				continue;
3835bfff6873SLukas Czerner 			}
3836e22834f0SDmitry Monakhov 			if (!progress) {
3837e22834f0SDmitry Monakhov 				elr->lr_next_sched = jiffies +
38388032bf12SJason A. Donenfeld 					get_random_u32_below(EXT4_DEF_LI_MAX_START_DELAY * HZ);
3839b2c78cd0STheodore Ts'o 			}
3840bfff6873SLukas Czerner 			if (time_before(elr->lr_next_sched, next_wakeup))
3841bfff6873SLukas Czerner 				next_wakeup = elr->lr_next_sched;
3842bfff6873SLukas Czerner 		}
3843bfff6873SLukas Czerner 		mutex_unlock(&eli->li_list_mtx);
3844bfff6873SLukas Czerner 
3845a0acae0eSTejun Heo 		try_to_freeze();
3846bfff6873SLukas Czerner 
38474ed5c033SLukas Czerner 		cur = jiffies;
38484ed5c033SLukas Czerner 		if ((time_after_eq(cur, next_wakeup)) ||
3849f4245bd4SLukas Czerner 		    (MAX_JIFFY_OFFSET == next_wakeup)) {
3850bfff6873SLukas Czerner 			cond_resched();
3851bfff6873SLukas Czerner 			continue;
3852bfff6873SLukas Czerner 		}
3853bfff6873SLukas Czerner 
38544ed5c033SLukas Czerner 		schedule_timeout_interruptible(next_wakeup - cur);
38554ed5c033SLukas Czerner 
38568f1f7453SEric Sandeen 		if (kthread_should_stop()) {
38578f1f7453SEric Sandeen 			ext4_clear_request_list();
38588f1f7453SEric Sandeen 			goto exit_thread;
38598f1f7453SEric Sandeen 		}
3860bfff6873SLukas Czerner 	}
3861bfff6873SLukas Czerner 
3862bfff6873SLukas Czerner exit_thread:
3863bfff6873SLukas Czerner 	/*
3864bfff6873SLukas Czerner 	 * It looks like the request list is empty, but we need
3865bfff6873SLukas Czerner 	 * to check it under the li_list_mtx lock, to prevent any
3866bfff6873SLukas Czerner 	 * additions into it, and of course we should lock ext4_li_mtx
3867bfff6873SLukas Czerner 	 * to atomically free the list and ext4_li_info, because at
3868bfff6873SLukas Czerner 	 * this point another ext4 filesystem could be registering
3869bfff6873SLukas Czerner 	 * new one.
3870bfff6873SLukas Czerner 	 */
3871bfff6873SLukas Czerner 	mutex_lock(&ext4_li_mtx);
3872bfff6873SLukas Czerner 	mutex_lock(&eli->li_list_mtx);
3873bfff6873SLukas Czerner 	if (!list_empty(&eli->li_request_list)) {
3874bfff6873SLukas Czerner 		mutex_unlock(&eli->li_list_mtx);
3875bfff6873SLukas Czerner 		mutex_unlock(&ext4_li_mtx);
3876bfff6873SLukas Czerner 		goto cont_thread;
3877bfff6873SLukas Czerner 	}
3878bfff6873SLukas Czerner 	mutex_unlock(&eli->li_list_mtx);
3879bfff6873SLukas Czerner 	kfree(ext4_li_info);
3880bfff6873SLukas Czerner 	ext4_li_info = NULL;
3881bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_mtx);
3882bfff6873SLukas Czerner 
3883bfff6873SLukas Czerner 	return 0;
3884bfff6873SLukas Czerner }
3885bfff6873SLukas Czerner 
3886bfff6873SLukas Czerner static void ext4_clear_request_list(void)
3887bfff6873SLukas Czerner {
3888bfff6873SLukas Czerner 	struct list_head *pos, *n;
3889bfff6873SLukas Czerner 	struct ext4_li_request *elr;
3890bfff6873SLukas Czerner 
3891bfff6873SLukas Czerner 	mutex_lock(&ext4_li_info->li_list_mtx);
3892bfff6873SLukas Czerner 	list_for_each_safe(pos, n, &ext4_li_info->li_request_list) {
3893bfff6873SLukas Czerner 		elr = list_entry(pos, struct ext4_li_request,
3894bfff6873SLukas Czerner 				 lr_request);
3895bfff6873SLukas Czerner 		ext4_remove_li_request(elr);
3896bfff6873SLukas Czerner 	}
3897bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_info->li_list_mtx);
3898bfff6873SLukas Czerner }
3899bfff6873SLukas Czerner 
3900bfff6873SLukas Czerner static int ext4_run_lazyinit_thread(void)
3901bfff6873SLukas Czerner {
39028f1f7453SEric Sandeen 	ext4_lazyinit_task = kthread_run(ext4_lazyinit_thread,
39038f1f7453SEric Sandeen 					 ext4_li_info, "ext4lazyinit");
39048f1f7453SEric Sandeen 	if (IS_ERR(ext4_lazyinit_task)) {
39058f1f7453SEric Sandeen 		int err = PTR_ERR(ext4_lazyinit_task);
3906bfff6873SLukas Czerner 		ext4_clear_request_list();
3907bfff6873SLukas Czerner 		kfree(ext4_li_info);
3908bfff6873SLukas Czerner 		ext4_li_info = NULL;
390992b97816STheodore Ts'o 		printk(KERN_CRIT "EXT4-fs: error %d creating inode table "
3910bfff6873SLukas Czerner 				 "initialization thread\n",
3911bfff6873SLukas Czerner 				 err);
3912bfff6873SLukas Czerner 		return err;
3913bfff6873SLukas Czerner 	}
3914bfff6873SLukas Czerner 	ext4_li_info->li_state |= EXT4_LAZYINIT_RUNNING;
3915bfff6873SLukas Czerner 	return 0;
3916bfff6873SLukas Czerner }
3917bfff6873SLukas Czerner 
3918bfff6873SLukas Czerner /*
3919bfff6873SLukas Czerner  * Check whether it make sense to run itable init. thread or not.
3920bfff6873SLukas Czerner  * If there is at least one uninitialized inode table, return
3921bfff6873SLukas Czerner  * corresponding group number, else the loop goes through all
3922bfff6873SLukas Czerner  * groups and return total number of groups.
3923bfff6873SLukas Czerner  */
3924bfff6873SLukas Czerner static ext4_group_t ext4_has_uninit_itable(struct super_block *sb)
3925bfff6873SLukas Czerner {
3926bfff6873SLukas Czerner 	ext4_group_t group, ngroups = EXT4_SB(sb)->s_groups_count;
3927bfff6873SLukas Czerner 	struct ext4_group_desc *gdp = NULL;
3928bfff6873SLukas Czerner 
39298844618dSTheodore Ts'o 	if (!ext4_has_group_desc_csum(sb))
39308844618dSTheodore Ts'o 		return ngroups;
39318844618dSTheodore Ts'o 
3932bfff6873SLukas Czerner 	for (group = 0; group < ngroups; group++) {
3933bfff6873SLukas Czerner 		gdp = ext4_get_group_desc(sb, group, NULL);
3934bfff6873SLukas Czerner 		if (!gdp)
3935bfff6873SLukas Czerner 			continue;
3936bfff6873SLukas Czerner 
393750122847STheodore Ts'o 		if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
3938bfff6873SLukas Czerner 			break;
3939bfff6873SLukas Czerner 	}
3940bfff6873SLukas Czerner 
3941bfff6873SLukas Czerner 	return group;
3942bfff6873SLukas Czerner }
3943bfff6873SLukas Czerner 
3944bfff6873SLukas Czerner static int ext4_li_info_new(void)
3945bfff6873SLukas Czerner {
3946bfff6873SLukas Czerner 	struct ext4_lazy_init *eli = NULL;
3947bfff6873SLukas Czerner 
3948bfff6873SLukas Czerner 	eli = kzalloc(sizeof(*eli), GFP_KERNEL);
3949bfff6873SLukas Czerner 	if (!eli)
3950bfff6873SLukas Czerner 		return -ENOMEM;
3951bfff6873SLukas Czerner 
3952bfff6873SLukas Czerner 	INIT_LIST_HEAD(&eli->li_request_list);
3953bfff6873SLukas Czerner 	mutex_init(&eli->li_list_mtx);
3954bfff6873SLukas Czerner 
3955bfff6873SLukas Czerner 	eli->li_state |= EXT4_LAZYINIT_QUIT;
3956bfff6873SLukas Czerner 
3957bfff6873SLukas Czerner 	ext4_li_info = eli;
3958bfff6873SLukas Czerner 
3959bfff6873SLukas Czerner 	return 0;
3960bfff6873SLukas Czerner }
3961bfff6873SLukas Czerner 
3962bfff6873SLukas Czerner static struct ext4_li_request *ext4_li_request_new(struct super_block *sb,
3963bfff6873SLukas Czerner 					    ext4_group_t start)
3964bfff6873SLukas Czerner {
3965bfff6873SLukas Czerner 	struct ext4_li_request *elr;
3966bfff6873SLukas Czerner 
3967bfff6873SLukas Czerner 	elr = kzalloc(sizeof(*elr), GFP_KERNEL);
3968bfff6873SLukas Czerner 	if (!elr)
3969bfff6873SLukas Czerner 		return NULL;
3970bfff6873SLukas Czerner 
3971bfff6873SLukas Czerner 	elr->lr_super = sb;
39723d392b26STheodore Ts'o 	elr->lr_first_not_zeroed = start;
397321175ca4SHarshad Shirwadkar 	if (test_opt(sb, NO_PREFETCH_BLOCK_BITMAPS)) {
39743d392b26STheodore Ts'o 		elr->lr_mode = EXT4_LI_MODE_ITABLE;
3975bfff6873SLukas Czerner 		elr->lr_next_group = start;
397621175ca4SHarshad Shirwadkar 	} else {
397721175ca4SHarshad Shirwadkar 		elr->lr_mode = EXT4_LI_MODE_PREFETCH_BBITMAP;
39783d392b26STheodore Ts'o 	}
3979bfff6873SLukas Czerner 
3980bfff6873SLukas Czerner 	/*
3981bfff6873SLukas Czerner 	 * Randomize first schedule time of the request to
3982bfff6873SLukas Czerner 	 * spread the inode table initialization requests
3983bfff6873SLukas Czerner 	 * better.
3984bfff6873SLukas Czerner 	 */
39858032bf12SJason A. Donenfeld 	elr->lr_next_sched = jiffies + get_random_u32_below(EXT4_DEF_LI_MAX_START_DELAY * HZ);
3986bfff6873SLukas Czerner 	return elr;
3987bfff6873SLukas Czerner }
3988bfff6873SLukas Czerner 
39897f511862STheodore Ts'o int ext4_register_li_request(struct super_block *sb,
3990bfff6873SLukas Czerner 			     ext4_group_t first_not_zeroed)
3991bfff6873SLukas Czerner {
3992bfff6873SLukas Czerner 	struct ext4_sb_info *sbi = EXT4_SB(sb);
39937f511862STheodore Ts'o 	struct ext4_li_request *elr = NULL;
399449598e04SJun Piao 	ext4_group_t ngroups = sbi->s_groups_count;
39956c5a6cb9SAndrew Morton 	int ret = 0;
3996bfff6873SLukas Czerner 
39977f511862STheodore Ts'o 	mutex_lock(&ext4_li_mtx);
399851ce6511SLukas Czerner 	if (sbi->s_li_request != NULL) {
399951ce6511SLukas Czerner 		/*
400051ce6511SLukas Czerner 		 * Reset timeout so it can be computed again, because
400151ce6511SLukas Czerner 		 * s_li_wait_mult might have changed.
400251ce6511SLukas Czerner 		 */
400351ce6511SLukas Czerner 		sbi->s_li_request->lr_timeout = 0;
40047f511862STheodore Ts'o 		goto out;
400551ce6511SLukas Czerner 	}
4006bfff6873SLukas Czerner 
4007426d15adSJosh Triplett 	if (sb_rdonly(sb) ||
4008426d15adSJosh Triplett 	    (test_opt(sb, NO_PREFETCH_BLOCK_BITMAPS) &&
4009426d15adSJosh Triplett 	     (first_not_zeroed == ngroups || !test_opt(sb, INIT_INODE_TABLE))))
40107f511862STheodore Ts'o 		goto out;
4011bfff6873SLukas Czerner 
4012bfff6873SLukas Czerner 	elr = ext4_li_request_new(sb, first_not_zeroed);
40137f511862STheodore Ts'o 	if (!elr) {
40147f511862STheodore Ts'o 		ret = -ENOMEM;
40157f511862STheodore Ts'o 		goto out;
40167f511862STheodore Ts'o 	}
4017bfff6873SLukas Czerner 
4018bfff6873SLukas Czerner 	if (NULL == ext4_li_info) {
4019bfff6873SLukas Czerner 		ret = ext4_li_info_new();
4020bfff6873SLukas Czerner 		if (ret)
4021bfff6873SLukas Czerner 			goto out;
4022bfff6873SLukas Czerner 	}
4023bfff6873SLukas Czerner 
4024bfff6873SLukas Czerner 	mutex_lock(&ext4_li_info->li_list_mtx);
4025bfff6873SLukas Czerner 	list_add(&elr->lr_request, &ext4_li_info->li_request_list);
4026bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_info->li_list_mtx);
4027bfff6873SLukas Czerner 
4028bfff6873SLukas Czerner 	sbi->s_li_request = elr;
402946e4690bSTao Ma 	/*
403046e4690bSTao Ma 	 * set elr to NULL here since it has been inserted to
403146e4690bSTao Ma 	 * the request_list and the removal and free of it is
403246e4690bSTao Ma 	 * handled by ext4_clear_request_list from now on.
403346e4690bSTao Ma 	 */
403446e4690bSTao Ma 	elr = NULL;
4035bfff6873SLukas Czerner 
4036bfff6873SLukas Czerner 	if (!(ext4_li_info->li_state & EXT4_LAZYINIT_RUNNING)) {
4037bfff6873SLukas Czerner 		ret = ext4_run_lazyinit_thread();
4038bfff6873SLukas Czerner 		if (ret)
4039bfff6873SLukas Czerner 			goto out;
4040bfff6873SLukas Czerner 	}
4041bfff6873SLukas Czerner out:
4042bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_mtx);
4043beed5ecbSNicolas Kaiser 	if (ret)
4044bfff6873SLukas Czerner 		kfree(elr);
4045bfff6873SLukas Czerner 	return ret;
4046bfff6873SLukas Czerner }
4047bfff6873SLukas Czerner 
4048bfff6873SLukas Czerner /*
4049bfff6873SLukas Czerner  * We do not need to lock anything since this is called on
4050bfff6873SLukas Czerner  * module unload.
4051bfff6873SLukas Czerner  */
4052bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void)
4053bfff6873SLukas Czerner {
4054bfff6873SLukas Czerner 	/*
4055bfff6873SLukas Czerner 	 * If thread exited earlier
4056bfff6873SLukas Czerner 	 * there's nothing to be done.
4057bfff6873SLukas Czerner 	 */
40588f1f7453SEric Sandeen 	if (!ext4_li_info || !ext4_lazyinit_task)
4059bfff6873SLukas Czerner 		return;
4060bfff6873SLukas Czerner 
40618f1f7453SEric Sandeen 	kthread_stop(ext4_lazyinit_task);
4062bfff6873SLukas Czerner }
4063bfff6873SLukas Czerner 
406425ed6e8aSDarrick J. Wong static int set_journal_csum_feature_set(struct super_block *sb)
406525ed6e8aSDarrick J. Wong {
406625ed6e8aSDarrick J. Wong 	int ret = 1;
406725ed6e8aSDarrick J. Wong 	int compat, incompat;
406825ed6e8aSDarrick J. Wong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
406925ed6e8aSDarrick J. Wong 
40709aa5d32bSDmitry Monakhov 	if (ext4_has_metadata_csum(sb)) {
4071db9ee220SDarrick J. Wong 		/* journal checksum v3 */
407225ed6e8aSDarrick J. Wong 		compat = 0;
4073db9ee220SDarrick J. Wong 		incompat = JBD2_FEATURE_INCOMPAT_CSUM_V3;
407425ed6e8aSDarrick J. Wong 	} else {
407525ed6e8aSDarrick J. Wong 		/* journal checksum v1 */
407625ed6e8aSDarrick J. Wong 		compat = JBD2_FEATURE_COMPAT_CHECKSUM;
407725ed6e8aSDarrick J. Wong 		incompat = 0;
407825ed6e8aSDarrick J. Wong 	}
407925ed6e8aSDarrick J. Wong 
4080feb8c6d3SDarrick J. Wong 	jbd2_journal_clear_features(sbi->s_journal,
4081feb8c6d3SDarrick J. Wong 			JBD2_FEATURE_COMPAT_CHECKSUM, 0,
4082feb8c6d3SDarrick J. Wong 			JBD2_FEATURE_INCOMPAT_CSUM_V3 |
4083feb8c6d3SDarrick J. Wong 			JBD2_FEATURE_INCOMPAT_CSUM_V2);
408425ed6e8aSDarrick J. Wong 	if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
408525ed6e8aSDarrick J. Wong 		ret = jbd2_journal_set_features(sbi->s_journal,
408625ed6e8aSDarrick J. Wong 				compat, 0,
408725ed6e8aSDarrick J. Wong 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT |
408825ed6e8aSDarrick J. Wong 				incompat);
408925ed6e8aSDarrick J. Wong 	} else if (test_opt(sb, JOURNAL_CHECKSUM)) {
409025ed6e8aSDarrick J. Wong 		ret = jbd2_journal_set_features(sbi->s_journal,
409125ed6e8aSDarrick J. Wong 				compat, 0,
409225ed6e8aSDarrick J. Wong 				incompat);
409325ed6e8aSDarrick J. Wong 		jbd2_journal_clear_features(sbi->s_journal, 0, 0,
409425ed6e8aSDarrick J. Wong 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
409525ed6e8aSDarrick J. Wong 	} else {
4096feb8c6d3SDarrick J. Wong 		jbd2_journal_clear_features(sbi->s_journal, 0, 0,
4097feb8c6d3SDarrick J. Wong 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
409825ed6e8aSDarrick J. Wong 	}
409925ed6e8aSDarrick J. Wong 
410025ed6e8aSDarrick J. Wong 	return ret;
410125ed6e8aSDarrick J. Wong }
410225ed6e8aSDarrick J. Wong 
4103952fc18eSTheodore Ts'o /*
4104952fc18eSTheodore Ts'o  * Note: calculating the overhead so we can be compatible with
4105952fc18eSTheodore Ts'o  * historical BSD practice is quite difficult in the face of
4106952fc18eSTheodore Ts'o  * clusters/bigalloc.  This is because multiple metadata blocks from
4107952fc18eSTheodore Ts'o  * different block group can end up in the same allocation cluster.
4108952fc18eSTheodore Ts'o  * Calculating the exact overhead in the face of clustered allocation
4109952fc18eSTheodore Ts'o  * requires either O(all block bitmaps) in memory or O(number of block
4110952fc18eSTheodore Ts'o  * groups**2) in time.  We will still calculate the superblock for
4111952fc18eSTheodore Ts'o  * older file systems --- and if we come across with a bigalloc file
4112952fc18eSTheodore Ts'o  * system with zero in s_overhead_clusters the estimate will be close to
4113952fc18eSTheodore Ts'o  * correct especially for very large cluster sizes --- but for newer
4114952fc18eSTheodore Ts'o  * file systems, it's better to calculate this figure once at mkfs
4115952fc18eSTheodore Ts'o  * time, and store it in the superblock.  If the superblock value is
4116952fc18eSTheodore Ts'o  * present (even for non-bigalloc file systems), we will use it.
4117952fc18eSTheodore Ts'o  */
4118952fc18eSTheodore Ts'o static int count_overhead(struct super_block *sb, ext4_group_t grp,
4119952fc18eSTheodore Ts'o 			  char *buf)
4120952fc18eSTheodore Ts'o {
4121952fc18eSTheodore Ts'o 	struct ext4_sb_info	*sbi = EXT4_SB(sb);
4122952fc18eSTheodore Ts'o 	struct ext4_group_desc	*gdp;
4123952fc18eSTheodore Ts'o 	ext4_fsblk_t		first_block, last_block, b;
4124952fc18eSTheodore Ts'o 	ext4_group_t		i, ngroups = ext4_get_groups_count(sb);
4125952fc18eSTheodore Ts'o 	int			s, j, count = 0;
412610b01ee9STheodore Ts'o 	int			has_super = ext4_bg_has_super(sb, grp);
4127952fc18eSTheodore Ts'o 
4128e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_bigalloc(sb))
412910b01ee9STheodore Ts'o 		return (has_super + ext4_bg_num_gdb(sb, grp) +
413010b01ee9STheodore Ts'o 			(has_super ? le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) : 0) +
41310548bbb8STheodore Ts'o 			sbi->s_itb_per_group + 2);
41320548bbb8STheodore Ts'o 
4133952fc18eSTheodore Ts'o 	first_block = le32_to_cpu(sbi->s_es->s_first_data_block) +
4134952fc18eSTheodore Ts'o 		(grp * EXT4_BLOCKS_PER_GROUP(sb));
4135952fc18eSTheodore Ts'o 	last_block = first_block + EXT4_BLOCKS_PER_GROUP(sb) - 1;
4136952fc18eSTheodore Ts'o 	for (i = 0; i < ngroups; i++) {
4137952fc18eSTheodore Ts'o 		gdp = ext4_get_group_desc(sb, i, NULL);
4138952fc18eSTheodore Ts'o 		b = ext4_block_bitmap(sb, gdp);
4139952fc18eSTheodore Ts'o 		if (b >= first_block && b <= last_block) {
4140952fc18eSTheodore Ts'o 			ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf);
4141952fc18eSTheodore Ts'o 			count++;
4142952fc18eSTheodore Ts'o 		}
4143952fc18eSTheodore Ts'o 		b = ext4_inode_bitmap(sb, gdp);
4144952fc18eSTheodore Ts'o 		if (b >= first_block && b <= last_block) {
4145952fc18eSTheodore Ts'o 			ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf);
4146952fc18eSTheodore Ts'o 			count++;
4147952fc18eSTheodore Ts'o 		}
4148952fc18eSTheodore Ts'o 		b = ext4_inode_table(sb, gdp);
4149952fc18eSTheodore Ts'o 		if (b >= first_block && b + sbi->s_itb_per_group <= last_block)
4150952fc18eSTheodore Ts'o 			for (j = 0; j < sbi->s_itb_per_group; j++, b++) {
4151952fc18eSTheodore Ts'o 				int c = EXT4_B2C(sbi, b - first_block);
4152952fc18eSTheodore Ts'o 				ext4_set_bit(c, buf);
4153952fc18eSTheodore Ts'o 				count++;
4154952fc18eSTheodore Ts'o 			}
4155952fc18eSTheodore Ts'o 		if (i != grp)
4156952fc18eSTheodore Ts'o 			continue;
4157952fc18eSTheodore Ts'o 		s = 0;
4158952fc18eSTheodore Ts'o 		if (ext4_bg_has_super(sb, grp)) {
4159952fc18eSTheodore Ts'o 			ext4_set_bit(s++, buf);
4160952fc18eSTheodore Ts'o 			count++;
4161952fc18eSTheodore Ts'o 		}
4162c48ae41bSTheodore Ts'o 		j = ext4_bg_num_gdb(sb, grp);
4163c48ae41bSTheodore Ts'o 		if (s + j > EXT4_BLOCKS_PER_GROUP(sb)) {
4164c48ae41bSTheodore Ts'o 			ext4_error(sb, "Invalid number of block group "
4165c48ae41bSTheodore Ts'o 				   "descriptor blocks: %d", j);
4166c48ae41bSTheodore Ts'o 			j = EXT4_BLOCKS_PER_GROUP(sb) - s;
4167952fc18eSTheodore Ts'o 		}
4168c48ae41bSTheodore Ts'o 		count += j;
4169c48ae41bSTheodore Ts'o 		for (; j > 0; j--)
4170c48ae41bSTheodore Ts'o 			ext4_set_bit(EXT4_B2C(sbi, s++), buf);
4171952fc18eSTheodore Ts'o 	}
4172952fc18eSTheodore Ts'o 	if (!count)
4173952fc18eSTheodore Ts'o 		return 0;
4174952fc18eSTheodore Ts'o 	return EXT4_CLUSTERS_PER_GROUP(sb) -
4175952fc18eSTheodore Ts'o 		ext4_count_free(buf, EXT4_CLUSTERS_PER_GROUP(sb) / 8);
4176952fc18eSTheodore Ts'o }
4177952fc18eSTheodore Ts'o 
4178952fc18eSTheodore Ts'o /*
4179952fc18eSTheodore Ts'o  * Compute the overhead and stash it in sbi->s_overhead
4180952fc18eSTheodore Ts'o  */
4181952fc18eSTheodore Ts'o int ext4_calculate_overhead(struct super_block *sb)
4182952fc18eSTheodore Ts'o {
4183952fc18eSTheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4184952fc18eSTheodore Ts'o 	struct ext4_super_block *es = sbi->s_es;
41853c816dedSEric Whitney 	struct inode *j_inode;
41863c816dedSEric Whitney 	unsigned int j_blocks, j_inum = le32_to_cpu(es->s_journal_inum);
4187952fc18eSTheodore Ts'o 	ext4_group_t i, ngroups = ext4_get_groups_count(sb);
4188952fc18eSTheodore Ts'o 	ext4_fsblk_t overhead = 0;
41894fdb5543SDmitry Monakhov 	char *buf = (char *) get_zeroed_page(GFP_NOFS);
4190952fc18eSTheodore Ts'o 
4191952fc18eSTheodore Ts'o 	if (!buf)
4192952fc18eSTheodore Ts'o 		return -ENOMEM;
4193952fc18eSTheodore Ts'o 
4194952fc18eSTheodore Ts'o 	/*
4195952fc18eSTheodore Ts'o 	 * Compute the overhead (FS structures).  This is constant
4196952fc18eSTheodore Ts'o 	 * for a given filesystem unless the number of block groups
4197952fc18eSTheodore Ts'o 	 * changes so we cache the previous value until it does.
4198952fc18eSTheodore Ts'o 	 */
4199952fc18eSTheodore Ts'o 
4200952fc18eSTheodore Ts'o 	/*
4201952fc18eSTheodore Ts'o 	 * All of the blocks before first_data_block are overhead
4202952fc18eSTheodore Ts'o 	 */
4203952fc18eSTheodore Ts'o 	overhead = EXT4_B2C(sbi, le32_to_cpu(es->s_first_data_block));
4204952fc18eSTheodore Ts'o 
4205952fc18eSTheodore Ts'o 	/*
4206952fc18eSTheodore Ts'o 	 * Add the overhead found in each block group
4207952fc18eSTheodore Ts'o 	 */
4208952fc18eSTheodore Ts'o 	for (i = 0; i < ngroups; i++) {
4209952fc18eSTheodore Ts'o 		int blks;
4210952fc18eSTheodore Ts'o 
4211952fc18eSTheodore Ts'o 		blks = count_overhead(sb, i, buf);
4212952fc18eSTheodore Ts'o 		overhead += blks;
4213952fc18eSTheodore Ts'o 		if (blks)
4214952fc18eSTheodore Ts'o 			memset(buf, 0, PAGE_SIZE);
4215952fc18eSTheodore Ts'o 		cond_resched();
4216952fc18eSTheodore Ts'o 	}
42173c816dedSEric Whitney 
42183c816dedSEric Whitney 	/*
42193c816dedSEric Whitney 	 * Add the internal journal blocks whether the journal has been
42203c816dedSEric Whitney 	 * loaded or not
42213c816dedSEric Whitney 	 */
4222ee7ed3aaSChunguang Xu 	if (sbi->s_journal && !sbi->s_journal_bdev)
4223ede7dc7fSHarshad Shirwadkar 		overhead += EXT4_NUM_B2C(sbi, sbi->s_journal->j_total_len);
4224f1eec3b0SRitesh Harjani 	else if (ext4_has_feature_journal(sb) && !sbi->s_journal && j_inum) {
4225f1eec3b0SRitesh Harjani 		/* j_inum for internal journal is non-zero */
42263c816dedSEric Whitney 		j_inode = ext4_get_journal_inode(sb, j_inum);
42273c816dedSEric Whitney 		if (j_inode) {
42283c816dedSEric Whitney 			j_blocks = j_inode->i_size >> sb->s_blocksize_bits;
42293c816dedSEric Whitney 			overhead += EXT4_NUM_B2C(sbi, j_blocks);
42303c816dedSEric Whitney 			iput(j_inode);
42313c816dedSEric Whitney 		} else {
42323c816dedSEric Whitney 			ext4_msg(sb, KERN_ERR, "can't get journal size");
42333c816dedSEric Whitney 		}
42343c816dedSEric Whitney 	}
4235952fc18eSTheodore Ts'o 	sbi->s_overhead = overhead;
4236952fc18eSTheodore Ts'o 	smp_wmb();
4237952fc18eSTheodore Ts'o 	free_page((unsigned long) buf);
4238952fc18eSTheodore Ts'o 	return 0;
4239952fc18eSTheodore Ts'o }
4240952fc18eSTheodore Ts'o 
4241b5799018STheodore Ts'o static void ext4_set_resv_clusters(struct super_block *sb)
424227dd4385SLukas Czerner {
424327dd4385SLukas Czerner 	ext4_fsblk_t resv_clusters;
4244b5799018STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
424527dd4385SLukas Czerner 
424627dd4385SLukas Czerner 	/*
424730fac0f7SJan Kara 	 * There's no need to reserve anything when we aren't using extents.
424830fac0f7SJan Kara 	 * The space estimates are exact, there are no unwritten extents,
424930fac0f7SJan Kara 	 * hole punching doesn't need new metadata... This is needed especially
425030fac0f7SJan Kara 	 * to keep ext2/3 backward compatibility.
425130fac0f7SJan Kara 	 */
4252e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_extents(sb))
4253b5799018STheodore Ts'o 		return;
425430fac0f7SJan Kara 	/*
425527dd4385SLukas Czerner 	 * By default we reserve 2% or 4096 clusters, whichever is smaller.
425627dd4385SLukas Czerner 	 * This should cover the situations where we can not afford to run
425727dd4385SLukas Czerner 	 * out of space like for example punch hole, or converting
4258556615dcSLukas Czerner 	 * unwritten extents in delalloc path. In most cases such
425927dd4385SLukas Czerner 	 * allocation would require 1, or 2 blocks, higher numbers are
426027dd4385SLukas Czerner 	 * very rare.
426127dd4385SLukas Czerner 	 */
4262b5799018STheodore Ts'o 	resv_clusters = (ext4_blocks_count(sbi->s_es) >>
4263b5799018STheodore Ts'o 			 sbi->s_cluster_bits);
426427dd4385SLukas Czerner 
426527dd4385SLukas Czerner 	do_div(resv_clusters, 50);
426627dd4385SLukas Czerner 	resv_clusters = min_t(ext4_fsblk_t, resv_clusters, 4096);
426727dd4385SLukas Czerner 
4268b5799018STheodore Ts'o 	atomic64_set(&sbi->s_resv_clusters, resv_clusters);
426927dd4385SLukas Czerner }
427027dd4385SLukas Czerner 
4271ca9b404fSRoman Anufriev static const char *ext4_quota_mode(struct super_block *sb)
4272ca9b404fSRoman Anufriev {
4273ca9b404fSRoman Anufriev #ifdef CONFIG_QUOTA
4274ca9b404fSRoman Anufriev 	if (!ext4_quota_capable(sb))
4275ca9b404fSRoman Anufriev 		return "none";
4276ca9b404fSRoman Anufriev 
4277ca9b404fSRoman Anufriev 	if (EXT4_SB(sb)->s_journal && ext4_is_quota_journalled(sb))
4278ca9b404fSRoman Anufriev 		return "journalled";
4279ca9b404fSRoman Anufriev 	else
4280ca9b404fSRoman Anufriev 		return "writeback";
4281ca9b404fSRoman Anufriev #else
4282ca9b404fSRoman Anufriev 	return "disabled";
4283ca9b404fSRoman Anufriev #endif
4284ca9b404fSRoman Anufriev }
4285ca9b404fSRoman Anufriev 
4286188c299eSJan Kara static void ext4_setup_csum_trigger(struct super_block *sb,
4287188c299eSJan Kara 				    enum ext4_journal_trigger_type type,
4288188c299eSJan Kara 				    void (*trigger)(
4289188c299eSJan Kara 					struct jbd2_buffer_trigger_type *type,
4290188c299eSJan Kara 					struct buffer_head *bh,
4291188c299eSJan Kara 					void *mapped_data,
4292188c299eSJan Kara 					size_t size))
4293188c299eSJan Kara {
4294188c299eSJan Kara 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4295188c299eSJan Kara 
4296188c299eSJan Kara 	sbi->s_journal_triggers[type].sb = sb;
4297188c299eSJan Kara 	sbi->s_journal_triggers[type].tr_triggers.t_frozen = trigger;
4298188c299eSJan Kara }
4299188c299eSJan Kara 
43007edfd85bSLukas Czerner static void ext4_free_sbi(struct ext4_sb_info *sbi)
4301ac27a0ecSDave Kleikamp {
43027edfd85bSLukas Czerner 	if (!sbi)
43037edfd85bSLukas Czerner 		return;
43047edfd85bSLukas Czerner 
43057edfd85bSLukas Czerner 	kfree(sbi->s_blockgroup_lock);
43068012b866SShiyang Ruan 	fs_put_dax(sbi->s_daxdev, NULL);
43077edfd85bSLukas Czerner 	kfree(sbi);
43087edfd85bSLukas Czerner }
43097edfd85bSLukas Czerner 
43107edfd85bSLukas Czerner static struct ext4_sb_info *ext4_alloc_sbi(struct super_block *sb)
43117edfd85bSLukas Czerner {
43127edfd85bSLukas Czerner 	struct ext4_sb_info *sbi;
43137edfd85bSLukas Czerner 
43147edfd85bSLukas Czerner 	sbi = kzalloc(sizeof(*sbi), GFP_KERNEL);
43157edfd85bSLukas Czerner 	if (!sbi)
43167edfd85bSLukas Czerner 		return NULL;
43177edfd85bSLukas Czerner 
43188012b866SShiyang Ruan 	sbi->s_daxdev = fs_dax_get_by_bdev(sb->s_bdev, &sbi->s_dax_part_off,
43198012b866SShiyang Ruan 					   NULL, NULL);
43207edfd85bSLukas Czerner 
43217edfd85bSLukas Czerner 	sbi->s_blockgroup_lock =
43227edfd85bSLukas Czerner 		kzalloc(sizeof(struct blockgroup_lock), GFP_KERNEL);
43237edfd85bSLukas Czerner 
43247edfd85bSLukas Czerner 	if (!sbi->s_blockgroup_lock)
43257edfd85bSLukas Czerner 		goto err_out;
43267edfd85bSLukas Czerner 
43277edfd85bSLukas Czerner 	sb->s_fs_info = sbi;
43287edfd85bSLukas Czerner 	sbi->s_sb = sb;
43297edfd85bSLukas Czerner 	return sbi;
43307edfd85bSLukas Czerner err_out:
43318012b866SShiyang Ruan 	fs_put_dax(sbi->s_daxdev, NULL);
43327edfd85bSLukas Czerner 	kfree(sbi);
43337edfd85bSLukas Czerner 	return NULL;
43347edfd85bSLukas Czerner }
43357edfd85bSLukas Czerner 
43365f6d662dSJason Yan static void ext4_set_def_opts(struct super_block *sb,
43375f6d662dSJason Yan 			      struct ext4_super_block *es)
43385f6d662dSJason Yan {
43395f6d662dSJason Yan 	unsigned long def_mount_opts;
43405f6d662dSJason Yan 
43415f6d662dSJason Yan 	/* Set defaults before we parse the mount options */
43425f6d662dSJason Yan 	def_mount_opts = le32_to_cpu(es->s_default_mount_opts);
43435f6d662dSJason Yan 	set_opt(sb, INIT_INODE_TABLE);
43445f6d662dSJason Yan 	if (def_mount_opts & EXT4_DEFM_DEBUG)
43455f6d662dSJason Yan 		set_opt(sb, DEBUG);
43465f6d662dSJason Yan 	if (def_mount_opts & EXT4_DEFM_BSDGROUPS)
43475f6d662dSJason Yan 		set_opt(sb, GRPID);
43485f6d662dSJason Yan 	if (def_mount_opts & EXT4_DEFM_UID16)
43495f6d662dSJason Yan 		set_opt(sb, NO_UID32);
43505f6d662dSJason Yan 	/* xattr user namespace & acls are now defaulted on */
43515f6d662dSJason Yan 	set_opt(sb, XATTR_USER);
43525f6d662dSJason Yan #ifdef CONFIG_EXT4_FS_POSIX_ACL
43535f6d662dSJason Yan 	set_opt(sb, POSIX_ACL);
43545f6d662dSJason Yan #endif
43555f6d662dSJason Yan 	if (ext4_has_feature_fast_commit(sb))
43565f6d662dSJason Yan 		set_opt2(sb, JOURNAL_FAST_COMMIT);
43575f6d662dSJason Yan 	/* don't forget to enable journal_csum when metadata_csum is enabled. */
43585f6d662dSJason Yan 	if (ext4_has_metadata_csum(sb))
43595f6d662dSJason Yan 		set_opt(sb, JOURNAL_CHECKSUM);
43605f6d662dSJason Yan 
43615f6d662dSJason Yan 	if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_DATA)
43625f6d662dSJason Yan 		set_opt(sb, JOURNAL_DATA);
43635f6d662dSJason Yan 	else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_ORDERED)
43645f6d662dSJason Yan 		set_opt(sb, ORDERED_DATA);
43655f6d662dSJason Yan 	else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_WBACK)
43665f6d662dSJason Yan 		set_opt(sb, WRITEBACK_DATA);
43675f6d662dSJason Yan 
43685f6d662dSJason Yan 	if (le16_to_cpu(es->s_errors) == EXT4_ERRORS_PANIC)
43695f6d662dSJason Yan 		set_opt(sb, ERRORS_PANIC);
43705f6d662dSJason Yan 	else if (le16_to_cpu(es->s_errors) == EXT4_ERRORS_CONTINUE)
43715f6d662dSJason Yan 		set_opt(sb, ERRORS_CONT);
43725f6d662dSJason Yan 	else
43735f6d662dSJason Yan 		set_opt(sb, ERRORS_RO);
43745f6d662dSJason Yan 	/* block_validity enabled by default; disable with noblock_validity */
43755f6d662dSJason Yan 	set_opt(sb, BLOCK_VALIDITY);
43765f6d662dSJason Yan 	if (def_mount_opts & EXT4_DEFM_DISCARD)
43775f6d662dSJason Yan 		set_opt(sb, DISCARD);
43785f6d662dSJason Yan 
43795f6d662dSJason Yan 	if ((def_mount_opts & EXT4_DEFM_NOBARRIER) == 0)
43805f6d662dSJason Yan 		set_opt(sb, BARRIER);
43815f6d662dSJason Yan 
43825f6d662dSJason Yan 	/*
43835f6d662dSJason Yan 	 * enable delayed allocation by default
43845f6d662dSJason Yan 	 * Use -o nodelalloc to turn it off
43855f6d662dSJason Yan 	 */
43865f6d662dSJason Yan 	if (!IS_EXT3_SB(sb) && !IS_EXT2_SB(sb) &&
43875f6d662dSJason Yan 	    ((def_mount_opts & EXT4_DEFM_NODELALLOC) == 0))
43885f6d662dSJason Yan 		set_opt(sb, DELALLOC);
43893df11e27SJason Yan 
43903df11e27SJason Yan 	if (sb->s_blocksize == PAGE_SIZE)
43913df11e27SJason Yan 		set_opt(sb, DIOREAD_NOLOCK);
43925f6d662dSJason Yan }
43935f6d662dSJason Yan 
4394c8267c51SJason Yan static int ext4_handle_clustersize(struct super_block *sb)
43954a8557b0SJason Yan {
43964a8557b0SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
43974a8557b0SJason Yan 	struct ext4_super_block *es = sbi->s_es;
43984a8557b0SJason Yan 	int clustersize;
43994a8557b0SJason Yan 
44004a8557b0SJason Yan 	/* Handle clustersize */
44014a8557b0SJason Yan 	clustersize = BLOCK_SIZE << le32_to_cpu(es->s_log_cluster_size);
44024a8557b0SJason Yan 	if (ext4_has_feature_bigalloc(sb)) {
4403c8267c51SJason Yan 		if (clustersize < sb->s_blocksize) {
44044a8557b0SJason Yan 			ext4_msg(sb, KERN_ERR,
44054a8557b0SJason Yan 				 "cluster size (%d) smaller than "
4406c8267c51SJason Yan 				 "block size (%lu)", clustersize, sb->s_blocksize);
44074a8557b0SJason Yan 			return -EINVAL;
44084a8557b0SJason Yan 		}
44094a8557b0SJason Yan 		sbi->s_cluster_bits = le32_to_cpu(es->s_log_cluster_size) -
44104a8557b0SJason Yan 			le32_to_cpu(es->s_log_block_size);
44114a8557b0SJason Yan 		sbi->s_clusters_per_group =
44124a8557b0SJason Yan 			le32_to_cpu(es->s_clusters_per_group);
4413c8267c51SJason Yan 		if (sbi->s_clusters_per_group > sb->s_blocksize * 8) {
44144a8557b0SJason Yan 			ext4_msg(sb, KERN_ERR,
44154a8557b0SJason Yan 				 "#clusters per group too big: %lu",
44164a8557b0SJason Yan 				 sbi->s_clusters_per_group);
44174a8557b0SJason Yan 			return -EINVAL;
44184a8557b0SJason Yan 		}
44194a8557b0SJason Yan 		if (sbi->s_blocks_per_group !=
4420c8267c51SJason Yan 		    (sbi->s_clusters_per_group * (clustersize / sb->s_blocksize))) {
44214a8557b0SJason Yan 			ext4_msg(sb, KERN_ERR, "blocks per group (%lu) and "
44224a8557b0SJason Yan 				 "clusters per group (%lu) inconsistent",
44234a8557b0SJason Yan 				 sbi->s_blocks_per_group,
44244a8557b0SJason Yan 				 sbi->s_clusters_per_group);
44254a8557b0SJason Yan 			return -EINVAL;
44264a8557b0SJason Yan 		}
44274a8557b0SJason Yan 	} else {
4428c8267c51SJason Yan 		if (clustersize != sb->s_blocksize) {
44294a8557b0SJason Yan 			ext4_msg(sb, KERN_ERR,
44304a8557b0SJason Yan 				 "fragment/cluster size (%d) != "
4431c8267c51SJason Yan 				 "block size (%lu)", clustersize, sb->s_blocksize);
44324a8557b0SJason Yan 			return -EINVAL;
44334a8557b0SJason Yan 		}
4434c8267c51SJason Yan 		if (sbi->s_blocks_per_group > sb->s_blocksize * 8) {
44354a8557b0SJason Yan 			ext4_msg(sb, KERN_ERR,
44364a8557b0SJason Yan 				 "#blocks per group too big: %lu",
44374a8557b0SJason Yan 				 sbi->s_blocks_per_group);
44384a8557b0SJason Yan 			return -EINVAL;
44394a8557b0SJason Yan 		}
44404a8557b0SJason Yan 		sbi->s_clusters_per_group = sbi->s_blocks_per_group;
44414a8557b0SJason Yan 		sbi->s_cluster_bits = 0;
44424a8557b0SJason Yan 	}
4443c8267c51SJason Yan 	sbi->s_cluster_ratio = clustersize / sb->s_blocksize;
44444a8557b0SJason Yan 
44454a8557b0SJason Yan 	/* Do we have standard group size of clustersize * 8 blocks ? */
44464a8557b0SJason Yan 	if (sbi->s_blocks_per_group == clustersize << 3)
44474a8557b0SJason Yan 		set_opt2(sb, STD_GROUP_SIZE);
44484a8557b0SJason Yan 
44494a8557b0SJason Yan 	return 0;
44504a8557b0SJason Yan }
44514a8557b0SJason Yan 
4452f7314a67SJason Yan static void ext4_fast_commit_init(struct super_block *sb)
4453f7314a67SJason Yan {
4454f7314a67SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4455f7314a67SJason Yan 
4456f7314a67SJason Yan 	/* Initialize fast commit stuff */
4457f7314a67SJason Yan 	atomic_set(&sbi->s_fc_subtid, 0);
4458f7314a67SJason Yan 	INIT_LIST_HEAD(&sbi->s_fc_q[FC_Q_MAIN]);
4459f7314a67SJason Yan 	INIT_LIST_HEAD(&sbi->s_fc_q[FC_Q_STAGING]);
4460f7314a67SJason Yan 	INIT_LIST_HEAD(&sbi->s_fc_dentry_q[FC_Q_MAIN]);
4461f7314a67SJason Yan 	INIT_LIST_HEAD(&sbi->s_fc_dentry_q[FC_Q_STAGING]);
4462f7314a67SJason Yan 	sbi->s_fc_bytes = 0;
4463f7314a67SJason Yan 	ext4_clear_mount_flag(sb, EXT4_MF_FC_INELIGIBLE);
4464f7314a67SJason Yan 	sbi->s_fc_ineligible_tid = 0;
4465f7314a67SJason Yan 	spin_lock_init(&sbi->s_fc_lock);
4466f7314a67SJason Yan 	memset(&sbi->s_fc_stats, 0, sizeof(sbi->s_fc_stats));
4467f7314a67SJason Yan 	sbi->s_fc_replay_state.fc_regions = NULL;
4468f7314a67SJason Yan 	sbi->s_fc_replay_state.fc_regions_size = 0;
4469f7314a67SJason Yan 	sbi->s_fc_replay_state.fc_regions_used = 0;
4470f7314a67SJason Yan 	sbi->s_fc_replay_state.fc_regions_valid = 0;
4471f7314a67SJason Yan 	sbi->s_fc_replay_state.fc_modified_inodes = NULL;
4472f7314a67SJason Yan 	sbi->s_fc_replay_state.fc_modified_inodes_size = 0;
4473f7314a67SJason Yan 	sbi->s_fc_replay_state.fc_modified_inodes_used = 0;
4474f7314a67SJason Yan }
4475f7314a67SJason Yan 
44760e495f7cSJason Yan static int ext4_inode_info_init(struct super_block *sb,
4477c8267c51SJason Yan 				struct ext4_super_block *es)
44780e495f7cSJason Yan {
44790e495f7cSJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
44800e495f7cSJason Yan 
44810e495f7cSJason Yan 	if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV) {
44820e495f7cSJason Yan 		sbi->s_inode_size = EXT4_GOOD_OLD_INODE_SIZE;
44830e495f7cSJason Yan 		sbi->s_first_ino = EXT4_GOOD_OLD_FIRST_INO;
44840e495f7cSJason Yan 	} else {
44850e495f7cSJason Yan 		sbi->s_inode_size = le16_to_cpu(es->s_inode_size);
44860e495f7cSJason Yan 		sbi->s_first_ino = le32_to_cpu(es->s_first_ino);
44870e495f7cSJason Yan 		if (sbi->s_first_ino < EXT4_GOOD_OLD_FIRST_INO) {
44880e495f7cSJason Yan 			ext4_msg(sb, KERN_ERR, "invalid first ino: %u",
44890e495f7cSJason Yan 				 sbi->s_first_ino);
44900e495f7cSJason Yan 			return -EINVAL;
44910e495f7cSJason Yan 		}
44920e495f7cSJason Yan 		if ((sbi->s_inode_size < EXT4_GOOD_OLD_INODE_SIZE) ||
44930e495f7cSJason Yan 		    (!is_power_of_2(sbi->s_inode_size)) ||
4494c8267c51SJason Yan 		    (sbi->s_inode_size > sb->s_blocksize)) {
44950e495f7cSJason Yan 			ext4_msg(sb, KERN_ERR,
44960e495f7cSJason Yan 			       "unsupported inode size: %d",
44970e495f7cSJason Yan 			       sbi->s_inode_size);
4498c8267c51SJason Yan 			ext4_msg(sb, KERN_ERR, "blocksize: %lu", sb->s_blocksize);
44990e495f7cSJason Yan 			return -EINVAL;
45000e495f7cSJason Yan 		}
45010e495f7cSJason Yan 		/*
45020e495f7cSJason Yan 		 * i_atime_extra is the last extra field available for
45030e495f7cSJason Yan 		 * [acm]times in struct ext4_inode. Checking for that
45040e495f7cSJason Yan 		 * field should suffice to ensure we have extra space
45050e495f7cSJason Yan 		 * for all three.
45060e495f7cSJason Yan 		 */
45070e495f7cSJason Yan 		if (sbi->s_inode_size >= offsetof(struct ext4_inode, i_atime_extra) +
45080e495f7cSJason Yan 			sizeof(((struct ext4_inode *)0)->i_atime_extra)) {
45090e495f7cSJason Yan 			sb->s_time_gran = 1;
45100e495f7cSJason Yan 			sb->s_time_max = EXT4_EXTRA_TIMESTAMP_MAX;
45110e495f7cSJason Yan 		} else {
45120e495f7cSJason Yan 			sb->s_time_gran = NSEC_PER_SEC;
45130e495f7cSJason Yan 			sb->s_time_max = EXT4_NON_EXTRA_TIMESTAMP_MAX;
45140e495f7cSJason Yan 		}
45150e495f7cSJason Yan 		sb->s_time_min = EXT4_TIMESTAMP_MIN;
45160e495f7cSJason Yan 	}
45170e495f7cSJason Yan 
45180e495f7cSJason Yan 	if (sbi->s_inode_size > EXT4_GOOD_OLD_INODE_SIZE) {
45190e495f7cSJason Yan 		sbi->s_want_extra_isize = sizeof(struct ext4_inode) -
45200e495f7cSJason Yan 			EXT4_GOOD_OLD_INODE_SIZE;
45210e495f7cSJason Yan 		if (ext4_has_feature_extra_isize(sb)) {
45220e495f7cSJason Yan 			unsigned v, max = (sbi->s_inode_size -
45230e495f7cSJason Yan 					   EXT4_GOOD_OLD_INODE_SIZE);
45240e495f7cSJason Yan 
45250e495f7cSJason Yan 			v = le16_to_cpu(es->s_want_extra_isize);
45260e495f7cSJason Yan 			if (v > max) {
45270e495f7cSJason Yan 				ext4_msg(sb, KERN_ERR,
45280e495f7cSJason Yan 					 "bad s_want_extra_isize: %d", v);
45290e495f7cSJason Yan 				return -EINVAL;
45300e495f7cSJason Yan 			}
45310e495f7cSJason Yan 			if (sbi->s_want_extra_isize < v)
45320e495f7cSJason Yan 				sbi->s_want_extra_isize = v;
45330e495f7cSJason Yan 
45340e495f7cSJason Yan 			v = le16_to_cpu(es->s_min_extra_isize);
45350e495f7cSJason Yan 			if (v > max) {
45360e495f7cSJason Yan 				ext4_msg(sb, KERN_ERR,
45370e495f7cSJason Yan 					 "bad s_min_extra_isize: %d", v);
45380e495f7cSJason Yan 				return -EINVAL;
45390e495f7cSJason Yan 			}
45400e495f7cSJason Yan 			if (sbi->s_want_extra_isize < v)
45410e495f7cSJason Yan 				sbi->s_want_extra_isize = v;
45420e495f7cSJason Yan 		}
45430e495f7cSJason Yan 	}
45440e495f7cSJason Yan 
45450e495f7cSJason Yan 	return 0;
45460e495f7cSJason Yan }
45470e495f7cSJason Yan 
454839c135b0SJason Yan #if IS_ENABLED(CONFIG_UNICODE)
454939c135b0SJason Yan static int ext4_encoding_init(struct super_block *sb, struct ext4_super_block *es)
455039c135b0SJason Yan {
455139c135b0SJason Yan 	const struct ext4_sb_encodings *encoding_info;
455239c135b0SJason Yan 	struct unicode_map *encoding;
455339c135b0SJason Yan 	__u16 encoding_flags = le16_to_cpu(es->s_encoding_flags);
455439c135b0SJason Yan 
455539c135b0SJason Yan 	if (!ext4_has_feature_casefold(sb) || sb->s_encoding)
455639c135b0SJason Yan 		return 0;
455739c135b0SJason Yan 
455839c135b0SJason Yan 	encoding_info = ext4_sb_read_encoding(es);
455939c135b0SJason Yan 	if (!encoding_info) {
456039c135b0SJason Yan 		ext4_msg(sb, KERN_ERR,
456139c135b0SJason Yan 			"Encoding requested by superblock is unknown");
456239c135b0SJason Yan 		return -EINVAL;
456339c135b0SJason Yan 	}
456439c135b0SJason Yan 
456539c135b0SJason Yan 	encoding = utf8_load(encoding_info->version);
456639c135b0SJason Yan 	if (IS_ERR(encoding)) {
456739c135b0SJason Yan 		ext4_msg(sb, KERN_ERR,
456839c135b0SJason Yan 			"can't mount with superblock charset: %s-%u.%u.%u "
456939c135b0SJason Yan 			"not supported by the kernel. flags: 0x%x.",
457039c135b0SJason Yan 			encoding_info->name,
457139c135b0SJason Yan 			unicode_major(encoding_info->version),
457239c135b0SJason Yan 			unicode_minor(encoding_info->version),
457339c135b0SJason Yan 			unicode_rev(encoding_info->version),
457439c135b0SJason Yan 			encoding_flags);
457539c135b0SJason Yan 		return -EINVAL;
457639c135b0SJason Yan 	}
457739c135b0SJason Yan 	ext4_msg(sb, KERN_INFO,"Using encoding defined by superblock: "
457839c135b0SJason Yan 		"%s-%u.%u.%u with flags 0x%hx", encoding_info->name,
457939c135b0SJason Yan 		unicode_major(encoding_info->version),
458039c135b0SJason Yan 		unicode_minor(encoding_info->version),
458139c135b0SJason Yan 		unicode_rev(encoding_info->version),
458239c135b0SJason Yan 		encoding_flags);
458339c135b0SJason Yan 
458439c135b0SJason Yan 	sb->s_encoding = encoding;
458539c135b0SJason Yan 	sb->s_encoding_flags = encoding_flags;
458639c135b0SJason Yan 
458739c135b0SJason Yan 	return 0;
458839c135b0SJason Yan }
458939c135b0SJason Yan #else
459039c135b0SJason Yan static inline int ext4_encoding_init(struct super_block *sb, struct ext4_super_block *es)
459139c135b0SJason Yan {
459239c135b0SJason Yan 	return 0;
459339c135b0SJason Yan }
459439c135b0SJason Yan #endif
459539c135b0SJason Yan 
4596b26458d1SJason Yan static int ext4_init_metadata_csum(struct super_block *sb, struct ext4_super_block *es)
4597b26458d1SJason Yan {
4598b26458d1SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4599b26458d1SJason Yan 
4600b26458d1SJason Yan 	/* Warn if metadata_csum and gdt_csum are both set. */
4601b26458d1SJason Yan 	if (ext4_has_feature_metadata_csum(sb) &&
4602b26458d1SJason Yan 	    ext4_has_feature_gdt_csum(sb))
4603b26458d1SJason Yan 		ext4_warning(sb, "metadata_csum and uninit_bg are "
4604b26458d1SJason Yan 			     "redundant flags; please run fsck.");
4605b26458d1SJason Yan 
4606b26458d1SJason Yan 	/* Check for a known checksum algorithm */
4607b26458d1SJason Yan 	if (!ext4_verify_csum_type(sb, es)) {
4608b26458d1SJason Yan 		ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with "
4609b26458d1SJason Yan 			 "unknown checksum algorithm.");
4610b26458d1SJason Yan 		return -EINVAL;
4611b26458d1SJason Yan 	}
4612b26458d1SJason Yan 	ext4_setup_csum_trigger(sb, EXT4_JTR_ORPHAN_FILE,
4613b26458d1SJason Yan 				ext4_orphan_file_block_trigger);
4614b26458d1SJason Yan 
4615b26458d1SJason Yan 	/* Load the checksum driver */
4616b26458d1SJason Yan 	sbi->s_chksum_driver = crypto_alloc_shash("crc32c", 0, 0);
4617b26458d1SJason Yan 	if (IS_ERR(sbi->s_chksum_driver)) {
4618b26458d1SJason Yan 		int ret = PTR_ERR(sbi->s_chksum_driver);
4619b26458d1SJason Yan 		ext4_msg(sb, KERN_ERR, "Cannot load crc32c driver.");
4620b26458d1SJason Yan 		sbi->s_chksum_driver = NULL;
4621b26458d1SJason Yan 		return ret;
4622b26458d1SJason Yan 	}
4623b26458d1SJason Yan 
4624b26458d1SJason Yan 	/* Check superblock checksum */
4625b26458d1SJason Yan 	if (!ext4_superblock_csum_verify(sb, es)) {
4626b26458d1SJason Yan 		ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with "
4627b26458d1SJason Yan 			 "invalid superblock checksum.  Run e2fsck?");
4628b26458d1SJason Yan 		return -EFSBADCRC;
4629b26458d1SJason Yan 	}
4630b26458d1SJason Yan 
4631b26458d1SJason Yan 	/* Precompute checksum seed for all metadata */
4632b26458d1SJason Yan 	if (ext4_has_feature_csum_seed(sb))
4633b26458d1SJason Yan 		sbi->s_csum_seed = le32_to_cpu(es->s_checksum_seed);
4634b26458d1SJason Yan 	else if (ext4_has_metadata_csum(sb) || ext4_has_feature_ea_inode(sb))
4635b26458d1SJason Yan 		sbi->s_csum_seed = ext4_chksum(sbi, ~0, es->s_uuid,
4636b26458d1SJason Yan 					       sizeof(es->s_uuid));
4637b26458d1SJason Yan 	return 0;
4638b26458d1SJason Yan }
4639b26458d1SJason Yan 
4640d7f3542bSJason Yan static int ext4_check_feature_compatibility(struct super_block *sb,
4641d7f3542bSJason Yan 					    struct ext4_super_block *es,
4642d7f3542bSJason Yan 					    int silent)
4643d7f3542bSJason Yan {
4644*54902099SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4645*54902099SJason Yan 
4646d7f3542bSJason Yan 	if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV &&
4647d7f3542bSJason Yan 	    (ext4_has_compat_features(sb) ||
4648d7f3542bSJason Yan 	     ext4_has_ro_compat_features(sb) ||
4649d7f3542bSJason Yan 	     ext4_has_incompat_features(sb)))
4650d7f3542bSJason Yan 		ext4_msg(sb, KERN_WARNING,
4651d7f3542bSJason Yan 		       "feature flags set on rev 0 fs, "
4652d7f3542bSJason Yan 		       "running e2fsck is recommended");
4653d7f3542bSJason Yan 
4654d7f3542bSJason Yan 	if (es->s_creator_os == cpu_to_le32(EXT4_OS_HURD)) {
4655d7f3542bSJason Yan 		set_opt2(sb, HURD_COMPAT);
4656d7f3542bSJason Yan 		if (ext4_has_feature_64bit(sb)) {
4657d7f3542bSJason Yan 			ext4_msg(sb, KERN_ERR,
4658d7f3542bSJason Yan 				 "The Hurd can't support 64-bit file systems");
4659d7f3542bSJason Yan 			return -EINVAL;
4660d7f3542bSJason Yan 		}
4661d7f3542bSJason Yan 
4662d7f3542bSJason Yan 		/*
4663d7f3542bSJason Yan 		 * ea_inode feature uses l_i_version field which is not
4664d7f3542bSJason Yan 		 * available in HURD_COMPAT mode.
4665d7f3542bSJason Yan 		 */
4666d7f3542bSJason Yan 		if (ext4_has_feature_ea_inode(sb)) {
4667d7f3542bSJason Yan 			ext4_msg(sb, KERN_ERR,
4668d7f3542bSJason Yan 				 "ea_inode feature is not supported for Hurd");
4669d7f3542bSJason Yan 			return -EINVAL;
4670d7f3542bSJason Yan 		}
4671d7f3542bSJason Yan 	}
4672d7f3542bSJason Yan 
4673d7f3542bSJason Yan 	if (IS_EXT2_SB(sb)) {
4674d7f3542bSJason Yan 		if (ext2_feature_set_ok(sb))
4675d7f3542bSJason Yan 			ext4_msg(sb, KERN_INFO, "mounting ext2 file system "
4676d7f3542bSJason Yan 				 "using the ext4 subsystem");
4677d7f3542bSJason Yan 		else {
4678d7f3542bSJason Yan 			/*
4679d7f3542bSJason Yan 			 * If we're probing be silent, if this looks like
4680d7f3542bSJason Yan 			 * it's actually an ext[34] filesystem.
4681d7f3542bSJason Yan 			 */
4682d7f3542bSJason Yan 			if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb)))
4683d7f3542bSJason Yan 				return -EINVAL;
4684d7f3542bSJason Yan 			ext4_msg(sb, KERN_ERR, "couldn't mount as ext2 due "
4685d7f3542bSJason Yan 				 "to feature incompatibilities");
4686d7f3542bSJason Yan 			return -EINVAL;
4687d7f3542bSJason Yan 		}
4688d7f3542bSJason Yan 	}
4689d7f3542bSJason Yan 
4690d7f3542bSJason Yan 	if (IS_EXT3_SB(sb)) {
4691d7f3542bSJason Yan 		if (ext3_feature_set_ok(sb))
4692d7f3542bSJason Yan 			ext4_msg(sb, KERN_INFO, "mounting ext3 file system "
4693d7f3542bSJason Yan 				 "using the ext4 subsystem");
4694d7f3542bSJason Yan 		else {
4695d7f3542bSJason Yan 			/*
4696d7f3542bSJason Yan 			 * If we're probing be silent, if this looks like
4697d7f3542bSJason Yan 			 * it's actually an ext4 filesystem.
4698d7f3542bSJason Yan 			 */
4699d7f3542bSJason Yan 			if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb)))
4700d7f3542bSJason Yan 				return -EINVAL;
4701d7f3542bSJason Yan 			ext4_msg(sb, KERN_ERR, "couldn't mount as ext3 due "
4702d7f3542bSJason Yan 				 "to feature incompatibilities");
4703d7f3542bSJason Yan 			return -EINVAL;
4704d7f3542bSJason Yan 		}
4705d7f3542bSJason Yan 	}
4706d7f3542bSJason Yan 
4707d7f3542bSJason Yan 	/*
4708d7f3542bSJason Yan 	 * Check feature flags regardless of the revision level, since we
4709d7f3542bSJason Yan 	 * previously didn't change the revision level when setting the flags,
4710d7f3542bSJason Yan 	 * so there is a chance incompat flags are set on a rev 0 filesystem.
4711d7f3542bSJason Yan 	 */
4712d7f3542bSJason Yan 	if (!ext4_feature_set_ok(sb, (sb_rdonly(sb))))
4713d7f3542bSJason Yan 		return -EINVAL;
4714d7f3542bSJason Yan 
4715*54902099SJason Yan 	if (sbi->s_daxdev) {
4716*54902099SJason Yan 		if (sb->s_blocksize == PAGE_SIZE)
4717*54902099SJason Yan 			set_bit(EXT4_FLAGS_BDEV_IS_DAX, &sbi->s_ext4_flags);
4718*54902099SJason Yan 		else
4719*54902099SJason Yan 			ext4_msg(sb, KERN_ERR, "unsupported blocksize for DAX\n");
4720*54902099SJason Yan 	}
4721*54902099SJason Yan 
4722*54902099SJason Yan 	if (sbi->s_mount_opt & EXT4_MOUNT_DAX_ALWAYS) {
4723*54902099SJason Yan 		if (ext4_has_feature_inline_data(sb)) {
4724*54902099SJason Yan 			ext4_msg(sb, KERN_ERR, "Cannot use DAX on a filesystem"
4725*54902099SJason Yan 					" that may contain inline data");
4726*54902099SJason Yan 			return -EINVAL;
4727*54902099SJason Yan 		}
4728*54902099SJason Yan 		if (!test_bit(EXT4_FLAGS_BDEV_IS_DAX, &sbi->s_ext4_flags)) {
4729*54902099SJason Yan 			ext4_msg(sb, KERN_ERR,
4730*54902099SJason Yan 				"DAX unsupported by block device.");
4731*54902099SJason Yan 			return -EINVAL;
4732*54902099SJason Yan 		}
4733*54902099SJason Yan 	}
4734*54902099SJason Yan 
4735*54902099SJason Yan 	if (ext4_has_feature_encrypt(sb) && es->s_encryption_level) {
4736*54902099SJason Yan 		ext4_msg(sb, KERN_ERR, "Unsupported encryption level %d",
4737*54902099SJason Yan 			 es->s_encryption_level);
4738*54902099SJason Yan 		return -EINVAL;
4739*54902099SJason Yan 	}
4740*54902099SJason Yan 
4741d7f3542bSJason Yan 	return 0;
4742d7f3542bSJason Yan }
4743d7f3542bSJason Yan 
474468e62439SJason Yan static int ext4_check_geometry(struct super_block *sb,
4745bc62dbf9SJason Yan 			       struct ext4_super_block *es)
4746bc62dbf9SJason Yan {
4747bc62dbf9SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4748bc62dbf9SJason Yan 	__u64 blocks_count;
4749269e9226SJason Yan 	int err;
4750269e9226SJason Yan 
4751269e9226SJason Yan 	if (le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) > (sb->s_blocksize / 4)) {
4752269e9226SJason Yan 		ext4_msg(sb, KERN_ERR,
4753269e9226SJason Yan 			 "Number of reserved GDT blocks insanely large: %d",
4754269e9226SJason Yan 			 le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks));
4755269e9226SJason Yan 		return -EINVAL;
4756269e9226SJason Yan 	}
4757269e9226SJason Yan 	/*
4758269e9226SJason Yan 	 * Test whether we have more sectors than will fit in sector_t,
4759269e9226SJason Yan 	 * and whether the max offset is addressable by the page cache.
4760269e9226SJason Yan 	 */
4761269e9226SJason Yan 	err = generic_check_addressable(sb->s_blocksize_bits,
4762269e9226SJason Yan 					ext4_blocks_count(es));
4763269e9226SJason Yan 	if (err) {
4764269e9226SJason Yan 		ext4_msg(sb, KERN_ERR, "filesystem"
4765269e9226SJason Yan 			 " too large to mount safely on this system");
4766269e9226SJason Yan 		return err;
4767269e9226SJason Yan 	}
4768bc62dbf9SJason Yan 
4769bc62dbf9SJason Yan 	/* check blocks count against device size */
4770bc62dbf9SJason Yan 	blocks_count = sb_bdev_nr_blocks(sb);
4771bc62dbf9SJason Yan 	if (blocks_count && ext4_blocks_count(es) > blocks_count) {
4772bc62dbf9SJason Yan 		ext4_msg(sb, KERN_WARNING, "bad geometry: block count %llu "
4773bc62dbf9SJason Yan 		       "exceeds size of device (%llu blocks)",
4774bc62dbf9SJason Yan 		       ext4_blocks_count(es), blocks_count);
4775bc62dbf9SJason Yan 		return -EINVAL;
4776bc62dbf9SJason Yan 	}
4777bc62dbf9SJason Yan 
4778bc62dbf9SJason Yan 	/*
4779bc62dbf9SJason Yan 	 * It makes no sense for the first data block to be beyond the end
4780bc62dbf9SJason Yan 	 * of the filesystem.
4781bc62dbf9SJason Yan 	 */
4782bc62dbf9SJason Yan 	if (le32_to_cpu(es->s_first_data_block) >= ext4_blocks_count(es)) {
4783bc62dbf9SJason Yan 		ext4_msg(sb, KERN_WARNING, "bad geometry: first data "
4784bc62dbf9SJason Yan 			 "block %u is beyond end of filesystem (%llu)",
4785bc62dbf9SJason Yan 			 le32_to_cpu(es->s_first_data_block),
4786bc62dbf9SJason Yan 			 ext4_blocks_count(es));
4787bc62dbf9SJason Yan 		return -EINVAL;
4788bc62dbf9SJason Yan 	}
4789bc62dbf9SJason Yan 	if ((es->s_first_data_block == 0) && (es->s_log_block_size == 0) &&
4790bc62dbf9SJason Yan 	    (sbi->s_cluster_ratio == 1)) {
4791bc62dbf9SJason Yan 		ext4_msg(sb, KERN_WARNING, "bad geometry: first data "
4792bc62dbf9SJason Yan 			 "block is 0 with a 1k block and cluster size");
4793bc62dbf9SJason Yan 		return -EINVAL;
4794bc62dbf9SJason Yan 	}
4795bc62dbf9SJason Yan 
4796bc62dbf9SJason Yan 	blocks_count = (ext4_blocks_count(es) -
4797bc62dbf9SJason Yan 			le32_to_cpu(es->s_first_data_block) +
4798bc62dbf9SJason Yan 			EXT4_BLOCKS_PER_GROUP(sb) - 1);
4799bc62dbf9SJason Yan 	do_div(blocks_count, EXT4_BLOCKS_PER_GROUP(sb));
4800bc62dbf9SJason Yan 	if (blocks_count > ((uint64_t)1<<32) - EXT4_DESC_PER_BLOCK(sb)) {
4801bc62dbf9SJason Yan 		ext4_msg(sb, KERN_WARNING, "groups count too large: %llu "
4802bc62dbf9SJason Yan 		       "(block count %llu, first data block %u, "
4803bc62dbf9SJason Yan 		       "blocks per group %lu)", blocks_count,
4804bc62dbf9SJason Yan 		       ext4_blocks_count(es),
4805bc62dbf9SJason Yan 		       le32_to_cpu(es->s_first_data_block),
4806bc62dbf9SJason Yan 		       EXT4_BLOCKS_PER_GROUP(sb));
4807bc62dbf9SJason Yan 		return -EINVAL;
4808bc62dbf9SJason Yan 	}
4809bc62dbf9SJason Yan 	sbi->s_groups_count = blocks_count;
4810bc62dbf9SJason Yan 	sbi->s_blockfile_groups = min_t(ext4_group_t, sbi->s_groups_count,
4811bc62dbf9SJason Yan 			(EXT4_MAX_BLOCK_FILE_PHYS / EXT4_BLOCKS_PER_GROUP(sb)));
4812bc62dbf9SJason Yan 	if (((u64)sbi->s_groups_count * sbi->s_inodes_per_group) !=
4813bc62dbf9SJason Yan 	    le32_to_cpu(es->s_inodes_count)) {
4814bc62dbf9SJason Yan 		ext4_msg(sb, KERN_ERR, "inodes count not valid: %u vs %llu",
4815bc62dbf9SJason Yan 			 le32_to_cpu(es->s_inodes_count),
4816bc62dbf9SJason Yan 			 ((u64)sbi->s_groups_count * sbi->s_inodes_per_group));
4817bc62dbf9SJason Yan 		return -EINVAL;
4818bc62dbf9SJason Yan 	}
4819bc62dbf9SJason Yan 
4820bc62dbf9SJason Yan 	return 0;
4821bc62dbf9SJason Yan }
4822bc62dbf9SJason Yan 
4823a4e6a511SJason Yan static int ext4_group_desc_init(struct super_block *sb,
4824a4e6a511SJason Yan 				struct ext4_super_block *es,
4825a4e6a511SJason Yan 				ext4_fsblk_t logical_sb_block,
4826a4e6a511SJason Yan 				ext4_group_t *first_not_zeroed)
4827a4e6a511SJason Yan {
4828a4e6a511SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4829a4e6a511SJason Yan 	unsigned int db_count;
4830a4e6a511SJason Yan 	ext4_fsblk_t block;
4831a4e6a511SJason Yan 	int i;
4832a4e6a511SJason Yan 
4833a4e6a511SJason Yan 	db_count = (sbi->s_groups_count + EXT4_DESC_PER_BLOCK(sb) - 1) /
4834a4e6a511SJason Yan 		   EXT4_DESC_PER_BLOCK(sb);
4835a4e6a511SJason Yan 	if (ext4_has_feature_meta_bg(sb)) {
4836a4e6a511SJason Yan 		if (le32_to_cpu(es->s_first_meta_bg) > db_count) {
4837a4e6a511SJason Yan 			ext4_msg(sb, KERN_WARNING,
4838a4e6a511SJason Yan 				 "first meta block group too large: %u "
4839a4e6a511SJason Yan 				 "(group descriptor block count %u)",
4840a4e6a511SJason Yan 				 le32_to_cpu(es->s_first_meta_bg), db_count);
4841a4e6a511SJason Yan 			return -EINVAL;
4842a4e6a511SJason Yan 		}
4843a4e6a511SJason Yan 	}
4844a4e6a511SJason Yan 	rcu_assign_pointer(sbi->s_group_desc,
4845a4e6a511SJason Yan 			   kvmalloc_array(db_count,
4846a4e6a511SJason Yan 					  sizeof(struct buffer_head *),
4847a4e6a511SJason Yan 					  GFP_KERNEL));
4848a4e6a511SJason Yan 	if (sbi->s_group_desc == NULL) {
4849a4e6a511SJason Yan 		ext4_msg(sb, KERN_ERR, "not enough memory");
4850a4e6a511SJason Yan 		return -ENOMEM;
4851a4e6a511SJason Yan 	}
4852a4e6a511SJason Yan 
4853a4e6a511SJason Yan 	bgl_lock_init(sbi->s_blockgroup_lock);
4854a4e6a511SJason Yan 
4855a4e6a511SJason Yan 	/* Pre-read the descriptors into the buffer cache */
4856a4e6a511SJason Yan 	for (i = 0; i < db_count; i++) {
4857a4e6a511SJason Yan 		block = descriptor_loc(sb, logical_sb_block, i);
4858a4e6a511SJason Yan 		ext4_sb_breadahead_unmovable(sb, block);
4859a4e6a511SJason Yan 	}
4860a4e6a511SJason Yan 
4861a4e6a511SJason Yan 	for (i = 0; i < db_count; i++) {
4862a4e6a511SJason Yan 		struct buffer_head *bh;
4863a4e6a511SJason Yan 
4864a4e6a511SJason Yan 		block = descriptor_loc(sb, logical_sb_block, i);
4865a4e6a511SJason Yan 		bh = ext4_sb_bread_unmovable(sb, block);
4866a4e6a511SJason Yan 		if (IS_ERR(bh)) {
4867a4e6a511SJason Yan 			ext4_msg(sb, KERN_ERR,
4868a4e6a511SJason Yan 			       "can't read group descriptor %d", i);
4869a4e6a511SJason Yan 			sbi->s_gdb_count = i;
4870172e344eSYe Bin 			return PTR_ERR(bh);
4871a4e6a511SJason Yan 		}
4872a4e6a511SJason Yan 		rcu_read_lock();
4873a4e6a511SJason Yan 		rcu_dereference(sbi->s_group_desc)[i] = bh;
4874a4e6a511SJason Yan 		rcu_read_unlock();
4875a4e6a511SJason Yan 	}
4876a4e6a511SJason Yan 	sbi->s_gdb_count = db_count;
4877a4e6a511SJason Yan 	if (!ext4_check_descriptors(sb, logical_sb_block, first_not_zeroed)) {
4878a4e6a511SJason Yan 		ext4_msg(sb, KERN_ERR, "group descriptors corrupted!");
4879172e344eSYe Bin 		return -EFSCORRUPTED;
4880a4e6a511SJason Yan 	}
4881172e344eSYe Bin 
4882a4e6a511SJason Yan 	return 0;
4883a4e6a511SJason Yan }
4884a4e6a511SJason Yan 
48859c1dd22dSJason Yan static int ext4_load_and_init_journal(struct super_block *sb,
48869c1dd22dSJason Yan 				      struct ext4_super_block *es,
48879c1dd22dSJason Yan 				      struct ext4_fs_context *ctx)
48889c1dd22dSJason Yan {
48899c1dd22dSJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
48909c1dd22dSJason Yan 	int err;
48919c1dd22dSJason Yan 
48929c1dd22dSJason Yan 	err = ext4_load_journal(sb, es, ctx->journal_devnum);
48939c1dd22dSJason Yan 	if (err)
48949c1dd22dSJason Yan 		return err;
48959c1dd22dSJason Yan 
48969c1dd22dSJason Yan 	if (ext4_has_feature_64bit(sb) &&
48979c1dd22dSJason Yan 	    !jbd2_journal_set_features(EXT4_SB(sb)->s_journal, 0, 0,
48989c1dd22dSJason Yan 				       JBD2_FEATURE_INCOMPAT_64BIT)) {
48999c1dd22dSJason Yan 		ext4_msg(sb, KERN_ERR, "Failed to set 64-bit journal feature");
49009c1dd22dSJason Yan 		goto out;
49019c1dd22dSJason Yan 	}
49029c1dd22dSJason Yan 
49039c1dd22dSJason Yan 	if (!set_journal_csum_feature_set(sb)) {
49049c1dd22dSJason Yan 		ext4_msg(sb, KERN_ERR, "Failed to set journal checksum "
49059c1dd22dSJason Yan 			 "feature set");
49069c1dd22dSJason Yan 		goto out;
49079c1dd22dSJason Yan 	}
49089c1dd22dSJason Yan 
49099c1dd22dSJason Yan 	if (test_opt2(sb, JOURNAL_FAST_COMMIT) &&
49109c1dd22dSJason Yan 		!jbd2_journal_set_features(EXT4_SB(sb)->s_journal, 0, 0,
49119c1dd22dSJason Yan 					  JBD2_FEATURE_INCOMPAT_FAST_COMMIT)) {
49129c1dd22dSJason Yan 		ext4_msg(sb, KERN_ERR,
49139c1dd22dSJason Yan 			"Failed to set fast commit journal feature");
49149c1dd22dSJason Yan 		goto out;
49159c1dd22dSJason Yan 	}
49169c1dd22dSJason Yan 
49179c1dd22dSJason Yan 	/* We have now updated the journal if required, so we can
49189c1dd22dSJason Yan 	 * validate the data journaling mode. */
49199c1dd22dSJason Yan 	switch (test_opt(sb, DATA_FLAGS)) {
49209c1dd22dSJason Yan 	case 0:
49219c1dd22dSJason Yan 		/* No mode set, assume a default based on the journal
49229c1dd22dSJason Yan 		 * capabilities: ORDERED_DATA if the journal can
49239c1dd22dSJason Yan 		 * cope, else JOURNAL_DATA
49249c1dd22dSJason Yan 		 */
49259c1dd22dSJason Yan 		if (jbd2_journal_check_available_features
49269c1dd22dSJason Yan 		    (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) {
49279c1dd22dSJason Yan 			set_opt(sb, ORDERED_DATA);
49289c1dd22dSJason Yan 			sbi->s_def_mount_opt |= EXT4_MOUNT_ORDERED_DATA;
49299c1dd22dSJason Yan 		} else {
49309c1dd22dSJason Yan 			set_opt(sb, JOURNAL_DATA);
49319c1dd22dSJason Yan 			sbi->s_def_mount_opt |= EXT4_MOUNT_JOURNAL_DATA;
49329c1dd22dSJason Yan 		}
49339c1dd22dSJason Yan 		break;
49349c1dd22dSJason Yan 
49359c1dd22dSJason Yan 	case EXT4_MOUNT_ORDERED_DATA:
49369c1dd22dSJason Yan 	case EXT4_MOUNT_WRITEBACK_DATA:
49379c1dd22dSJason Yan 		if (!jbd2_journal_check_available_features
49389c1dd22dSJason Yan 		    (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) {
49399c1dd22dSJason Yan 			ext4_msg(sb, KERN_ERR, "Journal does not support "
49409c1dd22dSJason Yan 			       "requested data journaling mode");
49419c1dd22dSJason Yan 			goto out;
49429c1dd22dSJason Yan 		}
49439c1dd22dSJason Yan 		break;
49449c1dd22dSJason Yan 	default:
49459c1dd22dSJason Yan 		break;
49469c1dd22dSJason Yan 	}
49479c1dd22dSJason Yan 
49489c1dd22dSJason Yan 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA &&
49499c1dd22dSJason Yan 	    test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
49509c1dd22dSJason Yan 		ext4_msg(sb, KERN_ERR, "can't mount with "
49519c1dd22dSJason Yan 			"journal_async_commit in data=ordered mode");
49529c1dd22dSJason Yan 		goto out;
49539c1dd22dSJason Yan 	}
49549c1dd22dSJason Yan 
49559c1dd22dSJason Yan 	set_task_ioprio(sbi->s_journal->j_task, ctx->journal_ioprio);
49569c1dd22dSJason Yan 
49579c1dd22dSJason Yan 	sbi->s_journal->j_submit_inode_data_buffers =
49589c1dd22dSJason Yan 		ext4_journal_submit_inode_data_buffers;
49599c1dd22dSJason Yan 	sbi->s_journal->j_finish_inode_data_buffers =
49609c1dd22dSJason Yan 		ext4_journal_finish_inode_data_buffers;
49619c1dd22dSJason Yan 
49629c1dd22dSJason Yan 	return 0;
49639c1dd22dSJason Yan 
49649c1dd22dSJason Yan out:
49659c1dd22dSJason Yan 	/* flush s_error_work before journal destroy. */
49669c1dd22dSJason Yan 	flush_work(&sbi->s_error_work);
49679c1dd22dSJason Yan 	jbd2_journal_destroy(sbi->s_journal);
49689c1dd22dSJason Yan 	sbi->s_journal = NULL;
49699f2a1d9fSJason Yan 	return -EINVAL;
49709c1dd22dSJason Yan }
49719c1dd22dSJason Yan 
497268e62439SJason Yan static int ext4_check_journal_data_mode(struct super_block *sb)
4973a5991e53SJason Yan {
4974a5991e53SJason Yan 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) {
4975a5991e53SJason Yan 		printk_once(KERN_WARNING "EXT4-fs: Warning: mounting with "
4976a5991e53SJason Yan 			    "data=journal disables delayed allocation, "
4977a5991e53SJason Yan 			    "dioread_nolock, O_DIRECT and fast_commit support!\n");
4978a5991e53SJason Yan 		/* can't mount with both data=journal and dioread_nolock. */
4979a5991e53SJason Yan 		clear_opt(sb, DIOREAD_NOLOCK);
4980a5991e53SJason Yan 		clear_opt2(sb, JOURNAL_FAST_COMMIT);
4981a5991e53SJason Yan 		if (test_opt2(sb, EXPLICIT_DELALLOC)) {
4982a5991e53SJason Yan 			ext4_msg(sb, KERN_ERR, "can't mount with "
4983a5991e53SJason Yan 				 "both data=journal and delalloc");
4984a5991e53SJason Yan 			return -EINVAL;
4985a5991e53SJason Yan 		}
4986a5991e53SJason Yan 		if (test_opt(sb, DAX_ALWAYS)) {
4987a5991e53SJason Yan 			ext4_msg(sb, KERN_ERR, "can't mount with "
4988a5991e53SJason Yan 				 "both data=journal and dax");
4989a5991e53SJason Yan 			return -EINVAL;
4990a5991e53SJason Yan 		}
4991a5991e53SJason Yan 		if (ext4_has_feature_encrypt(sb)) {
4992a5991e53SJason Yan 			ext4_msg(sb, KERN_WARNING,
4993a5991e53SJason Yan 				 "encrypted files will use data=ordered "
4994a5991e53SJason Yan 				 "instead of data journaling mode");
4995a5991e53SJason Yan 		}
4996a5991e53SJason Yan 		if (test_opt(sb, DELALLOC))
4997a5991e53SJason Yan 			clear_opt(sb, DELALLOC);
4998a5991e53SJason Yan 	} else {
4999a5991e53SJason Yan 		sb->s_iflags |= SB_I_CGROUPWB;
5000a5991e53SJason Yan 	}
5001a5991e53SJason Yan 
5002a5991e53SJason Yan 	return 0;
5003a5991e53SJason Yan }
5004a5991e53SJason Yan 
5005a7a79c29SJason Yan static int ext4_load_super(struct super_block *sb, ext4_fsblk_t *lsb,
5006a7a79c29SJason Yan 			   int silent)
5007a7a79c29SJason Yan {
5008a7a79c29SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
5009a7a79c29SJason Yan 	struct ext4_super_block *es;
5010a7a79c29SJason Yan 	ext4_fsblk_t logical_sb_block;
5011a7a79c29SJason Yan 	unsigned long offset = 0;
5012a7a79c29SJason Yan 	struct buffer_head *bh;
5013a7a79c29SJason Yan 	int ret = -EINVAL;
5014a7a79c29SJason Yan 	int blocksize;
5015a7a79c29SJason Yan 
5016a7a79c29SJason Yan 	blocksize = sb_min_blocksize(sb, EXT4_MIN_BLOCK_SIZE);
5017a7a79c29SJason Yan 	if (!blocksize) {
5018a7a79c29SJason Yan 		ext4_msg(sb, KERN_ERR, "unable to set blocksize");
5019a7a79c29SJason Yan 		return -EINVAL;
5020a7a79c29SJason Yan 	}
5021a7a79c29SJason Yan 
5022a7a79c29SJason Yan 	/*
5023a7a79c29SJason Yan 	 * The ext4 superblock will not be buffer aligned for other than 1kB
5024a7a79c29SJason Yan 	 * block sizes.  We need to calculate the offset from buffer start.
5025a7a79c29SJason Yan 	 */
5026a7a79c29SJason Yan 	if (blocksize != EXT4_MIN_BLOCK_SIZE) {
5027a7a79c29SJason Yan 		logical_sb_block = sbi->s_sb_block * EXT4_MIN_BLOCK_SIZE;
5028a7a79c29SJason Yan 		offset = do_div(logical_sb_block, blocksize);
5029a7a79c29SJason Yan 	} else {
5030a7a79c29SJason Yan 		logical_sb_block = sbi->s_sb_block;
5031a7a79c29SJason Yan 	}
5032a7a79c29SJason Yan 
5033a7a79c29SJason Yan 	bh = ext4_sb_bread_unmovable(sb, logical_sb_block);
5034a7a79c29SJason Yan 	if (IS_ERR(bh)) {
5035a7a79c29SJason Yan 		ext4_msg(sb, KERN_ERR, "unable to read superblock");
5036a7a79c29SJason Yan 		return PTR_ERR(bh);
5037a7a79c29SJason Yan 	}
5038a7a79c29SJason Yan 	/*
5039a7a79c29SJason Yan 	 * Note: s_es must be initialized as soon as possible because
5040a7a79c29SJason Yan 	 *       some ext4 macro-instructions depend on its value
5041a7a79c29SJason Yan 	 */
5042a7a79c29SJason Yan 	es = (struct ext4_super_block *) (bh->b_data + offset);
5043a7a79c29SJason Yan 	sbi->s_es = es;
5044a7a79c29SJason Yan 	sb->s_magic = le16_to_cpu(es->s_magic);
5045a7a79c29SJason Yan 	if (sb->s_magic != EXT4_SUPER_MAGIC) {
5046a7a79c29SJason Yan 		if (!silent)
5047a7a79c29SJason Yan 			ext4_msg(sb, KERN_ERR, "VFS: Can't find ext4 filesystem");
5048a7a79c29SJason Yan 		goto out;
5049a7a79c29SJason Yan 	}
5050a7a79c29SJason Yan 
5051a7a79c29SJason Yan 	if (le32_to_cpu(es->s_log_block_size) >
5052a7a79c29SJason Yan 	    (EXT4_MAX_BLOCK_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) {
5053a7a79c29SJason Yan 		ext4_msg(sb, KERN_ERR,
5054a7a79c29SJason Yan 			 "Invalid log block size: %u",
5055a7a79c29SJason Yan 			 le32_to_cpu(es->s_log_block_size));
5056a7a79c29SJason Yan 		goto out;
5057a7a79c29SJason Yan 	}
5058a7a79c29SJason Yan 	if (le32_to_cpu(es->s_log_cluster_size) >
5059a7a79c29SJason Yan 	    (EXT4_MAX_CLUSTER_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) {
5060a7a79c29SJason Yan 		ext4_msg(sb, KERN_ERR,
5061a7a79c29SJason Yan 			 "Invalid log cluster size: %u",
5062a7a79c29SJason Yan 			 le32_to_cpu(es->s_log_cluster_size));
5063a7a79c29SJason Yan 		goto out;
5064a7a79c29SJason Yan 	}
5065a7a79c29SJason Yan 
5066a7a79c29SJason Yan 	blocksize = EXT4_MIN_BLOCK_SIZE << le32_to_cpu(es->s_log_block_size);
5067a7a79c29SJason Yan 
5068a7a79c29SJason Yan 	/*
5069a7a79c29SJason Yan 	 * If the default block size is not the same as the real block size,
5070a7a79c29SJason Yan 	 * we need to reload it.
5071a7a79c29SJason Yan 	 */
5072a7a79c29SJason Yan 	if (sb->s_blocksize == blocksize) {
5073a7a79c29SJason Yan 		*lsb = logical_sb_block;
5074a7a79c29SJason Yan 		sbi->s_sbh = bh;
5075a7a79c29SJason Yan 		return 0;
5076a7a79c29SJason Yan 	}
5077a7a79c29SJason Yan 
5078a7a79c29SJason Yan 	/*
5079a7a79c29SJason Yan 	 * bh must be released before kill_bdev(), otherwise
5080a7a79c29SJason Yan 	 * it won't be freed and its page also. kill_bdev()
5081a7a79c29SJason Yan 	 * is called by sb_set_blocksize().
5082a7a79c29SJason Yan 	 */
5083a7a79c29SJason Yan 	brelse(bh);
5084a7a79c29SJason Yan 	/* Validate the filesystem blocksize */
5085a7a79c29SJason Yan 	if (!sb_set_blocksize(sb, blocksize)) {
5086a7a79c29SJason Yan 		ext4_msg(sb, KERN_ERR, "bad block size %d",
5087a7a79c29SJason Yan 				blocksize);
5088a7a79c29SJason Yan 		bh = NULL;
5089a7a79c29SJason Yan 		goto out;
5090a7a79c29SJason Yan 	}
5091a7a79c29SJason Yan 
5092a7a79c29SJason Yan 	logical_sb_block = sbi->s_sb_block * EXT4_MIN_BLOCK_SIZE;
5093a7a79c29SJason Yan 	offset = do_div(logical_sb_block, blocksize);
5094a7a79c29SJason Yan 	bh = ext4_sb_bread_unmovable(sb, logical_sb_block);
5095a7a79c29SJason Yan 	if (IS_ERR(bh)) {
5096a7a79c29SJason Yan 		ext4_msg(sb, KERN_ERR, "Can't read superblock on 2nd try");
5097a7a79c29SJason Yan 		ret = PTR_ERR(bh);
5098a7a79c29SJason Yan 		bh = NULL;
5099a7a79c29SJason Yan 		goto out;
5100a7a79c29SJason Yan 	}
5101a7a79c29SJason Yan 	es = (struct ext4_super_block *)(bh->b_data + offset);
5102a7a79c29SJason Yan 	sbi->s_es = es;
5103a7a79c29SJason Yan 	if (es->s_magic != cpu_to_le16(EXT4_SUPER_MAGIC)) {
5104a7a79c29SJason Yan 		ext4_msg(sb, KERN_ERR, "Magic mismatch, very weird!");
5105a7a79c29SJason Yan 		goto out;
5106a7a79c29SJason Yan 	}
5107a7a79c29SJason Yan 	*lsb = logical_sb_block;
5108a7a79c29SJason Yan 	sbi->s_sbh = bh;
5109a7a79c29SJason Yan 	return 0;
5110a7a79c29SJason Yan out:
5111a7a79c29SJason Yan 	brelse(bh);
5112a7a79c29SJason Yan 	return ret;
5113a7a79c29SJason Yan }
5114a7a79c29SJason Yan 
5115db9345d9SJason Yan static void ext4_hash_info_init(struct super_block *sb)
5116db9345d9SJason Yan {
5117db9345d9SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
5118db9345d9SJason Yan 	struct ext4_super_block *es = sbi->s_es;
5119db9345d9SJason Yan 	unsigned int i;
5120db9345d9SJason Yan 
5121db9345d9SJason Yan 	for (i = 0; i < 4; i++)
5122db9345d9SJason Yan 		sbi->s_hash_seed[i] = le32_to_cpu(es->s_hash_seed[i]);
5123db9345d9SJason Yan 
5124db9345d9SJason Yan 	sbi->s_def_hash_version = es->s_def_hash_version;
5125db9345d9SJason Yan 	if (ext4_has_feature_dir_index(sb)) {
5126db9345d9SJason Yan 		i = le32_to_cpu(es->s_flags);
5127db9345d9SJason Yan 		if (i & EXT2_FLAGS_UNSIGNED_HASH)
5128db9345d9SJason Yan 			sbi->s_hash_unsigned = 3;
5129db9345d9SJason Yan 		else if ((i & EXT2_FLAGS_SIGNED_HASH) == 0) {
5130db9345d9SJason Yan #ifdef __CHAR_UNSIGNED__
5131db9345d9SJason Yan 			if (!sb_rdonly(sb))
5132db9345d9SJason Yan 				es->s_flags |=
5133db9345d9SJason Yan 					cpu_to_le32(EXT2_FLAGS_UNSIGNED_HASH);
5134db9345d9SJason Yan 			sbi->s_hash_unsigned = 3;
5135db9345d9SJason Yan #else
5136db9345d9SJason Yan 			if (!sb_rdonly(sb))
5137db9345d9SJason Yan 				es->s_flags |=
5138db9345d9SJason Yan 					cpu_to_le32(EXT2_FLAGS_SIGNED_HASH);
5139db9345d9SJason Yan #endif
5140db9345d9SJason Yan 		}
5141db9345d9SJason Yan 	}
5142db9345d9SJason Yan }
5143db9345d9SJason Yan 
5144107d2be9SJason Yan static int ext4_block_group_meta_init(struct super_block *sb, int silent)
5145107d2be9SJason Yan {
5146107d2be9SJason Yan 	struct ext4_sb_info *sbi = EXT4_SB(sb);
5147107d2be9SJason Yan 	struct ext4_super_block *es = sbi->s_es;
5148107d2be9SJason Yan 	int has_huge_files;
5149107d2be9SJason Yan 
5150107d2be9SJason Yan 	has_huge_files = ext4_has_feature_huge_file(sb);
5151107d2be9SJason Yan 	sbi->s_bitmap_maxbytes = ext4_max_bitmap_size(sb->s_blocksize_bits,
5152107d2be9SJason Yan 						      has_huge_files);
5153107d2be9SJason Yan 	sb->s_maxbytes = ext4_max_size(sb->s_blocksize_bits, has_huge_files);
5154107d2be9SJason Yan 
5155107d2be9SJason Yan 	sbi->s_desc_size = le16_to_cpu(es->s_desc_size);
5156107d2be9SJason Yan 	if (ext4_has_feature_64bit(sb)) {
5157107d2be9SJason Yan 		if (sbi->s_desc_size < EXT4_MIN_DESC_SIZE_64BIT ||
5158107d2be9SJason Yan 		    sbi->s_desc_size > EXT4_MAX_DESC_SIZE ||
5159107d2be9SJason Yan 		    !is_power_of_2(sbi->s_desc_size)) {
5160107d2be9SJason Yan 			ext4_msg(sb, KERN_ERR,
5161107d2be9SJason Yan 			       "unsupported descriptor size %lu",
5162107d2be9SJason Yan 			       sbi->s_desc_size);
5163107d2be9SJason Yan 			return -EINVAL;
5164107d2be9SJason Yan 		}
5165107d2be9SJason Yan 	} else
5166107d2be9SJason Yan 		sbi->s_desc_size = EXT4_MIN_DESC_SIZE;
5167107d2be9SJason Yan 
5168107d2be9SJason Yan 	sbi->s_blocks_per_group = le32_to_cpu(es->s_blocks_per_group);
5169107d2be9SJason Yan 	sbi->s_inodes_per_group = le32_to_cpu(es->s_inodes_per_group);
5170107d2be9SJason Yan 
5171107d2be9SJason Yan 	sbi->s_inodes_per_block = sb->s_blocksize / EXT4_INODE_SIZE(sb);
5172107d2be9SJason Yan 	if (sbi->s_inodes_per_block == 0 || sbi->s_blocks_per_group == 0) {
5173107d2be9SJason Yan 		if (!silent)
5174107d2be9SJason Yan 			ext4_msg(sb, KERN_ERR, "VFS: Can't find ext4 filesystem");
5175107d2be9SJason Yan 		return -EINVAL;
5176107d2be9SJason Yan 	}
5177107d2be9SJason Yan 	if (sbi->s_inodes_per_group < sbi->s_inodes_per_block ||
5178107d2be9SJason Yan 	    sbi->s_inodes_per_group > sb->s_blocksize * 8) {
5179107d2be9SJason Yan 		ext4_msg(sb, KERN_ERR, "invalid inodes per group: %lu\n",
5180107d2be9SJason Yan 			 sbi->s_inodes_per_group);
5181107d2be9SJason Yan 		return -EINVAL;
5182107d2be9SJason Yan 	}
5183107d2be9SJason Yan 	sbi->s_itb_per_group = sbi->s_inodes_per_group /
5184107d2be9SJason Yan 					sbi->s_inodes_per_block;
5185107d2be9SJason Yan 	sbi->s_desc_per_block = sb->s_blocksize / EXT4_DESC_SIZE(sb);
5186107d2be9SJason Yan 	sbi->s_mount_state = le16_to_cpu(es->s_state) & ~EXT4_FC_REPLAY;
5187107d2be9SJason Yan 	sbi->s_addr_per_block_bits = ilog2(EXT4_ADDR_PER_BLOCK(sb));
5188107d2be9SJason Yan 	sbi->s_desc_per_block_bits = ilog2(EXT4_DESC_PER_BLOCK(sb));
5189107d2be9SJason Yan 
5190107d2be9SJason Yan 	return 0;
5191107d2be9SJason Yan }
5192107d2be9SJason Yan 
5193960e0ab6SLukas Czerner static int __ext4_fill_super(struct fs_context *fc, struct super_block *sb)
51947edfd85bSLukas Czerner {
5195617ba13bSMingming Cao 	struct ext4_super_block *es = NULL;
51967edfd85bSLukas Czerner 	struct ext4_sb_info *sbi = EXT4_SB(sb);
519770bbb3e0SAndrew Morton 	ext4_fsblk_t logical_sb_block;
5198ac27a0ecSDave Kleikamp 	struct inode *root;
5199dcc7dae3SCyrill Gorcunov 	int ret = -ENOMEM;
52004ec11028STheodore Ts'o 	unsigned int i;
5201107d2be9SJason Yan 	int needs_recovery;
520207aa2ea1SLukas Czerner 	int err = 0;
5203bfff6873SLukas Czerner 	ext4_group_t first_not_zeroed;
52047edfd85bSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
5205960e0ab6SLukas Czerner 	int silent = fc->sb_flags & SB_SILENT;
5206b237e304SHarshad Shirwadkar 
5207b237e304SHarshad Shirwadkar 	/* Set defaults for the variables that will be set during parsing */
5208e4e58e5dSOjaswin Mujoo 	if (!(ctx->spec & EXT4_SPEC_JOURNAL_IOPRIO))
52097edfd85bSLukas Czerner 		ctx->journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
5210ac27a0ecSDave Kleikamp 
5211240799cdSTheodore Ts'o 	sbi->s_inode_readahead_blks = EXT4_DEF_INODE_READAHEAD_BLKS;
5212f613dfcbSTheodore Ts'o 	sbi->s_sectors_written_start =
52138446fe92SChristoph Hellwig 		part_stat_read(sb->s_bdev, sectors[STAT_WRITE]);
5214ac27a0ecSDave Kleikamp 
521507aa2ea1SLukas Czerner 	/* -EINVAL is default */
5216dcc7dae3SCyrill Gorcunov 	ret = -EINVAL;
5217a7a79c29SJason Yan 	err = ext4_load_super(sb, &logical_sb_block, silent);
5218a7a79c29SJason Yan 	if (err)
5219ac27a0ecSDave Kleikamp 		goto out_fail;
5220ac27a0ecSDave Kleikamp 
5221a7a79c29SJason Yan 	es = sbi->s_es;
5222afc32f7eSTheodore Ts'o 	sbi->s_kbytes_written = le64_to_cpu(es->s_kbytes_written);
5223ac27a0ecSDave Kleikamp 
5224b26458d1SJason Yan 	err = ext4_init_metadata_csum(sb, es);
5225b26458d1SJason Yan 	if (err)
5226a5fc5119SJason Yan 		goto failed_mount;
5227a9c47317SDarrick J. Wong 
52285f6d662dSJason Yan 	ext4_set_def_opts(sb, es);
5229ac27a0ecSDave Kleikamp 
523008cefc7aSEric W. Biederman 	sbi->s_resuid = make_kuid(&init_user_ns, le16_to_cpu(es->s_def_resuid));
523108cefc7aSEric W. Biederman 	sbi->s_resgid = make_kgid(&init_user_ns, le16_to_cpu(es->s_def_resgid));
523230773840STheodore Ts'o 	sbi->s_commit_interval = JBD2_DEFAULT_MAX_COMMIT_AGE * HZ;
523330773840STheodore Ts'o 	sbi->s_min_batch_time = EXT4_DEF_MIN_BATCH_TIME;
523430773840STheodore Ts'o 	sbi->s_max_batch_time = EXT4_DEF_MAX_BATCH_TIME;
5235ac27a0ecSDave Kleikamp 
523651ce6511SLukas Czerner 	/*
523751ce6511SLukas Czerner 	 * set default s_li_wait_mult for lazyinit, for the case there is
523851ce6511SLukas Czerner 	 * no mount option specified.
523951ce6511SLukas Czerner 	 */
524051ce6511SLukas Czerner 	sbi->s_li_wait_mult = EXT4_DEF_LI_WAIT_MULT;
524151ce6511SLukas Czerner 
5242c8267c51SJason Yan 	if (ext4_inode_info_init(sb, es))
52439803387cSTheodore Ts'o 		goto failed_mount;
52449803387cSTheodore Ts'o 
52457edfd85bSLukas Czerner 	err = parse_apply_sb_mount_options(sb, ctx);
52467edfd85bSLukas Czerner 	if (err < 0)
52475aee0f8aSTheodore Ts'o 		goto failed_mount;
52487edfd85bSLukas Czerner 
52495a916be1STheodore Ts'o 	sbi->s_def_mount_opt = sbi->s_mount_opt;
5250e3645d72SZhang Yi 	sbi->s_def_mount_opt2 = sbi->s_mount_opt2;
52517edfd85bSLukas Czerner 
52527edfd85bSLukas Czerner 	err = ext4_check_opt_consistency(fc, sb);
52537edfd85bSLukas Czerner 	if (err < 0)
52547edfd85bSLukas Czerner 		goto failed_mount;
52557edfd85bSLukas Czerner 
525685456054SEric Biggers 	ext4_apply_options(fc, sb);
5257ac27a0ecSDave Kleikamp 
525839c135b0SJason Yan 	if (ext4_encoding_init(sb, es))
5259c83ad55eSGabriel Krisman Bertazi 		goto failed_mount;
5260c83ad55eSGabriel Krisman Bertazi 
526168e62439SJason Yan 	if (ext4_check_journal_data_mode(sb))
526256889787STheodore Ts'o 		goto failed_mount;
526356889787STheodore Ts'o 
52641751e8a6SLinus Torvalds 	sb->s_flags = (sb->s_flags & ~SB_POSIXACL) |
52651751e8a6SLinus Torvalds 		(test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0);
5266ac27a0ecSDave Kleikamp 
52671ff20307SJeff Layton 	/* i_version is always enabled now */
52681ff20307SJeff Layton 	sb->s_flags |= SB_I_VERSION;
52691ff20307SJeff Layton 
5270d7f3542bSJason Yan 	if (ext4_check_feature_compatibility(sb, es, silent))
5271ac27a0ecSDave Kleikamp 		goto failed_mount;
5272a13fb1a4SEric Sandeen 
5273107d2be9SJason Yan 	if (ext4_block_group_meta_init(sb, silent))
52740d1ee42fSAlexandre Ratchov 		goto failed_mount;
52750b8e58a1SAndreas Dilger 
5276db9345d9SJason Yan 	ext4_hash_info_init(sb);
5277ac27a0ecSDave Kleikamp 
5278c8267c51SJason Yan 	if (ext4_handle_clustersize(sb))
5279281b5995STheodore Ts'o 		goto failed_mount;
5280960fd856STheodore Ts'o 
528168e62439SJason Yan 	if (ext4_check_geometry(sb, es))
52820f2ddca6SFrom: Thiemo Nagel 		goto failed_mount;
52830f2ddca6SFrom: Thiemo Nagel 
5284235699a8SKees Cook 	timer_setup(&sbi->s_err_report, print_daily_error_info, 0);
5285c92dc856SJan Kara 	spin_lock_init(&sbi->s_error_lock);
5286c92dc856SJan Kara 	INIT_WORK(&sbi->s_error_work, flush_stashed_error_work);
528704496411STao Ma 
5288172e344eSYe Bin 	err = ext4_group_desc_init(sb, es, logical_sb_block, &first_not_zeroed);
5289172e344eSYe Bin 	if (err)
5290172e344eSYe Bin 		goto failed_mount3;
5291172e344eSYe Bin 
5292a75ae78fSDmitry Monakhov 	/* Register extent status tree shrinker */
5293eb68d0e2SZheng Liu 	if (ext4_es_register_shrinker(sbi))
5294ce7e010aSTheodore Ts'o 		goto failed_mount3;
5295ce7e010aSTheodore Ts'o 
5296c9de560dSAlex Tomas 	sbi->s_stripe = ext4_get_stripe_size(sbi);
529767a5da56SZheng Liu 	sbi->s_extent_max_zeroout_kb = 32;
5298c9de560dSAlex Tomas 
5299f9ae9cf5STheodore Ts'o 	/*
5300f9ae9cf5STheodore Ts'o 	 * set up enough so that it can read an inode
5301f9ae9cf5STheodore Ts'o 	 */
5302f9ae9cf5STheodore Ts'o 	sb->s_op = &ext4_sops;
5303617ba13bSMingming Cao 	sb->s_export_op = &ext4_export_ops;
5304617ba13bSMingming Cao 	sb->s_xattr = ext4_xattr_handlers;
5305643fa961SChandan Rajendra #ifdef CONFIG_FS_ENCRYPTION
5306a7550b30SJaegeuk Kim 	sb->s_cop = &ext4_cryptops;
5307ffcc4182SEric Biggers #endif
5308c93d8f88SEric Biggers #ifdef CONFIG_FS_VERITY
5309c93d8f88SEric Biggers 	sb->s_vop = &ext4_verityops;
5310c93d8f88SEric Biggers #endif
5311ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5312617ba13bSMingming Cao 	sb->dq_op = &ext4_quota_operations;
5313e2b911c5SDarrick J. Wong 	if (ext4_has_feature_quota(sb))
53141fa5efe3SJan Kara 		sb->s_qcop = &dquot_quotactl_sysfile_ops;
5315262b4662SJan Kara 	else
5316262b4662SJan Kara 		sb->s_qcop = &ext4_qctl_operations;
5317689c958cSLi Xi 	sb->s_quota_types = QTYPE_MASK_USR | QTYPE_MASK_GRP | QTYPE_MASK_PRJ;
5318ac27a0ecSDave Kleikamp #endif
531985787090SChristoph Hellwig 	memcpy(&sb->s_uuid, es->s_uuid, sizeof(es->s_uuid));
5320f2fa2ffcSAneesh Kumar K.V 
5321ac27a0ecSDave Kleikamp 	INIT_LIST_HEAD(&sbi->s_orphan); /* unlinked but open files */
53223b9d4ed2STheodore Ts'o 	mutex_init(&sbi->s_orphan_lock);
5323ac27a0ecSDave Kleikamp 
5324f7314a67SJason Yan 	ext4_fast_commit_init(sb);
5325aa75f4d3SHarshad Shirwadkar 
5326ac27a0ecSDave Kleikamp 	sb->s_root = NULL;
5327ac27a0ecSDave Kleikamp 
5328ac27a0ecSDave Kleikamp 	needs_recovery = (es->s_last_orphan != 0 ||
532902f310fcSJan Kara 			  ext4_has_feature_orphan_present(sb) ||
5330e2b911c5SDarrick J. Wong 			  ext4_has_feature_journal_needs_recovery(sb));
5331ac27a0ecSDave Kleikamp 
5332bc98a42cSDavid Howells 	if (ext4_has_feature_mmp(sb) && !sb_rdonly(sb))
5333c5e06d10SJohann Lombardi 		if (ext4_multi_mount_protect(sb, le64_to_cpu(es->s_mmp_block)))
533450460fe8SDarrick J. Wong 			goto failed_mount3a;
5335c5e06d10SJohann Lombardi 
5336ac27a0ecSDave Kleikamp 	/*
5337ac27a0ecSDave Kleikamp 	 * The first inode we look at is the journal inode.  Don't try
5338ac27a0ecSDave Kleikamp 	 * root first: it may be modified in the journal!
5339ac27a0ecSDave Kleikamp 	 */
5340e2b911c5SDarrick J. Wong 	if (!test_opt(sb, NOLOAD) && ext4_has_feature_journal(sb)) {
53419c1dd22dSJason Yan 		err = ext4_load_and_init_journal(sb, es, ctx);
53424753d8a2STheodore Ts'o 		if (err)
534350460fe8SDarrick J. Wong 			goto failed_mount3a;
5344bc98a42cSDavid Howells 	} else if (test_opt(sb, NOLOAD) && !sb_rdonly(sb) &&
5345e2b911c5SDarrick J. Wong 		   ext4_has_feature_journal_needs_recovery(sb)) {
5346b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "required journal recovery "
5347b31e1552SEric Sandeen 		       "suppressed and not mounted read-only");
534843bd6f1bSJason Yan 		goto failed_mount3a;
5349ac27a0ecSDave Kleikamp 	} else {
53501e381f60SDmitry Monakhov 		/* Nojournal mode, all journal mount options are illegal */
53511e381f60SDmitry Monakhov 		if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
53521e381f60SDmitry Monakhov 			ext4_msg(sb, KERN_ERR, "can't mount with "
53531e381f60SDmitry Monakhov 				 "journal_async_commit, fs mounted w/o journal");
535443bd6f1bSJason Yan 			goto failed_mount3a;
53551e381f60SDmitry Monakhov 		}
535689481b5fSBaokun Li 
535789481b5fSBaokun Li 		if (test_opt2(sb, EXPLICIT_JOURNAL_CHECKSUM)) {
535889481b5fSBaokun Li 			ext4_msg(sb, KERN_ERR, "can't mount with "
535989481b5fSBaokun Li 				 "journal_checksum, fs mounted w/o journal");
536089481b5fSBaokun Li 			goto failed_mount3a;
536189481b5fSBaokun Li 		}
53621e381f60SDmitry Monakhov 		if (sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ) {
53631e381f60SDmitry Monakhov 			ext4_msg(sb, KERN_ERR, "can't mount with "
53641e381f60SDmitry Monakhov 				 "commit=%lu, fs mounted w/o journal",
53651e381f60SDmitry Monakhov 				 sbi->s_commit_interval / HZ);
536643bd6f1bSJason Yan 			goto failed_mount3a;
53671e381f60SDmitry Monakhov 		}
53681e381f60SDmitry Monakhov 		if (EXT4_MOUNT_DATA_FLAGS &
53691e381f60SDmitry Monakhov 		    (sbi->s_mount_opt ^ sbi->s_def_mount_opt)) {
53701e381f60SDmitry Monakhov 			ext4_msg(sb, KERN_ERR, "can't mount with "
53711e381f60SDmitry Monakhov 				 "data=, fs mounted w/o journal");
537243bd6f1bSJason Yan 			goto failed_mount3a;
53731e381f60SDmitry Monakhov 		}
537450b29d8fSDebabrata Banerjee 		sbi->s_def_mount_opt &= ~EXT4_MOUNT_JOURNAL_CHECKSUM;
53751e381f60SDmitry Monakhov 		clear_opt(sb, JOURNAL_CHECKSUM);
5376fd8c37ecSTheodore Ts'o 		clear_opt(sb, DATA_FLAGS);
5377995a3ed6SHarshad Shirwadkar 		clear_opt2(sb, JOURNAL_FAST_COMMIT);
53780390131bSFrank Mayhar 		sbi->s_journal = NULL;
53790390131bSFrank Mayhar 		needs_recovery = 0;
5380ac27a0ecSDave Kleikamp 	}
5381ac27a0ecSDave Kleikamp 
5382cdb7ee4cSTahsin Erdogan 	if (!test_opt(sb, NO_MBCACHE)) {
538347387409STahsin Erdogan 		sbi->s_ea_block_cache = ext4_xattr_create_cache();
538447387409STahsin Erdogan 		if (!sbi->s_ea_block_cache) {
5385cdb7ee4cSTahsin Erdogan 			ext4_msg(sb, KERN_ERR,
5386cdb7ee4cSTahsin Erdogan 				 "Failed to create ea_block_cache");
53879c191f70ST Makphaibulchoke 			goto failed_mount_wq;
53889c191f70ST Makphaibulchoke 		}
53899c191f70ST Makphaibulchoke 
5390dec214d0STahsin Erdogan 		if (ext4_has_feature_ea_inode(sb)) {
5391dec214d0STahsin Erdogan 			sbi->s_ea_inode_cache = ext4_xattr_create_cache();
5392dec214d0STahsin Erdogan 			if (!sbi->s_ea_inode_cache) {
5393dec214d0STahsin Erdogan 				ext4_msg(sb, KERN_ERR,
5394dec214d0STahsin Erdogan 					 "Failed to create ea_inode_cache");
5395dec214d0STahsin Erdogan 				goto failed_mount_wq;
5396dec214d0STahsin Erdogan 			}
5397dec214d0STahsin Erdogan 		}
5398cdb7ee4cSTahsin Erdogan 	}
5399dec214d0STahsin Erdogan 
5400fd89d5f2STejun Heo 	/*
5401952fc18eSTheodore Ts'o 	 * Get the # of file system overhead blocks from the
5402952fc18eSTheodore Ts'o 	 * superblock if present.
5403952fc18eSTheodore Ts'o 	 */
5404952fc18eSTheodore Ts'o 	sbi->s_overhead = le32_to_cpu(es->s_overhead_clusters);
540585d825dbSTheodore Ts'o 	/* ignore the precalculated value if it is ridiculous */
540685d825dbSTheodore Ts'o 	if (sbi->s_overhead > ext4_blocks_count(es))
540785d825dbSTheodore Ts'o 		sbi->s_overhead = 0;
540885d825dbSTheodore Ts'o 	/*
540985d825dbSTheodore Ts'o 	 * If the bigalloc feature is not enabled recalculating the
541085d825dbSTheodore Ts'o 	 * overhead doesn't take long, so we might as well just redo
541185d825dbSTheodore Ts'o 	 * it to make sure we are using the correct value.
541285d825dbSTheodore Ts'o 	 */
541385d825dbSTheodore Ts'o 	if (!ext4_has_feature_bigalloc(sb))
541485d825dbSTheodore Ts'o 		sbi->s_overhead = 0;
541585d825dbSTheodore Ts'o 	if (sbi->s_overhead == 0) {
541607aa2ea1SLukas Czerner 		err = ext4_calculate_overhead(sb);
541707aa2ea1SLukas Czerner 		if (err)
5418952fc18eSTheodore Ts'o 			goto failed_mount_wq;
5419952fc18eSTheodore Ts'o 	}
5420952fc18eSTheodore Ts'o 
5421952fc18eSTheodore Ts'o 	/*
5422fd89d5f2STejun Heo 	 * The maximum number of concurrent works can be high and
5423fd89d5f2STejun Heo 	 * concurrency isn't really necessary.  Limit it to 1.
5424fd89d5f2STejun Heo 	 */
54252e8fa54eSJan Kara 	EXT4_SB(sb)->rsv_conversion_wq =
54262e8fa54eSJan Kara 		alloc_workqueue("ext4-rsv-conversion", WQ_MEM_RECLAIM | WQ_UNBOUND, 1);
54272e8fa54eSJan Kara 	if (!EXT4_SB(sb)->rsv_conversion_wq) {
54282e8fa54eSJan Kara 		printk(KERN_ERR "EXT4-fs: failed to create workqueue\n");
542907aa2ea1SLukas Czerner 		ret = -ENOMEM;
54302e8fa54eSJan Kara 		goto failed_mount4;
54312e8fa54eSJan Kara 	}
54322e8fa54eSJan Kara 
5433ac27a0ecSDave Kleikamp 	/*
5434dab291afSMingming Cao 	 * The jbd2_journal_load will have done any necessary log recovery,
5435ac27a0ecSDave Kleikamp 	 * so we can safely mount the rest of the filesystem now.
5436ac27a0ecSDave Kleikamp 	 */
5437ac27a0ecSDave Kleikamp 
54388a363970STheodore Ts'o 	root = ext4_iget(sb, EXT4_ROOT_INO, EXT4_IGET_SPECIAL);
54391d1fe1eeSDavid Howells 	if (IS_ERR(root)) {
5440b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "get root inode failed");
54411d1fe1eeSDavid Howells 		ret = PTR_ERR(root);
544232a9bb57SManish Katiyar 		root = NULL;
5443ac27a0ecSDave Kleikamp 		goto failed_mount4;
5444ac27a0ecSDave Kleikamp 	}
5445ac27a0ecSDave Kleikamp 	if (!S_ISDIR(root->i_mode) || !root->i_blocks || !root->i_size) {
5446b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "corrupt root inode, run e2fsck");
544794bf608aSAl Viro 		iput(root);
5448ac27a0ecSDave Kleikamp 		goto failed_mount4;
5449ac27a0ecSDave Kleikamp 	}
5450b886ee3eSGabriel Krisman Bertazi 
545148fde701SAl Viro 	sb->s_root = d_make_root(root);
54521d1fe1eeSDavid Howells 	if (!sb->s_root) {
5453b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "get root dentry failed");
54541d1fe1eeSDavid Howells 		ret = -ENOMEM;
54551d1fe1eeSDavid Howells 		goto failed_mount4;
54561d1fe1eeSDavid Howells 	}
5457ac27a0ecSDave Kleikamp 
5458c89128a0SJaegeuk Kim 	ret = ext4_setup_super(sb, es, sb_rdonly(sb));
5459c89128a0SJaegeuk Kim 	if (ret == -EROFS) {
54601751e8a6SLinus Torvalds 		sb->s_flags |= SB_RDONLY;
5461c89128a0SJaegeuk Kim 		ret = 0;
5462c89128a0SJaegeuk Kim 	} else if (ret)
5463c89128a0SJaegeuk Kim 		goto failed_mount4a;
5464ef7f3835SKalpak Shah 
5465b5799018STheodore Ts'o 	ext4_set_resv_clusters(sb);
546627dd4385SLukas Czerner 
54670f5bde1dSJan Kara 	if (test_opt(sb, BLOCK_VALIDITY)) {
54686fd058f7STheodore Ts'o 		err = ext4_setup_system_zone(sb);
54696fd058f7STheodore Ts'o 		if (err) {
5470b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "failed to initialize system "
5471fbe845ddSCurt Wohlgemuth 				 "zone (%d)", err);
5472f9ae9cf5STheodore Ts'o 			goto failed_mount4a;
5473f9ae9cf5STheodore Ts'o 		}
54740f5bde1dSJan Kara 	}
54758016e29fSHarshad Shirwadkar 	ext4_fc_replay_cleanup(sb);
5476f9ae9cf5STheodore Ts'o 
5477f9ae9cf5STheodore Ts'o 	ext4_ext_init(sb);
5478196e402aSHarshad Shirwadkar 
5479196e402aSHarshad Shirwadkar 	/*
5480196e402aSHarshad Shirwadkar 	 * Enable optimize_scan if number of groups is > threshold. This can be
5481196e402aSHarshad Shirwadkar 	 * turned off by passing "mb_optimize_scan=0". This can also be
5482196e402aSHarshad Shirwadkar 	 * turned on forcefully by passing "mb_optimize_scan=1".
5483196e402aSHarshad Shirwadkar 	 */
548427b38686SOjaswin Mujoo 	if (!(ctx->spec & EXT4_SPEC_mb_optimize_scan)) {
548527b38686SOjaswin Mujoo 		if (sbi->s_groups_count >= MB_DEFAULT_LINEAR_SCAN_THRESHOLD)
5486196e402aSHarshad Shirwadkar 			set_opt2(sb, MB_OPTIMIZE_SCAN);
548727b38686SOjaswin Mujoo 		else
5488196e402aSHarshad Shirwadkar 			clear_opt2(sb, MB_OPTIMIZE_SCAN);
548927b38686SOjaswin Mujoo 	}
5490196e402aSHarshad Shirwadkar 
5491f9ae9cf5STheodore Ts'o 	err = ext4_mb_init(sb);
5492f9ae9cf5STheodore Ts'o 	if (err) {
5493f9ae9cf5STheodore Ts'o 		ext4_msg(sb, KERN_ERR, "failed to initialize mballoc (%d)",
5494f9ae9cf5STheodore Ts'o 			 err);
5495dcf2d804STao Ma 		goto failed_mount5;
5496c2774d84SAneesh Kumar K.V 	}
5497c2774d84SAneesh Kumar K.V 
5498027f14f5STheodore Ts'o 	/*
5499027f14f5STheodore Ts'o 	 * We can only set up the journal commit callback once
5500027f14f5STheodore Ts'o 	 * mballoc is initialized
5501027f14f5STheodore Ts'o 	 */
5502027f14f5STheodore Ts'o 	if (sbi->s_journal)
5503027f14f5STheodore Ts'o 		sbi->s_journal->j_commit_callback =
5504027f14f5STheodore Ts'o 			ext4_journal_commit_callback;
5505027f14f5STheodore Ts'o 
55061f79467cSJason Yan 	if (ext4_percpu_param_init(sbi))
5507d5e03cbbSTheodore Ts'o 		goto failed_mount6;
5508d5e03cbbSTheodore Ts'o 
5509e2b911c5SDarrick J. Wong 	if (ext4_has_feature_flex_bg(sb))
5510d5e03cbbSTheodore Ts'o 		if (!ext4_fill_flex_info(sb)) {
5511d5e03cbbSTheodore Ts'o 			ext4_msg(sb, KERN_ERR,
5512d5e03cbbSTheodore Ts'o 			       "unable to initialize "
5513d5e03cbbSTheodore Ts'o 			       "flex_bg meta info!");
55148f6840c4SYang Yingliang 			ret = -ENOMEM;
5515d5e03cbbSTheodore Ts'o 			goto failed_mount6;
5516d5e03cbbSTheodore Ts'o 		}
5517d5e03cbbSTheodore Ts'o 
5518bfff6873SLukas Czerner 	err = ext4_register_li_request(sb, first_not_zeroed);
5519bfff6873SLukas Czerner 	if (err)
5520dcf2d804STao Ma 		goto failed_mount6;
5521bfff6873SLukas Czerner 
5522b5799018STheodore Ts'o 	err = ext4_register_sysfs(sb);
5523dcf2d804STao Ma 	if (err)
5524dcf2d804STao Ma 		goto failed_mount7;
55253197ebdbSTheodore Ts'o 
552602f310fcSJan Kara 	err = ext4_init_orphan_info(sb);
552702f310fcSJan Kara 	if (err)
552802f310fcSJan Kara 		goto failed_mount8;
55299b2ff357SJan Kara #ifdef CONFIG_QUOTA
55309b2ff357SJan Kara 	/* Enable quota usage during mount. */
5531bc98a42cSDavid Howells 	if (ext4_has_feature_quota(sb) && !sb_rdonly(sb)) {
55329b2ff357SJan Kara 		err = ext4_enable_quotas(sb);
55339b2ff357SJan Kara 		if (err)
553402f310fcSJan Kara 			goto failed_mount9;
55359b2ff357SJan Kara 	}
55369b2ff357SJan Kara #endif  /* CONFIG_QUOTA */
55379b2ff357SJan Kara 
5538bc71726cSzhangyi (F) 	/*
5539bc71726cSzhangyi (F) 	 * Save the original bdev mapping's wb_err value which could be
5540bc71726cSzhangyi (F) 	 * used to detect the metadata async write error.
5541bc71726cSzhangyi (F) 	 */
5542bc71726cSzhangyi (F) 	spin_lock_init(&sbi->s_bdev_wb_lock);
5543bc71726cSzhangyi (F) 	errseq_check_and_advance(&sb->s_bdev->bd_inode->i_mapping->wb_err,
5544bc71726cSzhangyi (F) 				 &sbi->s_bdev_wb_err);
5545bc71726cSzhangyi (F) 	sb->s_bdev->bd_super = sb;
5546617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state |= EXT4_ORPHAN_FS;
5547617ba13bSMingming Cao 	ext4_orphan_cleanup(sb, es);
5548617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state &= ~EXT4_ORPHAN_FS;
55499b6641ddSYe Bin 	/*
55509b6641ddSYe Bin 	 * Update the checksum after updating free space/inode counters and
55519b6641ddSYe Bin 	 * ext4_orphan_cleanup. Otherwise the superblock can have an incorrect
55529b6641ddSYe Bin 	 * checksum in the buffer cache until it is written out and
55539b6641ddSYe Bin 	 * e2fsprogs programs trying to open a file system immediately
55549b6641ddSYe Bin 	 * after it is mounted can fail.
55559b6641ddSYe Bin 	 */
55569b6641ddSYe Bin 	ext4_superblock_csum_set(sb);
55570390131bSFrank Mayhar 	if (needs_recovery) {
5558b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "recovery complete");
555911215630SJan Kara 		err = ext4_mark_recovery_complete(sb, es);
556011215630SJan Kara 		if (err)
556102f310fcSJan Kara 			goto failed_mount9;
55620390131bSFrank Mayhar 	}
55630390131bSFrank Mayhar 
556470200574SChristoph Hellwig 	if (test_opt(sb, DISCARD) && !bdev_max_discard_sectors(sb->s_bdev))
556579add3a3SLukas Czerner 		ext4_msg(sb, KERN_WARNING,
556670200574SChristoph Hellwig 			 "mounting with \"discard\" option, but the device does not support discard");
556779add3a3SLukas Czerner 
556866e61a9eSTheodore Ts'o 	if (es->s_error_count)
556966e61a9eSTheodore Ts'o 		mod_timer(&sbi->s_err_report, jiffies + 300*HZ); /* 5 minutes */
5570ac27a0ecSDave Kleikamp 
5571efbed4dcSTheodore Ts'o 	/* Enable message ratelimiting. Default is 10 messages per 5 secs. */
5572efbed4dcSTheodore Ts'o 	ratelimit_state_init(&sbi->s_err_ratelimit_state, 5 * HZ, 10);
5573efbed4dcSTheodore Ts'o 	ratelimit_state_init(&sbi->s_warning_ratelimit_state, 5 * HZ, 10);
5574efbed4dcSTheodore Ts'o 	ratelimit_state_init(&sbi->s_msg_ratelimit_state, 5 * HZ, 10);
55751cf006edSDmitry Monakhov 	atomic_set(&sbi->s_warning_count, 0);
55761cf006edSDmitry Monakhov 	atomic_set(&sbi->s_msg_count, 0);
5577efbed4dcSTheodore Ts'o 
5578ac27a0ecSDave Kleikamp 	return 0;
5579ac27a0ecSDave Kleikamp 
558002f310fcSJan Kara failed_mount9:
558102f310fcSJan Kara 	ext4_release_orphan_info(sb);
558272ba7450STheodore Ts'o failed_mount8:
5583ebd173beSTheodore Ts'o 	ext4_unregister_sysfs(sb);
5584cb8d53d2SEric Biggers 	kobject_put(&sbi->s_kobj);
5585dcf2d804STao Ma failed_mount7:
5586dcf2d804STao Ma 	ext4_unregister_li_request(sb);
5587dcf2d804STao Ma failed_mount6:
5588f9ae9cf5STheodore Ts'o 	ext4_mb_release(sb);
5589dcbf8758SJason Yan 	ext4_flex_groups_free(sbi);
55901f79467cSJason Yan 	ext4_percpu_param_destroy(sbi);
559100764937SAzat Khuzhin failed_mount5:
5592f9ae9cf5STheodore Ts'o 	ext4_ext_release(sb);
5593f9ae9cf5STheodore Ts'o 	ext4_release_system_zone(sb);
5594f9ae9cf5STheodore Ts'o failed_mount4a:
559594bf608aSAl Viro 	dput(sb->s_root);
559632a9bb57SManish Katiyar 	sb->s_root = NULL;
559794bf608aSAl Viro failed_mount4:
5598b31e1552SEric Sandeen 	ext4_msg(sb, KERN_ERR, "mount failed");
55992e8fa54eSJan Kara 	if (EXT4_SB(sb)->rsv_conversion_wq)
56002e8fa54eSJan Kara 		destroy_workqueue(EXT4_SB(sb)->rsv_conversion_wq);
56014c0425ffSMingming Cao failed_mount_wq:
5602dec214d0STahsin Erdogan 	ext4_xattr_destroy_cache(sbi->s_ea_inode_cache);
5603dec214d0STahsin Erdogan 	sbi->s_ea_inode_cache = NULL;
560450c15df6SChengguang Xu 
560547387409STahsin Erdogan 	ext4_xattr_destroy_cache(sbi->s_ea_block_cache);
560647387409STahsin Erdogan 	sbi->s_ea_block_cache = NULL;
560750c15df6SChengguang Xu 
56080390131bSFrank Mayhar 	if (sbi->s_journal) {
5609bb9464e0Syangerkun 		/* flush s_error_work before journal destroy. */
5610bb9464e0Syangerkun 		flush_work(&sbi->s_error_work);
5611dab291afSMingming Cao 		jbd2_journal_destroy(sbi->s_journal);
561247b4a50bSJan Kara 		sbi->s_journal = NULL;
56130390131bSFrank Mayhar 	}
561450460fe8SDarrick J. Wong failed_mount3a:
5615d3922a77SZheng Liu 	ext4_es_unregister_shrinker(sbi);
5616eb68d0e2SZheng Liu failed_mount3:
5617bb9464e0Syangerkun 	/* flush s_error_work before sbi destroy */
5618c92dc856SJan Kara 	flush_work(&sbi->s_error_work);
56192a4ae3bcSJan Kara 	del_timer_sync(&sbi->s_err_report);
5620618f0031SPavel Skripkin 	ext4_stop_mmpd(sbi);
5621a4e6a511SJason Yan 	ext4_group_desc_free(sbi);
5622ac27a0ecSDave Kleikamp failed_mount:
56230441984aSDarrick J. Wong 	if (sbi->s_chksum_driver)
56240441984aSDarrick J. Wong 		crypto_free_shash(sbi->s_chksum_driver);
5625c83ad55eSGabriel Krisman Bertazi 
56265298d4bfSChristoph Hellwig #if IS_ENABLED(CONFIG_UNICODE)
5627f8f4acb6SDaniel Rosenberg 	utf8_unload(sb->s_encoding);
5628c83ad55eSGabriel Krisman Bertazi #endif
5629c83ad55eSGabriel Krisman Bertazi 
5630ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5631a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
56320ba33facSTheodore Ts'o 		kfree(get_qf_name(sb, sbi, i));
5633ac27a0ecSDave Kleikamp #endif
5634ac4acb1fSEric Biggers 	fscrypt_free_dummy_policy(&sbi->s_dummy_enc_policy);
5635afd09b61SAlexey Makhalov 	/* ext4_blkdev_remove() calls kill_bdev(), release bh before it. */
5636a7a79c29SJason Yan 	brelse(sbi->s_sbh);
5637afd09b61SAlexey Makhalov 	ext4_blkdev_remove(sbi);
5638ac27a0ecSDave Kleikamp out_fail:
5639ac27a0ecSDave Kleikamp 	sb->s_fs_info = NULL;
564007aa2ea1SLukas Czerner 	return err ? err : ret;
5641ac27a0ecSDave Kleikamp }
5642ac27a0ecSDave Kleikamp 
5643cebe85d5SLukas Czerner static int ext4_fill_super(struct super_block *sb, struct fs_context *fc)
56447edfd85bSLukas Czerner {
5645cebe85d5SLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
56467edfd85bSLukas Czerner 	struct ext4_sb_info *sbi;
56477edfd85bSLukas Czerner 	const char *descr;
5648cebe85d5SLukas Czerner 	int ret;
56497edfd85bSLukas Czerner 
5650cebe85d5SLukas Czerner 	sbi = ext4_alloc_sbi(sb);
5651cebe85d5SLukas Czerner 	if (!sbi)
56527c268d4cSLukas Czerner 		return -ENOMEM;
5653cebe85d5SLukas Czerner 
5654cebe85d5SLukas Czerner 	fc->s_fs_info = sbi;
56557edfd85bSLukas Czerner 
56567edfd85bSLukas Czerner 	/* Cleanup superblock name */
56577edfd85bSLukas Czerner 	strreplace(sb->s_id, '/', '!');
56587edfd85bSLukas Czerner 
56597edfd85bSLukas Czerner 	sbi->s_sb_block = 1;	/* Default super block location */
5660cebe85d5SLukas Czerner 	if (ctx->spec & EXT4_SPEC_s_sb_block)
5661cebe85d5SLukas Czerner 		sbi->s_sb_block = ctx->s_sb_block;
56627edfd85bSLukas Czerner 
5663960e0ab6SLukas Czerner 	ret = __ext4_fill_super(fc, sb);
56647edfd85bSLukas Czerner 	if (ret < 0)
56657edfd85bSLukas Czerner 		goto free_sbi;
56667edfd85bSLukas Czerner 
5667cebe85d5SLukas Czerner 	if (sbi->s_journal) {
56687edfd85bSLukas Czerner 		if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
56697edfd85bSLukas Czerner 			descr = " journalled data mode";
56707edfd85bSLukas Czerner 		else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
56717edfd85bSLukas Czerner 			descr = " ordered data mode";
56727edfd85bSLukas Czerner 		else
56737edfd85bSLukas Czerner 			descr = " writeback data mode";
56747edfd85bSLukas Czerner 	} else
56757edfd85bSLukas Czerner 		descr = "out journal";
56767edfd85bSLukas Czerner 
56777edfd85bSLukas Czerner 	if (___ratelimit(&ext4_mount_msg_ratelimit, "EXT4-fs mount"))
5678bb0fbc78SLukas Czerner 		ext4_msg(sb, KERN_INFO, "mounted filesystem %pU with%s. "
5679bb0fbc78SLukas Czerner 			 "Quota mode: %s.", &sb->s_uuid, descr,
5680bb0fbc78SLukas Czerner 			 ext4_quota_mode(sb));
56817edfd85bSLukas Czerner 
5682eb705421STheodore Ts'o 	/* Update the s_overhead_clusters if necessary */
5683827891a3STheodore Ts'o 	ext4_update_overhead(sb, false);
56847edfd85bSLukas Czerner 	return 0;
5685cebe85d5SLukas Czerner 
56867edfd85bSLukas Czerner free_sbi:
56877edfd85bSLukas Czerner 	ext4_free_sbi(sbi);
5688cebe85d5SLukas Czerner 	fc->s_fs_info = NULL;
56897edfd85bSLukas Czerner 	return ret;
56907edfd85bSLukas Czerner }
56917edfd85bSLukas Czerner 
5692cebe85d5SLukas Czerner static int ext4_get_tree(struct fs_context *fc)
5693cebe85d5SLukas Czerner {
5694cebe85d5SLukas Czerner 	return get_tree_bdev(fc, ext4_fill_super);
5695cebe85d5SLukas Czerner }
5696cebe85d5SLukas Czerner 
5697ac27a0ecSDave Kleikamp /*
5698ac27a0ecSDave Kleikamp  * Setup any per-fs journal parameters now.  We'll do this both on
5699ac27a0ecSDave Kleikamp  * initial mount, once the journal has been initialised but before we've
5700ac27a0ecSDave Kleikamp  * done any recovery; and again on any subsequent remount.
5701ac27a0ecSDave Kleikamp  */
5702617ba13bSMingming Cao static void ext4_init_journal_params(struct super_block *sb, journal_t *journal)
5703ac27a0ecSDave Kleikamp {
5704617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
5705ac27a0ecSDave Kleikamp 
5706ac27a0ecSDave Kleikamp 	journal->j_commit_interval = sbi->s_commit_interval;
570730773840STheodore Ts'o 	journal->j_min_batch_time = sbi->s_min_batch_time;
570830773840STheodore Ts'o 	journal->j_max_batch_time = sbi->s_max_batch_time;
57096866d7b3SHarshad Shirwadkar 	ext4_fc_init(sb, journal);
5710ac27a0ecSDave Kleikamp 
5711a931da6aSTheodore Ts'o 	write_lock(&journal->j_state_lock);
5712ac27a0ecSDave Kleikamp 	if (test_opt(sb, BARRIER))
5713dab291afSMingming Cao 		journal->j_flags |= JBD2_BARRIER;
5714ac27a0ecSDave Kleikamp 	else
5715dab291afSMingming Cao 		journal->j_flags &= ~JBD2_BARRIER;
57165bf5683aSHidehiro Kawai 	if (test_opt(sb, DATA_ERR_ABORT))
57175bf5683aSHidehiro Kawai 		journal->j_flags |= JBD2_ABORT_ON_SYNCDATA_ERR;
57185bf5683aSHidehiro Kawai 	else
57195bf5683aSHidehiro Kawai 		journal->j_flags &= ~JBD2_ABORT_ON_SYNCDATA_ERR;
5720a931da6aSTheodore Ts'o 	write_unlock(&journal->j_state_lock);
5721ac27a0ecSDave Kleikamp }
5722ac27a0ecSDave Kleikamp 
5723c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb,
5724ac27a0ecSDave Kleikamp 					     unsigned int journal_inum)
5725ac27a0ecSDave Kleikamp {
5726ac27a0ecSDave Kleikamp 	struct inode *journal_inode;
5727ac27a0ecSDave Kleikamp 
5728c6cb7e77SEric Whitney 	/*
5729c6cb7e77SEric Whitney 	 * Test for the existence of a valid inode on disk.  Bad things
5730c6cb7e77SEric Whitney 	 * happen if we iget() an unused inode, as the subsequent iput()
5731c6cb7e77SEric Whitney 	 * will try to delete it.
5732c6cb7e77SEric Whitney 	 */
57338a363970STheodore Ts'o 	journal_inode = ext4_iget(sb, journal_inum, EXT4_IGET_SPECIAL);
57341d1fe1eeSDavid Howells 	if (IS_ERR(journal_inode)) {
5735b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "no journal found");
5736ac27a0ecSDave Kleikamp 		return NULL;
5737ac27a0ecSDave Kleikamp 	}
5738ac27a0ecSDave Kleikamp 	if (!journal_inode->i_nlink) {
5739ac27a0ecSDave Kleikamp 		make_bad_inode(journal_inode);
5740ac27a0ecSDave Kleikamp 		iput(journal_inode);
5741b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "journal inode is deleted");
5742ac27a0ecSDave Kleikamp 		return NULL;
5743ac27a0ecSDave Kleikamp 	}
5744ac27a0ecSDave Kleikamp 
57454978c659SJan Kara 	ext4_debug("Journal inode found at %p: %lld bytes\n",
5746ac27a0ecSDave Kleikamp 		  journal_inode, journal_inode->i_size);
5747105c78e1SEric Biggers 	if (!S_ISREG(journal_inode->i_mode) || IS_ENCRYPTED(journal_inode)) {
5748b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "invalid journal inode");
5749ac27a0ecSDave Kleikamp 		iput(journal_inode);
5750ac27a0ecSDave Kleikamp 		return NULL;
5751ac27a0ecSDave Kleikamp 	}
5752c6cb7e77SEric Whitney 	return journal_inode;
5753c6cb7e77SEric Whitney }
5754c6cb7e77SEric Whitney 
575562913ae9STheodore Ts'o static int ext4_journal_bmap(journal_t *journal, sector_t *block)
575662913ae9STheodore Ts'o {
575762913ae9STheodore Ts'o 	struct ext4_map_blocks map;
575862913ae9STheodore Ts'o 	int ret;
575962913ae9STheodore Ts'o 
576062913ae9STheodore Ts'o 	if (journal->j_inode == NULL)
576162913ae9STheodore Ts'o 		return 0;
576262913ae9STheodore Ts'o 
576362913ae9STheodore Ts'o 	map.m_lblk = *block;
576462913ae9STheodore Ts'o 	map.m_len = 1;
576562913ae9STheodore Ts'o 	ret = ext4_map_blocks(NULL, journal->j_inode, &map, 0);
576662913ae9STheodore Ts'o 	if (ret <= 0) {
576762913ae9STheodore Ts'o 		ext4_msg(journal->j_inode->i_sb, KERN_CRIT,
576862913ae9STheodore Ts'o 			 "journal bmap failed: block %llu ret %d\n",
576962913ae9STheodore Ts'o 			 *block, ret);
577062913ae9STheodore Ts'o 		jbd2_journal_abort(journal, ret ? ret : -EIO);
577162913ae9STheodore Ts'o 		return ret;
577262913ae9STheodore Ts'o 	}
577362913ae9STheodore Ts'o 	*block = map.m_pblk;
577462913ae9STheodore Ts'o 	return 0;
577562913ae9STheodore Ts'o }
577662913ae9STheodore Ts'o 
5777c6cb7e77SEric Whitney static journal_t *ext4_get_journal(struct super_block *sb,
5778c6cb7e77SEric Whitney 				   unsigned int journal_inum)
5779c6cb7e77SEric Whitney {
5780c6cb7e77SEric Whitney 	struct inode *journal_inode;
5781c6cb7e77SEric Whitney 	journal_t *journal;
5782c6cb7e77SEric Whitney 
578311215630SJan Kara 	if (WARN_ON_ONCE(!ext4_has_feature_journal(sb)))
578411215630SJan Kara 		return NULL;
5785c6cb7e77SEric Whitney 
5786c6cb7e77SEric Whitney 	journal_inode = ext4_get_journal_inode(sb, journal_inum);
5787c6cb7e77SEric Whitney 	if (!journal_inode)
5788c6cb7e77SEric Whitney 		return NULL;
5789ac27a0ecSDave Kleikamp 
5790dab291afSMingming Cao 	journal = jbd2_journal_init_inode(journal_inode);
5791ac27a0ecSDave Kleikamp 	if (!journal) {
5792b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "Could not load journal inode");
5793ac27a0ecSDave Kleikamp 		iput(journal_inode);
5794ac27a0ecSDave Kleikamp 		return NULL;
5795ac27a0ecSDave Kleikamp 	}
5796ac27a0ecSDave Kleikamp 	journal->j_private = sb;
579762913ae9STheodore Ts'o 	journal->j_bmap = ext4_journal_bmap;
5798617ba13bSMingming Cao 	ext4_init_journal_params(sb, journal);
5799ac27a0ecSDave Kleikamp 	return journal;
5800ac27a0ecSDave Kleikamp }
5801ac27a0ecSDave Kleikamp 
5802617ba13bSMingming Cao static journal_t *ext4_get_dev_journal(struct super_block *sb,
5803ac27a0ecSDave Kleikamp 				       dev_t j_dev)
5804ac27a0ecSDave Kleikamp {
5805ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
5806ac27a0ecSDave Kleikamp 	journal_t *journal;
5807617ba13bSMingming Cao 	ext4_fsblk_t start;
5808617ba13bSMingming Cao 	ext4_fsblk_t len;
5809ac27a0ecSDave Kleikamp 	int hblock, blocksize;
5810617ba13bSMingming Cao 	ext4_fsblk_t sb_block;
5811ac27a0ecSDave Kleikamp 	unsigned long offset;
5812617ba13bSMingming Cao 	struct ext4_super_block *es;
5813ac27a0ecSDave Kleikamp 	struct block_device *bdev;
5814ac27a0ecSDave Kleikamp 
581511215630SJan Kara 	if (WARN_ON_ONCE(!ext4_has_feature_journal(sb)))
581611215630SJan Kara 		return NULL;
58170390131bSFrank Mayhar 
5818b31e1552SEric Sandeen 	bdev = ext4_blkdev_get(j_dev, sb);
5819ac27a0ecSDave Kleikamp 	if (bdev == NULL)
5820ac27a0ecSDave Kleikamp 		return NULL;
5821ac27a0ecSDave Kleikamp 
5822ac27a0ecSDave Kleikamp 	blocksize = sb->s_blocksize;
5823e1defc4fSMartin K. Petersen 	hblock = bdev_logical_block_size(bdev);
5824ac27a0ecSDave Kleikamp 	if (blocksize < hblock) {
5825b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR,
5826b31e1552SEric Sandeen 			"blocksize too small for journal device");
5827ac27a0ecSDave Kleikamp 		goto out_bdev;
5828ac27a0ecSDave Kleikamp 	}
5829ac27a0ecSDave Kleikamp 
5830617ba13bSMingming Cao 	sb_block = EXT4_MIN_BLOCK_SIZE / blocksize;
5831617ba13bSMingming Cao 	offset = EXT4_MIN_BLOCK_SIZE % blocksize;
5832ac27a0ecSDave Kleikamp 	set_blocksize(bdev, blocksize);
5833ac27a0ecSDave Kleikamp 	if (!(bh = __bread(bdev, sb_block, blocksize))) {
5834b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "couldn't read superblock of "
5835b31e1552SEric Sandeen 		       "external journal");
5836ac27a0ecSDave Kleikamp 		goto out_bdev;
5837ac27a0ecSDave Kleikamp 	}
5838ac27a0ecSDave Kleikamp 
58392716b802STheodore Ts'o 	es = (struct ext4_super_block *) (bh->b_data + offset);
5840617ba13bSMingming Cao 	if ((le16_to_cpu(es->s_magic) != EXT4_SUPER_MAGIC) ||
5841ac27a0ecSDave Kleikamp 	    !(le32_to_cpu(es->s_feature_incompat) &
5842617ba13bSMingming Cao 	      EXT4_FEATURE_INCOMPAT_JOURNAL_DEV)) {
5843b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "external journal has "
5844b31e1552SEric Sandeen 					"bad superblock");
5845ac27a0ecSDave Kleikamp 		brelse(bh);
5846ac27a0ecSDave Kleikamp 		goto out_bdev;
5847ac27a0ecSDave Kleikamp 	}
5848ac27a0ecSDave Kleikamp 
5849df4763beSDarrick J. Wong 	if ((le32_to_cpu(es->s_feature_ro_compat) &
5850df4763beSDarrick J. Wong 	     EXT4_FEATURE_RO_COMPAT_METADATA_CSUM) &&
5851df4763beSDarrick J. Wong 	    es->s_checksum != ext4_superblock_csum(sb, es)) {
5852df4763beSDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "external journal has "
5853df4763beSDarrick J. Wong 				       "corrupt superblock");
5854df4763beSDarrick J. Wong 		brelse(bh);
5855df4763beSDarrick J. Wong 		goto out_bdev;
5856df4763beSDarrick J. Wong 	}
5857df4763beSDarrick J. Wong 
5858617ba13bSMingming Cao 	if (memcmp(EXT4_SB(sb)->s_es->s_journal_uuid, es->s_uuid, 16)) {
5859b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "journal UUID does not match");
5860ac27a0ecSDave Kleikamp 		brelse(bh);
5861ac27a0ecSDave Kleikamp 		goto out_bdev;
5862ac27a0ecSDave Kleikamp 	}
5863ac27a0ecSDave Kleikamp 
5864bd81d8eeSLaurent Vivier 	len = ext4_blocks_count(es);
5865ac27a0ecSDave Kleikamp 	start = sb_block + 1;
5866ac27a0ecSDave Kleikamp 	brelse(bh);	/* we're done with the superblock */
5867ac27a0ecSDave Kleikamp 
5868dab291afSMingming Cao 	journal = jbd2_journal_init_dev(bdev, sb->s_bdev,
5869ac27a0ecSDave Kleikamp 					start, len, blocksize);
5870ac27a0ecSDave Kleikamp 	if (!journal) {
5871b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "failed to create device journal");
5872ac27a0ecSDave Kleikamp 		goto out_bdev;
5873ac27a0ecSDave Kleikamp 	}
5874ac27a0ecSDave Kleikamp 	journal->j_private = sb;
58752d069c08Szhangyi (F) 	if (ext4_read_bh_lock(journal->j_sb_buffer, REQ_META | REQ_PRIO, true)) {
5876b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "I/O error on journal device");
5877ac27a0ecSDave Kleikamp 		goto out_journal;
5878ac27a0ecSDave Kleikamp 	}
5879ac27a0ecSDave Kleikamp 	if (be32_to_cpu(journal->j_superblock->s_nr_users) != 1) {
5880b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "External journal has more than one "
5881b31e1552SEric Sandeen 					"user (unsupported) - %d",
5882ac27a0ecSDave Kleikamp 			be32_to_cpu(journal->j_superblock->s_nr_users));
5883ac27a0ecSDave Kleikamp 		goto out_journal;
5884ac27a0ecSDave Kleikamp 	}
5885ee7ed3aaSChunguang Xu 	EXT4_SB(sb)->s_journal_bdev = bdev;
5886617ba13bSMingming Cao 	ext4_init_journal_params(sb, journal);
5887ac27a0ecSDave Kleikamp 	return journal;
58880b8e58a1SAndreas Dilger 
5889ac27a0ecSDave Kleikamp out_journal:
5890dab291afSMingming Cao 	jbd2_journal_destroy(journal);
5891ac27a0ecSDave Kleikamp out_bdev:
5892617ba13bSMingming Cao 	ext4_blkdev_put(bdev);
5893ac27a0ecSDave Kleikamp 	return NULL;
5894ac27a0ecSDave Kleikamp }
5895ac27a0ecSDave Kleikamp 
5896617ba13bSMingming Cao static int ext4_load_journal(struct super_block *sb,
5897617ba13bSMingming Cao 			     struct ext4_super_block *es,
5898ac27a0ecSDave Kleikamp 			     unsigned long journal_devnum)
5899ac27a0ecSDave Kleikamp {
5900ac27a0ecSDave Kleikamp 	journal_t *journal;
5901ac27a0ecSDave Kleikamp 	unsigned int journal_inum = le32_to_cpu(es->s_journal_inum);
5902ac27a0ecSDave Kleikamp 	dev_t journal_dev;
5903ac27a0ecSDave Kleikamp 	int err = 0;
5904ac27a0ecSDave Kleikamp 	int really_read_only;
5905273108faSLukas Czerner 	int journal_dev_ro;
5906ac27a0ecSDave Kleikamp 
590711215630SJan Kara 	if (WARN_ON_ONCE(!ext4_has_feature_journal(sb)))
590811215630SJan Kara 		return -EFSCORRUPTED;
59090390131bSFrank Mayhar 
5910ac27a0ecSDave Kleikamp 	if (journal_devnum &&
5911ac27a0ecSDave Kleikamp 	    journal_devnum != le32_to_cpu(es->s_journal_dev)) {
5912b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "external journal device major/minor "
5913b31e1552SEric Sandeen 			"numbers have changed");
5914ac27a0ecSDave Kleikamp 		journal_dev = new_decode_dev(journal_devnum);
5915ac27a0ecSDave Kleikamp 	} else
5916ac27a0ecSDave Kleikamp 		journal_dev = new_decode_dev(le32_to_cpu(es->s_journal_dev));
5917ac27a0ecSDave Kleikamp 
5918273108faSLukas Czerner 	if (journal_inum && journal_dev) {
5919273108faSLukas Czerner 		ext4_msg(sb, KERN_ERR,
5920273108faSLukas Czerner 			 "filesystem has both journal inode and journal device!");
5921273108faSLukas Czerner 		return -EINVAL;
5922273108faSLukas Czerner 	}
5923273108faSLukas Czerner 
5924273108faSLukas Czerner 	if (journal_inum) {
5925273108faSLukas Czerner 		journal = ext4_get_journal(sb, journal_inum);
5926273108faSLukas Czerner 		if (!journal)
5927273108faSLukas Czerner 			return -EINVAL;
5928273108faSLukas Czerner 	} else {
5929273108faSLukas Czerner 		journal = ext4_get_dev_journal(sb, journal_dev);
5930273108faSLukas Czerner 		if (!journal)
5931273108faSLukas Czerner 			return -EINVAL;
5932273108faSLukas Czerner 	}
5933273108faSLukas Czerner 
5934273108faSLukas Czerner 	journal_dev_ro = bdev_read_only(journal->j_dev);
5935273108faSLukas Czerner 	really_read_only = bdev_read_only(sb->s_bdev) | journal_dev_ro;
5936273108faSLukas Czerner 
5937273108faSLukas Czerner 	if (journal_dev_ro && !sb_rdonly(sb)) {
5938273108faSLukas Czerner 		ext4_msg(sb, KERN_ERR,
5939273108faSLukas Czerner 			 "journal device read-only, try mounting with '-o ro'");
5940273108faSLukas Czerner 		err = -EROFS;
5941273108faSLukas Czerner 		goto err_out;
5942273108faSLukas Czerner 	}
5943ac27a0ecSDave Kleikamp 
5944ac27a0ecSDave Kleikamp 	/*
5945ac27a0ecSDave Kleikamp 	 * Are we loading a blank journal or performing recovery after a
5946ac27a0ecSDave Kleikamp 	 * crash?  For recovery, we need to check in advance whether we
5947ac27a0ecSDave Kleikamp 	 * can get read-write access to the device.
5948ac27a0ecSDave Kleikamp 	 */
5949e2b911c5SDarrick J. Wong 	if (ext4_has_feature_journal_needs_recovery(sb)) {
5950bc98a42cSDavid Howells 		if (sb_rdonly(sb)) {
5951b31e1552SEric Sandeen 			ext4_msg(sb, KERN_INFO, "INFO: recovery "
5952b31e1552SEric Sandeen 					"required on readonly filesystem");
5953ac27a0ecSDave Kleikamp 			if (really_read_only) {
5954b31e1552SEric Sandeen 				ext4_msg(sb, KERN_ERR, "write access "
5955d98bf8cdSSimon Ruderich 					"unavailable, cannot proceed "
5956d98bf8cdSSimon Ruderich 					"(try mounting with noload)");
5957273108faSLukas Czerner 				err = -EROFS;
5958273108faSLukas Czerner 				goto err_out;
5959ac27a0ecSDave Kleikamp 			}
5960b31e1552SEric Sandeen 			ext4_msg(sb, KERN_INFO, "write access will "
5961b31e1552SEric Sandeen 			       "be enabled during recovery");
5962ac27a0ecSDave Kleikamp 		}
5963ac27a0ecSDave Kleikamp 	}
5964ac27a0ecSDave Kleikamp 
596590576c0bSTheodore Ts'o 	if (!(journal->j_flags & JBD2_BARRIER))
5966b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "barriers disabled");
59674776004fSTheodore Ts'o 
5968e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_journal_needs_recovery(sb))
5969dab291afSMingming Cao 		err = jbd2_journal_wipe(journal, !really_read_only);
59701c13d5c0STheodore Ts'o 	if (!err) {
59711c13d5c0STheodore Ts'o 		char *save = kmalloc(EXT4_S_ERR_LEN, GFP_KERNEL);
5972eee00237SYe Bin 
59731c13d5c0STheodore Ts'o 		if (save)
59741c13d5c0STheodore Ts'o 			memcpy(save, ((char *) es) +
59751c13d5c0STheodore Ts'o 			       EXT4_S_ERR_START, EXT4_S_ERR_LEN);
5976dab291afSMingming Cao 		err = jbd2_journal_load(journal);
59771c13d5c0STheodore Ts'o 		if (save)
59781c13d5c0STheodore Ts'o 			memcpy(((char *) es) + EXT4_S_ERR_START,
59791c13d5c0STheodore Ts'o 			       save, EXT4_S_ERR_LEN);
59801c13d5c0STheodore Ts'o 		kfree(save);
5981eee00237SYe Bin 		es->s_state |= cpu_to_le16(EXT4_SB(sb)->s_mount_state &
5982eee00237SYe Bin 					   EXT4_ERROR_FS);
5983eee00237SYe Bin 		/* Write out restored error information to the superblock */
5984eee00237SYe Bin 		if (!bdev_read_only(sb->s_bdev)) {
5985eee00237SYe Bin 			int err2;
5986eee00237SYe Bin 			err2 = ext4_commit_super(sb);
5987eee00237SYe Bin 			err = err ? : err2;
5988eee00237SYe Bin 		}
59891c13d5c0STheodore Ts'o 	}
5990ac27a0ecSDave Kleikamp 
5991ac27a0ecSDave Kleikamp 	if (err) {
5992b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "error loading journal");
5993273108faSLukas Czerner 		goto err_out;
5994ac27a0ecSDave Kleikamp 	}
5995ac27a0ecSDave Kleikamp 
5996617ba13bSMingming Cao 	EXT4_SB(sb)->s_journal = journal;
599711215630SJan Kara 	err = ext4_clear_journal_err(sb, es);
599811215630SJan Kara 	if (err) {
599911215630SJan Kara 		EXT4_SB(sb)->s_journal = NULL;
600011215630SJan Kara 		jbd2_journal_destroy(journal);
600111215630SJan Kara 		return err;
600211215630SJan Kara 	}
6003ac27a0ecSDave Kleikamp 
6004c41303ceSMaciej Żenczykowski 	if (!really_read_only && journal_devnum &&
6005ac27a0ecSDave Kleikamp 	    journal_devnum != le32_to_cpu(es->s_journal_dev)) {
6006ac27a0ecSDave Kleikamp 		es->s_journal_dev = cpu_to_le32(journal_devnum);
60073039d8b8SBaokun Li 		ext4_commit_super(sb);
60083039d8b8SBaokun Li 	}
60093039d8b8SBaokun Li 	if (!really_read_only && journal_inum &&
60103039d8b8SBaokun Li 	    journal_inum != le32_to_cpu(es->s_journal_inum)) {
60113039d8b8SBaokun Li 		es->s_journal_inum = cpu_to_le32(journal_inum);
60124392fbc4SJan Kara 		ext4_commit_super(sb);
6013ac27a0ecSDave Kleikamp 	}
6014ac27a0ecSDave Kleikamp 
6015ac27a0ecSDave Kleikamp 	return 0;
6016273108faSLukas Czerner 
6017273108faSLukas Czerner err_out:
6018273108faSLukas Czerner 	jbd2_journal_destroy(journal);
6019273108faSLukas Czerner 	return err;
6020ac27a0ecSDave Kleikamp }
6021ac27a0ecSDave Kleikamp 
60222d01ddc8SJan Kara /* Copy state of EXT4_SB(sb) into buffer for on-disk superblock */
60232d01ddc8SJan Kara static void ext4_update_super(struct super_block *sb)
6024ac27a0ecSDave Kleikamp {
6025c92dc856SJan Kara 	struct ext4_sb_info *sbi = EXT4_SB(sb);
6026e92ad03fSJan Kara 	struct ext4_super_block *es = sbi->s_es;
6027e92ad03fSJan Kara 	struct buffer_head *sbh = sbi->s_sbh;
6028ac27a0ecSDave Kleikamp 
602905c2c00fSJan Kara 	lock_buffer(sbh);
6030a17712c8SJon Derrick 	/*
603171290b36STheodore Ts'o 	 * If the file system is mounted read-only, don't update the
603271290b36STheodore Ts'o 	 * superblock write time.  This avoids updating the superblock
603371290b36STheodore Ts'o 	 * write time when we are mounting the root file system
603471290b36STheodore Ts'o 	 * read/only but we need to replay the journal; at that point,
603571290b36STheodore Ts'o 	 * for people who are east of GMT and who make their clock
603671290b36STheodore Ts'o 	 * tick in localtime for Windows bug-for-bug compatibility,
603771290b36STheodore Ts'o 	 * the clock is set in the future, and this will cause e2fsck
603871290b36STheodore Ts'o 	 * to complain and force a full file system check.
603971290b36STheodore Ts'o 	 */
60401751e8a6SLinus Torvalds 	if (!(sb->s_flags & SB_RDONLY))
60416a0678a7SArnd Bergmann 		ext4_update_tstamp(es, s_wtime);
6042afc32f7eSTheodore Ts'o 	es->s_kbytes_written =
6043e92ad03fSJan Kara 		cpu_to_le64(sbi->s_kbytes_written +
60448446fe92SChristoph Hellwig 		    ((part_stat_read(sb->s_bdev, sectors[STAT_WRITE]) -
6045e92ad03fSJan Kara 		      sbi->s_sectors_written_start) >> 1));
6046e92ad03fSJan Kara 	if (percpu_counter_initialized(&sbi->s_freeclusters_counter))
604757042651STheodore Ts'o 		ext4_free_blocks_count_set(es,
6048e92ad03fSJan Kara 			EXT4_C2B(sbi, percpu_counter_sum_positive(
6049e92ad03fSJan Kara 				&sbi->s_freeclusters_counter)));
6050e92ad03fSJan Kara 	if (percpu_counter_initialized(&sbi->s_freeinodes_counter))
60517f93cff9STheodore Ts'o 		es->s_free_inodes_count =
60527f93cff9STheodore Ts'o 			cpu_to_le32(percpu_counter_sum_positive(
6053e92ad03fSJan Kara 				&sbi->s_freeinodes_counter));
6054c92dc856SJan Kara 	/* Copy error information to the on-disk superblock */
6055c92dc856SJan Kara 	spin_lock(&sbi->s_error_lock);
6056c92dc856SJan Kara 	if (sbi->s_add_error_count > 0) {
6057c92dc856SJan Kara 		es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
6058c92dc856SJan Kara 		if (!es->s_first_error_time && !es->s_first_error_time_hi) {
6059c92dc856SJan Kara 			__ext4_update_tstamp(&es->s_first_error_time,
6060c92dc856SJan Kara 					     &es->s_first_error_time_hi,
6061c92dc856SJan Kara 					     sbi->s_first_error_time);
6062c92dc856SJan Kara 			strncpy(es->s_first_error_func, sbi->s_first_error_func,
6063c92dc856SJan Kara 				sizeof(es->s_first_error_func));
6064c92dc856SJan Kara 			es->s_first_error_line =
6065c92dc856SJan Kara 				cpu_to_le32(sbi->s_first_error_line);
6066c92dc856SJan Kara 			es->s_first_error_ino =
6067c92dc856SJan Kara 				cpu_to_le32(sbi->s_first_error_ino);
6068c92dc856SJan Kara 			es->s_first_error_block =
6069c92dc856SJan Kara 				cpu_to_le64(sbi->s_first_error_block);
6070c92dc856SJan Kara 			es->s_first_error_errcode =
6071c92dc856SJan Kara 				ext4_errno_to_code(sbi->s_first_error_code);
6072c92dc856SJan Kara 		}
6073c92dc856SJan Kara 		__ext4_update_tstamp(&es->s_last_error_time,
6074c92dc856SJan Kara 				     &es->s_last_error_time_hi,
6075c92dc856SJan Kara 				     sbi->s_last_error_time);
6076c92dc856SJan Kara 		strncpy(es->s_last_error_func, sbi->s_last_error_func,
6077c92dc856SJan Kara 			sizeof(es->s_last_error_func));
6078c92dc856SJan Kara 		es->s_last_error_line = cpu_to_le32(sbi->s_last_error_line);
6079c92dc856SJan Kara 		es->s_last_error_ino = cpu_to_le32(sbi->s_last_error_ino);
6080c92dc856SJan Kara 		es->s_last_error_block = cpu_to_le64(sbi->s_last_error_block);
6081c92dc856SJan Kara 		es->s_last_error_errcode =
6082c92dc856SJan Kara 				ext4_errno_to_code(sbi->s_last_error_code);
6083c92dc856SJan Kara 		/*
6084c92dc856SJan Kara 		 * Start the daily error reporting function if it hasn't been
6085c92dc856SJan Kara 		 * started already
6086c92dc856SJan Kara 		 */
6087c92dc856SJan Kara 		if (!es->s_error_count)
6088c92dc856SJan Kara 			mod_timer(&sbi->s_err_report, jiffies + 24*60*60*HZ);
6089c92dc856SJan Kara 		le32_add_cpu(&es->s_error_count, sbi->s_add_error_count);
6090c92dc856SJan Kara 		sbi->s_add_error_count = 0;
6091c92dc856SJan Kara 	}
6092c92dc856SJan Kara 	spin_unlock(&sbi->s_error_lock);
6093c92dc856SJan Kara 
609406db49e6STheodore Ts'o 	ext4_superblock_csum_set(sb);
60952d01ddc8SJan Kara 	unlock_buffer(sbh);
60962d01ddc8SJan Kara }
60972d01ddc8SJan Kara 
60982d01ddc8SJan Kara static int ext4_commit_super(struct super_block *sb)
60992d01ddc8SJan Kara {
61002d01ddc8SJan Kara 	struct buffer_head *sbh = EXT4_SB(sb)->s_sbh;
61012d01ddc8SJan Kara 
6102f88f1466SFengnan Chang 	if (!sbh)
6103f88f1466SFengnan Chang 		return -EINVAL;
6104f88f1466SFengnan Chang 	if (block_device_ejected(sb))
6105f88f1466SFengnan Chang 		return -ENODEV;
61062d01ddc8SJan Kara 
61072d01ddc8SJan Kara 	ext4_update_super(sb);
61082d01ddc8SJan Kara 
610915baa7dcSZhang Yi 	lock_buffer(sbh);
611015baa7dcSZhang Yi 	/* Buffer got discarded which means block device got invalidated */
611115baa7dcSZhang Yi 	if (!buffer_mapped(sbh)) {
611215baa7dcSZhang Yi 		unlock_buffer(sbh);
611315baa7dcSZhang Yi 		return -EIO;
611415baa7dcSZhang Yi 	}
611515baa7dcSZhang Yi 
6116e8680786STheodore Ts'o 	if (buffer_write_io_error(sbh) || !buffer_uptodate(sbh)) {
61174743f839SPranay Kr. Srivastava 		/*
61184743f839SPranay Kr. Srivastava 		 * Oh, dear.  A previous attempt to write the
61194743f839SPranay Kr. Srivastava 		 * superblock failed.  This could happen because the
61204743f839SPranay Kr. Srivastava 		 * USB device was yanked out.  Or it could happen to
61214743f839SPranay Kr. Srivastava 		 * be a transient write error and maybe the block will
61224743f839SPranay Kr. Srivastava 		 * be remapped.  Nothing we can do but to retry the
61234743f839SPranay Kr. Srivastava 		 * write and hope for the best.
61244743f839SPranay Kr. Srivastava 		 */
61254743f839SPranay Kr. Srivastava 		ext4_msg(sb, KERN_ERR, "previous I/O error to "
61264743f839SPranay Kr. Srivastava 		       "superblock detected");
61274743f839SPranay Kr. Srivastava 		clear_buffer_write_io_error(sbh);
61284743f839SPranay Kr. Srivastava 		set_buffer_uptodate(sbh);
61294743f839SPranay Kr. Srivastava 	}
613015baa7dcSZhang Yi 	get_bh(sbh);
613115baa7dcSZhang Yi 	/* Clear potential dirty bit if it was journalled update */
613215baa7dcSZhang Yi 	clear_buffer_dirty(sbh);
613315baa7dcSZhang Yi 	sbh->b_end_io = end_buffer_write_sync;
61341420c4a5SBart Van Assche 	submit_bh(REQ_OP_WRITE | REQ_SYNC |
61351420c4a5SBart Van Assche 		  (test_opt(sb, BARRIER) ? REQ_FUA : 0), sbh);
613615baa7dcSZhang Yi 	wait_on_buffer(sbh);
6137c89128a0SJaegeuk Kim 	if (buffer_write_io_error(sbh)) {
6138b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "I/O error while writing "
6139b31e1552SEric Sandeen 		       "superblock");
6140914258bfSTheodore Ts'o 		clear_buffer_write_io_error(sbh);
6141914258bfSTheodore Ts'o 		set_buffer_uptodate(sbh);
614215baa7dcSZhang Yi 		return -EIO;
6143914258bfSTheodore Ts'o 	}
614415baa7dcSZhang Yi 	return 0;
6145ac27a0ecSDave Kleikamp }
6146ac27a0ecSDave Kleikamp 
6147ac27a0ecSDave Kleikamp /*
6148ac27a0ecSDave Kleikamp  * Have we just finished recovery?  If so, and if we are mounting (or
6149ac27a0ecSDave Kleikamp  * remounting) the filesystem readonly, then we will end up with a
6150ac27a0ecSDave Kleikamp  * consistent fs on disk.  Record that fact.
6151ac27a0ecSDave Kleikamp  */
615211215630SJan Kara static int ext4_mark_recovery_complete(struct super_block *sb,
6153617ba13bSMingming Cao 				       struct ext4_super_block *es)
6154ac27a0ecSDave Kleikamp {
615511215630SJan Kara 	int err;
6156617ba13bSMingming Cao 	journal_t *journal = EXT4_SB(sb)->s_journal;
6157ac27a0ecSDave Kleikamp 
6158e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_journal(sb)) {
615911215630SJan Kara 		if (journal != NULL) {
616011215630SJan Kara 			ext4_error(sb, "Journal got removed while the fs was "
616111215630SJan Kara 				   "mounted!");
616211215630SJan Kara 			return -EFSCORRUPTED;
616311215630SJan Kara 		}
616411215630SJan Kara 		return 0;
61650390131bSFrank Mayhar 	}
6166dab291afSMingming Cao 	jbd2_journal_lock_updates(journal);
616701d5d965SLeah Rumancik 	err = jbd2_journal_flush(journal, 0);
616811215630SJan Kara 	if (err < 0)
61697ffe1ea8SHidehiro Kawai 		goto out;
61707ffe1ea8SHidehiro Kawai 
617102f310fcSJan Kara 	if (sb_rdonly(sb) && (ext4_has_feature_journal_needs_recovery(sb) ||
617202f310fcSJan Kara 	    ext4_has_feature_orphan_present(sb))) {
617302f310fcSJan Kara 		if (!ext4_orphan_file_empty(sb)) {
617402f310fcSJan Kara 			ext4_error(sb, "Orphan file not empty on read-only fs.");
617502f310fcSJan Kara 			err = -EFSCORRUPTED;
617602f310fcSJan Kara 			goto out;
617702f310fcSJan Kara 		}
6178e2b911c5SDarrick J. Wong 		ext4_clear_feature_journal_needs_recovery(sb);
617902f310fcSJan Kara 		ext4_clear_feature_orphan_present(sb);
61804392fbc4SJan Kara 		ext4_commit_super(sb);
6181ac27a0ecSDave Kleikamp 	}
61827ffe1ea8SHidehiro Kawai out:
6183dab291afSMingming Cao 	jbd2_journal_unlock_updates(journal);
618411215630SJan Kara 	return err;
6185ac27a0ecSDave Kleikamp }
6186ac27a0ecSDave Kleikamp 
6187ac27a0ecSDave Kleikamp /*
6188ac27a0ecSDave Kleikamp  * If we are mounting (or read-write remounting) a filesystem whose journal
6189ac27a0ecSDave Kleikamp  * has recorded an error from a previous lifetime, move that error to the
6190ac27a0ecSDave Kleikamp  * main filesystem now.
6191ac27a0ecSDave Kleikamp  */
619211215630SJan Kara static int ext4_clear_journal_err(struct super_block *sb,
6193617ba13bSMingming Cao 				   struct ext4_super_block *es)
6194ac27a0ecSDave Kleikamp {
6195ac27a0ecSDave Kleikamp 	journal_t *journal;
6196ac27a0ecSDave Kleikamp 	int j_errno;
6197ac27a0ecSDave Kleikamp 	const char *errstr;
6198ac27a0ecSDave Kleikamp 
619911215630SJan Kara 	if (!ext4_has_feature_journal(sb)) {
620011215630SJan Kara 		ext4_error(sb, "Journal got removed while the fs was mounted!");
620111215630SJan Kara 		return -EFSCORRUPTED;
620211215630SJan Kara 	}
62030390131bSFrank Mayhar 
6204617ba13bSMingming Cao 	journal = EXT4_SB(sb)->s_journal;
6205ac27a0ecSDave Kleikamp 
6206ac27a0ecSDave Kleikamp 	/*
6207ac27a0ecSDave Kleikamp 	 * Now check for any error status which may have been recorded in the
6208617ba13bSMingming Cao 	 * journal by a prior ext4_error() or ext4_abort()
6209ac27a0ecSDave Kleikamp 	 */
6210ac27a0ecSDave Kleikamp 
6211dab291afSMingming Cao 	j_errno = jbd2_journal_errno(journal);
6212ac27a0ecSDave Kleikamp 	if (j_errno) {
6213ac27a0ecSDave Kleikamp 		char nbuf[16];
6214ac27a0ecSDave Kleikamp 
6215617ba13bSMingming Cao 		errstr = ext4_decode_error(sb, j_errno, nbuf);
621612062dddSEric Sandeen 		ext4_warning(sb, "Filesystem error recorded "
6217ac27a0ecSDave Kleikamp 			     "from previous mount: %s", errstr);
6218ac27a0ecSDave Kleikamp 
6219617ba13bSMingming Cao 		EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
6220617ba13bSMingming Cao 		es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
6221f57886caSYe Bin 		j_errno = ext4_commit_super(sb);
6222f57886caSYe Bin 		if (j_errno)
6223f57886caSYe Bin 			return j_errno;
6224f57886caSYe Bin 		ext4_warning(sb, "Marked fs in need of filesystem check.");
6225ac27a0ecSDave Kleikamp 
6226dab291afSMingming Cao 		jbd2_journal_clear_err(journal);
6227d796c52eSTheodore Ts'o 		jbd2_journal_update_sb_errno(journal);
6228ac27a0ecSDave Kleikamp 	}
622911215630SJan Kara 	return 0;
6230ac27a0ecSDave Kleikamp }
6231ac27a0ecSDave Kleikamp 
6232ac27a0ecSDave Kleikamp /*
6233ac27a0ecSDave Kleikamp  * Force the running and committing transactions to commit,
6234ac27a0ecSDave Kleikamp  * and wait on the commit.
6235ac27a0ecSDave Kleikamp  */
6236617ba13bSMingming Cao int ext4_force_commit(struct super_block *sb)
6237ac27a0ecSDave Kleikamp {
6238ac27a0ecSDave Kleikamp 	journal_t *journal;
6239ac27a0ecSDave Kleikamp 
6240bc98a42cSDavid Howells 	if (sb_rdonly(sb))
6241ac27a0ecSDave Kleikamp 		return 0;
6242ac27a0ecSDave Kleikamp 
6243617ba13bSMingming Cao 	journal = EXT4_SB(sb)->s_journal;
6244b1deefc9SGuo Chao 	return ext4_journal_force_commit(journal);
6245ac27a0ecSDave Kleikamp }
6246ac27a0ecSDave Kleikamp 
6247617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait)
6248ac27a0ecSDave Kleikamp {
624914ce0cb4STheodore Ts'o 	int ret = 0;
62509eddacf9SJan Kara 	tid_t target;
625106a407f1SDmitry Monakhov 	bool needs_barrier = false;
62528d5d02e6SMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
6253ac27a0ecSDave Kleikamp 
625449598e04SJun Piao 	if (unlikely(ext4_forced_shutdown(sbi)))
62550db1ff22STheodore Ts'o 		return 0;
62560db1ff22STheodore Ts'o 
62579bffad1eSTheodore Ts'o 	trace_ext4_sync_fs(sb, wait);
62582e8fa54eSJan Kara 	flush_workqueue(sbi->rsv_conversion_wq);
6259a1177825SJan Kara 	/*
6260a1177825SJan Kara 	 * Writeback quota in non-journalled quota case - journalled quota has
6261a1177825SJan Kara 	 * no dirty dquots
6262a1177825SJan Kara 	 */
6263a1177825SJan Kara 	dquot_writeback_dquots(sb, -1);
626406a407f1SDmitry Monakhov 	/*
626506a407f1SDmitry Monakhov 	 * Data writeback is possible w/o journal transaction, so barrier must
626606a407f1SDmitry Monakhov 	 * being sent at the end of the function. But we can skip it if
626706a407f1SDmitry Monakhov 	 * transaction_commit will do it for us.
626806a407f1SDmitry Monakhov 	 */
6269bda32530STheodore Ts'o 	if (sbi->s_journal) {
627006a407f1SDmitry Monakhov 		target = jbd2_get_latest_transaction(sbi->s_journal);
627106a407f1SDmitry Monakhov 		if (wait && sbi->s_journal->j_flags & JBD2_BARRIER &&
627206a407f1SDmitry Monakhov 		    !jbd2_trans_will_send_data_barrier(sbi->s_journal, target))
627306a407f1SDmitry Monakhov 			needs_barrier = true;
627406a407f1SDmitry Monakhov 
62758d5d02e6SMingming Cao 		if (jbd2_journal_start_commit(sbi->s_journal, &target)) {
6276ac27a0ecSDave Kleikamp 			if (wait)
6277bda32530STheodore Ts'o 				ret = jbd2_log_wait_commit(sbi->s_journal,
6278bda32530STheodore Ts'o 							   target);
62790390131bSFrank Mayhar 		}
6280bda32530STheodore Ts'o 	} else if (wait && test_opt(sb, BARRIER))
6281bda32530STheodore Ts'o 		needs_barrier = true;
628206a407f1SDmitry Monakhov 	if (needs_barrier) {
628306a407f1SDmitry Monakhov 		int err;
6284c6bf3f0eSChristoph Hellwig 		err = blkdev_issue_flush(sb->s_bdev);
628506a407f1SDmitry Monakhov 		if (!ret)
628606a407f1SDmitry Monakhov 			ret = err;
628706a407f1SDmitry Monakhov 	}
628806a407f1SDmitry Monakhov 
628906a407f1SDmitry Monakhov 	return ret;
629006a407f1SDmitry Monakhov }
629106a407f1SDmitry Monakhov 
6292ac27a0ecSDave Kleikamp /*
6293ac27a0ecSDave Kleikamp  * LVM calls this function before a (read-only) snapshot is created.  This
6294ac27a0ecSDave Kleikamp  * gives us a chance to flush the journal completely and mark the fs clean.
6295be4f27d3SYongqiang Yang  *
6296be4f27d3SYongqiang Yang  * Note that only this function cannot bring a filesystem to be in a clean
62978e8ad8a5SJan Kara  * state independently. It relies on upper layer to stop all data & metadata
62988e8ad8a5SJan Kara  * modifications.
6299ac27a0ecSDave Kleikamp  */
6300c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb)
6301ac27a0ecSDave Kleikamp {
6302c4be0c1dSTakashi Sato 	int error = 0;
6303c4be0c1dSTakashi Sato 	journal_t *journal;
6304ac27a0ecSDave Kleikamp 
6305bc98a42cSDavid Howells 	if (sb_rdonly(sb))
63069ca92389STheodore Ts'o 		return 0;
63079ca92389STheodore Ts'o 
6308c4be0c1dSTakashi Sato 	journal = EXT4_SB(sb)->s_journal;
6309ac27a0ecSDave Kleikamp 
6310bb044576STheodore Ts'o 	if (journal) {
6311ac27a0ecSDave Kleikamp 		/* Now we set up the journal barrier. */
6312dab291afSMingming Cao 		jbd2_journal_lock_updates(journal);
63137ffe1ea8SHidehiro Kawai 
63147ffe1ea8SHidehiro Kawai 		/*
6315bb044576STheodore Ts'o 		 * Don't clear the needs_recovery flag if we failed to
6316bb044576STheodore Ts'o 		 * flush the journal.
63177ffe1ea8SHidehiro Kawai 		 */
631801d5d965SLeah Rumancik 		error = jbd2_journal_flush(journal, 0);
63196b0310fbSEric Sandeen 		if (error < 0)
63206b0310fbSEric Sandeen 			goto out;
6321ac27a0ecSDave Kleikamp 
6322ac27a0ecSDave Kleikamp 		/* Journal blocked and flushed, clear needs_recovery flag. */
6323e2b911c5SDarrick J. Wong 		ext4_clear_feature_journal_needs_recovery(sb);
632402f310fcSJan Kara 		if (ext4_orphan_file_empty(sb))
632502f310fcSJan Kara 			ext4_clear_feature_orphan_present(sb);
6326c642dc9eSEric Sandeen 	}
6327c642dc9eSEric Sandeen 
63284392fbc4SJan Kara 	error = ext4_commit_super(sb);
63296b0310fbSEric Sandeen out:
6330bb044576STheodore Ts'o 	if (journal)
63318e8ad8a5SJan Kara 		/* we rely on upper layer to stop further updates */
6332bb044576STheodore Ts'o 		jbd2_journal_unlock_updates(journal);
63336b0310fbSEric Sandeen 	return error;
6334ac27a0ecSDave Kleikamp }
6335ac27a0ecSDave Kleikamp 
6336ac27a0ecSDave Kleikamp /*
6337ac27a0ecSDave Kleikamp  * Called by LVM after the snapshot is done.  We need to reset the RECOVER
6338ac27a0ecSDave Kleikamp  * flag here, even though the filesystem is not technically dirty yet.
6339ac27a0ecSDave Kleikamp  */
6340c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb)
6341ac27a0ecSDave Kleikamp {
6342bc98a42cSDavid Howells 	if (sb_rdonly(sb) || ext4_forced_shutdown(EXT4_SB(sb)))
63439ca92389STheodore Ts'o 		return 0;
63449ca92389STheodore Ts'o 
6345c642dc9eSEric Sandeen 	if (EXT4_SB(sb)->s_journal) {
63469ca92389STheodore Ts'o 		/* Reset the needs_recovery flag before the fs is unlocked. */
6347e2b911c5SDarrick J. Wong 		ext4_set_feature_journal_needs_recovery(sb);
634802f310fcSJan Kara 		if (ext4_has_feature_orphan_file(sb))
634902f310fcSJan Kara 			ext4_set_feature_orphan_present(sb);
6350c642dc9eSEric Sandeen 	}
6351c642dc9eSEric Sandeen 
63524392fbc4SJan Kara 	ext4_commit_super(sb);
6353c4be0c1dSTakashi Sato 	return 0;
6354ac27a0ecSDave Kleikamp }
6355ac27a0ecSDave Kleikamp 
6356673c6100STheodore Ts'o /*
6357673c6100STheodore Ts'o  * Structure to save mount options for ext4_remount's benefit
6358673c6100STheodore Ts'o  */
6359673c6100STheodore Ts'o struct ext4_mount_options {
6360673c6100STheodore Ts'o 	unsigned long s_mount_opt;
6361a2595b8aSTheodore Ts'o 	unsigned long s_mount_opt2;
636208cefc7aSEric W. Biederman 	kuid_t s_resuid;
636308cefc7aSEric W. Biederman 	kgid_t s_resgid;
6364673c6100STheodore Ts'o 	unsigned long s_commit_interval;
6365673c6100STheodore Ts'o 	u32 s_min_batch_time, s_max_batch_time;
6366673c6100STheodore Ts'o #ifdef CONFIG_QUOTA
6367673c6100STheodore Ts'o 	int s_jquota_fmt;
6368a2d4a646SJan Kara 	char *s_qf_names[EXT4_MAXQUOTAS];
6369673c6100STheodore Ts'o #endif
6370673c6100STheodore Ts'o };
6371673c6100STheodore Ts'o 
6372960e0ab6SLukas Czerner static int __ext4_remount(struct fs_context *fc, struct super_block *sb)
6373ac27a0ecSDave Kleikamp {
63747edfd85bSLukas Czerner 	struct ext4_fs_context *ctx = fc->fs_private;
6375617ba13bSMingming Cao 	struct ext4_super_block *es;
6376617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
6377960e0ab6SLukas Czerner 	unsigned long old_sb_flags;
6378617ba13bSMingming Cao 	struct ext4_mount_options old_opts;
63798a266467STheodore Ts'o 	ext4_group_t g;
6380c5e06d10SJohann Lombardi 	int err = 0;
6381ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
63823bbef91bSAustin Kim 	int enable_quota = 0;
638303dafb5fSChen Gang 	int i, j;
638433458eabSTheodore Ts'o 	char *to_free[EXT4_MAXQUOTAS];
6385ac27a0ecSDave Kleikamp #endif
6386b237e304SHarshad Shirwadkar 
638721ac738eSChengguang Xu 
6388ac27a0ecSDave Kleikamp 	/* Store the original options */
6389ac27a0ecSDave Kleikamp 	old_sb_flags = sb->s_flags;
6390ac27a0ecSDave Kleikamp 	old_opts.s_mount_opt = sbi->s_mount_opt;
6391a2595b8aSTheodore Ts'o 	old_opts.s_mount_opt2 = sbi->s_mount_opt2;
6392ac27a0ecSDave Kleikamp 	old_opts.s_resuid = sbi->s_resuid;
6393ac27a0ecSDave Kleikamp 	old_opts.s_resgid = sbi->s_resgid;
6394ac27a0ecSDave Kleikamp 	old_opts.s_commit_interval = sbi->s_commit_interval;
639530773840STheodore Ts'o 	old_opts.s_min_batch_time = sbi->s_min_batch_time;
639630773840STheodore Ts'o 	old_opts.s_max_batch_time = sbi->s_max_batch_time;
6397ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
6398ac27a0ecSDave Kleikamp 	old_opts.s_jquota_fmt = sbi->s_jquota_fmt;
6399a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
640003dafb5fSChen Gang 		if (sbi->s_qf_names[i]) {
640133458eabSTheodore Ts'o 			char *qf_name = get_qf_name(sb, sbi, i);
640233458eabSTheodore Ts'o 
640333458eabSTheodore Ts'o 			old_opts.s_qf_names[i] = kstrdup(qf_name, GFP_KERNEL);
640403dafb5fSChen Gang 			if (!old_opts.s_qf_names[i]) {
640503dafb5fSChen Gang 				for (j = 0; j < i; j++)
640603dafb5fSChen Gang 					kfree(old_opts.s_qf_names[j]);
640703dafb5fSChen Gang 				return -ENOMEM;
640803dafb5fSChen Gang 			}
640903dafb5fSChen Gang 		} else
641003dafb5fSChen Gang 			old_opts.s_qf_names[i] = NULL;
6411ac27a0ecSDave Kleikamp #endif
6412e4e58e5dSOjaswin Mujoo 	if (!(ctx->spec & EXT4_SPEC_JOURNAL_IOPRIO)) {
6413b3881f74STheodore Ts'o 		if (sbi->s_journal && sbi->s_journal->j_task->io_context)
64147edfd85bSLukas Czerner 			ctx->journal_ioprio =
6415b237e304SHarshad Shirwadkar 				sbi->s_journal->j_task->io_context->ioprio;
6416e4e58e5dSOjaswin Mujoo 		else
6417e4e58e5dSOjaswin Mujoo 			ctx->journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
6418e4e58e5dSOjaswin Mujoo 
6419e4e58e5dSOjaswin Mujoo 	}
6420ac27a0ecSDave Kleikamp 
64217edfd85bSLukas Czerner 	ext4_apply_options(fc, sb);
6422ac27a0ecSDave Kleikamp 
64236b992ff2SDarrick J. Wong 	if ((old_opts.s_mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) ^
64246b992ff2SDarrick J. Wong 	    test_opt(sb, JOURNAL_CHECKSUM)) {
64256b992ff2SDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "changing journal_checksum "
64262d5b86e0SEric Sandeen 			 "during remount not supported; ignoring");
64272d5b86e0SEric Sandeen 		sbi->s_mount_opt ^= EXT4_MOUNT_JOURNAL_CHECKSUM;
6428c6d3d56dSDarrick J. Wong 	}
6429c6d3d56dSDarrick J. Wong 
64306ae6514bSPiotr Sarna 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) {
64316ae6514bSPiotr Sarna 		if (test_opt2(sb, EXPLICIT_DELALLOC)) {
64326ae6514bSPiotr Sarna 			ext4_msg(sb, KERN_ERR, "can't mount with "
64336ae6514bSPiotr Sarna 				 "both data=journal and delalloc");
64346ae6514bSPiotr Sarna 			err = -EINVAL;
64356ae6514bSPiotr Sarna 			goto restore_opts;
64366ae6514bSPiotr Sarna 		}
64376ae6514bSPiotr Sarna 		if (test_opt(sb, DIOREAD_NOLOCK)) {
64386ae6514bSPiotr Sarna 			ext4_msg(sb, KERN_ERR, "can't mount with "
64396ae6514bSPiotr Sarna 				 "both data=journal and dioread_nolock");
64406ae6514bSPiotr Sarna 			err = -EINVAL;
64416ae6514bSPiotr Sarna 			goto restore_opts;
64426ae6514bSPiotr Sarna 		}
6443ab04df78SJan Kara 	} else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA) {
6444ab04df78SJan Kara 		if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
6445ab04df78SJan Kara 			ext4_msg(sb, KERN_ERR, "can't mount with "
6446ab04df78SJan Kara 				"journal_async_commit in data=ordered mode");
6447ab04df78SJan Kara 			err = -EINVAL;
6448ab04df78SJan Kara 			goto restore_opts;
6449ab04df78SJan Kara 		}
6450923ae0ffSRoss Zwisler 	}
6451923ae0ffSRoss Zwisler 
6452cdb7ee4cSTahsin Erdogan 	if ((sbi->s_mount_opt ^ old_opts.s_mount_opt) & EXT4_MOUNT_NO_MBCACHE) {
6453cdb7ee4cSTahsin Erdogan 		ext4_msg(sb, KERN_ERR, "can't enable nombcache during remount");
6454cdb7ee4cSTahsin Erdogan 		err = -EINVAL;
6455cdb7ee4cSTahsin Erdogan 		goto restore_opts;
6456cdb7ee4cSTahsin Erdogan 	}
6457cdb7ee4cSTahsin Erdogan 
64589b5f6c9bSHarshad Shirwadkar 	if (ext4_test_mount_flag(sb, EXT4_MF_FS_ABORTED))
6459124e7c61SGabriel Krisman Bertazi 		ext4_abort(sb, ESHUTDOWN, "Abort forced by user");
6460ac27a0ecSDave Kleikamp 
64611751e8a6SLinus Torvalds 	sb->s_flags = (sb->s_flags & ~SB_POSIXACL) |
64621751e8a6SLinus Torvalds 		(test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0);
6463ac27a0ecSDave Kleikamp 
6464ac27a0ecSDave Kleikamp 	es = sbi->s_es;
6465ac27a0ecSDave Kleikamp 
6466b3881f74STheodore Ts'o 	if (sbi->s_journal) {
6467617ba13bSMingming Cao 		ext4_init_journal_params(sb, sbi->s_journal);
64687edfd85bSLukas Czerner 		set_task_ioprio(sbi->s_journal->j_task, ctx->journal_ioprio);
6469b3881f74STheodore Ts'o 	}
6470ac27a0ecSDave Kleikamp 
6471c92dc856SJan Kara 	/* Flush outstanding errors before changing fs state */
6472c92dc856SJan Kara 	flush_work(&sbi->s_error_work);
6473c92dc856SJan Kara 
6474960e0ab6SLukas Czerner 	if ((bool)(fc->sb_flags & SB_RDONLY) != sb_rdonly(sb)) {
64759b5f6c9bSHarshad Shirwadkar 		if (ext4_test_mount_flag(sb, EXT4_MF_FS_ABORTED)) {
6476ac27a0ecSDave Kleikamp 			err = -EROFS;
6477ac27a0ecSDave Kleikamp 			goto restore_opts;
6478ac27a0ecSDave Kleikamp 		}
6479ac27a0ecSDave Kleikamp 
6480960e0ab6SLukas Czerner 		if (fc->sb_flags & SB_RDONLY) {
648138c03b34STheodore Ts'o 			err = sync_filesystem(sb);
648238c03b34STheodore Ts'o 			if (err < 0)
648338c03b34STheodore Ts'o 				goto restore_opts;
64840f0dd62fSChristoph Hellwig 			err = dquot_suspend(sb, -1);
64850f0dd62fSChristoph Hellwig 			if (err < 0)
6486c79d967dSChristoph Hellwig 				goto restore_opts;
6487c79d967dSChristoph Hellwig 
6488ac27a0ecSDave Kleikamp 			/*
6489ac27a0ecSDave Kleikamp 			 * First of all, the unconditional stuff we have to do
6490ac27a0ecSDave Kleikamp 			 * to disable replay of the journal when we next remount
6491ac27a0ecSDave Kleikamp 			 */
64921751e8a6SLinus Torvalds 			sb->s_flags |= SB_RDONLY;
6493ac27a0ecSDave Kleikamp 
6494ac27a0ecSDave Kleikamp 			/*
6495ac27a0ecSDave Kleikamp 			 * OK, test if we are remounting a valid rw partition
6496ac27a0ecSDave Kleikamp 			 * readonly, and if so set the rdonly flag and then
6497ac27a0ecSDave Kleikamp 			 * mark the partition as valid again.
6498ac27a0ecSDave Kleikamp 			 */
6499617ba13bSMingming Cao 			if (!(es->s_state & cpu_to_le16(EXT4_VALID_FS)) &&
6500617ba13bSMingming Cao 			    (sbi->s_mount_state & EXT4_VALID_FS))
6501ac27a0ecSDave Kleikamp 				es->s_state = cpu_to_le16(sbi->s_mount_state);
6502ac27a0ecSDave Kleikamp 
650311215630SJan Kara 			if (sbi->s_journal) {
650411215630SJan Kara 				/*
650511215630SJan Kara 				 * We let remount-ro finish even if marking fs
650611215630SJan Kara 				 * as clean failed...
650711215630SJan Kara 				 */
6508617ba13bSMingming Cao 				ext4_mark_recovery_complete(sb, es);
650911215630SJan Kara 			}
6510ac27a0ecSDave Kleikamp 		} else {
6511a13fb1a4SEric Sandeen 			/* Make sure we can mount this feature set readwrite */
6512e2b911c5SDarrick J. Wong 			if (ext4_has_feature_readonly(sb) ||
65132cb5cc8bSDarrick J. Wong 			    !ext4_feature_set_ok(sb, 0)) {
6514ac27a0ecSDave Kleikamp 				err = -EROFS;
6515ac27a0ecSDave Kleikamp 				goto restore_opts;
6516ac27a0ecSDave Kleikamp 			}
6517ead6596bSEric Sandeen 			/*
65188a266467STheodore Ts'o 			 * Make sure the group descriptor checksums
65190b8e58a1SAndreas Dilger 			 * are sane.  If they aren't, refuse to remount r/w.
65208a266467STheodore Ts'o 			 */
65218a266467STheodore Ts'o 			for (g = 0; g < sbi->s_groups_count; g++) {
65228a266467STheodore Ts'o 				struct ext4_group_desc *gdp =
65238a266467STheodore Ts'o 					ext4_get_group_desc(sb, g, NULL);
65248a266467STheodore Ts'o 
6525feb0ab32SDarrick J. Wong 				if (!ext4_group_desc_csum_verify(sb, g, gdp)) {
6526b31e1552SEric Sandeen 					ext4_msg(sb, KERN_ERR,
6527b31e1552SEric Sandeen 	       "ext4_remount: Checksum for group %u failed (%u!=%u)",
6528e2b911c5SDarrick J. Wong 		g, le16_to_cpu(ext4_group_desc_csum(sb, g, gdp)),
65298a266467STheodore Ts'o 					       le16_to_cpu(gdp->bg_checksum));
65306a797d27SDarrick J. Wong 					err = -EFSBADCRC;
65318a266467STheodore Ts'o 					goto restore_opts;
65328a266467STheodore Ts'o 				}
65338a266467STheodore Ts'o 			}
65348a266467STheodore Ts'o 
65358a266467STheodore Ts'o 			/*
6536ead6596bSEric Sandeen 			 * If we have an unprocessed orphan list hanging
6537ead6596bSEric Sandeen 			 * around from a previously readonly bdev mount,
6538ead6596bSEric Sandeen 			 * require a full umount/remount for now.
6539ead6596bSEric Sandeen 			 */
654002f310fcSJan Kara 			if (es->s_last_orphan || !ext4_orphan_file_empty(sb)) {
6541b31e1552SEric Sandeen 				ext4_msg(sb, KERN_WARNING, "Couldn't "
6542ead6596bSEric Sandeen 				       "remount RDWR because of unprocessed "
6543ead6596bSEric Sandeen 				       "orphan inode list.  Please "
6544b31e1552SEric Sandeen 				       "umount/remount instead");
6545ead6596bSEric Sandeen 				err = -EINVAL;
6546ead6596bSEric Sandeen 				goto restore_opts;
6547ead6596bSEric Sandeen 			}
6548ead6596bSEric Sandeen 
6549ac27a0ecSDave Kleikamp 			/*
6550ac27a0ecSDave Kleikamp 			 * Mounting a RDONLY partition read-write, so reread
6551ac27a0ecSDave Kleikamp 			 * and store the current valid flag.  (It may have
6552ac27a0ecSDave Kleikamp 			 * been changed by e2fsck since we originally mounted
6553ac27a0ecSDave Kleikamp 			 * the partition.)
6554ac27a0ecSDave Kleikamp 			 */
655511215630SJan Kara 			if (sbi->s_journal) {
655611215630SJan Kara 				err = ext4_clear_journal_err(sb, es);
655711215630SJan Kara 				if (err)
655811215630SJan Kara 					goto restore_opts;
655911215630SJan Kara 			}
6560c878bea3STheodore Ts'o 			sbi->s_mount_state = (le16_to_cpu(es->s_state) &
6561c878bea3STheodore Ts'o 					      ~EXT4_FC_REPLAY);
6562c89128a0SJaegeuk Kim 
6563c89128a0SJaegeuk Kim 			err = ext4_setup_super(sb, es, 0);
6564c89128a0SJaegeuk Kim 			if (err)
6565c89128a0SJaegeuk Kim 				goto restore_opts;
6566c89128a0SJaegeuk Kim 
65671751e8a6SLinus Torvalds 			sb->s_flags &= ~SB_RDONLY;
6568e2b911c5SDarrick J. Wong 			if (ext4_has_feature_mmp(sb))
6569c5e06d10SJohann Lombardi 				if (ext4_multi_mount_protect(sb,
6570c5e06d10SJohann Lombardi 						le64_to_cpu(es->s_mmp_block))) {
6571c5e06d10SJohann Lombardi 					err = -EROFS;
6572c5e06d10SJohann Lombardi 					goto restore_opts;
6573c5e06d10SJohann Lombardi 				}
65743bbef91bSAustin Kim #ifdef CONFIG_QUOTA
6575c79d967dSChristoph Hellwig 			enable_quota = 1;
65763bbef91bSAustin Kim #endif
6577ac27a0ecSDave Kleikamp 		}
6578ac27a0ecSDave Kleikamp 	}
6579bfff6873SLukas Czerner 
6580bfff6873SLukas Czerner 	/*
6581bfff6873SLukas Czerner 	 * Reinitialize lazy itable initialization thread based on
6582bfff6873SLukas Czerner 	 * current settings
6583bfff6873SLukas Czerner 	 */
6584bc98a42cSDavid Howells 	if (sb_rdonly(sb) || !test_opt(sb, INIT_INODE_TABLE))
6585bfff6873SLukas Czerner 		ext4_unregister_li_request(sb);
6586bfff6873SLukas Czerner 	else {
6587bfff6873SLukas Czerner 		ext4_group_t first_not_zeroed;
6588bfff6873SLukas Czerner 		first_not_zeroed = ext4_has_uninit_itable(sb);
6589bfff6873SLukas Czerner 		ext4_register_li_request(sb, first_not_zeroed);
6590bfff6873SLukas Czerner 	}
6591bfff6873SLukas Czerner 
65920f5bde1dSJan Kara 	/*
65930f5bde1dSJan Kara 	 * Handle creation of system zone data early because it can fail.
65940f5bde1dSJan Kara 	 * Releasing of existing data is done when we are sure remount will
65950f5bde1dSJan Kara 	 * succeed.
65960f5bde1dSJan Kara 	 */
6597dd0db94fSChunguang Xu 	if (test_opt(sb, BLOCK_VALIDITY) && !sbi->s_system_blks) {
6598d176b1f6SJan Kara 		err = ext4_setup_system_zone(sb);
6599d176b1f6SJan Kara 		if (err)
6600d176b1f6SJan Kara 			goto restore_opts;
66010f5bde1dSJan Kara 	}
6602d176b1f6SJan Kara 
6603c89128a0SJaegeuk Kim 	if (sbi->s_journal == NULL && !(old_sb_flags & SB_RDONLY)) {
66044392fbc4SJan Kara 		err = ext4_commit_super(sb);
6605c89128a0SJaegeuk Kim 		if (err)
6606c89128a0SJaegeuk Kim 			goto restore_opts;
6607c89128a0SJaegeuk Kim 	}
66080390131bSFrank Mayhar 
6609ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
6610ac27a0ecSDave Kleikamp 	/* Release old quota file names */
6611a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
6612ac27a0ecSDave Kleikamp 		kfree(old_opts.s_qf_names[i]);
66137c319d32SAditya Kali 	if (enable_quota) {
66147c319d32SAditya Kali 		if (sb_any_quota_suspended(sb))
66150f0dd62fSChristoph Hellwig 			dquot_resume(sb, -1);
6616e2b911c5SDarrick J. Wong 		else if (ext4_has_feature_quota(sb)) {
66177c319d32SAditya Kali 			err = ext4_enable_quotas(sb);
661807724f98STheodore Ts'o 			if (err)
66197c319d32SAditya Kali 				goto restore_opts;
66207c319d32SAditya Kali 		}
66217c319d32SAditya Kali 	}
66227c319d32SAditya Kali #endif
6623dd0db94fSChunguang Xu 	if (!test_opt(sb, BLOCK_VALIDITY) && sbi->s_system_blks)
66240f5bde1dSJan Kara 		ext4_release_system_zone(sb);
6625d4c402d9SCurt Wohlgemuth 
662661bb4a1cSTheodore Ts'o 	if (!ext4_has_feature_mmp(sb) || sb_rdonly(sb))
662761bb4a1cSTheodore Ts'o 		ext4_stop_mmpd(sbi);
662861bb4a1cSTheodore Ts'o 
6629ac27a0ecSDave Kleikamp 	return 0;
66300b8e58a1SAndreas Dilger 
6631ac27a0ecSDave Kleikamp restore_opts:
6632ac27a0ecSDave Kleikamp 	sb->s_flags = old_sb_flags;
6633ac27a0ecSDave Kleikamp 	sbi->s_mount_opt = old_opts.s_mount_opt;
6634a2595b8aSTheodore Ts'o 	sbi->s_mount_opt2 = old_opts.s_mount_opt2;
6635ac27a0ecSDave Kleikamp 	sbi->s_resuid = old_opts.s_resuid;
6636ac27a0ecSDave Kleikamp 	sbi->s_resgid = old_opts.s_resgid;
6637ac27a0ecSDave Kleikamp 	sbi->s_commit_interval = old_opts.s_commit_interval;
663830773840STheodore Ts'o 	sbi->s_min_batch_time = old_opts.s_min_batch_time;
663930773840STheodore Ts'o 	sbi->s_max_batch_time = old_opts.s_max_batch_time;
6640dd0db94fSChunguang Xu 	if (!test_opt(sb, BLOCK_VALIDITY) && sbi->s_system_blks)
66410f5bde1dSJan Kara 		ext4_release_system_zone(sb);
6642ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
6643ac27a0ecSDave Kleikamp 	sbi->s_jquota_fmt = old_opts.s_jquota_fmt;
6644a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++) {
664533458eabSTheodore Ts'o 		to_free[i] = get_qf_name(sb, sbi, i);
664633458eabSTheodore Ts'o 		rcu_assign_pointer(sbi->s_qf_names[i], old_opts.s_qf_names[i]);
6647ac27a0ecSDave Kleikamp 	}
664833458eabSTheodore Ts'o 	synchronize_rcu();
664933458eabSTheodore Ts'o 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
665033458eabSTheodore Ts'o 		kfree(to_free[i]);
6651ac27a0ecSDave Kleikamp #endif
665261bb4a1cSTheodore Ts'o 	if (!ext4_has_feature_mmp(sb) || sb_rdonly(sb))
665361bb4a1cSTheodore Ts'o 		ext4_stop_mmpd(sbi);
6654ac27a0ecSDave Kleikamp 	return err;
6655ac27a0ecSDave Kleikamp }
6656ac27a0ecSDave Kleikamp 
6657cebe85d5SLukas Czerner static int ext4_reconfigure(struct fs_context *fc)
66587edfd85bSLukas Czerner {
6659cebe85d5SLukas Czerner 	struct super_block *sb = fc->root->d_sb;
66607edfd85bSLukas Czerner 	int ret;
66617edfd85bSLukas Czerner 
6662cebe85d5SLukas Czerner 	fc->s_fs_info = EXT4_SB(sb);
66637edfd85bSLukas Czerner 
6664cebe85d5SLukas Czerner 	ret = ext4_check_opt_consistency(fc, sb);
66657edfd85bSLukas Czerner 	if (ret < 0)
66667edfd85bSLukas Czerner 		return ret;
6667cebe85d5SLukas Czerner 
6668960e0ab6SLukas Czerner 	ret = __ext4_remount(fc, sb);
6669cebe85d5SLukas Czerner 	if (ret < 0)
6670cebe85d5SLukas Czerner 		return ret;
6671cebe85d5SLukas Czerner 
6672bb0fbc78SLukas Czerner 	ext4_msg(sb, KERN_INFO, "re-mounted %pU. Quota mode: %s.",
6673bb0fbc78SLukas Czerner 		 &sb->s_uuid, ext4_quota_mode(sb));
6674cebe85d5SLukas Czerner 
6675cebe85d5SLukas Czerner 	return 0;
66767edfd85bSLukas Czerner }
66777edfd85bSLukas Czerner 
6678689c958cSLi Xi #ifdef CONFIG_QUOTA
6679689c958cSLi Xi static int ext4_statfs_project(struct super_block *sb,
6680689c958cSLi Xi 			       kprojid_t projid, struct kstatfs *buf)
6681689c958cSLi Xi {
6682689c958cSLi Xi 	struct kqid qid;
6683689c958cSLi Xi 	struct dquot *dquot;
6684689c958cSLi Xi 	u64 limit;
6685689c958cSLi Xi 	u64 curblock;
6686689c958cSLi Xi 
6687689c958cSLi Xi 	qid = make_kqid_projid(projid);
6688689c958cSLi Xi 	dquot = dqget(sb, qid);
6689689c958cSLi Xi 	if (IS_ERR(dquot))
6690689c958cSLi Xi 		return PTR_ERR(dquot);
66917b9ca4c6SJan Kara 	spin_lock(&dquot->dq_dqb_lock);
6692689c958cSLi Xi 
6693a08fe66eSChengguang Xu 	limit = min_not_zero(dquot->dq_dqb.dqb_bsoftlimit,
6694a08fe66eSChengguang Xu 			     dquot->dq_dqb.dqb_bhardlimit);
669557c32ea4SChengguang Xu 	limit >>= sb->s_blocksize_bits;
669657c32ea4SChengguang Xu 
6697689c958cSLi Xi 	if (limit && buf->f_blocks > limit) {
6698f06925c7SKonstantin Khlebnikov 		curblock = (dquot->dq_dqb.dqb_curspace +
6699f06925c7SKonstantin Khlebnikov 			    dquot->dq_dqb.dqb_rsvspace) >> sb->s_blocksize_bits;
6700689c958cSLi Xi 		buf->f_blocks = limit;
6701689c958cSLi Xi 		buf->f_bfree = buf->f_bavail =
6702689c958cSLi Xi 			(buf->f_blocks > curblock) ?
6703689c958cSLi Xi 			 (buf->f_blocks - curblock) : 0;
6704689c958cSLi Xi 	}
6705689c958cSLi Xi 
6706a08fe66eSChengguang Xu 	limit = min_not_zero(dquot->dq_dqb.dqb_isoftlimit,
6707a08fe66eSChengguang Xu 			     dquot->dq_dqb.dqb_ihardlimit);
6708689c958cSLi Xi 	if (limit && buf->f_files > limit) {
6709689c958cSLi Xi 		buf->f_files = limit;
6710689c958cSLi Xi 		buf->f_ffree =
6711689c958cSLi Xi 			(buf->f_files > dquot->dq_dqb.dqb_curinodes) ?
6712689c958cSLi Xi 			 (buf->f_files - dquot->dq_dqb.dqb_curinodes) : 0;
6713689c958cSLi Xi 	}
6714689c958cSLi Xi 
67157b9ca4c6SJan Kara 	spin_unlock(&dquot->dq_dqb_lock);
6716689c958cSLi Xi 	dqput(dquot);
6717689c958cSLi Xi 	return 0;
6718689c958cSLi Xi }
6719689c958cSLi Xi #endif
6720689c958cSLi Xi 
6721617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf)
6722ac27a0ecSDave Kleikamp {
6723ac27a0ecSDave Kleikamp 	struct super_block *sb = dentry->d_sb;
6724617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
6725617ba13bSMingming Cao 	struct ext4_super_block *es = sbi->s_es;
672627dd4385SLukas Czerner 	ext4_fsblk_t overhead = 0, resv_blocks;
6727d02a9391SKazuya Mio 	s64 bfree;
672827dd4385SLukas Czerner 	resv_blocks = EXT4_C2B(sbi, atomic64_read(&sbi->s_resv_clusters));
6729ac27a0ecSDave Kleikamp 
6730952fc18eSTheodore Ts'o 	if (!test_opt(sb, MINIX_DF))
6731952fc18eSTheodore Ts'o 		overhead = sbi->s_overhead;
6732ac27a0ecSDave Kleikamp 
6733617ba13bSMingming Cao 	buf->f_type = EXT4_SUPER_MAGIC;
6734ac27a0ecSDave Kleikamp 	buf->f_bsize = sb->s_blocksize;
6735b72f78cbSEric Sandeen 	buf->f_blocks = ext4_blocks_count(es) - EXT4_C2B(sbi, overhead);
673657042651STheodore Ts'o 	bfree = percpu_counter_sum_positive(&sbi->s_freeclusters_counter) -
673757042651STheodore Ts'o 		percpu_counter_sum_positive(&sbi->s_dirtyclusters_counter);
6738d02a9391SKazuya Mio 	/* prevent underflow in case that few free space is available */
673957042651STheodore Ts'o 	buf->f_bfree = EXT4_C2B(sbi, max_t(s64, bfree, 0));
674027dd4385SLukas Czerner 	buf->f_bavail = buf->f_bfree -
674127dd4385SLukas Czerner 			(ext4_r_blocks_count(es) + resv_blocks);
674227dd4385SLukas Czerner 	if (buf->f_bfree < (ext4_r_blocks_count(es) + resv_blocks))
6743ac27a0ecSDave Kleikamp 		buf->f_bavail = 0;
6744ac27a0ecSDave Kleikamp 	buf->f_files = le32_to_cpu(es->s_inodes_count);
674552d9f3b4SPeter Zijlstra 	buf->f_ffree = percpu_counter_sum_positive(&sbi->s_freeinodes_counter);
6746617ba13bSMingming Cao 	buf->f_namelen = EXT4_NAME_LEN;
67479591c3a3SAmir Goldstein 	buf->f_fsid = uuid_to_fsid(es->s_uuid);
67480b8e58a1SAndreas Dilger 
6749689c958cSLi Xi #ifdef CONFIG_QUOTA
6750689c958cSLi Xi 	if (ext4_test_inode_flag(dentry->d_inode, EXT4_INODE_PROJINHERIT) &&
6751689c958cSLi Xi 	    sb_has_quota_limits_enabled(sb, PRJQUOTA))
6752689c958cSLi Xi 		ext4_statfs_project(sb, EXT4_I(dentry->d_inode)->i_projid, buf);
6753689c958cSLi Xi #endif
6754ac27a0ecSDave Kleikamp 	return 0;
6755ac27a0ecSDave Kleikamp }
6756ac27a0ecSDave Kleikamp 
6757ac27a0ecSDave Kleikamp 
6758ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
6759ac27a0ecSDave Kleikamp 
6760bc8230eeSJan Kara /*
6761bc8230eeSJan Kara  * Helper functions so that transaction is started before we acquire dqio_sem
6762bc8230eeSJan Kara  * to keep correct lock ordering of transaction > dqio_sem
6763bc8230eeSJan Kara  */
6764ac27a0ecSDave Kleikamp static inline struct inode *dquot_to_inode(struct dquot *dquot)
6765ac27a0ecSDave Kleikamp {
67664c376dcaSEric W. Biederman 	return sb_dqopt(dquot->dq_sb)->files[dquot->dq_id.type];
6767ac27a0ecSDave Kleikamp }
6768ac27a0ecSDave Kleikamp 
6769617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot)
6770ac27a0ecSDave Kleikamp {
6771ac27a0ecSDave Kleikamp 	int ret, err;
6772ac27a0ecSDave Kleikamp 	handle_t *handle;
6773ac27a0ecSDave Kleikamp 	struct inode *inode;
6774ac27a0ecSDave Kleikamp 
6775ac27a0ecSDave Kleikamp 	inode = dquot_to_inode(dquot);
67769924a92aSTheodore Ts'o 	handle = ext4_journal_start(inode, EXT4_HT_QUOTA,
6777617ba13bSMingming Cao 				    EXT4_QUOTA_TRANS_BLOCKS(dquot->dq_sb));
6778ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
6779ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
6780ac27a0ecSDave Kleikamp 	ret = dquot_commit(dquot);
6781617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
6782ac27a0ecSDave Kleikamp 	if (!ret)
6783ac27a0ecSDave Kleikamp 		ret = err;
6784ac27a0ecSDave Kleikamp 	return ret;
6785ac27a0ecSDave Kleikamp }
6786ac27a0ecSDave Kleikamp 
6787617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot)
6788ac27a0ecSDave Kleikamp {
6789ac27a0ecSDave Kleikamp 	int ret, err;
6790ac27a0ecSDave Kleikamp 	handle_t *handle;
6791ac27a0ecSDave Kleikamp 
67929924a92aSTheodore Ts'o 	handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA,
6793617ba13bSMingming Cao 				    EXT4_QUOTA_INIT_BLOCKS(dquot->dq_sb));
6794ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
6795ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
6796ac27a0ecSDave Kleikamp 	ret = dquot_acquire(dquot);
6797617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
6798ac27a0ecSDave Kleikamp 	if (!ret)
6799ac27a0ecSDave Kleikamp 		ret = err;
6800ac27a0ecSDave Kleikamp 	return ret;
6801ac27a0ecSDave Kleikamp }
6802ac27a0ecSDave Kleikamp 
6803617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot)
6804ac27a0ecSDave Kleikamp {
6805ac27a0ecSDave Kleikamp 	int ret, err;
6806ac27a0ecSDave Kleikamp 	handle_t *handle;
6807ac27a0ecSDave Kleikamp 
68089924a92aSTheodore Ts'o 	handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA,
6809617ba13bSMingming Cao 				    EXT4_QUOTA_DEL_BLOCKS(dquot->dq_sb));
68109c3013e9SJan Kara 	if (IS_ERR(handle)) {
68119c3013e9SJan Kara 		/* Release dquot anyway to avoid endless cycle in dqput() */
68129c3013e9SJan Kara 		dquot_release(dquot);
6813ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
68149c3013e9SJan Kara 	}
6815ac27a0ecSDave Kleikamp 	ret = dquot_release(dquot);
6816617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
6817ac27a0ecSDave Kleikamp 	if (!ret)
6818ac27a0ecSDave Kleikamp 		ret = err;
6819ac27a0ecSDave Kleikamp 	return ret;
6820ac27a0ecSDave Kleikamp }
6821ac27a0ecSDave Kleikamp 
6822617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot)
6823ac27a0ecSDave Kleikamp {
6824262b4662SJan Kara 	struct super_block *sb = dquot->dq_sb;
6825262b4662SJan Kara 
6826f177ee08SRoman Anufriev 	if (ext4_is_quota_journalled(sb)) {
6827ac27a0ecSDave Kleikamp 		dquot_mark_dquot_dirty(dquot);
6828617ba13bSMingming Cao 		return ext4_write_dquot(dquot);
6829ac27a0ecSDave Kleikamp 	} else {
6830ac27a0ecSDave Kleikamp 		return dquot_mark_dquot_dirty(dquot);
6831ac27a0ecSDave Kleikamp 	}
6832ac27a0ecSDave Kleikamp }
6833ac27a0ecSDave Kleikamp 
6834617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type)
6835ac27a0ecSDave Kleikamp {
6836ac27a0ecSDave Kleikamp 	int ret, err;
6837ac27a0ecSDave Kleikamp 	handle_t *handle;
6838ac27a0ecSDave Kleikamp 
6839ac27a0ecSDave Kleikamp 	/* Data block + inode block */
6840f9c1f248SBaokun Li 	handle = ext4_journal_start_sb(sb, EXT4_HT_QUOTA, 2);
6841ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
6842ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
6843ac27a0ecSDave Kleikamp 	ret = dquot_commit_info(sb, type);
6844617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
6845ac27a0ecSDave Kleikamp 	if (!ret)
6846ac27a0ecSDave Kleikamp 		ret = err;
6847ac27a0ecSDave Kleikamp 	return ret;
6848ac27a0ecSDave Kleikamp }
6849ac27a0ecSDave Kleikamp 
6850daf647d2STheodore Ts'o static void lockdep_set_quota_inode(struct inode *inode, int subclass)
6851daf647d2STheodore Ts'o {
6852daf647d2STheodore Ts'o 	struct ext4_inode_info *ei = EXT4_I(inode);
6853daf647d2STheodore Ts'o 
6854daf647d2STheodore Ts'o 	/* The first argument of lockdep_set_subclass has to be
6855daf647d2STheodore Ts'o 	 * *exactly* the same as the argument to init_rwsem() --- in
6856daf647d2STheodore Ts'o 	 * this case, in init_once() --- or lockdep gets unhappy
6857daf647d2STheodore Ts'o 	 * because the name of the lock is set using the
6858daf647d2STheodore Ts'o 	 * stringification of the argument to init_rwsem().
6859daf647d2STheodore Ts'o 	 */
6860daf647d2STheodore Ts'o 	(void) ei;	/* shut up clang warning if !CONFIG_LOCKDEP */
6861daf647d2STheodore Ts'o 	lockdep_set_subclass(&ei->i_data_sem, subclass);
6862daf647d2STheodore Ts'o }
6863daf647d2STheodore Ts'o 
6864ac27a0ecSDave Kleikamp /*
6865ac27a0ecSDave Kleikamp  * Standard function to be called on quota_on
6866ac27a0ecSDave Kleikamp  */
6867617ba13bSMingming Cao static int ext4_quota_on(struct super_block *sb, int type, int format_id,
68688c54ca9cSAl Viro 			 const struct path *path)
6869ac27a0ecSDave Kleikamp {
6870ac27a0ecSDave Kleikamp 	int err;
6871ac27a0ecSDave Kleikamp 
6872ac27a0ecSDave Kleikamp 	if (!test_opt(sb, QUOTA))
6873ac27a0ecSDave Kleikamp 		return -EINVAL;
68740623543bSJan Kara 
6875ac27a0ecSDave Kleikamp 	/* Quotafile not on the same filesystem? */
6876d8c9584eSAl Viro 	if (path->dentry->d_sb != sb)
6877ac27a0ecSDave Kleikamp 		return -EXDEV;
6878e0770e91SJan Kara 
6879e0770e91SJan Kara 	/* Quota already enabled for this file? */
6880e0770e91SJan Kara 	if (IS_NOQUOTA(d_inode(path->dentry)))
6881e0770e91SJan Kara 		return -EBUSY;
6882e0770e91SJan Kara 
68830623543bSJan Kara 	/* Journaling quota? */
68840623543bSJan Kara 	if (EXT4_SB(sb)->s_qf_names[type]) {
68852b2d6d01STheodore Ts'o 		/* Quotafile not in fs root? */
6886f00c9e44SJan Kara 		if (path->dentry->d_parent != sb->s_root)
6887b31e1552SEric Sandeen 			ext4_msg(sb, KERN_WARNING,
6888b31e1552SEric Sandeen 				"Quota file not on filesystem root. "
6889b31e1552SEric Sandeen 				"Journaled quota will not work");
689091389240SJan Kara 		sb_dqopt(sb)->flags |= DQUOT_NOLIST_DIRTY;
689191389240SJan Kara 	} else {
689291389240SJan Kara 		/*
689391389240SJan Kara 		 * Clear the flag just in case mount options changed since
689491389240SJan Kara 		 * last time.
689591389240SJan Kara 		 */
689691389240SJan Kara 		sb_dqopt(sb)->flags &= ~DQUOT_NOLIST_DIRTY;
68970623543bSJan Kara 	}
68980623543bSJan Kara 
6899daf647d2STheodore Ts'o 	lockdep_set_quota_inode(path->dentry->d_inode, I_DATA_SEM_QUOTA);
6900daf647d2STheodore Ts'o 	err = dquot_quota_on(sb, type, format_id, path);
690115fc69bbSJan Kara 	if (!err) {
6902957153fcSJan Kara 		struct inode *inode = d_inode(path->dentry);
6903957153fcSJan Kara 		handle_t *handle;
6904957153fcSJan Kara 
690561a92987SJan Kara 		/*
690661a92987SJan Kara 		 * Set inode flags to prevent userspace from messing with quota
690761a92987SJan Kara 		 * files. If this fails, we return success anyway since quotas
690861a92987SJan Kara 		 * are already enabled and this is not a hard failure.
690961a92987SJan Kara 		 */
6910957153fcSJan Kara 		inode_lock(inode);
6911957153fcSJan Kara 		handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1);
6912957153fcSJan Kara 		if (IS_ERR(handle))
6913957153fcSJan Kara 			goto unlock_inode;
6914957153fcSJan Kara 		EXT4_I(inode)->i_flags |= EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL;
6915957153fcSJan Kara 		inode_set_flags(inode, S_NOATIME | S_IMMUTABLE,
6916957153fcSJan Kara 				S_NOATIME | S_IMMUTABLE);
69174209ae12SHarshad Shirwadkar 		err = ext4_mark_inode_dirty(handle, inode);
6918957153fcSJan Kara 		ext4_journal_stop(handle);
6919957153fcSJan Kara 	unlock_inode:
6920957153fcSJan Kara 		inode_unlock(inode);
692115fc69bbSJan Kara 		if (err)
692215fc69bbSJan Kara 			dquot_quota_off(sb, type);
6923957153fcSJan Kara 	}
692415fc69bbSJan Kara 	if (err)
692515fc69bbSJan Kara 		lockdep_set_quota_inode(path->dentry->d_inode,
692615fc69bbSJan Kara 					     I_DATA_SEM_NORMAL);
6927daf647d2STheodore Ts'o 	return err;
6928ac27a0ecSDave Kleikamp }
6929ac27a0ecSDave Kleikamp 
693007342ec2SBaokun Li static inline bool ext4_check_quota_inum(int type, unsigned long qf_inum)
693107342ec2SBaokun Li {
693207342ec2SBaokun Li 	switch (type) {
693307342ec2SBaokun Li 	case USRQUOTA:
693407342ec2SBaokun Li 		return qf_inum == EXT4_USR_QUOTA_INO;
693507342ec2SBaokun Li 	case GRPQUOTA:
693607342ec2SBaokun Li 		return qf_inum == EXT4_GRP_QUOTA_INO;
693707342ec2SBaokun Li 	case PRJQUOTA:
693807342ec2SBaokun Li 		return qf_inum >= EXT4_GOOD_OLD_FIRST_INO;
693907342ec2SBaokun Li 	default:
694007342ec2SBaokun Li 		BUG();
694107342ec2SBaokun Li 	}
694207342ec2SBaokun Li }
694307342ec2SBaokun Li 
69447c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id,
69457c319d32SAditya Kali 			     unsigned int flags)
69467c319d32SAditya Kali {
69477c319d32SAditya Kali 	int err;
69487c319d32SAditya Kali 	struct inode *qf_inode;
6949a2d4a646SJan Kara 	unsigned long qf_inums[EXT4_MAXQUOTAS] = {
69507c319d32SAditya Kali 		le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum),
6951689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum),
6952689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum)
69537c319d32SAditya Kali 	};
69547c319d32SAditya Kali 
6955e2b911c5SDarrick J. Wong 	BUG_ON(!ext4_has_feature_quota(sb));
69567c319d32SAditya Kali 
69577c319d32SAditya Kali 	if (!qf_inums[type])
69587c319d32SAditya Kali 		return -EPERM;
69597c319d32SAditya Kali 
696007342ec2SBaokun Li 	if (!ext4_check_quota_inum(type, qf_inums[type])) {
696107342ec2SBaokun Li 		ext4_error(sb, "Bad quota inum: %lu, type: %d",
696207342ec2SBaokun Li 				qf_inums[type], type);
696307342ec2SBaokun Li 		return -EUCLEAN;
696407342ec2SBaokun Li 	}
696507342ec2SBaokun Li 
69668a363970STheodore Ts'o 	qf_inode = ext4_iget(sb, qf_inums[type], EXT4_IGET_SPECIAL);
69677c319d32SAditya Kali 	if (IS_ERR(qf_inode)) {
696807342ec2SBaokun Li 		ext4_error(sb, "Bad quota inode: %lu, type: %d",
696907342ec2SBaokun Li 				qf_inums[type], type);
69707c319d32SAditya Kali 		return PTR_ERR(qf_inode);
69717c319d32SAditya Kali 	}
69727c319d32SAditya Kali 
6973bcb13850SJan Kara 	/* Don't account quota for quota files to avoid recursion */
6974bcb13850SJan Kara 	qf_inode->i_flags |= S_NOQUOTA;
6975daf647d2STheodore Ts'o 	lockdep_set_quota_inode(qf_inode, I_DATA_SEM_QUOTA);
69767212b95eSJan Kara 	err = dquot_load_quota_inode(qf_inode, type, format_id, flags);
6977daf647d2STheodore Ts'o 	if (err)
6978daf647d2STheodore Ts'o 		lockdep_set_quota_inode(qf_inode, I_DATA_SEM_NORMAL);
697961157b24SPan Bian 	iput(qf_inode);
69807c319d32SAditya Kali 
69817c319d32SAditya Kali 	return err;
69827c319d32SAditya Kali }
69837c319d32SAditya Kali 
69847c319d32SAditya Kali /* Enable usage tracking for all quota types. */
698525c6d98fSJan Kara int ext4_enable_quotas(struct super_block *sb)
69867c319d32SAditya Kali {
69877c319d32SAditya Kali 	int type, err = 0;
6988a2d4a646SJan Kara 	unsigned long qf_inums[EXT4_MAXQUOTAS] = {
69897c319d32SAditya Kali 		le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum),
6990689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum),
6991689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum)
69927c319d32SAditya Kali 	};
699349da9392SJan Kara 	bool quota_mopt[EXT4_MAXQUOTAS] = {
699449da9392SJan Kara 		test_opt(sb, USRQUOTA),
699549da9392SJan Kara 		test_opt(sb, GRPQUOTA),
699649da9392SJan Kara 		test_opt(sb, PRJQUOTA),
699749da9392SJan Kara 	};
69987c319d32SAditya Kali 
699991389240SJan Kara 	sb_dqopt(sb)->flags |= DQUOT_QUOTA_SYS_FILE | DQUOT_NOLIST_DIRTY;
7000a2d4a646SJan Kara 	for (type = 0; type < EXT4_MAXQUOTAS; type++) {
70017c319d32SAditya Kali 		if (qf_inums[type]) {
70027c319d32SAditya Kali 			err = ext4_quota_enable(sb, type, QFMT_VFS_V1,
700349da9392SJan Kara 				DQUOT_USAGE_ENABLED |
700449da9392SJan Kara 				(quota_mopt[type] ? DQUOT_LIMITS_ENABLED : 0));
70057c319d32SAditya Kali 			if (err) {
70067c319d32SAditya Kali 				ext4_warning(sb,
700772ba7450STheodore Ts'o 					"Failed to enable quota tracking "
700807342ec2SBaokun Li 					"(type=%d, err=%d, ino=%lu). "
700907342ec2SBaokun Li 					"Please run e2fsck to fix.", type,
701007342ec2SBaokun Li 					err, qf_inums[type]);
70114013d47aSJan Kara 				for (type--; type >= 0; type--) {
70124013d47aSJan Kara 					struct inode *inode;
70134013d47aSJan Kara 
70144013d47aSJan Kara 					inode = sb_dqopt(sb)->files[type];
70154013d47aSJan Kara 					if (inode)
70164013d47aSJan Kara 						inode = igrab(inode);
70177f144fd0SJunichi Uekawa 					dquot_quota_off(sb, type);
70184013d47aSJan Kara 					if (inode) {
70194013d47aSJan Kara 						lockdep_set_quota_inode(inode,
70204013d47aSJan Kara 							I_DATA_SEM_NORMAL);
70214013d47aSJan Kara 						iput(inode);
70224013d47aSJan Kara 					}
70234013d47aSJan Kara 				}
70247f144fd0SJunichi Uekawa 
70257c319d32SAditya Kali 				return err;
70267c319d32SAditya Kali 			}
70277c319d32SAditya Kali 		}
70287c319d32SAditya Kali 	}
70297c319d32SAditya Kali 	return 0;
70307c319d32SAditya Kali }
70317c319d32SAditya Kali 
7032ca0e05e4SDmitry Monakhov static int ext4_quota_off(struct super_block *sb, int type)
7033ca0e05e4SDmitry Monakhov {
703421f97697SJan Kara 	struct inode *inode = sb_dqopt(sb)->files[type];
703521f97697SJan Kara 	handle_t *handle;
7036957153fcSJan Kara 	int err;
703721f97697SJan Kara 
703887009d86SDmitry Monakhov 	/* Force all delayed allocation blocks to be allocated.
703987009d86SDmitry Monakhov 	 * Caller already holds s_umount sem */
704087009d86SDmitry Monakhov 	if (test_opt(sb, DELALLOC))
7041ca0e05e4SDmitry Monakhov 		sync_filesystem(sb);
7042ca0e05e4SDmitry Monakhov 
7043957153fcSJan Kara 	if (!inode || !igrab(inode))
70440b268590SAmir Goldstein 		goto out;
70450b268590SAmir Goldstein 
7046957153fcSJan Kara 	err = dquot_quota_off(sb, type);
7047964edf66SJan Kara 	if (err || ext4_has_feature_quota(sb))
7048957153fcSJan Kara 		goto out_put;
7049957153fcSJan Kara 
7050957153fcSJan Kara 	inode_lock(inode);
705161a92987SJan Kara 	/*
705261a92987SJan Kara 	 * Update modification times of quota files when userspace can
705361a92987SJan Kara 	 * start looking at them. If we fail, we return success anyway since
705461a92987SJan Kara 	 * this is not a hard failure and quotas are already disabled.
705561a92987SJan Kara 	 */
70569924a92aSTheodore Ts'o 	handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1);
70574209ae12SHarshad Shirwadkar 	if (IS_ERR(handle)) {
70584209ae12SHarshad Shirwadkar 		err = PTR_ERR(handle);
7059957153fcSJan Kara 		goto out_unlock;
70604209ae12SHarshad Shirwadkar 	}
7061957153fcSJan Kara 	EXT4_I(inode)->i_flags &= ~(EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL);
7062957153fcSJan Kara 	inode_set_flags(inode, 0, S_NOATIME | S_IMMUTABLE);
7063eeca7ea1SDeepa Dinamani 	inode->i_mtime = inode->i_ctime = current_time(inode);
70644209ae12SHarshad Shirwadkar 	err = ext4_mark_inode_dirty(handle, inode);
706521f97697SJan Kara 	ext4_journal_stop(handle);
7066957153fcSJan Kara out_unlock:
7067957153fcSJan Kara 	inode_unlock(inode);
7068957153fcSJan Kara out_put:
7069964edf66SJan Kara 	lockdep_set_quota_inode(inode, I_DATA_SEM_NORMAL);
7070957153fcSJan Kara 	iput(inode);
7071957153fcSJan Kara 	return err;
707221f97697SJan Kara out:
7073ca0e05e4SDmitry Monakhov 	return dquot_quota_off(sb, type);
7074ca0e05e4SDmitry Monakhov }
7075ca0e05e4SDmitry Monakhov 
7076ac27a0ecSDave Kleikamp /* Read data from quotafile - avoid pagecache and such because we cannot afford
7077ac27a0ecSDave Kleikamp  * acquiring the locks... As quota files are never truncated and quota code
7078ac27a0ecSDave Kleikamp  * itself serializes the operations (and no one else should touch the files)
7079ac27a0ecSDave Kleikamp  * we don't have to be afraid of races */
7080617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
7081ac27a0ecSDave Kleikamp 			       size_t len, loff_t off)
7082ac27a0ecSDave Kleikamp {
7083ac27a0ecSDave Kleikamp 	struct inode *inode = sb_dqopt(sb)->files[type];
7084725d26d3SAneesh Kumar K.V 	ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
7085ac27a0ecSDave Kleikamp 	int offset = off & (sb->s_blocksize - 1);
7086ac27a0ecSDave Kleikamp 	int tocopy;
7087ac27a0ecSDave Kleikamp 	size_t toread;
7088ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
7089ac27a0ecSDave Kleikamp 	loff_t i_size = i_size_read(inode);
7090ac27a0ecSDave Kleikamp 
7091ac27a0ecSDave Kleikamp 	if (off > i_size)
7092ac27a0ecSDave Kleikamp 		return 0;
7093ac27a0ecSDave Kleikamp 	if (off+len > i_size)
7094ac27a0ecSDave Kleikamp 		len = i_size-off;
7095ac27a0ecSDave Kleikamp 	toread = len;
7096ac27a0ecSDave Kleikamp 	while (toread > 0) {
709766267814SJiangshan Yi 		tocopy = min_t(unsigned long, sb->s_blocksize - offset, toread);
70981c215028STheodore Ts'o 		bh = ext4_bread(NULL, inode, blk, 0);
70991c215028STheodore Ts'o 		if (IS_ERR(bh))
71001c215028STheodore Ts'o 			return PTR_ERR(bh);
7101ac27a0ecSDave Kleikamp 		if (!bh)	/* A hole? */
7102ac27a0ecSDave Kleikamp 			memset(data, 0, tocopy);
7103ac27a0ecSDave Kleikamp 		else
7104ac27a0ecSDave Kleikamp 			memcpy(data, bh->b_data+offset, tocopy);
7105ac27a0ecSDave Kleikamp 		brelse(bh);
7106ac27a0ecSDave Kleikamp 		offset = 0;
7107ac27a0ecSDave Kleikamp 		toread -= tocopy;
7108ac27a0ecSDave Kleikamp 		data += tocopy;
7109ac27a0ecSDave Kleikamp 		blk++;
7110ac27a0ecSDave Kleikamp 	}
7111ac27a0ecSDave Kleikamp 	return len;
7112ac27a0ecSDave Kleikamp }
7113ac27a0ecSDave Kleikamp 
7114ac27a0ecSDave Kleikamp /* Write to quotafile (we know the transaction is already started and has
7115ac27a0ecSDave Kleikamp  * enough credits) */
7116617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
7117ac27a0ecSDave Kleikamp 				const char *data, size_t len, loff_t off)
7118ac27a0ecSDave Kleikamp {
7119ac27a0ecSDave Kleikamp 	struct inode *inode = sb_dqopt(sb)->files[type];
7120725d26d3SAneesh Kumar K.V 	ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
71214209ae12SHarshad Shirwadkar 	int err = 0, err2 = 0, offset = off & (sb->s_blocksize - 1);
7122c5e298aeSTheodore Ts'o 	int retries = 0;
7123ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
7124ac27a0ecSDave Kleikamp 	handle_t *handle = journal_current_handle();
7125ac27a0ecSDave Kleikamp 
7126380a0091SYe Bin 	if (!handle) {
7127b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)"
7128b31e1552SEric Sandeen 			" cancelled because transaction is not started",
71299c3013e9SJan Kara 			(unsigned long long)off, (unsigned long long)len);
71309c3013e9SJan Kara 		return -EIO;
71319c3013e9SJan Kara 	}
713267eeb568SDmitry Monakhov 	/*
713367eeb568SDmitry Monakhov 	 * Since we account only one data block in transaction credits,
713467eeb568SDmitry Monakhov 	 * then it is impossible to cross a block boundary.
713567eeb568SDmitry Monakhov 	 */
713667eeb568SDmitry Monakhov 	if (sb->s_blocksize - offset < len) {
713767eeb568SDmitry Monakhov 		ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)"
713867eeb568SDmitry Monakhov 			" cancelled because not block aligned",
713967eeb568SDmitry Monakhov 			(unsigned long long)off, (unsigned long long)len);
714067eeb568SDmitry Monakhov 		return -EIO;
714167eeb568SDmitry Monakhov 	}
714267eeb568SDmitry Monakhov 
7143c5e298aeSTheodore Ts'o 	do {
7144c5e298aeSTheodore Ts'o 		bh = ext4_bread(handle, inode, blk,
7145c5e298aeSTheodore Ts'o 				EXT4_GET_BLOCKS_CREATE |
7146c5e298aeSTheodore Ts'o 				EXT4_GET_BLOCKS_METADATA_NOFAIL);
714745586c70SMasahiro Yamada 	} while (PTR_ERR(bh) == -ENOSPC &&
7148c5e298aeSTheodore Ts'o 		 ext4_should_retry_alloc(inode->i_sb, &retries));
71491c215028STheodore Ts'o 	if (IS_ERR(bh))
71501c215028STheodore Ts'o 		return PTR_ERR(bh);
7151ac27a0ecSDave Kleikamp 	if (!bh)
7152ac27a0ecSDave Kleikamp 		goto out;
71535d601255Sliang xie 	BUFFER_TRACE(bh, "get write access");
7154188c299eSJan Kara 	err = ext4_journal_get_write_access(handle, sb, bh, EXT4_JTR_NONE);
7155ac27a0ecSDave Kleikamp 	if (err) {
7156ac27a0ecSDave Kleikamp 		brelse(bh);
71571c215028STheodore Ts'o 		return err;
7158ac27a0ecSDave Kleikamp 	}
7159ac27a0ecSDave Kleikamp 	lock_buffer(bh);
716067eeb568SDmitry Monakhov 	memcpy(bh->b_data+offset, data, len);
7161ac27a0ecSDave Kleikamp 	flush_dcache_page(bh->b_page);
7162ac27a0ecSDave Kleikamp 	unlock_buffer(bh);
71630390131bSFrank Mayhar 	err = ext4_handle_dirty_metadata(handle, NULL, bh);
7164ac27a0ecSDave Kleikamp 	brelse(bh);
7165ac27a0ecSDave Kleikamp out:
716667eeb568SDmitry Monakhov 	if (inode->i_size < off + len) {
716767eeb568SDmitry Monakhov 		i_size_write(inode, off + len);
7168617ba13bSMingming Cao 		EXT4_I(inode)->i_disksize = inode->i_size;
71694209ae12SHarshad Shirwadkar 		err2 = ext4_mark_inode_dirty(handle, inode);
71704209ae12SHarshad Shirwadkar 		if (unlikely(err2 && !err))
71714209ae12SHarshad Shirwadkar 			err = err2;
717221f97697SJan Kara 	}
71734209ae12SHarshad Shirwadkar 	return err ? err : len;
7174ac27a0ecSDave Kleikamp }
7175ac27a0ecSDave Kleikamp #endif
7176ac27a0ecSDave Kleikamp 
7177c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2)
717824b58424STheodore Ts'o static inline void register_as_ext2(void)
717924b58424STheodore Ts'o {
718024b58424STheodore Ts'o 	int err = register_filesystem(&ext2_fs_type);
718124b58424STheodore Ts'o 	if (err)
718224b58424STheodore Ts'o 		printk(KERN_WARNING
718324b58424STheodore Ts'o 		       "EXT4-fs: Unable to register as ext2 (%d)\n", err);
718424b58424STheodore Ts'o }
718524b58424STheodore Ts'o 
718624b58424STheodore Ts'o static inline void unregister_as_ext2(void)
718724b58424STheodore Ts'o {
718824b58424STheodore Ts'o 	unregister_filesystem(&ext2_fs_type);
718924b58424STheodore Ts'o }
71902035e776STheodore Ts'o 
71912035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb)
71922035e776STheodore Ts'o {
7193e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext2_incompat_features(sb))
71942035e776STheodore Ts'o 		return 0;
7195bc98a42cSDavid Howells 	if (sb_rdonly(sb))
71962035e776STheodore Ts'o 		return 1;
7197e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext2_ro_compat_features(sb))
71982035e776STheodore Ts'o 		return 0;
71992035e776STheodore Ts'o 	return 1;
72002035e776STheodore Ts'o }
720124b58424STheodore Ts'o #else
720224b58424STheodore Ts'o static inline void register_as_ext2(void) { }
720324b58424STheodore Ts'o static inline void unregister_as_ext2(void) { }
72042035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb) { return 0; }
720524b58424STheodore Ts'o #endif
720624b58424STheodore Ts'o 
720724b58424STheodore Ts'o static inline void register_as_ext3(void)
720824b58424STheodore Ts'o {
720924b58424STheodore Ts'o 	int err = register_filesystem(&ext3_fs_type);
721024b58424STheodore Ts'o 	if (err)
721124b58424STheodore Ts'o 		printk(KERN_WARNING
721224b58424STheodore Ts'o 		       "EXT4-fs: Unable to register as ext3 (%d)\n", err);
721324b58424STheodore Ts'o }
721424b58424STheodore Ts'o 
721524b58424STheodore Ts'o static inline void unregister_as_ext3(void)
721624b58424STheodore Ts'o {
721724b58424STheodore Ts'o 	unregister_filesystem(&ext3_fs_type);
721824b58424STheodore Ts'o }
72192035e776STheodore Ts'o 
72202035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb)
72212035e776STheodore Ts'o {
7222e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext3_incompat_features(sb))
72232035e776STheodore Ts'o 		return 0;
7224e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_journal(sb))
72252035e776STheodore Ts'o 		return 0;
7226bc98a42cSDavid Howells 	if (sb_rdonly(sb))
72272035e776STheodore Ts'o 		return 1;
7228e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext3_ro_compat_features(sb))
72292035e776STheodore Ts'o 		return 0;
72302035e776STheodore Ts'o 	return 1;
72312035e776STheodore Ts'o }
723224b58424STheodore Ts'o 
723303010a33STheodore Ts'o static struct file_system_type ext4_fs_type = {
7234ac27a0ecSDave Kleikamp 	.owner			= THIS_MODULE,
723503010a33STheodore Ts'o 	.name			= "ext4",
7236cebe85d5SLukas Czerner 	.init_fs_context	= ext4_init_fs_context,
7237cebe85d5SLukas Czerner 	.parameters		= ext4_param_specs,
7238ac27a0ecSDave Kleikamp 	.kill_sb		= kill_block_super,
723914f3db55SChristian Brauner 	.fs_flags		= FS_REQUIRES_DEV | FS_ALLOW_IDMAP,
7240ac27a0ecSDave Kleikamp };
72417f78e035SEric W. Biederman MODULE_ALIAS_FS("ext4");
7242ac27a0ecSDave Kleikamp 
7243e9e3bcecSEric Sandeen /* Shared across all ext4 file systems */
7244e9e3bcecSEric Sandeen wait_queue_head_t ext4__ioend_wq[EXT4_WQ_HASH_SZ];
7245e9e3bcecSEric Sandeen 
72465dabfc78STheodore Ts'o static int __init ext4_init_fs(void)
7247ac27a0ecSDave Kleikamp {
7248e9e3bcecSEric Sandeen 	int i, err;
7249c9de560dSAlex Tomas 
7250e294a537STheodore Ts'o 	ratelimit_state_init(&ext4_mount_msg_ratelimit, 30 * HZ, 64);
725107c0c5d8SAl Viro 	ext4_li_info = NULL;
725207c0c5d8SAl Viro 
72539a4c8019SCarlos Maiolino 	/* Build-time check for flags consistency */
725412e9b892SDmitry Monakhov 	ext4_check_flag_values();
7255e9e3bcecSEric Sandeen 
7256e142d052SJan Kara 	for (i = 0; i < EXT4_WQ_HASH_SZ; i++)
7257e9e3bcecSEric Sandeen 		init_waitqueue_head(&ext4__ioend_wq[i]);
7258e9e3bcecSEric Sandeen 
725951865fdaSZheng Liu 	err = ext4_init_es();
72606fd058f7STheodore Ts'o 	if (err)
72616fd058f7STheodore Ts'o 		return err;
726251865fdaSZheng Liu 
72631dc0aa46SEric Whitney 	err = ext4_init_pending();
72641dc0aa46SEric Whitney 	if (err)
726522cfe4b4SEric Biggers 		goto out7;
726622cfe4b4SEric Biggers 
726722cfe4b4SEric Biggers 	err = ext4_init_post_read_processing();
726822cfe4b4SEric Biggers 	if (err)
72691dc0aa46SEric Whitney 		goto out6;
72701dc0aa46SEric Whitney 
727151865fdaSZheng Liu 	err = ext4_init_pageio();
727251865fdaSZheng Liu 	if (err)
7273b5799018STheodore Ts'o 		goto out5;
727451865fdaSZheng Liu 
72755dabfc78STheodore Ts'o 	err = ext4_init_system_zone();
7276bd2d0210STheodore Ts'o 	if (err)
7277b5799018STheodore Ts'o 		goto out4;
7278857ac889SLukas Czerner 
7279b5799018STheodore Ts'o 	err = ext4_init_sysfs();
7280dd68314cSTheodore Ts'o 	if (err)
7281b5799018STheodore Ts'o 		goto out3;
7282857ac889SLukas Czerner 
72835dabfc78STheodore Ts'o 	err = ext4_init_mballoc();
7284ac27a0ecSDave Kleikamp 	if (err)
7285c9de560dSAlex Tomas 		goto out2;
7286ac27a0ecSDave Kleikamp 	err = init_inodecache();
7287ac27a0ecSDave Kleikamp 	if (err)
7288ac27a0ecSDave Kleikamp 		goto out1;
7289aa75f4d3SHarshad Shirwadkar 
7290aa75f4d3SHarshad Shirwadkar 	err = ext4_fc_init_dentry_cache();
7291aa75f4d3SHarshad Shirwadkar 	if (err)
7292aa75f4d3SHarshad Shirwadkar 		goto out05;
7293aa75f4d3SHarshad Shirwadkar 
729424b58424STheodore Ts'o 	register_as_ext3();
72952035e776STheodore Ts'o 	register_as_ext2();
729603010a33STheodore Ts'o 	err = register_filesystem(&ext4_fs_type);
7297ac27a0ecSDave Kleikamp 	if (err)
7298ac27a0ecSDave Kleikamp 		goto out;
7299bfff6873SLukas Czerner 
7300ac27a0ecSDave Kleikamp 	return 0;
7301ac27a0ecSDave Kleikamp out:
730224b58424STheodore Ts'o 	unregister_as_ext2();
730324b58424STheodore Ts'o 	unregister_as_ext3();
7304ab047d51SSebastian Andrzej Siewior 	ext4_fc_destroy_dentry_cache();
7305aa75f4d3SHarshad Shirwadkar out05:
7306ac27a0ecSDave Kleikamp 	destroy_inodecache();
7307ac27a0ecSDave Kleikamp out1:
73085dabfc78STheodore Ts'o 	ext4_exit_mballoc();
73099c191f70ST Makphaibulchoke out2:
7310b5799018STheodore Ts'o 	ext4_exit_sysfs();
7311b5799018STheodore Ts'o out3:
7312dd68314cSTheodore Ts'o 	ext4_exit_system_zone();
7313b5799018STheodore Ts'o out4:
73145dabfc78STheodore Ts'o 	ext4_exit_pageio();
7315b5799018STheodore Ts'o out5:
731622cfe4b4SEric Biggers 	ext4_exit_post_read_processing();
73171dc0aa46SEric Whitney out6:
731822cfe4b4SEric Biggers 	ext4_exit_pending();
731922cfe4b4SEric Biggers out7:
732051865fdaSZheng Liu 	ext4_exit_es();
732151865fdaSZheng Liu 
7322ac27a0ecSDave Kleikamp 	return err;
7323ac27a0ecSDave Kleikamp }
7324ac27a0ecSDave Kleikamp 
73255dabfc78STheodore Ts'o static void __exit ext4_exit_fs(void)
7326ac27a0ecSDave Kleikamp {
7327bfff6873SLukas Czerner 	ext4_destroy_lazyinit_thread();
732824b58424STheodore Ts'o 	unregister_as_ext2();
732924b58424STheodore Ts'o 	unregister_as_ext3();
733003010a33STheodore Ts'o 	unregister_filesystem(&ext4_fs_type);
7331ab047d51SSebastian Andrzej Siewior 	ext4_fc_destroy_dentry_cache();
7332ac27a0ecSDave Kleikamp 	destroy_inodecache();
73335dabfc78STheodore Ts'o 	ext4_exit_mballoc();
7334b5799018STheodore Ts'o 	ext4_exit_sysfs();
73355dabfc78STheodore Ts'o 	ext4_exit_system_zone();
73365dabfc78STheodore Ts'o 	ext4_exit_pageio();
733722cfe4b4SEric Biggers 	ext4_exit_post_read_processing();
7338dd12ed14SEric Sandeen 	ext4_exit_es();
73391dc0aa46SEric Whitney 	ext4_exit_pending();
7340ac27a0ecSDave Kleikamp }
7341ac27a0ecSDave Kleikamp 
7342ac27a0ecSDave Kleikamp MODULE_AUTHOR("Remy Card, Stephen Tweedie, Andrew Morton, Andreas Dilger, Theodore Ts'o and others");
734383982b6fSTheodore Ts'o MODULE_DESCRIPTION("Fourth Extended Filesystem");
7344ac27a0ecSDave Kleikamp MODULE_LICENSE("GPL");
73457ef79ad5STheodore Ts'o MODULE_SOFTDEP("pre: crc32c");
73465dabfc78STheodore Ts'o module_init(ext4_init_fs)
73475dabfc78STheodore Ts'o module_exit(ext4_exit_fs)
7348