xref: /linux/fs/ext4/super.c (revision 1dc0aa46e74a3366e12f426b7caaca477853e9c3)
1f5166768STheodore Ts'o // SPDX-License-Identifier: GPL-2.0
2ac27a0ecSDave Kleikamp /*
3617ba13bSMingming Cao  *  linux/fs/ext4/super.c
4ac27a0ecSDave Kleikamp  *
5ac27a0ecSDave Kleikamp  * Copyright (C) 1992, 1993, 1994, 1995
6ac27a0ecSDave Kleikamp  * Remy Card (card@masi.ibp.fr)
7ac27a0ecSDave Kleikamp  * Laboratoire MASI - Institut Blaise Pascal
8ac27a0ecSDave Kleikamp  * Universite Pierre et Marie Curie (Paris VI)
9ac27a0ecSDave Kleikamp  *
10ac27a0ecSDave Kleikamp  *  from
11ac27a0ecSDave Kleikamp  *
12ac27a0ecSDave Kleikamp  *  linux/fs/minix/inode.c
13ac27a0ecSDave Kleikamp  *
14ac27a0ecSDave Kleikamp  *  Copyright (C) 1991, 1992  Linus Torvalds
15ac27a0ecSDave Kleikamp  *
16ac27a0ecSDave Kleikamp  *  Big-endian to little-endian byte-swapping/bitmaps by
17ac27a0ecSDave Kleikamp  *        David S. Miller (davem@caip.rutgers.edu), 1995
18ac27a0ecSDave Kleikamp  */
19ac27a0ecSDave Kleikamp 
20ac27a0ecSDave Kleikamp #include <linux/module.h>
21ac27a0ecSDave Kleikamp #include <linux/string.h>
22ac27a0ecSDave Kleikamp #include <linux/fs.h>
23ac27a0ecSDave Kleikamp #include <linux/time.h>
24c5ca7c76STheodore Ts'o #include <linux/vmalloc.h>
25ac27a0ecSDave Kleikamp #include <linux/slab.h>
26ac27a0ecSDave Kleikamp #include <linux/init.h>
27ac27a0ecSDave Kleikamp #include <linux/blkdev.h>
2866114cadSTejun Heo #include <linux/backing-dev.h>
29ac27a0ecSDave Kleikamp #include <linux/parser.h>
30ac27a0ecSDave Kleikamp #include <linux/buffer_head.h>
31a5694255SChristoph Hellwig #include <linux/exportfs.h>
32ac27a0ecSDave Kleikamp #include <linux/vfs.h>
33ac27a0ecSDave Kleikamp #include <linux/random.h>
34ac27a0ecSDave Kleikamp #include <linux/mount.h>
35ac27a0ecSDave Kleikamp #include <linux/namei.h>
36ac27a0ecSDave Kleikamp #include <linux/quotaops.h>
37ac27a0ecSDave Kleikamp #include <linux/seq_file.h>
383197ebdbSTheodore Ts'o #include <linux/ctype.h>
391330593eSVignesh Babu #include <linux/log2.h>
40717d50e4SAndreas Dilger #include <linux/crc16.h>
41ef510424SDan Williams #include <linux/dax.h>
427abc52c2SDan Magenheimer #include <linux/cleancache.h>
437c0f6ba6SLinus Torvalds #include <linux/uaccess.h>
44ee73f9a5SJeff Layton #include <linux/iversion.h>
45ac27a0ecSDave Kleikamp 
46bfff6873SLukas Czerner #include <linux/kthread.h>
47bfff6873SLukas Czerner #include <linux/freezer.h>
48bfff6873SLukas Czerner 
493dcf5451SChristoph Hellwig #include "ext4.h"
504a092d73STheodore Ts'o #include "ext4_extents.h"	/* Needed for trace points definition */
513dcf5451SChristoph Hellwig #include "ext4_jbd2.h"
52ac27a0ecSDave Kleikamp #include "xattr.h"
53ac27a0ecSDave Kleikamp #include "acl.h"
543661d286STheodore Ts'o #include "mballoc.h"
550c9ec4beSDarrick J. Wong #include "fsmap.h"
56ac27a0ecSDave Kleikamp 
579bffad1eSTheodore Ts'o #define CREATE_TRACE_POINTS
589bffad1eSTheodore Ts'o #include <trace/events/ext4.h>
599bffad1eSTheodore Ts'o 
600b75a840SLukas Czerner static struct ext4_lazy_init *ext4_li_info;
610b75a840SLukas Czerner static struct mutex ext4_li_mtx;
62e294a537STheodore Ts'o static struct ratelimit_state ext4_mount_msg_ratelimit;
639f6200bbSTheodore Ts'o 
64617ba13bSMingming Cao static int ext4_load_journal(struct super_block *, struct ext4_super_block *,
65ac27a0ecSDave Kleikamp 			     unsigned long journal_devnum);
662adf6da8STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root);
67e2d67052STheodore Ts'o static int ext4_commit_super(struct super_block *sb, int sync);
68617ba13bSMingming Cao static void ext4_mark_recovery_complete(struct super_block *sb,
69617ba13bSMingming Cao 					struct ext4_super_block *es);
70617ba13bSMingming Cao static void ext4_clear_journal_err(struct super_block *sb,
71617ba13bSMingming Cao 				   struct ext4_super_block *es);
72617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait);
73617ba13bSMingming Cao static int ext4_remount(struct super_block *sb, int *flags, char *data);
74617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf);
75c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb);
76c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb);
77152a0836SAl Viro static struct dentry *ext4_mount(struct file_system_type *fs_type, int flags,
78152a0836SAl Viro 		       const char *dev_name, void *data);
792035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb);
802035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb);
81d39195c3SAmir Goldstein static int ext4_feature_set_ok(struct super_block *sb, int readonly);
82bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void);
83bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb);
848f1f7453SEric Sandeen static void ext4_clear_request_list(void);
85c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb,
86c6cb7e77SEric Whitney 					    unsigned int journal_inum);
87ac27a0ecSDave Kleikamp 
88e74031fdSJan Kara /*
89e74031fdSJan Kara  * Lock ordering
90e74031fdSJan Kara  *
91e74031fdSJan Kara  * Note the difference between i_mmap_sem (EXT4_I(inode)->i_mmap_sem) and
92e74031fdSJan Kara  * i_mmap_rwsem (inode->i_mmap_rwsem)!
93e74031fdSJan Kara  *
94e74031fdSJan Kara  * page fault path:
95e74031fdSJan Kara  * mmap_sem -> sb_start_pagefault -> i_mmap_sem (r) -> transaction start ->
96e74031fdSJan Kara  *   page lock -> i_data_sem (rw)
97e74031fdSJan Kara  *
98e74031fdSJan Kara  * buffered write path:
99e74031fdSJan Kara  * sb_start_write -> i_mutex -> mmap_sem
100e74031fdSJan Kara  * sb_start_write -> i_mutex -> transaction start -> page lock ->
101e74031fdSJan Kara  *   i_data_sem (rw)
102e74031fdSJan Kara  *
103e74031fdSJan Kara  * truncate:
1041d39834fSNikolay Borisov  * sb_start_write -> i_mutex -> i_mmap_sem (w) -> i_mmap_rwsem (w) -> page lock
1051d39834fSNikolay Borisov  * sb_start_write -> i_mutex -> i_mmap_sem (w) -> transaction start ->
1061d39834fSNikolay Borisov  *   i_data_sem (rw)
107e74031fdSJan Kara  *
108e74031fdSJan Kara  * direct IO:
1091d39834fSNikolay Borisov  * sb_start_write -> i_mutex -> mmap_sem
1101d39834fSNikolay Borisov  * sb_start_write -> i_mutex -> transaction start -> i_data_sem (rw)
111e74031fdSJan Kara  *
112e74031fdSJan Kara  * writepages:
113e74031fdSJan Kara  * transaction start -> page lock(s) -> i_data_sem (rw)
114e74031fdSJan Kara  */
115e74031fdSJan Kara 
116c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2)
1172035e776STheodore Ts'o static struct file_system_type ext2_fs_type = {
1182035e776STheodore Ts'o 	.owner		= THIS_MODULE,
1192035e776STheodore Ts'o 	.name		= "ext2",
1202035e776STheodore Ts'o 	.mount		= ext4_mount,
1212035e776STheodore Ts'o 	.kill_sb	= kill_block_super,
1222035e776STheodore Ts'o 	.fs_flags	= FS_REQUIRES_DEV,
1232035e776STheodore Ts'o };
1247f78e035SEric W. Biederman MODULE_ALIAS_FS("ext2");
125fa7614ddSEric W. Biederman MODULE_ALIAS("ext2");
1262035e776STheodore Ts'o #define IS_EXT2_SB(sb) ((sb)->s_bdev->bd_holder == &ext2_fs_type)
1272035e776STheodore Ts'o #else
1282035e776STheodore Ts'o #define IS_EXT2_SB(sb) (0)
1292035e776STheodore Ts'o #endif
1302035e776STheodore Ts'o 
1312035e776STheodore Ts'o 
132ba69f9abSJan Kara static struct file_system_type ext3_fs_type = {
133ba69f9abSJan Kara 	.owner		= THIS_MODULE,
134ba69f9abSJan Kara 	.name		= "ext3",
135152a0836SAl Viro 	.mount		= ext4_mount,
136ba69f9abSJan Kara 	.kill_sb	= kill_block_super,
137ba69f9abSJan Kara 	.fs_flags	= FS_REQUIRES_DEV,
138ba69f9abSJan Kara };
1397f78e035SEric W. Biederman MODULE_ALIAS_FS("ext3");
140fa7614ddSEric W. Biederman MODULE_ALIAS("ext3");
141ba69f9abSJan Kara #define IS_EXT3_SB(sb) ((sb)->s_bdev->bd_holder == &ext3_fs_type)
142bd81d8eeSLaurent Vivier 
143d25425f8SDarrick J. Wong static int ext4_verify_csum_type(struct super_block *sb,
144d25425f8SDarrick J. Wong 				 struct ext4_super_block *es)
145d25425f8SDarrick J. Wong {
146e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_metadata_csum(sb))
147d25425f8SDarrick J. Wong 		return 1;
148d25425f8SDarrick J. Wong 
149d25425f8SDarrick J. Wong 	return es->s_checksum_type == EXT4_CRC32C_CHKSUM;
150d25425f8SDarrick J. Wong }
151d25425f8SDarrick J. Wong 
152a9c47317SDarrick J. Wong static __le32 ext4_superblock_csum(struct super_block *sb,
153a9c47317SDarrick J. Wong 				   struct ext4_super_block *es)
154a9c47317SDarrick J. Wong {
155a9c47317SDarrick J. Wong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
156a9c47317SDarrick J. Wong 	int offset = offsetof(struct ext4_super_block, s_checksum);
157a9c47317SDarrick J. Wong 	__u32 csum;
158a9c47317SDarrick J. Wong 
159a9c47317SDarrick J. Wong 	csum = ext4_chksum(sbi, ~0, (char *)es, offset);
160a9c47317SDarrick J. Wong 
161a9c47317SDarrick J. Wong 	return cpu_to_le32(csum);
162a9c47317SDarrick J. Wong }
163a9c47317SDarrick J. Wong 
164c197855eSStephen Hemminger static int ext4_superblock_csum_verify(struct super_block *sb,
165a9c47317SDarrick J. Wong 				       struct ext4_super_block *es)
166a9c47317SDarrick J. Wong {
1679aa5d32bSDmitry Monakhov 	if (!ext4_has_metadata_csum(sb))
168a9c47317SDarrick J. Wong 		return 1;
169a9c47317SDarrick J. Wong 
170a9c47317SDarrick J. Wong 	return es->s_checksum == ext4_superblock_csum(sb, es);
171a9c47317SDarrick J. Wong }
172a9c47317SDarrick J. Wong 
17306db49e6STheodore Ts'o void ext4_superblock_csum_set(struct super_block *sb)
174a9c47317SDarrick J. Wong {
17506db49e6STheodore Ts'o 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
17606db49e6STheodore Ts'o 
1779aa5d32bSDmitry Monakhov 	if (!ext4_has_metadata_csum(sb))
178a9c47317SDarrick J. Wong 		return;
179a9c47317SDarrick J. Wong 
180a9c47317SDarrick J. Wong 	es->s_checksum = ext4_superblock_csum(sb, es);
181a9c47317SDarrick J. Wong }
182a9c47317SDarrick J. Wong 
1839933fc0aSTheodore Ts'o void *ext4_kvmalloc(size_t size, gfp_t flags)
1849933fc0aSTheodore Ts'o {
1859933fc0aSTheodore Ts'o 	void *ret;
1869933fc0aSTheodore Ts'o 
1878be04b93SJoe Perches 	ret = kmalloc(size, flags | __GFP_NOWARN);
1889933fc0aSTheodore Ts'o 	if (!ret)
1899933fc0aSTheodore Ts'o 		ret = __vmalloc(size, flags, PAGE_KERNEL);
1909933fc0aSTheodore Ts'o 	return ret;
1919933fc0aSTheodore Ts'o }
1929933fc0aSTheodore Ts'o 
1939933fc0aSTheodore Ts'o void *ext4_kvzalloc(size_t size, gfp_t flags)
1949933fc0aSTheodore Ts'o {
1959933fc0aSTheodore Ts'o 	void *ret;
1969933fc0aSTheodore Ts'o 
1978be04b93SJoe Perches 	ret = kzalloc(size, flags | __GFP_NOWARN);
1989933fc0aSTheodore Ts'o 	if (!ret)
1999933fc0aSTheodore Ts'o 		ret = __vmalloc(size, flags | __GFP_ZERO, PAGE_KERNEL);
2009933fc0aSTheodore Ts'o 	return ret;
2019933fc0aSTheodore Ts'o }
2029933fc0aSTheodore Ts'o 
2038fadc143SAlexandre Ratchov ext4_fsblk_t ext4_block_bitmap(struct super_block *sb,
2048fadc143SAlexandre Ratchov 			       struct ext4_group_desc *bg)
205bd81d8eeSLaurent Vivier {
2063a14589cSAneesh Kumar K.V 	return le32_to_cpu(bg->bg_block_bitmap_lo) |
2078fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
2088fadc143SAlexandre Ratchov 		 (ext4_fsblk_t)le32_to_cpu(bg->bg_block_bitmap_hi) << 32 : 0);
209bd81d8eeSLaurent Vivier }
210bd81d8eeSLaurent Vivier 
2118fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_bitmap(struct super_block *sb,
2128fadc143SAlexandre Ratchov 			       struct ext4_group_desc *bg)
213bd81d8eeSLaurent Vivier {
2145272f837SAneesh Kumar K.V 	return le32_to_cpu(bg->bg_inode_bitmap_lo) |
2158fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
2168fadc143SAlexandre Ratchov 		 (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_bitmap_hi) << 32 : 0);
217bd81d8eeSLaurent Vivier }
218bd81d8eeSLaurent Vivier 
2198fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_table(struct super_block *sb,
2208fadc143SAlexandre Ratchov 			      struct ext4_group_desc *bg)
221bd81d8eeSLaurent Vivier {
2225272f837SAneesh Kumar K.V 	return le32_to_cpu(bg->bg_inode_table_lo) |
2238fadc143SAlexandre Ratchov 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
2248fadc143SAlexandre Ratchov 		 (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_table_hi) << 32 : 0);
225bd81d8eeSLaurent Vivier }
226bd81d8eeSLaurent Vivier 
227021b65bbSTheodore Ts'o __u32 ext4_free_group_clusters(struct super_block *sb,
228560671a0SAneesh Kumar K.V 			       struct ext4_group_desc *bg)
229560671a0SAneesh Kumar K.V {
230560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_free_blocks_count_lo) |
231560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
232560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_free_blocks_count_hi) << 16 : 0);
233560671a0SAneesh Kumar K.V }
234560671a0SAneesh Kumar K.V 
235560671a0SAneesh Kumar K.V __u32 ext4_free_inodes_count(struct super_block *sb,
236560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
237560671a0SAneesh Kumar K.V {
238560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_free_inodes_count_lo) |
239560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
240560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_free_inodes_count_hi) << 16 : 0);
241560671a0SAneesh Kumar K.V }
242560671a0SAneesh Kumar K.V 
243560671a0SAneesh Kumar K.V __u32 ext4_used_dirs_count(struct super_block *sb,
244560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
245560671a0SAneesh Kumar K.V {
246560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_used_dirs_count_lo) |
247560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
248560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_used_dirs_count_hi) << 16 : 0);
249560671a0SAneesh Kumar K.V }
250560671a0SAneesh Kumar K.V 
251560671a0SAneesh Kumar K.V __u32 ext4_itable_unused_count(struct super_block *sb,
252560671a0SAneesh Kumar K.V 			      struct ext4_group_desc *bg)
253560671a0SAneesh Kumar K.V {
254560671a0SAneesh Kumar K.V 	return le16_to_cpu(bg->bg_itable_unused_lo) |
255560671a0SAneesh Kumar K.V 		(EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ?
256560671a0SAneesh Kumar K.V 		 (__u32)le16_to_cpu(bg->bg_itable_unused_hi) << 16 : 0);
257560671a0SAneesh Kumar K.V }
258560671a0SAneesh Kumar K.V 
2598fadc143SAlexandre Ratchov void ext4_block_bitmap_set(struct super_block *sb,
2608fadc143SAlexandre Ratchov 			   struct ext4_group_desc *bg, ext4_fsblk_t blk)
261bd81d8eeSLaurent Vivier {
2623a14589cSAneesh Kumar K.V 	bg->bg_block_bitmap_lo = cpu_to_le32((u32)blk);
2638fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
2648fadc143SAlexandre Ratchov 		bg->bg_block_bitmap_hi = cpu_to_le32(blk >> 32);
265bd81d8eeSLaurent Vivier }
266bd81d8eeSLaurent Vivier 
2678fadc143SAlexandre Ratchov void ext4_inode_bitmap_set(struct super_block *sb,
2688fadc143SAlexandre Ratchov 			   struct ext4_group_desc *bg, ext4_fsblk_t blk)
269bd81d8eeSLaurent Vivier {
2705272f837SAneesh Kumar K.V 	bg->bg_inode_bitmap_lo  = cpu_to_le32((u32)blk);
2718fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
2728fadc143SAlexandre Ratchov 		bg->bg_inode_bitmap_hi = cpu_to_le32(blk >> 32);
273bd81d8eeSLaurent Vivier }
274bd81d8eeSLaurent Vivier 
2758fadc143SAlexandre Ratchov void ext4_inode_table_set(struct super_block *sb,
2768fadc143SAlexandre Ratchov 			  struct ext4_group_desc *bg, ext4_fsblk_t blk)
277bd81d8eeSLaurent Vivier {
2785272f837SAneesh Kumar K.V 	bg->bg_inode_table_lo = cpu_to_le32((u32)blk);
2798fadc143SAlexandre Ratchov 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
2808fadc143SAlexandre Ratchov 		bg->bg_inode_table_hi = cpu_to_le32(blk >> 32);
281bd81d8eeSLaurent Vivier }
282bd81d8eeSLaurent Vivier 
283021b65bbSTheodore Ts'o void ext4_free_group_clusters_set(struct super_block *sb,
284560671a0SAneesh Kumar K.V 				  struct ext4_group_desc *bg, __u32 count)
285560671a0SAneesh Kumar K.V {
286560671a0SAneesh Kumar K.V 	bg->bg_free_blocks_count_lo = cpu_to_le16((__u16)count);
287560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
288560671a0SAneesh Kumar K.V 		bg->bg_free_blocks_count_hi = cpu_to_le16(count >> 16);
289560671a0SAneesh Kumar K.V }
290560671a0SAneesh Kumar K.V 
291560671a0SAneesh Kumar K.V void ext4_free_inodes_set(struct super_block *sb,
292560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
293560671a0SAneesh Kumar K.V {
294560671a0SAneesh Kumar K.V 	bg->bg_free_inodes_count_lo = cpu_to_le16((__u16)count);
295560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
296560671a0SAneesh Kumar K.V 		bg->bg_free_inodes_count_hi = cpu_to_le16(count >> 16);
297560671a0SAneesh Kumar K.V }
298560671a0SAneesh Kumar K.V 
299560671a0SAneesh Kumar K.V void ext4_used_dirs_set(struct super_block *sb,
300560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
301560671a0SAneesh Kumar K.V {
302560671a0SAneesh Kumar K.V 	bg->bg_used_dirs_count_lo = cpu_to_le16((__u16)count);
303560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
304560671a0SAneesh Kumar K.V 		bg->bg_used_dirs_count_hi = cpu_to_le16(count >> 16);
305560671a0SAneesh Kumar K.V }
306560671a0SAneesh Kumar K.V 
307560671a0SAneesh Kumar K.V void ext4_itable_unused_set(struct super_block *sb,
308560671a0SAneesh Kumar K.V 			  struct ext4_group_desc *bg, __u32 count)
309560671a0SAneesh Kumar K.V {
310560671a0SAneesh Kumar K.V 	bg->bg_itable_unused_lo = cpu_to_le16((__u16)count);
311560671a0SAneesh Kumar K.V 	if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT)
312560671a0SAneesh Kumar K.V 		bg->bg_itable_unused_hi = cpu_to_le16(count >> 16);
313560671a0SAneesh Kumar K.V }
314560671a0SAneesh Kumar K.V 
3156a0678a7SArnd Bergmann static void __ext4_update_tstamp(__le32 *lo, __u8 *hi)
3166a0678a7SArnd Bergmann {
3176a0678a7SArnd Bergmann 	time64_t now = ktime_get_real_seconds();
3186a0678a7SArnd Bergmann 
3196a0678a7SArnd Bergmann 	now = clamp_val(now, 0, (1ull << 40) - 1);
3206a0678a7SArnd Bergmann 
3216a0678a7SArnd Bergmann 	*lo = cpu_to_le32(lower_32_bits(now));
3226a0678a7SArnd Bergmann 	*hi = upper_32_bits(now);
3236a0678a7SArnd Bergmann }
3246a0678a7SArnd Bergmann 
3256a0678a7SArnd Bergmann static time64_t __ext4_get_tstamp(__le32 *lo, __u8 *hi)
3266a0678a7SArnd Bergmann {
3276a0678a7SArnd Bergmann 	return ((time64_t)(*hi) << 32) + le32_to_cpu(*lo);
3286a0678a7SArnd Bergmann }
3296a0678a7SArnd Bergmann #define ext4_update_tstamp(es, tstamp) \
3306a0678a7SArnd Bergmann 	__ext4_update_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi)
3316a0678a7SArnd Bergmann #define ext4_get_tstamp(es, tstamp) \
3326a0678a7SArnd Bergmann 	__ext4_get_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi)
333d3d1faf6SCurt Wohlgemuth 
3341c13d5c0STheodore Ts'o static void __save_error_info(struct super_block *sb, const char *func,
3351c13d5c0STheodore Ts'o 			    unsigned int line)
3361c13d5c0STheodore Ts'o {
3371c13d5c0STheodore Ts'o 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
3381c13d5c0STheodore Ts'o 
3391c13d5c0STheodore Ts'o 	EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
3401b46617bSTheodore Ts'o 	if (bdev_read_only(sb->s_bdev))
3411b46617bSTheodore Ts'o 		return;
3421c13d5c0STheodore Ts'o 	es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
3436a0678a7SArnd Bergmann 	ext4_update_tstamp(es, s_last_error_time);
3441c13d5c0STheodore Ts'o 	strncpy(es->s_last_error_func, func, sizeof(es->s_last_error_func));
3451c13d5c0STheodore Ts'o 	es->s_last_error_line = cpu_to_le32(line);
3461c13d5c0STheodore Ts'o 	if (!es->s_first_error_time) {
3471c13d5c0STheodore Ts'o 		es->s_first_error_time = es->s_last_error_time;
3486a0678a7SArnd Bergmann 		es->s_first_error_time_hi = es->s_last_error_time_hi;
3491c13d5c0STheodore Ts'o 		strncpy(es->s_first_error_func, func,
3501c13d5c0STheodore Ts'o 			sizeof(es->s_first_error_func));
3511c13d5c0STheodore Ts'o 		es->s_first_error_line = cpu_to_le32(line);
3521c13d5c0STheodore Ts'o 		es->s_first_error_ino = es->s_last_error_ino;
3531c13d5c0STheodore Ts'o 		es->s_first_error_block = es->s_last_error_block;
3541c13d5c0STheodore Ts'o 	}
35566e61a9eSTheodore Ts'o 	/*
35666e61a9eSTheodore Ts'o 	 * Start the daily error reporting function if it hasn't been
35766e61a9eSTheodore Ts'o 	 * started already
35866e61a9eSTheodore Ts'o 	 */
35966e61a9eSTheodore Ts'o 	if (!es->s_error_count)
36066e61a9eSTheodore Ts'o 		mod_timer(&EXT4_SB(sb)->s_err_report, jiffies + 24*60*60*HZ);
361ba39ebb6SWei Yongjun 	le32_add_cpu(&es->s_error_count, 1);
3621c13d5c0STheodore Ts'o }
3631c13d5c0STheodore Ts'o 
3641c13d5c0STheodore Ts'o static void save_error_info(struct super_block *sb, const char *func,
3651c13d5c0STheodore Ts'o 			    unsigned int line)
3661c13d5c0STheodore Ts'o {
3671c13d5c0STheodore Ts'o 	__save_error_info(sb, func, line);
3681c13d5c0STheodore Ts'o 	ext4_commit_super(sb, 1);
3691c13d5c0STheodore Ts'o }
3701c13d5c0STheodore Ts'o 
371bdfe0cbdSTheodore Ts'o /*
372bdfe0cbdSTheodore Ts'o  * The del_gendisk() function uninitializes the disk-specific data
373bdfe0cbdSTheodore Ts'o  * structures, including the bdi structure, without telling anyone
374bdfe0cbdSTheodore Ts'o  * else.  Once this happens, any attempt to call mark_buffer_dirty()
375bdfe0cbdSTheodore Ts'o  * (for example, by ext4_commit_super), will cause a kernel OOPS.
376bdfe0cbdSTheodore Ts'o  * This is a kludge to prevent these oops until we can put in a proper
377bdfe0cbdSTheodore Ts'o  * hook in del_gendisk() to inform the VFS and file system layers.
378bdfe0cbdSTheodore Ts'o  */
379bdfe0cbdSTheodore Ts'o static int block_device_ejected(struct super_block *sb)
380bdfe0cbdSTheodore Ts'o {
381bdfe0cbdSTheodore Ts'o 	struct inode *bd_inode = sb->s_bdev->bd_inode;
382bdfe0cbdSTheodore Ts'o 	struct backing_dev_info *bdi = inode_to_bdi(bd_inode);
383bdfe0cbdSTheodore Ts'o 
384bdfe0cbdSTheodore Ts'o 	return bdi->dev == NULL;
385bdfe0cbdSTheodore Ts'o }
386bdfe0cbdSTheodore Ts'o 
38718aadd47SBobi Jam static void ext4_journal_commit_callback(journal_t *journal, transaction_t *txn)
38818aadd47SBobi Jam {
38918aadd47SBobi Jam 	struct super_block		*sb = journal->j_private;
39018aadd47SBobi Jam 	struct ext4_sb_info		*sbi = EXT4_SB(sb);
39118aadd47SBobi Jam 	int				error = is_journal_aborted(journal);
3925d3ee208SDmitry Monakhov 	struct ext4_journal_cb_entry	*jce;
39318aadd47SBobi Jam 
3945d3ee208SDmitry Monakhov 	BUG_ON(txn->t_state == T_FINISHED);
395a0154344SDaeho Jeong 
396a0154344SDaeho Jeong 	ext4_process_freed_data(sb, txn->t_tid);
397a0154344SDaeho Jeong 
39818aadd47SBobi Jam 	spin_lock(&sbi->s_md_lock);
3995d3ee208SDmitry Monakhov 	while (!list_empty(&txn->t_private_list)) {
4005d3ee208SDmitry Monakhov 		jce = list_entry(txn->t_private_list.next,
4015d3ee208SDmitry Monakhov 				 struct ext4_journal_cb_entry, jce_list);
40218aadd47SBobi Jam 		list_del_init(&jce->jce_list);
40318aadd47SBobi Jam 		spin_unlock(&sbi->s_md_lock);
40418aadd47SBobi Jam 		jce->jce_func(sb, jce, error);
40518aadd47SBobi Jam 		spin_lock(&sbi->s_md_lock);
40618aadd47SBobi Jam 	}
40718aadd47SBobi Jam 	spin_unlock(&sbi->s_md_lock);
40818aadd47SBobi Jam }
4091c13d5c0STheodore Ts'o 
410ac27a0ecSDave Kleikamp /* Deal with the reporting of failure conditions on a filesystem such as
411ac27a0ecSDave Kleikamp  * inconsistencies detected or read IO failures.
412ac27a0ecSDave Kleikamp  *
413ac27a0ecSDave Kleikamp  * On ext2, we can store the error state of the filesystem in the
414617ba13bSMingming Cao  * superblock.  That is not possible on ext4, because we may have other
415ac27a0ecSDave Kleikamp  * write ordering constraints on the superblock which prevent us from
416ac27a0ecSDave Kleikamp  * writing it out straight away; and given that the journal is about to
417ac27a0ecSDave Kleikamp  * be aborted, we can't rely on the current, or future, transactions to
418ac27a0ecSDave Kleikamp  * write out the superblock safely.
419ac27a0ecSDave Kleikamp  *
420dab291afSMingming Cao  * We'll just use the jbd2_journal_abort() error code to record an error in
421d6b198bcSThadeu Lima de Souza Cascardo  * the journal instead.  On recovery, the journal will complain about
422ac27a0ecSDave Kleikamp  * that error until we've noted it down and cleared it.
423ac27a0ecSDave Kleikamp  */
424ac27a0ecSDave Kleikamp 
425617ba13bSMingming Cao static void ext4_handle_error(struct super_block *sb)
426ac27a0ecSDave Kleikamp {
427327eaf73STheodore Ts'o 	if (test_opt(sb, WARN_ON_ERROR))
428327eaf73STheodore Ts'o 		WARN_ON_ONCE(1);
429327eaf73STheodore Ts'o 
430bc98a42cSDavid Howells 	if (sb_rdonly(sb))
431ac27a0ecSDave Kleikamp 		return;
432ac27a0ecSDave Kleikamp 
433ac27a0ecSDave Kleikamp 	if (!test_opt(sb, ERRORS_CONT)) {
434617ba13bSMingming Cao 		journal_t *journal = EXT4_SB(sb)->s_journal;
435ac27a0ecSDave Kleikamp 
4364ab2f15bSTheodore Ts'o 		EXT4_SB(sb)->s_mount_flags |= EXT4_MF_FS_ABORTED;
437ac27a0ecSDave Kleikamp 		if (journal)
438dab291afSMingming Cao 			jbd2_journal_abort(journal, -EIO);
439ac27a0ecSDave Kleikamp 	}
440ac27a0ecSDave Kleikamp 	if (test_opt(sb, ERRORS_RO)) {
441b31e1552SEric Sandeen 		ext4_msg(sb, KERN_CRIT, "Remounting filesystem read-only");
4424418e141SDmitry Monakhov 		/*
4434418e141SDmitry Monakhov 		 * Make sure updated value of ->s_mount_flags will be visible
4444418e141SDmitry Monakhov 		 * before ->s_flags update
4454418e141SDmitry Monakhov 		 */
4464418e141SDmitry Monakhov 		smp_wmb();
4471751e8a6SLinus Torvalds 		sb->s_flags |= SB_RDONLY;
448ac27a0ecSDave Kleikamp 	}
4494327ba52SDaeho Jeong 	if (test_opt(sb, ERRORS_PANIC)) {
4504327ba52SDaeho Jeong 		if (EXT4_SB(sb)->s_journal &&
4514327ba52SDaeho Jeong 		  !(EXT4_SB(sb)->s_journal->j_flags & JBD2_REC_ERR))
4524327ba52SDaeho Jeong 			return;
453617ba13bSMingming Cao 		panic("EXT4-fs (device %s): panic forced after error\n",
454ac27a0ecSDave Kleikamp 			sb->s_id);
455ac27a0ecSDave Kleikamp 	}
4564327ba52SDaeho Jeong }
457ac27a0ecSDave Kleikamp 
458efbed4dcSTheodore Ts'o #define ext4_error_ratelimit(sb)					\
459efbed4dcSTheodore Ts'o 		___ratelimit(&(EXT4_SB(sb)->s_err_ratelimit_state),	\
460efbed4dcSTheodore Ts'o 			     "EXT4-fs error")
461efbed4dcSTheodore Ts'o 
46212062dddSEric Sandeen void __ext4_error(struct super_block *sb, const char *function,
463c398eda0STheodore Ts'o 		  unsigned int line, const char *fmt, ...)
464ac27a0ecSDave Kleikamp {
4650ff2ea7dSJoe Perches 	struct va_format vaf;
466ac27a0ecSDave Kleikamp 	va_list args;
467ac27a0ecSDave Kleikamp 
4680db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(sb))))
4690db1ff22STheodore Ts'o 		return;
4700db1ff22STheodore Ts'o 
471ccf0f32aSTheodore Ts'o 	trace_ext4_error(sb, function, line);
472efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(sb)) {
473ac27a0ecSDave Kleikamp 		va_start(args, fmt);
4740ff2ea7dSJoe Perches 		vaf.fmt = fmt;
4750ff2ea7dSJoe Perches 		vaf.va = &args;
476efbed4dcSTheodore Ts'o 		printk(KERN_CRIT
477efbed4dcSTheodore Ts'o 		       "EXT4-fs error (device %s): %s:%d: comm %s: %pV\n",
4780ff2ea7dSJoe Perches 		       sb->s_id, function, line, current->comm, &vaf);
479ac27a0ecSDave Kleikamp 		va_end(args);
480efbed4dcSTheodore Ts'o 	}
481f3fc0210STheodore Ts'o 	save_error_info(sb, function, line);
482617ba13bSMingming Cao 	ext4_handle_error(sb);
483ac27a0ecSDave Kleikamp }
484ac27a0ecSDave Kleikamp 
485e7c96e8eSJoe Perches void __ext4_error_inode(struct inode *inode, const char *function,
486c398eda0STheodore Ts'o 			unsigned int line, ext4_fsblk_t block,
487273df556SFrank Mayhar 			const char *fmt, ...)
488273df556SFrank Mayhar {
489273df556SFrank Mayhar 	va_list args;
490f7c21177STheodore Ts'o 	struct va_format vaf;
4911c13d5c0STheodore Ts'o 	struct ext4_super_block *es = EXT4_SB(inode->i_sb)->s_es;
492273df556SFrank Mayhar 
4930db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
4940db1ff22STheodore Ts'o 		return;
4950db1ff22STheodore Ts'o 
496ccf0f32aSTheodore Ts'o 	trace_ext4_error(inode->i_sb, function, line);
4971c13d5c0STheodore Ts'o 	es->s_last_error_ino = cpu_to_le32(inode->i_ino);
4981c13d5c0STheodore Ts'o 	es->s_last_error_block = cpu_to_le64(block);
499efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(inode->i_sb)) {
500273df556SFrank Mayhar 		va_start(args, fmt);
501f7c21177STheodore Ts'o 		vaf.fmt = fmt;
502f7c21177STheodore Ts'o 		vaf.va = &args;
503c398eda0STheodore Ts'o 		if (block)
504d9ee81daSJoe Perches 			printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
505d9ee81daSJoe Perches 			       "inode #%lu: block %llu: comm %s: %pV\n",
506d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
507d9ee81daSJoe Perches 			       block, current->comm, &vaf);
508d9ee81daSJoe Perches 		else
509d9ee81daSJoe Perches 			printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: "
510d9ee81daSJoe Perches 			       "inode #%lu: comm %s: %pV\n",
511d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
512d9ee81daSJoe Perches 			       current->comm, &vaf);
513273df556SFrank Mayhar 		va_end(args);
514efbed4dcSTheodore Ts'o 	}
515efbed4dcSTheodore Ts'o 	save_error_info(inode->i_sb, function, line);
516273df556SFrank Mayhar 	ext4_handle_error(inode->i_sb);
517273df556SFrank Mayhar }
518273df556SFrank Mayhar 
519e7c96e8eSJoe Perches void __ext4_error_file(struct file *file, const char *function,
520f7c21177STheodore Ts'o 		       unsigned int line, ext4_fsblk_t block,
521f7c21177STheodore Ts'o 		       const char *fmt, ...)
522273df556SFrank Mayhar {
523273df556SFrank Mayhar 	va_list args;
524f7c21177STheodore Ts'o 	struct va_format vaf;
5251c13d5c0STheodore Ts'o 	struct ext4_super_block *es;
526496ad9aaSAl Viro 	struct inode *inode = file_inode(file);
527273df556SFrank Mayhar 	char pathname[80], *path;
528273df556SFrank Mayhar 
5290db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb))))
5300db1ff22STheodore Ts'o 		return;
5310db1ff22STheodore Ts'o 
532ccf0f32aSTheodore Ts'o 	trace_ext4_error(inode->i_sb, function, line);
5331c13d5c0STheodore Ts'o 	es = EXT4_SB(inode->i_sb)->s_es;
5341c13d5c0STheodore Ts'o 	es->s_last_error_ino = cpu_to_le32(inode->i_ino);
535efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(inode->i_sb)) {
5369bf39ab2SMiklos Szeredi 		path = file_path(file, pathname, sizeof(pathname));
537f9a62d09SDan Carpenter 		if (IS_ERR(path))
538273df556SFrank Mayhar 			path = "(unknown)";
539f7c21177STheodore Ts'o 		va_start(args, fmt);
540f7c21177STheodore Ts'o 		vaf.fmt = fmt;
541f7c21177STheodore Ts'o 		vaf.va = &args;
542d9ee81daSJoe Perches 		if (block)
543d9ee81daSJoe Perches 			printk(KERN_CRIT
544d9ee81daSJoe Perches 			       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
545d9ee81daSJoe Perches 			       "block %llu: comm %s: path %s: %pV\n",
546d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
547d9ee81daSJoe Perches 			       block, current->comm, path, &vaf);
548d9ee81daSJoe Perches 		else
549d9ee81daSJoe Perches 			printk(KERN_CRIT
550d9ee81daSJoe Perches 			       "EXT4-fs error (device %s): %s:%d: inode #%lu: "
551d9ee81daSJoe Perches 			       "comm %s: path %s: %pV\n",
552d9ee81daSJoe Perches 			       inode->i_sb->s_id, function, line, inode->i_ino,
553d9ee81daSJoe Perches 			       current->comm, path, &vaf);
554273df556SFrank Mayhar 		va_end(args);
555efbed4dcSTheodore Ts'o 	}
556efbed4dcSTheodore Ts'o 	save_error_info(inode->i_sb, function, line);
557273df556SFrank Mayhar 	ext4_handle_error(inode->i_sb);
558273df556SFrank Mayhar }
559273df556SFrank Mayhar 
560722887ddSTheodore Ts'o const char *ext4_decode_error(struct super_block *sb, int errno,
561ac27a0ecSDave Kleikamp 			      char nbuf[16])
562ac27a0ecSDave Kleikamp {
563ac27a0ecSDave Kleikamp 	char *errstr = NULL;
564ac27a0ecSDave Kleikamp 
565ac27a0ecSDave Kleikamp 	switch (errno) {
5666a797d27SDarrick J. Wong 	case -EFSCORRUPTED:
5676a797d27SDarrick J. Wong 		errstr = "Corrupt filesystem";
5686a797d27SDarrick J. Wong 		break;
5696a797d27SDarrick J. Wong 	case -EFSBADCRC:
5706a797d27SDarrick J. Wong 		errstr = "Filesystem failed CRC";
5716a797d27SDarrick J. Wong 		break;
572ac27a0ecSDave Kleikamp 	case -EIO:
573ac27a0ecSDave Kleikamp 		errstr = "IO failure";
574ac27a0ecSDave Kleikamp 		break;
575ac27a0ecSDave Kleikamp 	case -ENOMEM:
576ac27a0ecSDave Kleikamp 		errstr = "Out of memory";
577ac27a0ecSDave Kleikamp 		break;
578ac27a0ecSDave Kleikamp 	case -EROFS:
57978f1ddbbSTheodore Ts'o 		if (!sb || (EXT4_SB(sb)->s_journal &&
58078f1ddbbSTheodore Ts'o 			    EXT4_SB(sb)->s_journal->j_flags & JBD2_ABORT))
581ac27a0ecSDave Kleikamp 			errstr = "Journal has aborted";
582ac27a0ecSDave Kleikamp 		else
583ac27a0ecSDave Kleikamp 			errstr = "Readonly filesystem";
584ac27a0ecSDave Kleikamp 		break;
585ac27a0ecSDave Kleikamp 	default:
586ac27a0ecSDave Kleikamp 		/* If the caller passed in an extra buffer for unknown
587ac27a0ecSDave Kleikamp 		 * errors, textualise them now.  Else we just return
588ac27a0ecSDave Kleikamp 		 * NULL. */
589ac27a0ecSDave Kleikamp 		if (nbuf) {
590ac27a0ecSDave Kleikamp 			/* Check for truncated error codes... */
591ac27a0ecSDave Kleikamp 			if (snprintf(nbuf, 16, "error %d", -errno) >= 0)
592ac27a0ecSDave Kleikamp 				errstr = nbuf;
593ac27a0ecSDave Kleikamp 		}
594ac27a0ecSDave Kleikamp 		break;
595ac27a0ecSDave Kleikamp 	}
596ac27a0ecSDave Kleikamp 
597ac27a0ecSDave Kleikamp 	return errstr;
598ac27a0ecSDave Kleikamp }
599ac27a0ecSDave Kleikamp 
600617ba13bSMingming Cao /* __ext4_std_error decodes expected errors from journaling functions
601ac27a0ecSDave Kleikamp  * automatically and invokes the appropriate error response.  */
602ac27a0ecSDave Kleikamp 
603c398eda0STheodore Ts'o void __ext4_std_error(struct super_block *sb, const char *function,
604c398eda0STheodore Ts'o 		      unsigned int line, int errno)
605ac27a0ecSDave Kleikamp {
606ac27a0ecSDave Kleikamp 	char nbuf[16];
607ac27a0ecSDave Kleikamp 	const char *errstr;
608ac27a0ecSDave Kleikamp 
6090db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(sb))))
6100db1ff22STheodore Ts'o 		return;
6110db1ff22STheodore Ts'o 
612ac27a0ecSDave Kleikamp 	/* Special case: if the error is EROFS, and we're not already
613ac27a0ecSDave Kleikamp 	 * inside a transaction, then there's really no point in logging
614ac27a0ecSDave Kleikamp 	 * an error. */
615bc98a42cSDavid Howells 	if (errno == -EROFS && journal_current_handle() == NULL && sb_rdonly(sb))
616ac27a0ecSDave Kleikamp 		return;
617ac27a0ecSDave Kleikamp 
618efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(sb)) {
619617ba13bSMingming Cao 		errstr = ext4_decode_error(sb, errno, nbuf);
620c398eda0STheodore Ts'o 		printk(KERN_CRIT "EXT4-fs error (device %s) in %s:%d: %s\n",
621c398eda0STheodore Ts'o 		       sb->s_id, function, line, errstr);
622efbed4dcSTheodore Ts'o 	}
623ac27a0ecSDave Kleikamp 
624efbed4dcSTheodore Ts'o 	save_error_info(sb, function, line);
625617ba13bSMingming Cao 	ext4_handle_error(sb);
626ac27a0ecSDave Kleikamp }
627ac27a0ecSDave Kleikamp 
628ac27a0ecSDave Kleikamp /*
629617ba13bSMingming Cao  * ext4_abort is a much stronger failure handler than ext4_error.  The
630ac27a0ecSDave Kleikamp  * abort function may be used to deal with unrecoverable failures such
631ac27a0ecSDave Kleikamp  * as journal IO errors or ENOMEM at a critical moment in log management.
632ac27a0ecSDave Kleikamp  *
633ac27a0ecSDave Kleikamp  * We unconditionally force the filesystem into an ABORT|READONLY state,
634ac27a0ecSDave Kleikamp  * unless the error response on the fs has been set to panic in which
635ac27a0ecSDave Kleikamp  * case we take the easy way out and panic immediately.
636ac27a0ecSDave Kleikamp  */
637ac27a0ecSDave Kleikamp 
638c67d859eSTheodore Ts'o void __ext4_abort(struct super_block *sb, const char *function,
639c398eda0STheodore Ts'o 		unsigned int line, const char *fmt, ...)
640ac27a0ecSDave Kleikamp {
641651e1c3bSJoe Perches 	struct va_format vaf;
642ac27a0ecSDave Kleikamp 	va_list args;
643ac27a0ecSDave Kleikamp 
6440db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(sb))))
6450db1ff22STheodore Ts'o 		return;
6460db1ff22STheodore Ts'o 
6471c13d5c0STheodore Ts'o 	save_error_info(sb, function, line);
648ac27a0ecSDave Kleikamp 	va_start(args, fmt);
649651e1c3bSJoe Perches 	vaf.fmt = fmt;
650651e1c3bSJoe Perches 	vaf.va = &args;
651651e1c3bSJoe Perches 	printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: %pV\n",
652651e1c3bSJoe Perches 	       sb->s_id, function, line, &vaf);
653ac27a0ecSDave Kleikamp 	va_end(args);
654ac27a0ecSDave Kleikamp 
655bc98a42cSDavid Howells 	if (sb_rdonly(sb) == 0) {
656b31e1552SEric Sandeen 		ext4_msg(sb, KERN_CRIT, "Remounting filesystem read-only");
6574ab2f15bSTheodore Ts'o 		EXT4_SB(sb)->s_mount_flags |= EXT4_MF_FS_ABORTED;
6584418e141SDmitry Monakhov 		/*
6594418e141SDmitry Monakhov 		 * Make sure updated value of ->s_mount_flags will be visible
6604418e141SDmitry Monakhov 		 * before ->s_flags update
6614418e141SDmitry Monakhov 		 */
6624418e141SDmitry Monakhov 		smp_wmb();
6631751e8a6SLinus Torvalds 		sb->s_flags |= SB_RDONLY;
664ef2cabf7SHidehiro Kawai 		if (EXT4_SB(sb)->s_journal)
665dab291afSMingming Cao 			jbd2_journal_abort(EXT4_SB(sb)->s_journal, -EIO);
6661c13d5c0STheodore Ts'o 		save_error_info(sb, function, line);
6671c13d5c0STheodore Ts'o 	}
6684327ba52SDaeho Jeong 	if (test_opt(sb, ERRORS_PANIC)) {
6694327ba52SDaeho Jeong 		if (EXT4_SB(sb)->s_journal &&
6704327ba52SDaeho Jeong 		  !(EXT4_SB(sb)->s_journal->j_flags & JBD2_REC_ERR))
6714327ba52SDaeho Jeong 			return;
6721c13d5c0STheodore Ts'o 		panic("EXT4-fs panic from previous error\n");
673ac27a0ecSDave Kleikamp 	}
6744327ba52SDaeho Jeong }
675ac27a0ecSDave Kleikamp 
676e7c96e8eSJoe Perches void __ext4_msg(struct super_block *sb,
677e7c96e8eSJoe Perches 		const char *prefix, const char *fmt, ...)
678b31e1552SEric Sandeen {
6790ff2ea7dSJoe Perches 	struct va_format vaf;
680b31e1552SEric Sandeen 	va_list args;
681b31e1552SEric Sandeen 
682efbed4dcSTheodore Ts'o 	if (!___ratelimit(&(EXT4_SB(sb)->s_msg_ratelimit_state), "EXT4-fs"))
683efbed4dcSTheodore Ts'o 		return;
684efbed4dcSTheodore Ts'o 
685b31e1552SEric Sandeen 	va_start(args, fmt);
6860ff2ea7dSJoe Perches 	vaf.fmt = fmt;
6870ff2ea7dSJoe Perches 	vaf.va = &args;
6880ff2ea7dSJoe Perches 	printk("%sEXT4-fs (%s): %pV\n", prefix, sb->s_id, &vaf);
689b31e1552SEric Sandeen 	va_end(args);
690b31e1552SEric Sandeen }
691b31e1552SEric Sandeen 
692b03a2f7eSAndreas Dilger #define ext4_warning_ratelimit(sb)					\
693b03a2f7eSAndreas Dilger 		___ratelimit(&(EXT4_SB(sb)->s_warning_ratelimit_state),	\
694b03a2f7eSAndreas Dilger 			     "EXT4-fs warning")
695b03a2f7eSAndreas Dilger 
69612062dddSEric Sandeen void __ext4_warning(struct super_block *sb, const char *function,
697c398eda0STheodore Ts'o 		    unsigned int line, const char *fmt, ...)
698ac27a0ecSDave Kleikamp {
6990ff2ea7dSJoe Perches 	struct va_format vaf;
700ac27a0ecSDave Kleikamp 	va_list args;
701ac27a0ecSDave Kleikamp 
702b03a2f7eSAndreas Dilger 	if (!ext4_warning_ratelimit(sb))
703efbed4dcSTheodore Ts'o 		return;
704efbed4dcSTheodore Ts'o 
705ac27a0ecSDave Kleikamp 	va_start(args, fmt);
7060ff2ea7dSJoe Perches 	vaf.fmt = fmt;
7070ff2ea7dSJoe Perches 	vaf.va = &args;
7080ff2ea7dSJoe Perches 	printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: %pV\n",
7090ff2ea7dSJoe Perches 	       sb->s_id, function, line, &vaf);
710ac27a0ecSDave Kleikamp 	va_end(args);
711ac27a0ecSDave Kleikamp }
712ac27a0ecSDave Kleikamp 
713b03a2f7eSAndreas Dilger void __ext4_warning_inode(const struct inode *inode, const char *function,
714b03a2f7eSAndreas Dilger 			  unsigned int line, const char *fmt, ...)
715b03a2f7eSAndreas Dilger {
716b03a2f7eSAndreas Dilger 	struct va_format vaf;
717b03a2f7eSAndreas Dilger 	va_list args;
718b03a2f7eSAndreas Dilger 
719b03a2f7eSAndreas Dilger 	if (!ext4_warning_ratelimit(inode->i_sb))
720b03a2f7eSAndreas Dilger 		return;
721b03a2f7eSAndreas Dilger 
722b03a2f7eSAndreas Dilger 	va_start(args, fmt);
723b03a2f7eSAndreas Dilger 	vaf.fmt = fmt;
724b03a2f7eSAndreas Dilger 	vaf.va = &args;
725b03a2f7eSAndreas Dilger 	printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: "
726b03a2f7eSAndreas Dilger 	       "inode #%lu: comm %s: %pV\n", inode->i_sb->s_id,
727b03a2f7eSAndreas Dilger 	       function, line, inode->i_ino, current->comm, &vaf);
728b03a2f7eSAndreas Dilger 	va_end(args);
729b03a2f7eSAndreas Dilger }
730b03a2f7eSAndreas Dilger 
731e29136f8STheodore Ts'o void __ext4_grp_locked_error(const char *function, unsigned int line,
732e29136f8STheodore Ts'o 			     struct super_block *sb, ext4_group_t grp,
733e29136f8STheodore Ts'o 			     unsigned long ino, ext4_fsblk_t block,
734e29136f8STheodore Ts'o 			     const char *fmt, ...)
7355d1b1b3fSAneesh Kumar K.V __releases(bitlock)
7365d1b1b3fSAneesh Kumar K.V __acquires(bitlock)
7375d1b1b3fSAneesh Kumar K.V {
7380ff2ea7dSJoe Perches 	struct va_format vaf;
7395d1b1b3fSAneesh Kumar K.V 	va_list args;
7405d1b1b3fSAneesh Kumar K.V 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
7415d1b1b3fSAneesh Kumar K.V 
7420db1ff22STheodore Ts'o 	if (unlikely(ext4_forced_shutdown(EXT4_SB(sb))))
7430db1ff22STheodore Ts'o 		return;
7440db1ff22STheodore Ts'o 
745ccf0f32aSTheodore Ts'o 	trace_ext4_error(sb, function, line);
7461c13d5c0STheodore Ts'o 	es->s_last_error_ino = cpu_to_le32(ino);
7471c13d5c0STheodore Ts'o 	es->s_last_error_block = cpu_to_le64(block);
7481c13d5c0STheodore Ts'o 	__save_error_info(sb, function, line);
7490ff2ea7dSJoe Perches 
750efbed4dcSTheodore Ts'o 	if (ext4_error_ratelimit(sb)) {
7515d1b1b3fSAneesh Kumar K.V 		va_start(args, fmt);
7520ff2ea7dSJoe Perches 		vaf.fmt = fmt;
7530ff2ea7dSJoe Perches 		vaf.va = &args;
75421149d61SRobin Dong 		printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: group %u, ",
755e29136f8STheodore Ts'o 		       sb->s_id, function, line, grp);
756e29136f8STheodore Ts'o 		if (ino)
7570ff2ea7dSJoe Perches 			printk(KERN_CONT "inode %lu: ", ino);
758e29136f8STheodore Ts'o 		if (block)
759efbed4dcSTheodore Ts'o 			printk(KERN_CONT "block %llu:",
760efbed4dcSTheodore Ts'o 			       (unsigned long long) block);
7610ff2ea7dSJoe Perches 		printk(KERN_CONT "%pV\n", &vaf);
7625d1b1b3fSAneesh Kumar K.V 		va_end(args);
763efbed4dcSTheodore Ts'o 	}
7645d1b1b3fSAneesh Kumar K.V 
765327eaf73STheodore Ts'o 	if (test_opt(sb, WARN_ON_ERROR))
766327eaf73STheodore Ts'o 		WARN_ON_ONCE(1);
767327eaf73STheodore Ts'o 
7685d1b1b3fSAneesh Kumar K.V 	if (test_opt(sb, ERRORS_CONT)) {
769e2d67052STheodore Ts'o 		ext4_commit_super(sb, 0);
7705d1b1b3fSAneesh Kumar K.V 		return;
7715d1b1b3fSAneesh Kumar K.V 	}
7721c13d5c0STheodore Ts'o 
7735d1b1b3fSAneesh Kumar K.V 	ext4_unlock_group(sb, grp);
77406f29cc8SZhouyi Zhou 	ext4_commit_super(sb, 1);
7755d1b1b3fSAneesh Kumar K.V 	ext4_handle_error(sb);
7765d1b1b3fSAneesh Kumar K.V 	/*
7775d1b1b3fSAneesh Kumar K.V 	 * We only get here in the ERRORS_RO case; relocking the group
7785d1b1b3fSAneesh Kumar K.V 	 * may be dangerous, but nothing bad will happen since the
7795d1b1b3fSAneesh Kumar K.V 	 * filesystem will have already been marked read/only and the
7805d1b1b3fSAneesh Kumar K.V 	 * journal has been aborted.  We return 1 as a hint to callers
7815d1b1b3fSAneesh Kumar K.V 	 * who might what to use the return value from
78225985edcSLucas De Marchi 	 * ext4_grp_locked_error() to distinguish between the
7835d1b1b3fSAneesh Kumar K.V 	 * ERRORS_CONT and ERRORS_RO case, and perhaps return more
7845d1b1b3fSAneesh Kumar K.V 	 * aggressively from the ext4 function in question, with a
7855d1b1b3fSAneesh Kumar K.V 	 * more appropriate error code.
7865d1b1b3fSAneesh Kumar K.V 	 */
7875d1b1b3fSAneesh Kumar K.V 	ext4_lock_group(sb, grp);
7885d1b1b3fSAneesh Kumar K.V 	return;
7895d1b1b3fSAneesh Kumar K.V }
7905d1b1b3fSAneesh Kumar K.V 
791db79e6d1SWang Shilong void ext4_mark_group_bitmap_corrupted(struct super_block *sb,
792db79e6d1SWang Shilong 				     ext4_group_t group,
793db79e6d1SWang Shilong 				     unsigned int flags)
794db79e6d1SWang Shilong {
795db79e6d1SWang Shilong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
796db79e6d1SWang Shilong 	struct ext4_group_info *grp = ext4_get_group_info(sb, group);
797db79e6d1SWang Shilong 	struct ext4_group_desc *gdp = ext4_get_group_desc(sb, group, NULL);
7989af0b3d1SWang Shilong 	int ret;
799db79e6d1SWang Shilong 
8009af0b3d1SWang Shilong 	if (flags & EXT4_GROUP_INFO_BBITMAP_CORRUPT) {
8019af0b3d1SWang Shilong 		ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_BBITMAP_CORRUPT_BIT,
8029af0b3d1SWang Shilong 					    &grp->bb_state);
8039af0b3d1SWang Shilong 		if (!ret)
804db79e6d1SWang Shilong 			percpu_counter_sub(&sbi->s_freeclusters_counter,
805db79e6d1SWang Shilong 					   grp->bb_free);
806db79e6d1SWang Shilong 	}
807db79e6d1SWang Shilong 
8089af0b3d1SWang Shilong 	if (flags & EXT4_GROUP_INFO_IBITMAP_CORRUPT) {
8099af0b3d1SWang Shilong 		ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_IBITMAP_CORRUPT_BIT,
8109af0b3d1SWang Shilong 					    &grp->bb_state);
8119af0b3d1SWang Shilong 		if (!ret && gdp) {
812db79e6d1SWang Shilong 			int count;
813db79e6d1SWang Shilong 
814db79e6d1SWang Shilong 			count = ext4_free_inodes_count(sb, gdp);
815db79e6d1SWang Shilong 			percpu_counter_sub(&sbi->s_freeinodes_counter,
816db79e6d1SWang Shilong 					   count);
817db79e6d1SWang Shilong 		}
818db79e6d1SWang Shilong 	}
819db79e6d1SWang Shilong }
820db79e6d1SWang Shilong 
821617ba13bSMingming Cao void ext4_update_dynamic_rev(struct super_block *sb)
822ac27a0ecSDave Kleikamp {
823617ba13bSMingming Cao 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
824ac27a0ecSDave Kleikamp 
825617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) > EXT4_GOOD_OLD_REV)
826ac27a0ecSDave Kleikamp 		return;
827ac27a0ecSDave Kleikamp 
82812062dddSEric Sandeen 	ext4_warning(sb,
829ac27a0ecSDave Kleikamp 		     "updating to rev %d because of new feature flag, "
830ac27a0ecSDave Kleikamp 		     "running e2fsck is recommended",
831617ba13bSMingming Cao 		     EXT4_DYNAMIC_REV);
832ac27a0ecSDave Kleikamp 
833617ba13bSMingming Cao 	es->s_first_ino = cpu_to_le32(EXT4_GOOD_OLD_FIRST_INO);
834617ba13bSMingming Cao 	es->s_inode_size = cpu_to_le16(EXT4_GOOD_OLD_INODE_SIZE);
835617ba13bSMingming Cao 	es->s_rev_level = cpu_to_le32(EXT4_DYNAMIC_REV);
836ac27a0ecSDave Kleikamp 	/* leave es->s_feature_*compat flags alone */
837ac27a0ecSDave Kleikamp 	/* es->s_uuid will be set by e2fsck if empty */
838ac27a0ecSDave Kleikamp 
839ac27a0ecSDave Kleikamp 	/*
840ac27a0ecSDave Kleikamp 	 * The rest of the superblock fields should be zero, and if not it
841ac27a0ecSDave Kleikamp 	 * means they are likely already in use, so leave them alone.  We
842ac27a0ecSDave Kleikamp 	 * can leave it up to e2fsck to clean up any inconsistencies there.
843ac27a0ecSDave Kleikamp 	 */
844ac27a0ecSDave Kleikamp }
845ac27a0ecSDave Kleikamp 
846ac27a0ecSDave Kleikamp /*
847ac27a0ecSDave Kleikamp  * Open the external journal device
848ac27a0ecSDave Kleikamp  */
849b31e1552SEric Sandeen static struct block_device *ext4_blkdev_get(dev_t dev, struct super_block *sb)
850ac27a0ecSDave Kleikamp {
851ac27a0ecSDave Kleikamp 	struct block_device *bdev;
852ac27a0ecSDave Kleikamp 	char b[BDEVNAME_SIZE];
853ac27a0ecSDave Kleikamp 
854d4d77629STejun Heo 	bdev = blkdev_get_by_dev(dev, FMODE_READ|FMODE_WRITE|FMODE_EXCL, sb);
855ac27a0ecSDave Kleikamp 	if (IS_ERR(bdev))
856ac27a0ecSDave Kleikamp 		goto fail;
857ac27a0ecSDave Kleikamp 	return bdev;
858ac27a0ecSDave Kleikamp 
859ac27a0ecSDave Kleikamp fail:
860b31e1552SEric Sandeen 	ext4_msg(sb, KERN_ERR, "failed to open journal device %s: %ld",
861ac27a0ecSDave Kleikamp 			__bdevname(dev, b), PTR_ERR(bdev));
862ac27a0ecSDave Kleikamp 	return NULL;
863ac27a0ecSDave Kleikamp }
864ac27a0ecSDave Kleikamp 
865ac27a0ecSDave Kleikamp /*
866ac27a0ecSDave Kleikamp  * Release the journal device
867ac27a0ecSDave Kleikamp  */
8684385bab1SAl Viro static void ext4_blkdev_put(struct block_device *bdev)
869ac27a0ecSDave Kleikamp {
8704385bab1SAl Viro 	blkdev_put(bdev, FMODE_READ|FMODE_WRITE|FMODE_EXCL);
871ac27a0ecSDave Kleikamp }
872ac27a0ecSDave Kleikamp 
8734385bab1SAl Viro static void ext4_blkdev_remove(struct ext4_sb_info *sbi)
874ac27a0ecSDave Kleikamp {
875ac27a0ecSDave Kleikamp 	struct block_device *bdev;
876ac27a0ecSDave Kleikamp 	bdev = sbi->journal_bdev;
877ac27a0ecSDave Kleikamp 	if (bdev) {
8784385bab1SAl Viro 		ext4_blkdev_put(bdev);
879ac27a0ecSDave Kleikamp 		sbi->journal_bdev = NULL;
880ac27a0ecSDave Kleikamp 	}
881ac27a0ecSDave Kleikamp }
882ac27a0ecSDave Kleikamp 
883ac27a0ecSDave Kleikamp static inline struct inode *orphan_list_entry(struct list_head *l)
884ac27a0ecSDave Kleikamp {
885617ba13bSMingming Cao 	return &list_entry(l, struct ext4_inode_info, i_orphan)->vfs_inode;
886ac27a0ecSDave Kleikamp }
887ac27a0ecSDave Kleikamp 
888617ba13bSMingming Cao static void dump_orphan_list(struct super_block *sb, struct ext4_sb_info *sbi)
889ac27a0ecSDave Kleikamp {
890ac27a0ecSDave Kleikamp 	struct list_head *l;
891ac27a0ecSDave Kleikamp 
892b31e1552SEric Sandeen 	ext4_msg(sb, KERN_ERR, "sb orphan head is %d",
893ac27a0ecSDave Kleikamp 		 le32_to_cpu(sbi->s_es->s_last_orphan));
894ac27a0ecSDave Kleikamp 
895ac27a0ecSDave Kleikamp 	printk(KERN_ERR "sb_info orphan list:\n");
896ac27a0ecSDave Kleikamp 	list_for_each(l, &sbi->s_orphan) {
897ac27a0ecSDave Kleikamp 		struct inode *inode = orphan_list_entry(l);
898ac27a0ecSDave Kleikamp 		printk(KERN_ERR "  "
899ac27a0ecSDave Kleikamp 		       "inode %s:%lu at %p: mode %o, nlink %d, next %d\n",
900ac27a0ecSDave Kleikamp 		       inode->i_sb->s_id, inode->i_ino, inode,
901ac27a0ecSDave Kleikamp 		       inode->i_mode, inode->i_nlink,
902ac27a0ecSDave Kleikamp 		       NEXT_ORPHAN(inode));
903ac27a0ecSDave Kleikamp 	}
904ac27a0ecSDave Kleikamp }
905ac27a0ecSDave Kleikamp 
906957153fcSJan Kara #ifdef CONFIG_QUOTA
907957153fcSJan Kara static int ext4_quota_off(struct super_block *sb, int type);
908957153fcSJan Kara 
909957153fcSJan Kara static inline void ext4_quota_off_umount(struct super_block *sb)
910957153fcSJan Kara {
911957153fcSJan Kara 	int type;
912957153fcSJan Kara 
913957153fcSJan Kara 	/* Use our quota_off function to clear inode flags etc. */
914957153fcSJan Kara 	for (type = 0; type < EXT4_MAXQUOTAS; type++)
915957153fcSJan Kara 		ext4_quota_off(sb, type);
916957153fcSJan Kara }
917957153fcSJan Kara #else
918957153fcSJan Kara static inline void ext4_quota_off_umount(struct super_block *sb)
919957153fcSJan Kara {
920957153fcSJan Kara }
921957153fcSJan Kara #endif
922957153fcSJan Kara 
923617ba13bSMingming Cao static void ext4_put_super(struct super_block *sb)
924ac27a0ecSDave Kleikamp {
925617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
926617ba13bSMingming Cao 	struct ext4_super_block *es = sbi->s_es;
92797abd7d4STheodore Ts'o 	int aborted = 0;
928ef2cabf7SHidehiro Kawai 	int i, err;
929ac27a0ecSDave Kleikamp 
930857ac889SLukas Czerner 	ext4_unregister_li_request(sb);
931957153fcSJan Kara 	ext4_quota_off_umount(sb);
932e0ccfd95SChristoph Hellwig 
9332e8fa54eSJan Kara 	destroy_workqueue(sbi->rsv_conversion_wq);
9344c0425ffSMingming Cao 
9350390131bSFrank Mayhar 	if (sbi->s_journal) {
93697abd7d4STheodore Ts'o 		aborted = is_journal_aborted(sbi->s_journal);
937ef2cabf7SHidehiro Kawai 		err = jbd2_journal_destroy(sbi->s_journal);
93847b4a50bSJan Kara 		sbi->s_journal = NULL;
93997abd7d4STheodore Ts'o 		if ((err < 0) && !aborted)
940c67d859eSTheodore Ts'o 			ext4_abort(sb, "Couldn't clean up the journal");
9410390131bSFrank Mayhar 	}
942d4edac31SJosef Bacik 
943ebd173beSTheodore Ts'o 	ext4_unregister_sysfs(sb);
944d3922a77SZheng Liu 	ext4_es_unregister_shrinker(sbi);
9459105bb14SAl Viro 	del_timer_sync(&sbi->s_err_report);
946d4edac31SJosef Bacik 	ext4_release_system_zone(sb);
947d4edac31SJosef Bacik 	ext4_mb_release(sb);
948d4edac31SJosef Bacik 	ext4_ext_release(sb);
949d4edac31SJosef Bacik 
950bc98a42cSDavid Howells 	if (!sb_rdonly(sb) && !aborted) {
951e2b911c5SDarrick J. Wong 		ext4_clear_feature_journal_needs_recovery(sb);
952ac27a0ecSDave Kleikamp 		es->s_state = cpu_to_le16(sbi->s_mount_state);
953ac27a0ecSDave Kleikamp 	}
954bc98a42cSDavid Howells 	if (!sb_rdonly(sb))
955a8e25a83SArtem Bityutskiy 		ext4_commit_super(sb, 1);
956a8e25a83SArtem Bityutskiy 
957ac27a0ecSDave Kleikamp 	for (i = 0; i < sbi->s_gdb_count; i++)
958ac27a0ecSDave Kleikamp 		brelse(sbi->s_group_desc[i]);
959b93b41d4SAl Viro 	kvfree(sbi->s_group_desc);
960b93b41d4SAl Viro 	kvfree(sbi->s_flex_groups);
96157042651STheodore Ts'o 	percpu_counter_destroy(&sbi->s_freeclusters_counter);
962ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_freeinodes_counter);
963ac27a0ecSDave Kleikamp 	percpu_counter_destroy(&sbi->s_dirs_counter);
96457042651STheodore Ts'o 	percpu_counter_destroy(&sbi->s_dirtyclusters_counter);
965c8585c6fSDaeho Jeong 	percpu_free_rwsem(&sbi->s_journal_flag_rwsem);
966ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
967a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
968ac27a0ecSDave Kleikamp 		kfree(sbi->s_qf_names[i]);
969ac27a0ecSDave Kleikamp #endif
970ac27a0ecSDave Kleikamp 
971ac27a0ecSDave Kleikamp 	/* Debugging code just in case the in-memory inode orphan list
972ac27a0ecSDave Kleikamp 	 * isn't empty.  The on-disk one can be non-empty if we've
973ac27a0ecSDave Kleikamp 	 * detected an error and taken the fs readonly, but the
974ac27a0ecSDave Kleikamp 	 * in-memory list had better be clean by this point. */
975ac27a0ecSDave Kleikamp 	if (!list_empty(&sbi->s_orphan))
976ac27a0ecSDave Kleikamp 		dump_orphan_list(sb, sbi);
977ac27a0ecSDave Kleikamp 	J_ASSERT(list_empty(&sbi->s_orphan));
978ac27a0ecSDave Kleikamp 
97989d96a6fSTheodore Ts'o 	sync_blockdev(sb->s_bdev);
980f98393a6SPeter Zijlstra 	invalidate_bdev(sb->s_bdev);
981ac27a0ecSDave Kleikamp 	if (sbi->journal_bdev && sbi->journal_bdev != sb->s_bdev) {
982ac27a0ecSDave Kleikamp 		/*
983ac27a0ecSDave Kleikamp 		 * Invalidate the journal device's buffers.  We don't want them
984ac27a0ecSDave Kleikamp 		 * floating about in memory - the physical journal device may
985ac27a0ecSDave Kleikamp 		 * hotswapped, and it breaks the `ro-after' testing code.
986ac27a0ecSDave Kleikamp 		 */
987ac27a0ecSDave Kleikamp 		sync_blockdev(sbi->journal_bdev);
988f98393a6SPeter Zijlstra 		invalidate_bdev(sbi->journal_bdev);
989617ba13bSMingming Cao 		ext4_blkdev_remove(sbi);
990ac27a0ecSDave Kleikamp 	}
991dec214d0STahsin Erdogan 	if (sbi->s_ea_inode_cache) {
992dec214d0STahsin Erdogan 		ext4_xattr_destroy_cache(sbi->s_ea_inode_cache);
993dec214d0STahsin Erdogan 		sbi->s_ea_inode_cache = NULL;
994dec214d0STahsin Erdogan 	}
99547387409STahsin Erdogan 	if (sbi->s_ea_block_cache) {
99647387409STahsin Erdogan 		ext4_xattr_destroy_cache(sbi->s_ea_block_cache);
99747387409STahsin Erdogan 		sbi->s_ea_block_cache = NULL;
9989c191f70ST Makphaibulchoke 	}
999c5e06d10SJohann Lombardi 	if (sbi->s_mmp_tsk)
1000c5e06d10SJohann Lombardi 		kthread_stop(sbi->s_mmp_tsk);
10019060dd2cSEric Sandeen 	brelse(sbi->s_sbh);
1002ac27a0ecSDave Kleikamp 	sb->s_fs_info = NULL;
10033197ebdbSTheodore Ts'o 	/*
10043197ebdbSTheodore Ts'o 	 * Now that we are completely done shutting down the
10053197ebdbSTheodore Ts'o 	 * superblock, we need to actually destroy the kobject.
10063197ebdbSTheodore Ts'o 	 */
10073197ebdbSTheodore Ts'o 	kobject_put(&sbi->s_kobj);
10083197ebdbSTheodore Ts'o 	wait_for_completion(&sbi->s_kobj_unregister);
10090441984aSDarrick J. Wong 	if (sbi->s_chksum_driver)
10100441984aSDarrick J. Wong 		crypto_free_shash(sbi->s_chksum_driver);
1011705895b6SPekka Enberg 	kfree(sbi->s_blockgroup_lock);
10125e405595SDan Williams 	fs_put_dax(sbi->s_daxdev);
1013ac27a0ecSDave Kleikamp 	kfree(sbi);
1014ac27a0ecSDave Kleikamp }
1015ac27a0ecSDave Kleikamp 
1016e18b890bSChristoph Lameter static struct kmem_cache *ext4_inode_cachep;
1017ac27a0ecSDave Kleikamp 
1018ac27a0ecSDave Kleikamp /*
1019ac27a0ecSDave Kleikamp  * Called inside transaction, so use GFP_NOFS
1020ac27a0ecSDave Kleikamp  */
1021617ba13bSMingming Cao static struct inode *ext4_alloc_inode(struct super_block *sb)
1022ac27a0ecSDave Kleikamp {
1023617ba13bSMingming Cao 	struct ext4_inode_info *ei;
1024ac27a0ecSDave Kleikamp 
1025e6b4f8daSChristoph Lameter 	ei = kmem_cache_alloc(ext4_inode_cachep, GFP_NOFS);
1026ac27a0ecSDave Kleikamp 	if (!ei)
1027ac27a0ecSDave Kleikamp 		return NULL;
10280b8e58a1SAndreas Dilger 
1029ee73f9a5SJeff Layton 	inode_set_iversion(&ei->vfs_inode, 1);
1030202ee5dfSTheodore Ts'o 	spin_lock_init(&ei->i_raw_lock);
1031c9de560dSAlex Tomas 	INIT_LIST_HEAD(&ei->i_prealloc_list);
1032c9de560dSAlex Tomas 	spin_lock_init(&ei->i_prealloc_lock);
10339a26b661SZheng Liu 	ext4_es_init_tree(&ei->i_es_tree);
10349a26b661SZheng Liu 	rwlock_init(&ei->i_es_lock);
1035edaa53caSZheng Liu 	INIT_LIST_HEAD(&ei->i_es_list);
1036eb68d0e2SZheng Liu 	ei->i_es_all_nr = 0;
1037edaa53caSZheng Liu 	ei->i_es_shk_nr = 0;
1038dd475925SJan Kara 	ei->i_es_shrink_lblk = 0;
1039d2a17637SMingming Cao 	ei->i_reserved_data_blocks = 0;
10409d0be502STheodore Ts'o 	ei->i_da_metadata_calc_len = 0;
10417e731bc9STheodore Ts'o 	ei->i_da_metadata_calc_last_lblock = 0;
1042d2a17637SMingming Cao 	spin_lock_init(&(ei->i_block_reservation_lock));
1043*1dc0aa46SEric Whitney 	ext4_init_pending_tree(&ei->i_pending_tree);
1044a9e7f447SDmitry Monakhov #ifdef CONFIG_QUOTA
1045a9e7f447SDmitry Monakhov 	ei->i_reserved_quota = 0;
104696c7e0d9SJan Kara 	memset(&ei->i_dquot, 0, sizeof(ei->i_dquot));
1047a9e7f447SDmitry Monakhov #endif
10488aefcd55STheodore Ts'o 	ei->jinode = NULL;
10492e8fa54eSJan Kara 	INIT_LIST_HEAD(&ei->i_rsv_conversion_list);
1050744692dcSJiaying Zhang 	spin_lock_init(&ei->i_completed_io_lock);
1051b436b9beSJan Kara 	ei->i_sync_tid = 0;
1052b436b9beSJan Kara 	ei->i_datasync_tid = 0;
1053e27f41e1SDmitry Monakhov 	atomic_set(&ei->i_unwritten, 0);
10542e8fa54eSJan Kara 	INIT_WORK(&ei->i_rsv_conversion_work, ext4_end_io_rsv_work);
1055ac27a0ecSDave Kleikamp 	return &ei->vfs_inode;
1056ac27a0ecSDave Kleikamp }
1057ac27a0ecSDave Kleikamp 
10587ff9c073STheodore Ts'o static int ext4_drop_inode(struct inode *inode)
10597ff9c073STheodore Ts'o {
10607ff9c073STheodore Ts'o 	int drop = generic_drop_inode(inode);
10617ff9c073STheodore Ts'o 
10627ff9c073STheodore Ts'o 	trace_ext4_drop_inode(inode, drop);
10637ff9c073STheodore Ts'o 	return drop;
10647ff9c073STheodore Ts'o }
10657ff9c073STheodore Ts'o 
1066fa0d7e3dSNick Piggin static void ext4_i_callback(struct rcu_head *head)
1067fa0d7e3dSNick Piggin {
1068fa0d7e3dSNick Piggin 	struct inode *inode = container_of(head, struct inode, i_rcu);
1069fa0d7e3dSNick Piggin 	kmem_cache_free(ext4_inode_cachep, EXT4_I(inode));
1070fa0d7e3dSNick Piggin }
1071fa0d7e3dSNick Piggin 
1072617ba13bSMingming Cao static void ext4_destroy_inode(struct inode *inode)
1073ac27a0ecSDave Kleikamp {
10749f7dd93dSVasily Averin 	if (!list_empty(&(EXT4_I(inode)->i_orphan))) {
1075b31e1552SEric Sandeen 		ext4_msg(inode->i_sb, KERN_ERR,
1076b31e1552SEric Sandeen 			 "Inode %lu (%p): orphan list check failed!",
1077b31e1552SEric Sandeen 			 inode->i_ino, EXT4_I(inode));
10789f7dd93dSVasily Averin 		print_hex_dump(KERN_INFO, "", DUMP_PREFIX_ADDRESS, 16, 4,
10799f7dd93dSVasily Averin 				EXT4_I(inode), sizeof(struct ext4_inode_info),
10809f7dd93dSVasily Averin 				true);
10819f7dd93dSVasily Averin 		dump_stack();
10829f7dd93dSVasily Averin 	}
1083fa0d7e3dSNick Piggin 	call_rcu(&inode->i_rcu, ext4_i_callback);
1084ac27a0ecSDave Kleikamp }
1085ac27a0ecSDave Kleikamp 
108651cc5068SAlexey Dobriyan static void init_once(void *foo)
1087ac27a0ecSDave Kleikamp {
1088617ba13bSMingming Cao 	struct ext4_inode_info *ei = (struct ext4_inode_info *) foo;
1089ac27a0ecSDave Kleikamp 
1090ac27a0ecSDave Kleikamp 	INIT_LIST_HEAD(&ei->i_orphan);
1091ac27a0ecSDave Kleikamp 	init_rwsem(&ei->xattr_sem);
10920e855ac8SAneesh Kumar K.V 	init_rwsem(&ei->i_data_sem);
1093ea3d7209SJan Kara 	init_rwsem(&ei->i_mmap_sem);
1094ac27a0ecSDave Kleikamp 	inode_init_once(&ei->vfs_inode);
1095ac27a0ecSDave Kleikamp }
1096ac27a0ecSDave Kleikamp 
1097e67bc2b3SFabian Frederick static int __init init_inodecache(void)
1098ac27a0ecSDave Kleikamp {
1099f8dd7c70SDavid Windsor 	ext4_inode_cachep = kmem_cache_create_usercopy("ext4_inode_cache",
1100f8dd7c70SDavid Windsor 				sizeof(struct ext4_inode_info), 0,
1101f8dd7c70SDavid Windsor 				(SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD|
1102f8dd7c70SDavid Windsor 					SLAB_ACCOUNT),
1103f8dd7c70SDavid Windsor 				offsetof(struct ext4_inode_info, i_data),
1104f8dd7c70SDavid Windsor 				sizeof_field(struct ext4_inode_info, i_data),
110520c2df83SPaul Mundt 				init_once);
1106617ba13bSMingming Cao 	if (ext4_inode_cachep == NULL)
1107ac27a0ecSDave Kleikamp 		return -ENOMEM;
1108ac27a0ecSDave Kleikamp 	return 0;
1109ac27a0ecSDave Kleikamp }
1110ac27a0ecSDave Kleikamp 
1111ac27a0ecSDave Kleikamp static void destroy_inodecache(void)
1112ac27a0ecSDave Kleikamp {
11138c0a8537SKirill A. Shutemov 	/*
11148c0a8537SKirill A. Shutemov 	 * Make sure all delayed rcu free inodes are flushed before we
11158c0a8537SKirill A. Shutemov 	 * destroy cache.
11168c0a8537SKirill A. Shutemov 	 */
11178c0a8537SKirill A. Shutemov 	rcu_barrier();
1118617ba13bSMingming Cao 	kmem_cache_destroy(ext4_inode_cachep);
1119ac27a0ecSDave Kleikamp }
1120ac27a0ecSDave Kleikamp 
11210930fcc1SAl Viro void ext4_clear_inode(struct inode *inode)
1122ac27a0ecSDave Kleikamp {
11230930fcc1SAl Viro 	invalidate_inode_buffers(inode);
1124dbd5768fSJan Kara 	clear_inode(inode);
11259f754758SChristoph Hellwig 	dquot_drop(inode);
1126c2ea3fdeSTheodore Ts'o 	ext4_discard_preallocations(inode);
112751865fdaSZheng Liu 	ext4_es_remove_extent(inode, 0, EXT_MAX_BLOCKS);
11288aefcd55STheodore Ts'o 	if (EXT4_I(inode)->jinode) {
11298aefcd55STheodore Ts'o 		jbd2_journal_release_jbd_inode(EXT4_JOURNAL(inode),
11308aefcd55STheodore Ts'o 					       EXT4_I(inode)->jinode);
11318aefcd55STheodore Ts'o 		jbd2_free_inode(EXT4_I(inode)->jinode);
11328aefcd55STheodore Ts'o 		EXT4_I(inode)->jinode = NULL;
11338aefcd55STheodore Ts'o 	}
11343d204e24SEric Biggers 	fscrypt_put_encryption_info(inode);
1135ac27a0ecSDave Kleikamp }
1136ac27a0ecSDave Kleikamp 
11371b961ac0SChristoph Hellwig static struct inode *ext4_nfs_get_inode(struct super_block *sb,
11381b961ac0SChristoph Hellwig 					u64 ino, u32 generation)
1139ac27a0ecSDave Kleikamp {
1140ac27a0ecSDave Kleikamp 	struct inode *inode;
1141ac27a0ecSDave Kleikamp 
1142617ba13bSMingming Cao 	if (ino < EXT4_FIRST_INO(sb) && ino != EXT4_ROOT_INO)
1143ac27a0ecSDave Kleikamp 		return ERR_PTR(-ESTALE);
1144617ba13bSMingming Cao 	if (ino > le32_to_cpu(EXT4_SB(sb)->s_es->s_inodes_count))
1145ac27a0ecSDave Kleikamp 		return ERR_PTR(-ESTALE);
1146ac27a0ecSDave Kleikamp 
1147ac27a0ecSDave Kleikamp 	/* iget isn't really right if the inode is currently unallocated!!
1148ac27a0ecSDave Kleikamp 	 *
1149617ba13bSMingming Cao 	 * ext4_read_inode will return a bad_inode if the inode had been
1150ac27a0ecSDave Kleikamp 	 * deleted, so we should be safe.
1151ac27a0ecSDave Kleikamp 	 *
1152ac27a0ecSDave Kleikamp 	 * Currently we don't know the generation for parent directory, so
1153ac27a0ecSDave Kleikamp 	 * a generation of 0 means "accept any"
1154ac27a0ecSDave Kleikamp 	 */
1155f4bb2981STheodore Ts'o 	inode = ext4_iget_normal(sb, ino);
11561d1fe1eeSDavid Howells 	if (IS_ERR(inode))
11571d1fe1eeSDavid Howells 		return ERR_CAST(inode);
11581d1fe1eeSDavid Howells 	if (generation && inode->i_generation != generation) {
1159ac27a0ecSDave Kleikamp 		iput(inode);
1160ac27a0ecSDave Kleikamp 		return ERR_PTR(-ESTALE);
1161ac27a0ecSDave Kleikamp 	}
11621b961ac0SChristoph Hellwig 
11631b961ac0SChristoph Hellwig 	return inode;
1164ac27a0ecSDave Kleikamp }
11651b961ac0SChristoph Hellwig 
11661b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_dentry(struct super_block *sb, struct fid *fid,
11671b961ac0SChristoph Hellwig 					int fh_len, int fh_type)
11681b961ac0SChristoph Hellwig {
11691b961ac0SChristoph Hellwig 	return generic_fh_to_dentry(sb, fid, fh_len, fh_type,
11701b961ac0SChristoph Hellwig 				    ext4_nfs_get_inode);
11711b961ac0SChristoph Hellwig }
11721b961ac0SChristoph Hellwig 
11731b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_parent(struct super_block *sb, struct fid *fid,
11741b961ac0SChristoph Hellwig 					int fh_len, int fh_type)
11751b961ac0SChristoph Hellwig {
11761b961ac0SChristoph Hellwig 	return generic_fh_to_parent(sb, fid, fh_len, fh_type,
11771b961ac0SChristoph Hellwig 				    ext4_nfs_get_inode);
1178ac27a0ecSDave Kleikamp }
1179ac27a0ecSDave Kleikamp 
1180c39a7f84SToshiyuki Okajima /*
1181c39a7f84SToshiyuki Okajima  * Try to release metadata pages (indirect blocks, directories) which are
1182c39a7f84SToshiyuki Okajima  * mapped via the block device.  Since these pages could have journal heads
1183c39a7f84SToshiyuki Okajima  * which would prevent try_to_free_buffers() from freeing them, we must use
1184c39a7f84SToshiyuki Okajima  * jbd2 layer's try_to_free_buffers() function to release them.
1185c39a7f84SToshiyuki Okajima  */
11860b8e58a1SAndreas Dilger static int bdev_try_to_free_page(struct super_block *sb, struct page *page,
11870b8e58a1SAndreas Dilger 				 gfp_t wait)
1188c39a7f84SToshiyuki Okajima {
1189c39a7f84SToshiyuki Okajima 	journal_t *journal = EXT4_SB(sb)->s_journal;
1190c39a7f84SToshiyuki Okajima 
1191c39a7f84SToshiyuki Okajima 	WARN_ON(PageChecked(page));
1192c39a7f84SToshiyuki Okajima 	if (!page_has_buffers(page))
1193c39a7f84SToshiyuki Okajima 		return 0;
1194c39a7f84SToshiyuki Okajima 	if (journal)
1195c39a7f84SToshiyuki Okajima 		return jbd2_journal_try_to_free_buffers(journal, page,
1196d0164adcSMel Gorman 						wait & ~__GFP_DIRECT_RECLAIM);
1197c39a7f84SToshiyuki Okajima 	return try_to_free_buffers(page);
1198c39a7f84SToshiyuki Okajima }
1199c39a7f84SToshiyuki Okajima 
1200a7550b30SJaegeuk Kim #ifdef CONFIG_EXT4_FS_ENCRYPTION
1201a7550b30SJaegeuk Kim static int ext4_get_context(struct inode *inode, void *ctx, size_t len)
1202a7550b30SJaegeuk Kim {
1203a7550b30SJaegeuk Kim 	return ext4_xattr_get(inode, EXT4_XATTR_INDEX_ENCRYPTION,
1204a7550b30SJaegeuk Kim 				 EXT4_XATTR_NAME_ENCRYPTION_CONTEXT, ctx, len);
1205a7550b30SJaegeuk Kim }
1206a7550b30SJaegeuk Kim 
1207a7550b30SJaegeuk Kim static int ext4_set_context(struct inode *inode, const void *ctx, size_t len,
1208a7550b30SJaegeuk Kim 							void *fs_data)
1209a7550b30SJaegeuk Kim {
12102f8f5e76SEric Biggers 	handle_t *handle = fs_data;
1211c1a5d5f6STahsin Erdogan 	int res, res2, credits, retries = 0;
1212a7550b30SJaegeuk Kim 
12139ce0151aSEric Biggers 	/*
12149ce0151aSEric Biggers 	 * Encrypting the root directory is not allowed because e2fsck expects
12159ce0151aSEric Biggers 	 * lost+found to exist and be unencrypted, and encrypting the root
12169ce0151aSEric Biggers 	 * directory would imply encrypting the lost+found directory as well as
12179ce0151aSEric Biggers 	 * the filename "lost+found" itself.
12189ce0151aSEric Biggers 	 */
12199ce0151aSEric Biggers 	if (inode->i_ino == EXT4_ROOT_INO)
12209ce0151aSEric Biggers 		return -EPERM;
1221a7550b30SJaegeuk Kim 
12227d3e06a8SRoss Zwisler 	if (WARN_ON_ONCE(IS_DAX(inode) && i_size_read(inode)))
12237d3e06a8SRoss Zwisler 		return -EINVAL;
12247d3e06a8SRoss Zwisler 
122594840e3cSEric Biggers 	res = ext4_convert_inline_data(inode);
122694840e3cSEric Biggers 	if (res)
122794840e3cSEric Biggers 		return res;
122894840e3cSEric Biggers 
12292f8f5e76SEric Biggers 	/*
12302f8f5e76SEric Biggers 	 * If a journal handle was specified, then the encryption context is
12312f8f5e76SEric Biggers 	 * being set on a new inode via inheritance and is part of a larger
12322f8f5e76SEric Biggers 	 * transaction to create the inode.  Otherwise the encryption context is
12332f8f5e76SEric Biggers 	 * being set on an existing inode in its own transaction.  Only in the
12342f8f5e76SEric Biggers 	 * latter case should the "retry on ENOSPC" logic be used.
12352f8f5e76SEric Biggers 	 */
12362f8f5e76SEric Biggers 
12372f8f5e76SEric Biggers 	if (handle) {
12382f8f5e76SEric Biggers 		res = ext4_xattr_set_handle(handle, inode,
12392f8f5e76SEric Biggers 					    EXT4_XATTR_INDEX_ENCRYPTION,
12402f8f5e76SEric Biggers 					    EXT4_XATTR_NAME_ENCRYPTION_CONTEXT,
12412f8f5e76SEric Biggers 					    ctx, len, 0);
1242a7550b30SJaegeuk Kim 		if (!res) {
1243a7550b30SJaegeuk Kim 			ext4_set_inode_flag(inode, EXT4_INODE_ENCRYPT);
1244a7550b30SJaegeuk Kim 			ext4_clear_inode_state(inode,
1245a7550b30SJaegeuk Kim 					EXT4_STATE_MAY_INLINE_DATA);
1246a3caa24bSJan Kara 			/*
12472ee6a576SEric Biggers 			 * Update inode->i_flags - S_ENCRYPTED will be enabled,
12482ee6a576SEric Biggers 			 * S_DAX may be disabled
1249a3caa24bSJan Kara 			 */
1250a3caa24bSJan Kara 			ext4_set_inode_flags(inode);
1251a7550b30SJaegeuk Kim 		}
1252a7550b30SJaegeuk Kim 		return res;
1253a7550b30SJaegeuk Kim 	}
1254a7550b30SJaegeuk Kim 
1255b8cb5a54STahsin Erdogan 	res = dquot_initialize(inode);
1256b8cb5a54STahsin Erdogan 	if (res)
1257b8cb5a54STahsin Erdogan 		return res;
12582f8f5e76SEric Biggers retry:
1259af65207cSTahsin Erdogan 	res = ext4_xattr_set_credits(inode, len, false /* is_create */,
1260af65207cSTahsin Erdogan 				     &credits);
1261dec214d0STahsin Erdogan 	if (res)
1262dec214d0STahsin Erdogan 		return res;
1263dec214d0STahsin Erdogan 
1264c1a5d5f6STahsin Erdogan 	handle = ext4_journal_start(inode, EXT4_HT_MISC, credits);
1265a7550b30SJaegeuk Kim 	if (IS_ERR(handle))
1266a7550b30SJaegeuk Kim 		return PTR_ERR(handle);
1267a7550b30SJaegeuk Kim 
12682f8f5e76SEric Biggers 	res = ext4_xattr_set_handle(handle, inode, EXT4_XATTR_INDEX_ENCRYPTION,
12692f8f5e76SEric Biggers 				    EXT4_XATTR_NAME_ENCRYPTION_CONTEXT,
12702f8f5e76SEric Biggers 				    ctx, len, 0);
1271a7550b30SJaegeuk Kim 	if (!res) {
1272a7550b30SJaegeuk Kim 		ext4_set_inode_flag(inode, EXT4_INODE_ENCRYPT);
12732ee6a576SEric Biggers 		/*
12742ee6a576SEric Biggers 		 * Update inode->i_flags - S_ENCRYPTED will be enabled,
12752ee6a576SEric Biggers 		 * S_DAX may be disabled
12762ee6a576SEric Biggers 		 */
1277a3caa24bSJan Kara 		ext4_set_inode_flags(inode);
1278a7550b30SJaegeuk Kim 		res = ext4_mark_inode_dirty(handle, inode);
1279a7550b30SJaegeuk Kim 		if (res)
1280a7550b30SJaegeuk Kim 			EXT4_ERROR_INODE(inode, "Failed to mark inode dirty");
1281a7550b30SJaegeuk Kim 	}
1282a7550b30SJaegeuk Kim 	res2 = ext4_journal_stop(handle);
12832f8f5e76SEric Biggers 
12842f8f5e76SEric Biggers 	if (res == -ENOSPC && ext4_should_retry_alloc(inode->i_sb, &retries))
12852f8f5e76SEric Biggers 		goto retry;
1286a7550b30SJaegeuk Kim 	if (!res)
1287a7550b30SJaegeuk Kim 		res = res2;
1288a7550b30SJaegeuk Kim 	return res;
1289a7550b30SJaegeuk Kim }
1290a7550b30SJaegeuk Kim 
1291c250b7ddSEric Biggers static bool ext4_dummy_context(struct inode *inode)
1292a7550b30SJaegeuk Kim {
1293a7550b30SJaegeuk Kim 	return DUMMY_ENCRYPTION_ENABLED(EXT4_SB(inode->i_sb));
1294a7550b30SJaegeuk Kim }
1295a7550b30SJaegeuk Kim 
12966f69f0edSEric Biggers static const struct fscrypt_operations ext4_cryptops = {
1297a5d431efSEric Biggers 	.key_prefix		= "ext4:",
1298a7550b30SJaegeuk Kim 	.get_context		= ext4_get_context,
1299a7550b30SJaegeuk Kim 	.set_context		= ext4_set_context,
1300a7550b30SJaegeuk Kim 	.dummy_context		= ext4_dummy_context,
1301a7550b30SJaegeuk Kim 	.empty_dir		= ext4_empty_dir,
1302e12ee683SEric Biggers 	.max_namelen		= EXT4_NAME_LEN,
1303a7550b30SJaegeuk Kim };
1304a7550b30SJaegeuk Kim #endif
1305a7550b30SJaegeuk Kim 
1306ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1307d6006186SEric Biggers static const char * const quotatypes[] = INITQFNAMES;
1308689c958cSLi Xi #define QTYPE2NAME(t) (quotatypes[t])
1309ac27a0ecSDave Kleikamp 
1310617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot);
1311617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot);
1312617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot);
1313617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot);
1314617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type);
13156f28e087SJan Kara static int ext4_quota_on(struct super_block *sb, int type, int format_id,
13168c54ca9cSAl Viro 			 const struct path *path);
1317617ba13bSMingming Cao static int ext4_quota_on_mount(struct super_block *sb, int type);
1318617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
1319ac27a0ecSDave Kleikamp 			       size_t len, loff_t off);
1320617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
1321ac27a0ecSDave Kleikamp 				const char *data, size_t len, loff_t off);
13227c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id,
13237c319d32SAditya Kali 			     unsigned int flags);
13247c319d32SAditya Kali static int ext4_enable_quotas(struct super_block *sb);
13258f0e8746STheodore Ts'o static int ext4_get_next_id(struct super_block *sb, struct kqid *qid);
1326ac27a0ecSDave Kleikamp 
132796c7e0d9SJan Kara static struct dquot **ext4_get_dquots(struct inode *inode)
132896c7e0d9SJan Kara {
132996c7e0d9SJan Kara 	return EXT4_I(inode)->i_dquot;
133096c7e0d9SJan Kara }
133196c7e0d9SJan Kara 
133261e225dcSAlexey Dobriyan static const struct dquot_operations ext4_quota_operations = {
133360e58e0fSMingming Cao 	.get_reserved_space	= ext4_get_reserved_space,
1334617ba13bSMingming Cao 	.write_dquot		= ext4_write_dquot,
1335617ba13bSMingming Cao 	.acquire_dquot		= ext4_acquire_dquot,
1336617ba13bSMingming Cao 	.release_dquot		= ext4_release_dquot,
1337617ba13bSMingming Cao 	.mark_dirty		= ext4_mark_dquot_dirty,
1338a5b5ee32SJan Kara 	.write_info		= ext4_write_info,
1339a5b5ee32SJan Kara 	.alloc_dquot		= dquot_alloc,
1340a5b5ee32SJan Kara 	.destroy_dquot		= dquot_destroy,
1341040cb378SLi Xi 	.get_projid		= ext4_get_projid,
13427a9ca53aSTahsin Erdogan 	.get_inode_usage	= ext4_get_inode_usage,
13438f0e8746STheodore Ts'o 	.get_next_id		= ext4_get_next_id,
1344ac27a0ecSDave Kleikamp };
1345ac27a0ecSDave Kleikamp 
13460d54b217SAlexey Dobriyan static const struct quotactl_ops ext4_qctl_operations = {
1347617ba13bSMingming Cao 	.quota_on	= ext4_quota_on,
1348ca0e05e4SDmitry Monakhov 	.quota_off	= ext4_quota_off,
1349287a8095SChristoph Hellwig 	.quota_sync	= dquot_quota_sync,
13500a240339SJan Kara 	.get_state	= dquot_get_state,
1351287a8095SChristoph Hellwig 	.set_info	= dquot_set_dqinfo,
1352287a8095SChristoph Hellwig 	.get_dqblk	= dquot_get_dqblk,
13536332b9b5SEric Sandeen 	.set_dqblk	= dquot_set_dqblk,
13546332b9b5SEric Sandeen 	.get_nextdqblk	= dquot_get_next_dqblk,
1355ac27a0ecSDave Kleikamp };
1356ac27a0ecSDave Kleikamp #endif
1357ac27a0ecSDave Kleikamp 
1358ee9b6d61SJosef 'Jeff' Sipek static const struct super_operations ext4_sops = {
1359617ba13bSMingming Cao 	.alloc_inode	= ext4_alloc_inode,
1360617ba13bSMingming Cao 	.destroy_inode	= ext4_destroy_inode,
1361617ba13bSMingming Cao 	.write_inode	= ext4_write_inode,
1362617ba13bSMingming Cao 	.dirty_inode	= ext4_dirty_inode,
13637ff9c073STheodore Ts'o 	.drop_inode	= ext4_drop_inode,
13640930fcc1SAl Viro 	.evict_inode	= ext4_evict_inode,
1365617ba13bSMingming Cao 	.put_super	= ext4_put_super,
1366617ba13bSMingming Cao 	.sync_fs	= ext4_sync_fs,
1367c4be0c1dSTakashi Sato 	.freeze_fs	= ext4_freeze,
1368c4be0c1dSTakashi Sato 	.unfreeze_fs	= ext4_unfreeze,
1369617ba13bSMingming Cao 	.statfs		= ext4_statfs,
1370617ba13bSMingming Cao 	.remount_fs	= ext4_remount,
1371617ba13bSMingming Cao 	.show_options	= ext4_show_options,
1372ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
1373617ba13bSMingming Cao 	.quota_read	= ext4_quota_read,
1374617ba13bSMingming Cao 	.quota_write	= ext4_quota_write,
137596c7e0d9SJan Kara 	.get_dquots	= ext4_get_dquots,
1376ac27a0ecSDave Kleikamp #endif
1377c39a7f84SToshiyuki Okajima 	.bdev_try_to_free_page = bdev_try_to_free_page,
1378ac27a0ecSDave Kleikamp };
1379ac27a0ecSDave Kleikamp 
138039655164SChristoph Hellwig static const struct export_operations ext4_export_ops = {
13811b961ac0SChristoph Hellwig 	.fh_to_dentry = ext4_fh_to_dentry,
13821b961ac0SChristoph Hellwig 	.fh_to_parent = ext4_fh_to_parent,
1383617ba13bSMingming Cao 	.get_parent = ext4_get_parent,
1384ac27a0ecSDave Kleikamp };
1385ac27a0ecSDave Kleikamp 
1386ac27a0ecSDave Kleikamp enum {
1387ac27a0ecSDave Kleikamp 	Opt_bsd_df, Opt_minix_df, Opt_grpid, Opt_nogrpid,
1388ac27a0ecSDave Kleikamp 	Opt_resgid, Opt_resuid, Opt_sb, Opt_err_cont, Opt_err_panic, Opt_err_ro,
138972578c33STheodore Ts'o 	Opt_nouid32, Opt_debug, Opt_removed,
1390ac27a0ecSDave Kleikamp 	Opt_user_xattr, Opt_nouser_xattr, Opt_acl, Opt_noacl,
139172578c33STheodore Ts'o 	Opt_auto_da_alloc, Opt_noauto_da_alloc, Opt_noload,
1392ad4eec61SEric Sandeen 	Opt_commit, Opt_min_batch_time, Opt_max_batch_time, Opt_journal_dev,
1393ad4eec61SEric Sandeen 	Opt_journal_path, Opt_journal_checksum, Opt_journal_async_commit,
1394ac27a0ecSDave Kleikamp 	Opt_abort, Opt_data_journal, Opt_data_ordered, Opt_data_writeback,
13956ddb2447STheodore Ts'o 	Opt_data_err_abort, Opt_data_err_ignore, Opt_test_dummy_encryption,
1396ac27a0ecSDave Kleikamp 	Opt_usrjquota, Opt_grpjquota, Opt_offusrjquota, Opt_offgrpjquota,
13975a20bdfcSJan Kara 	Opt_jqfmt_vfsold, Opt_jqfmt_vfsv0, Opt_jqfmt_vfsv1, Opt_quota,
1398ee4a3fcdSTheodore Ts'o 	Opt_noquota, Opt_barrier, Opt_nobarrier, Opt_err,
139949da9392SJan Kara 	Opt_usrquota, Opt_grpquota, Opt_prjquota, Opt_i_version, Opt_dax,
1400327eaf73STheodore Ts'o 	Opt_stripe, Opt_delalloc, Opt_nodelalloc, Opt_warn_on_error,
1401327eaf73STheodore Ts'o 	Opt_nowarn_on_error, Opt_mblk_io_submit,
1402670e9875STheodore Ts'o 	Opt_lazytime, Opt_nolazytime, Opt_debug_want_extra_isize,
14031449032bSTheodore Ts'o 	Opt_nomblk_io_submit, Opt_block_validity, Opt_noblock_validity,
14045328e635SEric Sandeen 	Opt_inode_readahead_blks, Opt_journal_ioprio,
1405744692dcSJiaying Zhang 	Opt_dioread_nolock, Opt_dioread_lock,
1406fc6cb1cdSTheodore Ts'o 	Opt_discard, Opt_nodiscard, Opt_init_itable, Opt_noinit_itable,
1407cdb7ee4cSTahsin Erdogan 	Opt_max_dir_size_kb, Opt_nojournal_checksum, Opt_nombcache,
1408ac27a0ecSDave Kleikamp };
1409ac27a0ecSDave Kleikamp 
1410a447c093SSteven Whitehouse static const match_table_t tokens = {
1411ac27a0ecSDave Kleikamp 	{Opt_bsd_df, "bsddf"},
1412ac27a0ecSDave Kleikamp 	{Opt_minix_df, "minixdf"},
1413ac27a0ecSDave Kleikamp 	{Opt_grpid, "grpid"},
1414ac27a0ecSDave Kleikamp 	{Opt_grpid, "bsdgroups"},
1415ac27a0ecSDave Kleikamp 	{Opt_nogrpid, "nogrpid"},
1416ac27a0ecSDave Kleikamp 	{Opt_nogrpid, "sysvgroups"},
1417ac27a0ecSDave Kleikamp 	{Opt_resgid, "resgid=%u"},
1418ac27a0ecSDave Kleikamp 	{Opt_resuid, "resuid=%u"},
1419ac27a0ecSDave Kleikamp 	{Opt_sb, "sb=%u"},
1420ac27a0ecSDave Kleikamp 	{Opt_err_cont, "errors=continue"},
1421ac27a0ecSDave Kleikamp 	{Opt_err_panic, "errors=panic"},
1422ac27a0ecSDave Kleikamp 	{Opt_err_ro, "errors=remount-ro"},
1423ac27a0ecSDave Kleikamp 	{Opt_nouid32, "nouid32"},
1424ac27a0ecSDave Kleikamp 	{Opt_debug, "debug"},
142572578c33STheodore Ts'o 	{Opt_removed, "oldalloc"},
142672578c33STheodore Ts'o 	{Opt_removed, "orlov"},
1427ac27a0ecSDave Kleikamp 	{Opt_user_xattr, "user_xattr"},
1428ac27a0ecSDave Kleikamp 	{Opt_nouser_xattr, "nouser_xattr"},
1429ac27a0ecSDave Kleikamp 	{Opt_acl, "acl"},
1430ac27a0ecSDave Kleikamp 	{Opt_noacl, "noacl"},
1431e3bb52aeSEric Sandeen 	{Opt_noload, "norecovery"},
14325a916be1STheodore Ts'o 	{Opt_noload, "noload"},
143372578c33STheodore Ts'o 	{Opt_removed, "nobh"},
143472578c33STheodore Ts'o 	{Opt_removed, "bh"},
1435ac27a0ecSDave Kleikamp 	{Opt_commit, "commit=%u"},
143630773840STheodore Ts'o 	{Opt_min_batch_time, "min_batch_time=%u"},
143730773840STheodore Ts'o 	{Opt_max_batch_time, "max_batch_time=%u"},
1438ac27a0ecSDave Kleikamp 	{Opt_journal_dev, "journal_dev=%u"},
1439ad4eec61SEric Sandeen 	{Opt_journal_path, "journal_path=%s"},
1440818d276cSGirish Shilamkar 	{Opt_journal_checksum, "journal_checksum"},
1441c6d3d56dSDarrick J. Wong 	{Opt_nojournal_checksum, "nojournal_checksum"},
1442818d276cSGirish Shilamkar 	{Opt_journal_async_commit, "journal_async_commit"},
1443ac27a0ecSDave Kleikamp 	{Opt_abort, "abort"},
1444ac27a0ecSDave Kleikamp 	{Opt_data_journal, "data=journal"},
1445ac27a0ecSDave Kleikamp 	{Opt_data_ordered, "data=ordered"},
1446ac27a0ecSDave Kleikamp 	{Opt_data_writeback, "data=writeback"},
14475bf5683aSHidehiro Kawai 	{Opt_data_err_abort, "data_err=abort"},
14485bf5683aSHidehiro Kawai 	{Opt_data_err_ignore, "data_err=ignore"},
1449ac27a0ecSDave Kleikamp 	{Opt_offusrjquota, "usrjquota="},
1450ac27a0ecSDave Kleikamp 	{Opt_usrjquota, "usrjquota=%s"},
1451ac27a0ecSDave Kleikamp 	{Opt_offgrpjquota, "grpjquota="},
1452ac27a0ecSDave Kleikamp 	{Opt_grpjquota, "grpjquota=%s"},
1453ac27a0ecSDave Kleikamp 	{Opt_jqfmt_vfsold, "jqfmt=vfsold"},
1454ac27a0ecSDave Kleikamp 	{Opt_jqfmt_vfsv0, "jqfmt=vfsv0"},
14555a20bdfcSJan Kara 	{Opt_jqfmt_vfsv1, "jqfmt=vfsv1"},
1456ac27a0ecSDave Kleikamp 	{Opt_grpquota, "grpquota"},
1457ac27a0ecSDave Kleikamp 	{Opt_noquota, "noquota"},
1458ac27a0ecSDave Kleikamp 	{Opt_quota, "quota"},
1459ac27a0ecSDave Kleikamp 	{Opt_usrquota, "usrquota"},
146049da9392SJan Kara 	{Opt_prjquota, "prjquota"},
1461ac27a0ecSDave Kleikamp 	{Opt_barrier, "barrier=%u"},
146206705bffSTheodore Ts'o 	{Opt_barrier, "barrier"},
146306705bffSTheodore Ts'o 	{Opt_nobarrier, "nobarrier"},
146425ec56b5SJean Noel Cordenner 	{Opt_i_version, "i_version"},
1465923ae0ffSRoss Zwisler 	{Opt_dax, "dax"},
1466c9de560dSAlex Tomas 	{Opt_stripe, "stripe=%u"},
146764769240SAlex Tomas 	{Opt_delalloc, "delalloc"},
1468327eaf73STheodore Ts'o 	{Opt_warn_on_error, "warn_on_error"},
1469327eaf73STheodore Ts'o 	{Opt_nowarn_on_error, "nowarn_on_error"},
1470a26f4992STheodore Ts'o 	{Opt_lazytime, "lazytime"},
1471a26f4992STheodore Ts'o 	{Opt_nolazytime, "nolazytime"},
1472670e9875STheodore Ts'o 	{Opt_debug_want_extra_isize, "debug_want_extra_isize=%u"},
1473dd919b98SAneesh Kumar K.V 	{Opt_nodelalloc, "nodelalloc"},
147436ade451SJan Kara 	{Opt_removed, "mblk_io_submit"},
147536ade451SJan Kara 	{Opt_removed, "nomblk_io_submit"},
14766fd058f7STheodore Ts'o 	{Opt_block_validity, "block_validity"},
14776fd058f7STheodore Ts'o 	{Opt_noblock_validity, "noblock_validity"},
1478240799cdSTheodore Ts'o 	{Opt_inode_readahead_blks, "inode_readahead_blks=%u"},
1479b3881f74STheodore Ts'o 	{Opt_journal_ioprio, "journal_ioprio=%u"},
1480afd4672dSTheodore Ts'o 	{Opt_auto_da_alloc, "auto_da_alloc=%u"},
148106705bffSTheodore Ts'o 	{Opt_auto_da_alloc, "auto_da_alloc"},
148206705bffSTheodore Ts'o 	{Opt_noauto_da_alloc, "noauto_da_alloc"},
1483744692dcSJiaying Zhang 	{Opt_dioread_nolock, "dioread_nolock"},
1484744692dcSJiaying Zhang 	{Opt_dioread_lock, "dioread_lock"},
14855328e635SEric Sandeen 	{Opt_discard, "discard"},
14865328e635SEric Sandeen 	{Opt_nodiscard, "nodiscard"},
1487fc6cb1cdSTheodore Ts'o 	{Opt_init_itable, "init_itable=%u"},
1488fc6cb1cdSTheodore Ts'o 	{Opt_init_itable, "init_itable"},
1489fc6cb1cdSTheodore Ts'o 	{Opt_noinit_itable, "noinit_itable"},
1490df981d03STheodore Ts'o 	{Opt_max_dir_size_kb, "max_dir_size_kb=%u"},
14916ddb2447STheodore Ts'o 	{Opt_test_dummy_encryption, "test_dummy_encryption"},
1492cdb7ee4cSTahsin Erdogan 	{Opt_nombcache, "nombcache"},
1493cdb7ee4cSTahsin Erdogan 	{Opt_nombcache, "no_mbcache"},	/* for backward compatibility */
1494c7198b9cSTheodore Ts'o 	{Opt_removed, "check=none"},	/* mount option from ext2/3 */
1495c7198b9cSTheodore Ts'o 	{Opt_removed, "nocheck"},	/* mount option from ext2/3 */
1496c7198b9cSTheodore Ts'o 	{Opt_removed, "reservation"},	/* mount option from ext2/3 */
1497c7198b9cSTheodore Ts'o 	{Opt_removed, "noreservation"}, /* mount option from ext2/3 */
1498c7198b9cSTheodore Ts'o 	{Opt_removed, "journal=%u"},	/* mount option from ext2/3 */
1499f3f12faaSJosef Bacik 	{Opt_err, NULL},
1500ac27a0ecSDave Kleikamp };
1501ac27a0ecSDave Kleikamp 
1502617ba13bSMingming Cao static ext4_fsblk_t get_sb_block(void **data)
1503ac27a0ecSDave Kleikamp {
1504617ba13bSMingming Cao 	ext4_fsblk_t	sb_block;
1505ac27a0ecSDave Kleikamp 	char		*options = (char *) *data;
1506ac27a0ecSDave Kleikamp 
1507ac27a0ecSDave Kleikamp 	if (!options || strncmp(options, "sb=", 3) != 0)
1508ac27a0ecSDave Kleikamp 		return 1;	/* Default location */
15090b8e58a1SAndreas Dilger 
1510ac27a0ecSDave Kleikamp 	options += 3;
15110b8e58a1SAndreas Dilger 	/* TODO: use simple_strtoll with >32bit ext4 */
1512ac27a0ecSDave Kleikamp 	sb_block = simple_strtoul(options, &options, 0);
1513ac27a0ecSDave Kleikamp 	if (*options && *options != ',') {
15144776004fSTheodore Ts'o 		printk(KERN_ERR "EXT4-fs: Invalid sb specification: %s\n",
1515ac27a0ecSDave Kleikamp 		       (char *) *data);
1516ac27a0ecSDave Kleikamp 		return 1;
1517ac27a0ecSDave Kleikamp 	}
1518ac27a0ecSDave Kleikamp 	if (*options == ',')
1519ac27a0ecSDave Kleikamp 		options++;
1520ac27a0ecSDave Kleikamp 	*data = (void *) options;
15210b8e58a1SAndreas Dilger 
1522ac27a0ecSDave Kleikamp 	return sb_block;
1523ac27a0ecSDave Kleikamp }
1524ac27a0ecSDave Kleikamp 
1525b3881f74STheodore Ts'o #define DEFAULT_JOURNAL_IOPRIO (IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, 3))
1526d6006186SEric Biggers static const char deprecated_msg[] =
1527d6006186SEric Biggers 	"Mount option \"%s\" will be removed by %s\n"
1528437ca0fdSDmitry Monakhov 	"Contact linux-ext4@vger.kernel.org if you think we should keep it.\n";
1529b3881f74STheodore Ts'o 
153056c50f11SDmitry Monakhov #ifdef CONFIG_QUOTA
153156c50f11SDmitry Monakhov static int set_qf_name(struct super_block *sb, int qtype, substring_t *args)
153256c50f11SDmitry Monakhov {
153356c50f11SDmitry Monakhov 	struct ext4_sb_info *sbi = EXT4_SB(sb);
153456c50f11SDmitry Monakhov 	char *qname;
153503dafb5fSChen Gang 	int ret = -1;
153656c50f11SDmitry Monakhov 
153756c50f11SDmitry Monakhov 	if (sb_any_quota_loaded(sb) &&
153856c50f11SDmitry Monakhov 		!sbi->s_qf_names[qtype]) {
153956c50f11SDmitry Monakhov 		ext4_msg(sb, KERN_ERR,
154056c50f11SDmitry Monakhov 			"Cannot change journaled "
154156c50f11SDmitry Monakhov 			"quota options when quota turned on");
154257f73c2cSTheodore Ts'o 		return -1;
154356c50f11SDmitry Monakhov 	}
1544e2b911c5SDarrick J. Wong 	if (ext4_has_feature_quota(sb)) {
1545c325a67cSTheodore Ts'o 		ext4_msg(sb, KERN_INFO, "Journaled quota options "
1546c325a67cSTheodore Ts'o 			 "ignored when QUOTA feature is enabled");
1547c325a67cSTheodore Ts'o 		return 1;
1548262b4662SJan Kara 	}
154956c50f11SDmitry Monakhov 	qname = match_strdup(args);
155056c50f11SDmitry Monakhov 	if (!qname) {
155156c50f11SDmitry Monakhov 		ext4_msg(sb, KERN_ERR,
155256c50f11SDmitry Monakhov 			"Not enough memory for storing quotafile name");
155357f73c2cSTheodore Ts'o 		return -1;
155456c50f11SDmitry Monakhov 	}
155503dafb5fSChen Gang 	if (sbi->s_qf_names[qtype]) {
155603dafb5fSChen Gang 		if (strcmp(sbi->s_qf_names[qtype], qname) == 0)
155703dafb5fSChen Gang 			ret = 1;
155803dafb5fSChen Gang 		else
155956c50f11SDmitry Monakhov 			ext4_msg(sb, KERN_ERR,
156003dafb5fSChen Gang 				 "%s quota file already specified",
156103dafb5fSChen Gang 				 QTYPE2NAME(qtype));
156203dafb5fSChen Gang 		goto errout;
156356c50f11SDmitry Monakhov 	}
156403dafb5fSChen Gang 	if (strchr(qname, '/')) {
156556c50f11SDmitry Monakhov 		ext4_msg(sb, KERN_ERR,
156656c50f11SDmitry Monakhov 			"quotafile must be on filesystem root");
156703dafb5fSChen Gang 		goto errout;
156856c50f11SDmitry Monakhov 	}
156903dafb5fSChen Gang 	sbi->s_qf_names[qtype] = qname;
1570fd8c37ecSTheodore Ts'o 	set_opt(sb, QUOTA);
157156c50f11SDmitry Monakhov 	return 1;
157203dafb5fSChen Gang errout:
157303dafb5fSChen Gang 	kfree(qname);
157403dafb5fSChen Gang 	return ret;
157556c50f11SDmitry Monakhov }
157656c50f11SDmitry Monakhov 
157756c50f11SDmitry Monakhov static int clear_qf_name(struct super_block *sb, int qtype)
157856c50f11SDmitry Monakhov {
157956c50f11SDmitry Monakhov 
158056c50f11SDmitry Monakhov 	struct ext4_sb_info *sbi = EXT4_SB(sb);
158156c50f11SDmitry Monakhov 
158256c50f11SDmitry Monakhov 	if (sb_any_quota_loaded(sb) &&
158356c50f11SDmitry Monakhov 		sbi->s_qf_names[qtype]) {
158456c50f11SDmitry Monakhov 		ext4_msg(sb, KERN_ERR, "Cannot change journaled quota options"
158556c50f11SDmitry Monakhov 			" when quota turned on");
158657f73c2cSTheodore Ts'o 		return -1;
158756c50f11SDmitry Monakhov 	}
158803dafb5fSChen Gang 	kfree(sbi->s_qf_names[qtype]);
158956c50f11SDmitry Monakhov 	sbi->s_qf_names[qtype] = NULL;
159056c50f11SDmitry Monakhov 	return 1;
159156c50f11SDmitry Monakhov }
159256c50f11SDmitry Monakhov #endif
159356c50f11SDmitry Monakhov 
159426092bf5STheodore Ts'o #define MOPT_SET	0x0001
159526092bf5STheodore Ts'o #define MOPT_CLEAR	0x0002
159626092bf5STheodore Ts'o #define MOPT_NOSUPPORT	0x0004
159726092bf5STheodore Ts'o #define MOPT_EXPLICIT	0x0008
159826092bf5STheodore Ts'o #define MOPT_CLEAR_ERR	0x0010
159926092bf5STheodore Ts'o #define MOPT_GTE0	0x0020
160026092bf5STheodore Ts'o #ifdef CONFIG_QUOTA
160126092bf5STheodore Ts'o #define MOPT_Q		0
160226092bf5STheodore Ts'o #define MOPT_QFMT	0x0040
160326092bf5STheodore Ts'o #else
160426092bf5STheodore Ts'o #define MOPT_Q		MOPT_NOSUPPORT
160526092bf5STheodore Ts'o #define MOPT_QFMT	MOPT_NOSUPPORT
160626092bf5STheodore Ts'o #endif
160726092bf5STheodore Ts'o #define MOPT_DATAJ	0x0080
16088dc0aa8cSTheodore Ts'o #define MOPT_NO_EXT2	0x0100
16098dc0aa8cSTheodore Ts'o #define MOPT_NO_EXT3	0x0200
16108dc0aa8cSTheodore Ts'o #define MOPT_EXT4_ONLY	(MOPT_NO_EXT2 | MOPT_NO_EXT3)
1611ad4eec61SEric Sandeen #define MOPT_STRING	0x0400
161226092bf5STheodore Ts'o 
161326092bf5STheodore Ts'o static const struct mount_opts {
161426092bf5STheodore Ts'o 	int	token;
161526092bf5STheodore Ts'o 	int	mount_opt;
161626092bf5STheodore Ts'o 	int	flags;
161726092bf5STheodore Ts'o } ext4_mount_opts[] = {
161826092bf5STheodore Ts'o 	{Opt_minix_df, EXT4_MOUNT_MINIX_DF, MOPT_SET},
161926092bf5STheodore Ts'o 	{Opt_bsd_df, EXT4_MOUNT_MINIX_DF, MOPT_CLEAR},
162026092bf5STheodore Ts'o 	{Opt_grpid, EXT4_MOUNT_GRPID, MOPT_SET},
162126092bf5STheodore Ts'o 	{Opt_nogrpid, EXT4_MOUNT_GRPID, MOPT_CLEAR},
162226092bf5STheodore Ts'o 	{Opt_block_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_SET},
162326092bf5STheodore Ts'o 	{Opt_noblock_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_CLEAR},
16248dc0aa8cSTheodore Ts'o 	{Opt_dioread_nolock, EXT4_MOUNT_DIOREAD_NOLOCK,
16258dc0aa8cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_SET},
16268dc0aa8cSTheodore Ts'o 	{Opt_dioread_lock, EXT4_MOUNT_DIOREAD_NOLOCK,
16278dc0aa8cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_CLEAR},
162826092bf5STheodore Ts'o 	{Opt_discard, EXT4_MOUNT_DISCARD, MOPT_SET},
162926092bf5STheodore Ts'o 	{Opt_nodiscard, EXT4_MOUNT_DISCARD, MOPT_CLEAR},
16308dc0aa8cSTheodore Ts'o 	{Opt_delalloc, EXT4_MOUNT_DELALLOC,
16318dc0aa8cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
16328dc0aa8cSTheodore Ts'o 	{Opt_nodelalloc, EXT4_MOUNT_DELALLOC,
163359d9fa5cSTheodore Ts'o 	 MOPT_EXT4_ONLY | MOPT_CLEAR},
1634327eaf73STheodore Ts'o 	{Opt_warn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_SET},
1635327eaf73STheodore Ts'o 	{Opt_nowarn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_CLEAR},
1636c6d3d56dSDarrick J. Wong 	{Opt_nojournal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM,
1637c6d3d56dSDarrick J. Wong 	 MOPT_EXT4_ONLY | MOPT_CLEAR},
16388dc0aa8cSTheodore Ts'o 	{Opt_journal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM,
16391e381f60SDmitry Monakhov 	 MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
164026092bf5STheodore Ts'o 	{Opt_journal_async_commit, (EXT4_MOUNT_JOURNAL_ASYNC_COMMIT |
16418dc0aa8cSTheodore Ts'o 				    EXT4_MOUNT_JOURNAL_CHECKSUM),
16421e381f60SDmitry Monakhov 	 MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT},
16438dc0aa8cSTheodore Ts'o 	{Opt_noload, EXT4_MOUNT_NOLOAD, MOPT_NO_EXT2 | MOPT_SET},
164426092bf5STheodore Ts'o 	{Opt_err_panic, EXT4_MOUNT_ERRORS_PANIC, MOPT_SET | MOPT_CLEAR_ERR},
164526092bf5STheodore Ts'o 	{Opt_err_ro, EXT4_MOUNT_ERRORS_RO, MOPT_SET | MOPT_CLEAR_ERR},
164626092bf5STheodore Ts'o 	{Opt_err_cont, EXT4_MOUNT_ERRORS_CONT, MOPT_SET | MOPT_CLEAR_ERR},
16478dc0aa8cSTheodore Ts'o 	{Opt_data_err_abort, EXT4_MOUNT_DATA_ERR_ABORT,
16487915a861SAles Novak 	 MOPT_NO_EXT2},
16498dc0aa8cSTheodore Ts'o 	{Opt_data_err_ignore, EXT4_MOUNT_DATA_ERR_ABORT,
16507915a861SAles Novak 	 MOPT_NO_EXT2},
165126092bf5STheodore Ts'o 	{Opt_barrier, EXT4_MOUNT_BARRIER, MOPT_SET},
165226092bf5STheodore Ts'o 	{Opt_nobarrier, EXT4_MOUNT_BARRIER, MOPT_CLEAR},
165326092bf5STheodore Ts'o 	{Opt_noauto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_SET},
165426092bf5STheodore Ts'o 	{Opt_auto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_CLEAR},
165526092bf5STheodore Ts'o 	{Opt_noinit_itable, EXT4_MOUNT_INIT_INODE_TABLE, MOPT_CLEAR},
165626092bf5STheodore Ts'o 	{Opt_commit, 0, MOPT_GTE0},
165726092bf5STheodore Ts'o 	{Opt_max_batch_time, 0, MOPT_GTE0},
165826092bf5STheodore Ts'o 	{Opt_min_batch_time, 0, MOPT_GTE0},
165926092bf5STheodore Ts'o 	{Opt_inode_readahead_blks, 0, MOPT_GTE0},
166026092bf5STheodore Ts'o 	{Opt_init_itable, 0, MOPT_GTE0},
1661923ae0ffSRoss Zwisler 	{Opt_dax, EXT4_MOUNT_DAX, MOPT_SET},
166226092bf5STheodore Ts'o 	{Opt_stripe, 0, MOPT_GTE0},
16630efb3b23SJan Kara 	{Opt_resuid, 0, MOPT_GTE0},
16640efb3b23SJan Kara 	{Opt_resgid, 0, MOPT_GTE0},
16655ba92bcfSCarlos Maiolino 	{Opt_journal_dev, 0, MOPT_NO_EXT2 | MOPT_GTE0},
16665ba92bcfSCarlos Maiolino 	{Opt_journal_path, 0, MOPT_NO_EXT2 | MOPT_STRING},
16675ba92bcfSCarlos Maiolino 	{Opt_journal_ioprio, 0, MOPT_NO_EXT2 | MOPT_GTE0},
16688dc0aa8cSTheodore Ts'o 	{Opt_data_journal, EXT4_MOUNT_JOURNAL_DATA, MOPT_NO_EXT2 | MOPT_DATAJ},
16698dc0aa8cSTheodore Ts'o 	{Opt_data_ordered, EXT4_MOUNT_ORDERED_DATA, MOPT_NO_EXT2 | MOPT_DATAJ},
16708dc0aa8cSTheodore Ts'o 	{Opt_data_writeback, EXT4_MOUNT_WRITEBACK_DATA,
16718dc0aa8cSTheodore Ts'o 	 MOPT_NO_EXT2 | MOPT_DATAJ},
167226092bf5STheodore Ts'o 	{Opt_user_xattr, EXT4_MOUNT_XATTR_USER, MOPT_SET},
167326092bf5STheodore Ts'o 	{Opt_nouser_xattr, EXT4_MOUNT_XATTR_USER, MOPT_CLEAR},
167426092bf5STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
167526092bf5STheodore Ts'o 	{Opt_acl, EXT4_MOUNT_POSIX_ACL, MOPT_SET},
167626092bf5STheodore Ts'o 	{Opt_noacl, EXT4_MOUNT_POSIX_ACL, MOPT_CLEAR},
167726092bf5STheodore Ts'o #else
167826092bf5STheodore Ts'o 	{Opt_acl, 0, MOPT_NOSUPPORT},
167926092bf5STheodore Ts'o 	{Opt_noacl, 0, MOPT_NOSUPPORT},
168026092bf5STheodore Ts'o #endif
168126092bf5STheodore Ts'o 	{Opt_nouid32, EXT4_MOUNT_NO_UID32, MOPT_SET},
168226092bf5STheodore Ts'o 	{Opt_debug, EXT4_MOUNT_DEBUG, MOPT_SET},
1683670e9875STheodore Ts'o 	{Opt_debug_want_extra_isize, 0, MOPT_GTE0},
168426092bf5STheodore Ts'o 	{Opt_quota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA, MOPT_SET | MOPT_Q},
168526092bf5STheodore Ts'o 	{Opt_usrquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA,
168626092bf5STheodore Ts'o 							MOPT_SET | MOPT_Q},
168726092bf5STheodore Ts'o 	{Opt_grpquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_GRPQUOTA,
168826092bf5STheodore Ts'o 							MOPT_SET | MOPT_Q},
168949da9392SJan Kara 	{Opt_prjquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_PRJQUOTA,
169049da9392SJan Kara 							MOPT_SET | MOPT_Q},
169126092bf5STheodore Ts'o 	{Opt_noquota, (EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA |
169249da9392SJan Kara 		       EXT4_MOUNT_GRPQUOTA | EXT4_MOUNT_PRJQUOTA),
169349da9392SJan Kara 							MOPT_CLEAR | MOPT_Q},
169426092bf5STheodore Ts'o 	{Opt_usrjquota, 0, MOPT_Q},
169526092bf5STheodore Ts'o 	{Opt_grpjquota, 0, MOPT_Q},
169626092bf5STheodore Ts'o 	{Opt_offusrjquota, 0, MOPT_Q},
169726092bf5STheodore Ts'o 	{Opt_offgrpjquota, 0, MOPT_Q},
169826092bf5STheodore Ts'o 	{Opt_jqfmt_vfsold, QFMT_VFS_OLD, MOPT_QFMT},
169926092bf5STheodore Ts'o 	{Opt_jqfmt_vfsv0, QFMT_VFS_V0, MOPT_QFMT},
170026092bf5STheodore Ts'o 	{Opt_jqfmt_vfsv1, QFMT_VFS_V1, MOPT_QFMT},
1701df981d03STheodore Ts'o 	{Opt_max_dir_size_kb, 0, MOPT_GTE0},
17026ddb2447STheodore Ts'o 	{Opt_test_dummy_encryption, 0, MOPT_GTE0},
1703cdb7ee4cSTahsin Erdogan 	{Opt_nombcache, EXT4_MOUNT_NO_MBCACHE, MOPT_SET},
170426092bf5STheodore Ts'o 	{Opt_err, 0, 0}
170526092bf5STheodore Ts'o };
170626092bf5STheodore Ts'o 
170726092bf5STheodore Ts'o static int handle_mount_opt(struct super_block *sb, char *opt, int token,
170826092bf5STheodore Ts'o 			    substring_t *args, unsigned long *journal_devnum,
170926092bf5STheodore Ts'o 			    unsigned int *journal_ioprio, int is_remount)
171026092bf5STheodore Ts'o {
171126092bf5STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
171226092bf5STheodore Ts'o 	const struct mount_opts *m;
171308cefc7aSEric W. Biederman 	kuid_t uid;
171408cefc7aSEric W. Biederman 	kgid_t gid;
171526092bf5STheodore Ts'o 	int arg = 0;
171626092bf5STheodore Ts'o 
171757f73c2cSTheodore Ts'o #ifdef CONFIG_QUOTA
171857f73c2cSTheodore Ts'o 	if (token == Opt_usrjquota)
171957f73c2cSTheodore Ts'o 		return set_qf_name(sb, USRQUOTA, &args[0]);
172057f73c2cSTheodore Ts'o 	else if (token == Opt_grpjquota)
172157f73c2cSTheodore Ts'o 		return set_qf_name(sb, GRPQUOTA, &args[0]);
172257f73c2cSTheodore Ts'o 	else if (token == Opt_offusrjquota)
172357f73c2cSTheodore Ts'o 		return clear_qf_name(sb, USRQUOTA);
172457f73c2cSTheodore Ts'o 	else if (token == Opt_offgrpjquota)
172557f73c2cSTheodore Ts'o 		return clear_qf_name(sb, GRPQUOTA);
172657f73c2cSTheodore Ts'o #endif
172726092bf5STheodore Ts'o 	switch (token) {
1728f7048605STheodore Ts'o 	case Opt_noacl:
1729f7048605STheodore Ts'o 	case Opt_nouser_xattr:
1730f7048605STheodore Ts'o 		ext4_msg(sb, KERN_WARNING, deprecated_msg, opt, "3.5");
1731f7048605STheodore Ts'o 		break;
173226092bf5STheodore Ts'o 	case Opt_sb:
173326092bf5STheodore Ts'o 		return 1;	/* handled by get_sb_block() */
173426092bf5STheodore Ts'o 	case Opt_removed:
17355f3633e3SJan Kara 		ext4_msg(sb, KERN_WARNING, "Ignoring removed %s option", opt);
173626092bf5STheodore Ts'o 		return 1;
173726092bf5STheodore Ts'o 	case Opt_abort:
173826092bf5STheodore Ts'o 		sbi->s_mount_flags |= EXT4_MF_FS_ABORTED;
173926092bf5STheodore Ts'o 		return 1;
174026092bf5STheodore Ts'o 	case Opt_i_version:
1741357fdad0SMatthew Garrett 		sb->s_flags |= SB_I_VERSION;
174226092bf5STheodore Ts'o 		return 1;
1743a26f4992STheodore Ts'o 	case Opt_lazytime:
17441751e8a6SLinus Torvalds 		sb->s_flags |= SB_LAZYTIME;
1745a26f4992STheodore Ts'o 		return 1;
1746a26f4992STheodore Ts'o 	case Opt_nolazytime:
17471751e8a6SLinus Torvalds 		sb->s_flags &= ~SB_LAZYTIME;
1748a26f4992STheodore Ts'o 		return 1;
174926092bf5STheodore Ts'o 	}
175026092bf5STheodore Ts'o 
17515f3633e3SJan Kara 	for (m = ext4_mount_opts; m->token != Opt_err; m++)
17525f3633e3SJan Kara 		if (token == m->token)
17535f3633e3SJan Kara 			break;
17545f3633e3SJan Kara 
17555f3633e3SJan Kara 	if (m->token == Opt_err) {
17565f3633e3SJan Kara 		ext4_msg(sb, KERN_ERR, "Unrecognized mount option \"%s\" "
17575f3633e3SJan Kara 			 "or missing value", opt);
17585f3633e3SJan Kara 		return -1;
17595f3633e3SJan Kara 	}
17605f3633e3SJan Kara 
17618dc0aa8cSTheodore Ts'o 	if ((m->flags & MOPT_NO_EXT2) && IS_EXT2_SB(sb)) {
17628dc0aa8cSTheodore Ts'o 		ext4_msg(sb, KERN_ERR,
17638dc0aa8cSTheodore Ts'o 			 "Mount option \"%s\" incompatible with ext2", opt);
17648dc0aa8cSTheodore Ts'o 		return -1;
17658dc0aa8cSTheodore Ts'o 	}
17668dc0aa8cSTheodore Ts'o 	if ((m->flags & MOPT_NO_EXT3) && IS_EXT3_SB(sb)) {
17678dc0aa8cSTheodore Ts'o 		ext4_msg(sb, KERN_ERR,
17688dc0aa8cSTheodore Ts'o 			 "Mount option \"%s\" incompatible with ext3", opt);
17698dc0aa8cSTheodore Ts'o 		return -1;
17708dc0aa8cSTheodore Ts'o 	}
17718dc0aa8cSTheodore Ts'o 
1772ad4eec61SEric Sandeen 	if (args->from && !(m->flags & MOPT_STRING) && match_int(args, &arg))
17730efb3b23SJan Kara 		return -1;
177426092bf5STheodore Ts'o 	if (args->from && (m->flags & MOPT_GTE0) && (arg < 0))
177526092bf5STheodore Ts'o 		return -1;
1776c93cf2d7SDmitry Monakhov 	if (m->flags & MOPT_EXPLICIT) {
1777c93cf2d7SDmitry Monakhov 		if (m->mount_opt & EXT4_MOUNT_DELALLOC) {
177826092bf5STheodore Ts'o 			set_opt2(sb, EXPLICIT_DELALLOC);
17791e381f60SDmitry Monakhov 		} else if (m->mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) {
17801e381f60SDmitry Monakhov 			set_opt2(sb, EXPLICIT_JOURNAL_CHECKSUM);
1781c93cf2d7SDmitry Monakhov 		} else
1782c93cf2d7SDmitry Monakhov 			return -1;
1783c93cf2d7SDmitry Monakhov 	}
178426092bf5STheodore Ts'o 	if (m->flags & MOPT_CLEAR_ERR)
178526092bf5STheodore Ts'o 		clear_opt(sb, ERRORS_MASK);
178626092bf5STheodore Ts'o 	if (token == Opt_noquota && sb_any_quota_loaded(sb)) {
178726092bf5STheodore Ts'o 		ext4_msg(sb, KERN_ERR, "Cannot change quota "
178826092bf5STheodore Ts'o 			 "options when quota turned on");
178926092bf5STheodore Ts'o 		return -1;
179026092bf5STheodore Ts'o 	}
179126092bf5STheodore Ts'o 
179226092bf5STheodore Ts'o 	if (m->flags & MOPT_NOSUPPORT) {
179326092bf5STheodore Ts'o 		ext4_msg(sb, KERN_ERR, "%s option not supported", opt);
179426092bf5STheodore Ts'o 	} else if (token == Opt_commit) {
179526092bf5STheodore Ts'o 		if (arg == 0)
179626092bf5STheodore Ts'o 			arg = JBD2_DEFAULT_MAX_COMMIT_AGE;
179726092bf5STheodore Ts'o 		sbi->s_commit_interval = HZ * arg;
1798670e9875STheodore Ts'o 	} else if (token == Opt_debug_want_extra_isize) {
1799670e9875STheodore Ts'o 		sbi->s_want_extra_isize = arg;
180026092bf5STheodore Ts'o 	} else if (token == Opt_max_batch_time) {
180126092bf5STheodore Ts'o 		sbi->s_max_batch_time = arg;
180226092bf5STheodore Ts'o 	} else if (token == Opt_min_batch_time) {
180326092bf5STheodore Ts'o 		sbi->s_min_batch_time = arg;
180426092bf5STheodore Ts'o 	} else if (token == Opt_inode_readahead_blks) {
1805e33e60eaSJan Kara 		if (arg && (arg > (1 << 30) || !is_power_of_2(arg))) {
1806e33e60eaSJan Kara 			ext4_msg(sb, KERN_ERR,
1807e33e60eaSJan Kara 				 "EXT4-fs: inode_readahead_blks must be "
1808e33e60eaSJan Kara 				 "0 or a power of 2 smaller than 2^31");
180926092bf5STheodore Ts'o 			return -1;
181026092bf5STheodore Ts'o 		}
181126092bf5STheodore Ts'o 		sbi->s_inode_readahead_blks = arg;
181226092bf5STheodore Ts'o 	} else if (token == Opt_init_itable) {
181326092bf5STheodore Ts'o 		set_opt(sb, INIT_INODE_TABLE);
181426092bf5STheodore Ts'o 		if (!args->from)
181526092bf5STheodore Ts'o 			arg = EXT4_DEF_LI_WAIT_MULT;
181626092bf5STheodore Ts'o 		sbi->s_li_wait_mult = arg;
1817df981d03STheodore Ts'o 	} else if (token == Opt_max_dir_size_kb) {
1818df981d03STheodore Ts'o 		sbi->s_max_dir_size_kb = arg;
181926092bf5STheodore Ts'o 	} else if (token == Opt_stripe) {
182026092bf5STheodore Ts'o 		sbi->s_stripe = arg;
18210efb3b23SJan Kara 	} else if (token == Opt_resuid) {
18220efb3b23SJan Kara 		uid = make_kuid(current_user_ns(), arg);
18230efb3b23SJan Kara 		if (!uid_valid(uid)) {
18245f3633e3SJan Kara 			ext4_msg(sb, KERN_ERR, "Invalid uid value %d", arg);
18250efb3b23SJan Kara 			return -1;
18260efb3b23SJan Kara 		}
18270efb3b23SJan Kara 		sbi->s_resuid = uid;
18280efb3b23SJan Kara 	} else if (token == Opt_resgid) {
18290efb3b23SJan Kara 		gid = make_kgid(current_user_ns(), arg);
18300efb3b23SJan Kara 		if (!gid_valid(gid)) {
18315f3633e3SJan Kara 			ext4_msg(sb, KERN_ERR, "Invalid gid value %d", arg);
18320efb3b23SJan Kara 			return -1;
18330efb3b23SJan Kara 		}
18340efb3b23SJan Kara 		sbi->s_resgid = gid;
18350efb3b23SJan Kara 	} else if (token == Opt_journal_dev) {
18360efb3b23SJan Kara 		if (is_remount) {
18370efb3b23SJan Kara 			ext4_msg(sb, KERN_ERR,
18380efb3b23SJan Kara 				 "Cannot specify journal on remount");
18390efb3b23SJan Kara 			return -1;
18400efb3b23SJan Kara 		}
18410efb3b23SJan Kara 		*journal_devnum = arg;
1842ad4eec61SEric Sandeen 	} else if (token == Opt_journal_path) {
1843ad4eec61SEric Sandeen 		char *journal_path;
1844ad4eec61SEric Sandeen 		struct inode *journal_inode;
1845ad4eec61SEric Sandeen 		struct path path;
1846ad4eec61SEric Sandeen 		int error;
1847ad4eec61SEric Sandeen 
1848ad4eec61SEric Sandeen 		if (is_remount) {
1849ad4eec61SEric Sandeen 			ext4_msg(sb, KERN_ERR,
1850ad4eec61SEric Sandeen 				 "Cannot specify journal on remount");
1851ad4eec61SEric Sandeen 			return -1;
1852ad4eec61SEric Sandeen 		}
1853ad4eec61SEric Sandeen 		journal_path = match_strdup(&args[0]);
1854ad4eec61SEric Sandeen 		if (!journal_path) {
1855ad4eec61SEric Sandeen 			ext4_msg(sb, KERN_ERR, "error: could not dup "
1856ad4eec61SEric Sandeen 				"journal device string");
1857ad4eec61SEric Sandeen 			return -1;
1858ad4eec61SEric Sandeen 		}
1859ad4eec61SEric Sandeen 
1860ad4eec61SEric Sandeen 		error = kern_path(journal_path, LOOKUP_FOLLOW, &path);
1861ad4eec61SEric Sandeen 		if (error) {
1862ad4eec61SEric Sandeen 			ext4_msg(sb, KERN_ERR, "error: could not find "
1863ad4eec61SEric Sandeen 				"journal device path: error %d", error);
1864ad4eec61SEric Sandeen 			kfree(journal_path);
1865ad4eec61SEric Sandeen 			return -1;
1866ad4eec61SEric Sandeen 		}
1867ad4eec61SEric Sandeen 
18682b0143b5SDavid Howells 		journal_inode = d_inode(path.dentry);
1869ad4eec61SEric Sandeen 		if (!S_ISBLK(journal_inode->i_mode)) {
1870ad4eec61SEric Sandeen 			ext4_msg(sb, KERN_ERR, "error: journal path %s "
1871ad4eec61SEric Sandeen 				"is not a block device", journal_path);
1872ad4eec61SEric Sandeen 			path_put(&path);
1873ad4eec61SEric Sandeen 			kfree(journal_path);
1874ad4eec61SEric Sandeen 			return -1;
1875ad4eec61SEric Sandeen 		}
1876ad4eec61SEric Sandeen 
1877ad4eec61SEric Sandeen 		*journal_devnum = new_encode_dev(journal_inode->i_rdev);
1878ad4eec61SEric Sandeen 		path_put(&path);
1879ad4eec61SEric Sandeen 		kfree(journal_path);
18800efb3b23SJan Kara 	} else if (token == Opt_journal_ioprio) {
18810efb3b23SJan Kara 		if (arg > 7) {
18825f3633e3SJan Kara 			ext4_msg(sb, KERN_ERR, "Invalid journal IO priority"
18830efb3b23SJan Kara 				 " (must be 0-7)");
18840efb3b23SJan Kara 			return -1;
18850efb3b23SJan Kara 		}
18860efb3b23SJan Kara 		*journal_ioprio =
18870efb3b23SJan Kara 			IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, arg);
18886ddb2447STheodore Ts'o 	} else if (token == Opt_test_dummy_encryption) {
18896ddb2447STheodore Ts'o #ifdef CONFIG_EXT4_FS_ENCRYPTION
18906ddb2447STheodore Ts'o 		sbi->s_mount_flags |= EXT4_MF_TEST_DUMMY_ENCRYPTION;
18916ddb2447STheodore Ts'o 		ext4_msg(sb, KERN_WARNING,
18926ddb2447STheodore Ts'o 			 "Test dummy encryption mode enabled");
18936ddb2447STheodore Ts'o #else
18946ddb2447STheodore Ts'o 		ext4_msg(sb, KERN_WARNING,
18956ddb2447STheodore Ts'o 			 "Test dummy encryption mount option ignored");
18966ddb2447STheodore Ts'o #endif
189726092bf5STheodore Ts'o 	} else if (m->flags & MOPT_DATAJ) {
189826092bf5STheodore Ts'o 		if (is_remount) {
189926092bf5STheodore Ts'o 			if (!sbi->s_journal)
190026092bf5STheodore Ts'o 				ext4_msg(sb, KERN_WARNING, "Remounting file system with no journal so ignoring journalled data option");
19015f3633e3SJan Kara 			else if (test_opt(sb, DATA_FLAGS) != m->mount_opt) {
190226092bf5STheodore Ts'o 				ext4_msg(sb, KERN_ERR,
190326092bf5STheodore Ts'o 					 "Cannot change data mode on remount");
190426092bf5STheodore Ts'o 				return -1;
190526092bf5STheodore Ts'o 			}
190626092bf5STheodore Ts'o 		} else {
190726092bf5STheodore Ts'o 			clear_opt(sb, DATA_FLAGS);
190826092bf5STheodore Ts'o 			sbi->s_mount_opt |= m->mount_opt;
190926092bf5STheodore Ts'o 		}
191026092bf5STheodore Ts'o #ifdef CONFIG_QUOTA
191126092bf5STheodore Ts'o 	} else if (m->flags & MOPT_QFMT) {
191226092bf5STheodore Ts'o 		if (sb_any_quota_loaded(sb) &&
191326092bf5STheodore Ts'o 		    sbi->s_jquota_fmt != m->mount_opt) {
19145f3633e3SJan Kara 			ext4_msg(sb, KERN_ERR, "Cannot change journaled "
19155f3633e3SJan Kara 				 "quota options when quota turned on");
191626092bf5STheodore Ts'o 			return -1;
191726092bf5STheodore Ts'o 		}
1918e2b911c5SDarrick J. Wong 		if (ext4_has_feature_quota(sb)) {
1919c325a67cSTheodore Ts'o 			ext4_msg(sb, KERN_INFO,
1920c325a67cSTheodore Ts'o 				 "Quota format mount options ignored "
1921262b4662SJan Kara 				 "when QUOTA feature is enabled");
1922c325a67cSTheodore Ts'o 			return 1;
1923262b4662SJan Kara 		}
192426092bf5STheodore Ts'o 		sbi->s_jquota_fmt = m->mount_opt;
192526092bf5STheodore Ts'o #endif
1926923ae0ffSRoss Zwisler 	} else if (token == Opt_dax) {
1927ef83b6e8SDan Williams #ifdef CONFIG_FS_DAX
1928ef83b6e8SDan Williams 		ext4_msg(sb, KERN_WARNING,
1929ef83b6e8SDan Williams 		"DAX enabled. Warning: EXPERIMENTAL, use at your own risk");
1930ef83b6e8SDan Williams 			sbi->s_mount_opt |= m->mount_opt;
1931ef83b6e8SDan Williams #else
1932923ae0ffSRoss Zwisler 		ext4_msg(sb, KERN_INFO, "dax option not supported");
1933923ae0ffSRoss Zwisler 		return -1;
1934923ae0ffSRoss Zwisler #endif
19357915a861SAles Novak 	} else if (token == Opt_data_err_abort) {
19367915a861SAles Novak 		sbi->s_mount_opt |= m->mount_opt;
19377915a861SAles Novak 	} else if (token == Opt_data_err_ignore) {
19387915a861SAles Novak 		sbi->s_mount_opt &= ~m->mount_opt;
193926092bf5STheodore Ts'o 	} else {
194026092bf5STheodore Ts'o 		if (!args->from)
194126092bf5STheodore Ts'o 			arg = 1;
194226092bf5STheodore Ts'o 		if (m->flags & MOPT_CLEAR)
194326092bf5STheodore Ts'o 			arg = !arg;
194426092bf5STheodore Ts'o 		else if (unlikely(!(m->flags & MOPT_SET))) {
194526092bf5STheodore Ts'o 			ext4_msg(sb, KERN_WARNING,
194626092bf5STheodore Ts'o 				 "buggy handling of option %s", opt);
194726092bf5STheodore Ts'o 			WARN_ON(1);
194826092bf5STheodore Ts'o 			return -1;
194926092bf5STheodore Ts'o 		}
195026092bf5STheodore Ts'o 		if (arg != 0)
195126092bf5STheodore Ts'o 			sbi->s_mount_opt |= m->mount_opt;
195226092bf5STheodore Ts'o 		else
195326092bf5STheodore Ts'o 			sbi->s_mount_opt &= ~m->mount_opt;
195426092bf5STheodore Ts'o 	}
195526092bf5STheodore Ts'o 	return 1;
195626092bf5STheodore Ts'o }
195726092bf5STheodore Ts'o 
1958ac27a0ecSDave Kleikamp static int parse_options(char *options, struct super_block *sb,
1959c3191067STheodore Ts'o 			 unsigned long *journal_devnum,
1960b3881f74STheodore Ts'o 			 unsigned int *journal_ioprio,
1961661aa520SEric Sandeen 			 int is_remount)
1962ac27a0ecSDave Kleikamp {
1963617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
1964ac27a0ecSDave Kleikamp 	char *p;
1965ac27a0ecSDave Kleikamp 	substring_t args[MAX_OPT_ARGS];
196626092bf5STheodore Ts'o 	int token;
1967ac27a0ecSDave Kleikamp 
1968ac27a0ecSDave Kleikamp 	if (!options)
1969ac27a0ecSDave Kleikamp 		return 1;
1970ac27a0ecSDave Kleikamp 
1971ac27a0ecSDave Kleikamp 	while ((p = strsep(&options, ",")) != NULL) {
1972ac27a0ecSDave Kleikamp 		if (!*p)
1973ac27a0ecSDave Kleikamp 			continue;
197415121c18SEric Sandeen 		/*
197515121c18SEric Sandeen 		 * Initialize args struct so we know whether arg was
197615121c18SEric Sandeen 		 * found; some options take optional arguments.
197715121c18SEric Sandeen 		 */
1978caecd0afSSachin Kamat 		args[0].to = args[0].from = NULL;
1979ac27a0ecSDave Kleikamp 		token = match_token(p, tokens, args);
198026092bf5STheodore Ts'o 		if (handle_mount_opt(sb, p, token, args, journal_devnum,
198126092bf5STheodore Ts'o 				     journal_ioprio, is_remount) < 0)
1982ac27a0ecSDave Kleikamp 			return 0;
1983ac27a0ecSDave Kleikamp 	}
1984ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
198549da9392SJan Kara 	/*
198649da9392SJan Kara 	 * We do the test below only for project quotas. 'usrquota' and
198749da9392SJan Kara 	 * 'grpquota' mount options are allowed even without quota feature
198849da9392SJan Kara 	 * to support legacy quotas in quota files.
198949da9392SJan Kara 	 */
199049da9392SJan Kara 	if (test_opt(sb, PRJQUOTA) && !ext4_has_feature_project(sb)) {
199149da9392SJan Kara 		ext4_msg(sb, KERN_ERR, "Project quota feature not enabled. "
199249da9392SJan Kara 			 "Cannot enable project quota enforcement.");
199349da9392SJan Kara 		return 0;
199449da9392SJan Kara 	}
199549da9392SJan Kara 	if (sbi->s_qf_names[USRQUOTA] || sbi->s_qf_names[GRPQUOTA]) {
1996482a7425SDmitry Monakhov 		if (test_opt(sb, USRQUOTA) && sbi->s_qf_names[USRQUOTA])
1997fd8c37ecSTheodore Ts'o 			clear_opt(sb, USRQUOTA);
1998ac27a0ecSDave Kleikamp 
1999482a7425SDmitry Monakhov 		if (test_opt(sb, GRPQUOTA) && sbi->s_qf_names[GRPQUOTA])
2000fd8c37ecSTheodore Ts'o 			clear_opt(sb, GRPQUOTA);
2001ac27a0ecSDave Kleikamp 
200256c50f11SDmitry Monakhov 		if (test_opt(sb, GRPQUOTA) || test_opt(sb, USRQUOTA)) {
2003b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "old and new quota "
2004b31e1552SEric Sandeen 					"format mixing");
2005ac27a0ecSDave Kleikamp 			return 0;
2006ac27a0ecSDave Kleikamp 		}
2007ac27a0ecSDave Kleikamp 
2008ac27a0ecSDave Kleikamp 		if (!sbi->s_jquota_fmt) {
2009b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "journaled quota format "
2010b31e1552SEric Sandeen 					"not specified");
2011ac27a0ecSDave Kleikamp 			return 0;
2012ac27a0ecSDave Kleikamp 		}
2013ac27a0ecSDave Kleikamp 	}
2014ac27a0ecSDave Kleikamp #endif
2015261cb20cSJan Kara 	if (test_opt(sb, DIOREAD_NOLOCK)) {
2016261cb20cSJan Kara 		int blocksize =
2017261cb20cSJan Kara 			BLOCK_SIZE << le32_to_cpu(sbi->s_es->s_log_block_size);
2018261cb20cSJan Kara 
201909cbfeafSKirill A. Shutemov 		if (blocksize < PAGE_SIZE) {
2020261cb20cSJan Kara 			ext4_msg(sb, KERN_ERR, "can't mount with "
2021261cb20cSJan Kara 				 "dioread_nolock if block size != PAGE_SIZE");
2022261cb20cSJan Kara 			return 0;
2023261cb20cSJan Kara 		}
2024261cb20cSJan Kara 	}
2025ac27a0ecSDave Kleikamp 	return 1;
2026ac27a0ecSDave Kleikamp }
2027ac27a0ecSDave Kleikamp 
20282adf6da8STheodore Ts'o static inline void ext4_show_quota_options(struct seq_file *seq,
20292adf6da8STheodore Ts'o 					   struct super_block *sb)
20302adf6da8STheodore Ts'o {
20312adf6da8STheodore Ts'o #if defined(CONFIG_QUOTA)
20322adf6da8STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
20332adf6da8STheodore Ts'o 
20342adf6da8STheodore Ts'o 	if (sbi->s_jquota_fmt) {
20352adf6da8STheodore Ts'o 		char *fmtname = "";
20362adf6da8STheodore Ts'o 
20372adf6da8STheodore Ts'o 		switch (sbi->s_jquota_fmt) {
20382adf6da8STheodore Ts'o 		case QFMT_VFS_OLD:
20392adf6da8STheodore Ts'o 			fmtname = "vfsold";
20402adf6da8STheodore Ts'o 			break;
20412adf6da8STheodore Ts'o 		case QFMT_VFS_V0:
20422adf6da8STheodore Ts'o 			fmtname = "vfsv0";
20432adf6da8STheodore Ts'o 			break;
20442adf6da8STheodore Ts'o 		case QFMT_VFS_V1:
20452adf6da8STheodore Ts'o 			fmtname = "vfsv1";
20462adf6da8STheodore Ts'o 			break;
20472adf6da8STheodore Ts'o 		}
20482adf6da8STheodore Ts'o 		seq_printf(seq, ",jqfmt=%s", fmtname);
20492adf6da8STheodore Ts'o 	}
20502adf6da8STheodore Ts'o 
20512adf6da8STheodore Ts'o 	if (sbi->s_qf_names[USRQUOTA])
2052a068acf2SKees Cook 		seq_show_option(seq, "usrjquota", sbi->s_qf_names[USRQUOTA]);
20532adf6da8STheodore Ts'o 
20542adf6da8STheodore Ts'o 	if (sbi->s_qf_names[GRPQUOTA])
2055a068acf2SKees Cook 		seq_show_option(seq, "grpjquota", sbi->s_qf_names[GRPQUOTA]);
20562adf6da8STheodore Ts'o #endif
20572adf6da8STheodore Ts'o }
20582adf6da8STheodore Ts'o 
20595a916be1STheodore Ts'o static const char *token2str(int token)
20605a916be1STheodore Ts'o {
206150df9fd5SHerton Ronaldo Krzesinski 	const struct match_token *t;
20625a916be1STheodore Ts'o 
20635a916be1STheodore Ts'o 	for (t = tokens; t->token != Opt_err; t++)
20645a916be1STheodore Ts'o 		if (t->token == token && !strchr(t->pattern, '='))
20655a916be1STheodore Ts'o 			break;
20665a916be1STheodore Ts'o 	return t->pattern;
20675a916be1STheodore Ts'o }
20685a916be1STheodore Ts'o 
20692adf6da8STheodore Ts'o /*
20702adf6da8STheodore Ts'o  * Show an option if
20712adf6da8STheodore Ts'o  *  - it's set to a non-default value OR
20722adf6da8STheodore Ts'o  *  - if the per-sb default is different from the global default
20732adf6da8STheodore Ts'o  */
207466acdcf4STheodore Ts'o static int _ext4_show_options(struct seq_file *seq, struct super_block *sb,
207566acdcf4STheodore Ts'o 			      int nodefs)
20762adf6da8STheodore Ts'o {
20772adf6da8STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
20782adf6da8STheodore Ts'o 	struct ext4_super_block *es = sbi->s_es;
207968afa7e0STyson Nottingham 	int def_errors, def_mount_opt = sbi->s_def_mount_opt;
20805a916be1STheodore Ts'o 	const struct mount_opts *m;
208166acdcf4STheodore Ts'o 	char sep = nodefs ? '\n' : ',';
20822adf6da8STheodore Ts'o 
208366acdcf4STheodore Ts'o #define SEQ_OPTS_PUTS(str) seq_printf(seq, "%c" str, sep)
208466acdcf4STheodore Ts'o #define SEQ_OPTS_PRINT(str, arg) seq_printf(seq, "%c" str, sep, arg)
20852adf6da8STheodore Ts'o 
20862adf6da8STheodore Ts'o 	if (sbi->s_sb_block != 1)
20875a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("sb=%llu", sbi->s_sb_block);
20885a916be1STheodore Ts'o 
20895a916be1STheodore Ts'o 	for (m = ext4_mount_opts; m->token != Opt_err; m++) {
20905a916be1STheodore Ts'o 		int want_set = m->flags & MOPT_SET;
20915a916be1STheodore Ts'o 		if (((m->flags & (MOPT_SET|MOPT_CLEAR)) == 0) ||
20925a916be1STheodore Ts'o 		    (m->flags & MOPT_CLEAR_ERR))
20935a916be1STheodore Ts'o 			continue;
209468afa7e0STyson Nottingham 		if (!nodefs && !(m->mount_opt & (sbi->s_mount_opt ^ def_mount_opt)))
20955a916be1STheodore Ts'o 			continue; /* skip if same as the default */
20965a916be1STheodore Ts'o 		if ((want_set &&
20975a916be1STheodore Ts'o 		     (sbi->s_mount_opt & m->mount_opt) != m->mount_opt) ||
20985a916be1STheodore Ts'o 		    (!want_set && (sbi->s_mount_opt & m->mount_opt)))
20995a916be1STheodore Ts'o 			continue; /* select Opt_noFoo vs Opt_Foo */
21005a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("%s", token2str(m->token));
21015a916be1STheodore Ts'o 	}
21025a916be1STheodore Ts'o 
210308cefc7aSEric W. Biederman 	if (nodefs || !uid_eq(sbi->s_resuid, make_kuid(&init_user_ns, EXT4_DEF_RESUID)) ||
21045a916be1STheodore Ts'o 	    le16_to_cpu(es->s_def_resuid) != EXT4_DEF_RESUID)
210508cefc7aSEric W. Biederman 		SEQ_OPTS_PRINT("resuid=%u",
210608cefc7aSEric W. Biederman 				from_kuid_munged(&init_user_ns, sbi->s_resuid));
210708cefc7aSEric W. Biederman 	if (nodefs || !gid_eq(sbi->s_resgid, make_kgid(&init_user_ns, EXT4_DEF_RESGID)) ||
21085a916be1STheodore Ts'o 	    le16_to_cpu(es->s_def_resgid) != EXT4_DEF_RESGID)
210908cefc7aSEric W. Biederman 		SEQ_OPTS_PRINT("resgid=%u",
211008cefc7aSEric W. Biederman 				from_kgid_munged(&init_user_ns, sbi->s_resgid));
211166acdcf4STheodore Ts'o 	def_errors = nodefs ? -1 : le16_to_cpu(es->s_errors);
21125a916be1STheodore Ts'o 	if (test_opt(sb, ERRORS_RO) && def_errors != EXT4_ERRORS_RO)
21135a916be1STheodore Ts'o 		SEQ_OPTS_PUTS("errors=remount-ro");
21142adf6da8STheodore Ts'o 	if (test_opt(sb, ERRORS_CONT) && def_errors != EXT4_ERRORS_CONTINUE)
21155a916be1STheodore Ts'o 		SEQ_OPTS_PUTS("errors=continue");
21162adf6da8STheodore Ts'o 	if (test_opt(sb, ERRORS_PANIC) && def_errors != EXT4_ERRORS_PANIC)
21175a916be1STheodore Ts'o 		SEQ_OPTS_PUTS("errors=panic");
211866acdcf4STheodore Ts'o 	if (nodefs || sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ)
21195a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("commit=%lu", sbi->s_commit_interval / HZ);
212066acdcf4STheodore Ts'o 	if (nodefs || sbi->s_min_batch_time != EXT4_DEF_MIN_BATCH_TIME)
21215a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("min_batch_time=%u", sbi->s_min_batch_time);
212266acdcf4STheodore Ts'o 	if (nodefs || sbi->s_max_batch_time != EXT4_DEF_MAX_BATCH_TIME)
21235a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("max_batch_time=%u", sbi->s_max_batch_time);
2124357fdad0SMatthew Garrett 	if (sb->s_flags & SB_I_VERSION)
21255a916be1STheodore Ts'o 		SEQ_OPTS_PUTS("i_version");
212666acdcf4STheodore Ts'o 	if (nodefs || sbi->s_stripe)
21275a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("stripe=%lu", sbi->s_stripe);
212868afa7e0STyson Nottingham 	if (nodefs || EXT4_MOUNT_DATA_FLAGS &
212968afa7e0STyson Nottingham 			(sbi->s_mount_opt ^ def_mount_opt)) {
21302adf6da8STheodore Ts'o 		if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
21315a916be1STheodore Ts'o 			SEQ_OPTS_PUTS("data=journal");
21322adf6da8STheodore Ts'o 		else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
21335a916be1STheodore Ts'o 			SEQ_OPTS_PUTS("data=ordered");
21342adf6da8STheodore Ts'o 		else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_WRITEBACK_DATA)
21355a916be1STheodore Ts'o 			SEQ_OPTS_PUTS("data=writeback");
21365a916be1STheodore Ts'o 	}
213766acdcf4STheodore Ts'o 	if (nodefs ||
213866acdcf4STheodore Ts'o 	    sbi->s_inode_readahead_blks != EXT4_DEF_INODE_READAHEAD_BLKS)
21395a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("inode_readahead_blks=%u",
21402adf6da8STheodore Ts'o 			       sbi->s_inode_readahead_blks);
21412adf6da8STheodore Ts'o 
2142ceec0376STyson Nottingham 	if (test_opt(sb, INIT_INODE_TABLE) && (nodefs ||
214366acdcf4STheodore Ts'o 		       (sbi->s_li_wait_mult != EXT4_DEF_LI_WAIT_MULT)))
21445a916be1STheodore Ts'o 		SEQ_OPTS_PRINT("init_itable=%u", sbi->s_li_wait_mult);
2145df981d03STheodore Ts'o 	if (nodefs || sbi->s_max_dir_size_kb)
2146df981d03STheodore Ts'o 		SEQ_OPTS_PRINT("max_dir_size_kb=%u", sbi->s_max_dir_size_kb);
21477915a861SAles Novak 	if (test_opt(sb, DATA_ERR_ABORT))
21487915a861SAles Novak 		SEQ_OPTS_PUTS("data_err=abort");
2149338affb5SEric Biggers 	if (DUMMY_ENCRYPTION_ENABLED(sbi))
2150338affb5SEric Biggers 		SEQ_OPTS_PUTS("test_dummy_encryption");
21512adf6da8STheodore Ts'o 
21522adf6da8STheodore Ts'o 	ext4_show_quota_options(seq, sb);
21532adf6da8STheodore Ts'o 	return 0;
21542adf6da8STheodore Ts'o }
21552adf6da8STheodore Ts'o 
215666acdcf4STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root)
215766acdcf4STheodore Ts'o {
215866acdcf4STheodore Ts'o 	return _ext4_show_options(seq, root->d_sb, 0);
215966acdcf4STheodore Ts'o }
216066acdcf4STheodore Ts'o 
2161ebd173beSTheodore Ts'o int ext4_seq_options_show(struct seq_file *seq, void *offset)
216266acdcf4STheodore Ts'o {
216366acdcf4STheodore Ts'o 	struct super_block *sb = seq->private;
216466acdcf4STheodore Ts'o 	int rc;
216566acdcf4STheodore Ts'o 
2166bc98a42cSDavid Howells 	seq_puts(seq, sb_rdonly(sb) ? "ro" : "rw");
216766acdcf4STheodore Ts'o 	rc = _ext4_show_options(seq, sb, 1);
216866acdcf4STheodore Ts'o 	seq_puts(seq, "\n");
216966acdcf4STheodore Ts'o 	return rc;
217066acdcf4STheodore Ts'o }
217166acdcf4STheodore Ts'o 
2172617ba13bSMingming Cao static int ext4_setup_super(struct super_block *sb, struct ext4_super_block *es,
2173ac27a0ecSDave Kleikamp 			    int read_only)
2174ac27a0ecSDave Kleikamp {
2175617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2176c89128a0SJaegeuk Kim 	int err = 0;
2177ac27a0ecSDave Kleikamp 
2178617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) > EXT4_MAX_SUPP_REV) {
2179b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "revision level too high, "
2180b31e1552SEric Sandeen 			 "forcing read-only mode");
2181c89128a0SJaegeuk Kim 		err = -EROFS;
2182ac27a0ecSDave Kleikamp 	}
2183ac27a0ecSDave Kleikamp 	if (read_only)
2184281b5995STheodore Ts'o 		goto done;
2185617ba13bSMingming Cao 	if (!(sbi->s_mount_state & EXT4_VALID_FS))
2186b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING, "warning: mounting unchecked fs, "
2187b31e1552SEric Sandeen 			 "running e2fsck is recommended");
2188c8b459f4SLukas Czerner 	else if (sbi->s_mount_state & EXT4_ERROR_FS)
2189b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING,
2190b31e1552SEric Sandeen 			 "warning: mounting fs with errors, "
2191b31e1552SEric Sandeen 			 "running e2fsck is recommended");
2192ed3ce80aSTao Ma 	else if ((__s16) le16_to_cpu(es->s_max_mnt_count) > 0 &&
2193ac27a0ecSDave Kleikamp 		 le16_to_cpu(es->s_mnt_count) >=
2194ac27a0ecSDave Kleikamp 		 (unsigned short) (__s16) le16_to_cpu(es->s_max_mnt_count))
2195b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING,
2196b31e1552SEric Sandeen 			 "warning: maximal mount count reached, "
2197b31e1552SEric Sandeen 			 "running e2fsck is recommended");
2198ac27a0ecSDave Kleikamp 	else if (le32_to_cpu(es->s_checkinterval) &&
21996a0678a7SArnd Bergmann 		 (ext4_get_tstamp(es, s_lastcheck) +
22006a0678a7SArnd Bergmann 		  le32_to_cpu(es->s_checkinterval) <= ktime_get_real_seconds()))
2201b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING,
2202b31e1552SEric Sandeen 			 "warning: checktime reached, "
2203b31e1552SEric Sandeen 			 "running e2fsck is recommended");
22040390131bSFrank Mayhar 	if (!sbi->s_journal)
2205216c34b2SMarcin Slusarz 		es->s_state &= cpu_to_le16(~EXT4_VALID_FS);
2206ac27a0ecSDave Kleikamp 	if (!(__s16) le16_to_cpu(es->s_max_mnt_count))
2207617ba13bSMingming Cao 		es->s_max_mnt_count = cpu_to_le16(EXT4_DFL_MAX_MNT_COUNT);
2208e8546d06SMarcin Slusarz 	le16_add_cpu(&es->s_mnt_count, 1);
22096a0678a7SArnd Bergmann 	ext4_update_tstamp(es, s_mtime);
2210617ba13bSMingming Cao 	ext4_update_dynamic_rev(sb);
22110390131bSFrank Mayhar 	if (sbi->s_journal)
2212e2b911c5SDarrick J. Wong 		ext4_set_feature_journal_needs_recovery(sb);
2213ac27a0ecSDave Kleikamp 
2214c89128a0SJaegeuk Kim 	err = ext4_commit_super(sb, 1);
2215281b5995STheodore Ts'o done:
2216ac27a0ecSDave Kleikamp 	if (test_opt(sb, DEBUG))
2217a9df9a49STheodore Ts'o 		printk(KERN_INFO "[EXT4 FS bs=%lu, gc=%u, "
2218a2595b8aSTheodore Ts'o 				"bpg=%lu, ipg=%lu, mo=%04x, mo2=%04x]\n",
2219ac27a0ecSDave Kleikamp 			sb->s_blocksize,
2220ac27a0ecSDave Kleikamp 			sbi->s_groups_count,
2221617ba13bSMingming Cao 			EXT4_BLOCKS_PER_GROUP(sb),
2222617ba13bSMingming Cao 			EXT4_INODES_PER_GROUP(sb),
2223a2595b8aSTheodore Ts'o 			sbi->s_mount_opt, sbi->s_mount_opt2);
2224ac27a0ecSDave Kleikamp 
22257abc52c2SDan Magenheimer 	cleancache_init_fs(sb);
2226c89128a0SJaegeuk Kim 	return err;
2227ac27a0ecSDave Kleikamp }
2228ac27a0ecSDave Kleikamp 
2229117fff10STheodore Ts'o int ext4_alloc_flex_bg_array(struct super_block *sb, ext4_group_t ngroup)
2230117fff10STheodore Ts'o {
2231117fff10STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2232117fff10STheodore Ts'o 	struct flex_groups *new_groups;
2233117fff10STheodore Ts'o 	int size;
2234117fff10STheodore Ts'o 
2235117fff10STheodore Ts'o 	if (!sbi->s_log_groups_per_flex)
2236117fff10STheodore Ts'o 		return 0;
2237117fff10STheodore Ts'o 
2238117fff10STheodore Ts'o 	size = ext4_flex_group(sbi, ngroup - 1) + 1;
2239117fff10STheodore Ts'o 	if (size <= sbi->s_flex_groups_allocated)
2240117fff10STheodore Ts'o 		return 0;
2241117fff10STheodore Ts'o 
2242117fff10STheodore Ts'o 	size = roundup_pow_of_two(size * sizeof(struct flex_groups));
2243a7c3e901SMichal Hocko 	new_groups = kvzalloc(size, GFP_KERNEL);
2244117fff10STheodore Ts'o 	if (!new_groups) {
2245117fff10STheodore Ts'o 		ext4_msg(sb, KERN_ERR, "not enough memory for %d flex groups",
2246117fff10STheodore Ts'o 			 size / (int) sizeof(struct flex_groups));
2247117fff10STheodore Ts'o 		return -ENOMEM;
2248117fff10STheodore Ts'o 	}
2249117fff10STheodore Ts'o 
2250117fff10STheodore Ts'o 	if (sbi->s_flex_groups) {
2251117fff10STheodore Ts'o 		memcpy(new_groups, sbi->s_flex_groups,
2252117fff10STheodore Ts'o 		       (sbi->s_flex_groups_allocated *
2253117fff10STheodore Ts'o 			sizeof(struct flex_groups)));
2254b93b41d4SAl Viro 		kvfree(sbi->s_flex_groups);
2255117fff10STheodore Ts'o 	}
2256117fff10STheodore Ts'o 	sbi->s_flex_groups = new_groups;
2257117fff10STheodore Ts'o 	sbi->s_flex_groups_allocated = size / sizeof(struct flex_groups);
2258117fff10STheodore Ts'o 	return 0;
2259117fff10STheodore Ts'o }
2260117fff10STheodore Ts'o 
2261772cb7c8SJose R. Santos static int ext4_fill_flex_info(struct super_block *sb)
2262772cb7c8SJose R. Santos {
2263772cb7c8SJose R. Santos 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2264772cb7c8SJose R. Santos 	struct ext4_group_desc *gdp = NULL;
2265772cb7c8SJose R. Santos 	ext4_group_t flex_group;
2266117fff10STheodore Ts'o 	int i, err;
2267772cb7c8SJose R. Santos 
2268503358aeSTheodore Ts'o 	sbi->s_log_groups_per_flex = sbi->s_es->s_log_groups_per_flex;
2269d50f2ab6SXi Wang 	if (sbi->s_log_groups_per_flex < 1 || sbi->s_log_groups_per_flex > 31) {
2270772cb7c8SJose R. Santos 		sbi->s_log_groups_per_flex = 0;
2271772cb7c8SJose R. Santos 		return 1;
2272772cb7c8SJose R. Santos 	}
2273772cb7c8SJose R. Santos 
2274117fff10STheodore Ts'o 	err = ext4_alloc_flex_bg_array(sb, sbi->s_groups_count);
2275117fff10STheodore Ts'o 	if (err)
2276772cb7c8SJose R. Santos 		goto failed;
2277772cb7c8SJose R. Santos 
2278772cb7c8SJose R. Santos 	for (i = 0; i < sbi->s_groups_count; i++) {
227988b6edd1STheodore Ts'o 		gdp = ext4_get_group_desc(sb, i, NULL);
2280772cb7c8SJose R. Santos 
2281772cb7c8SJose R. Santos 		flex_group = ext4_flex_group(sbi, i);
22827ad9bb65STheodore Ts'o 		atomic_add(ext4_free_inodes_count(sb, gdp),
22837ad9bb65STheodore Ts'o 			   &sbi->s_flex_groups[flex_group].free_inodes);
228490ba983fSTheodore Ts'o 		atomic64_add(ext4_free_group_clusters(sb, gdp),
228524aaa8efSTheodore Ts'o 			     &sbi->s_flex_groups[flex_group].free_clusters);
22867ad9bb65STheodore Ts'o 		atomic_add(ext4_used_dirs_count(sb, gdp),
22877ad9bb65STheodore Ts'o 			   &sbi->s_flex_groups[flex_group].used_dirs);
2288772cb7c8SJose R. Santos 	}
2289772cb7c8SJose R. Santos 
2290772cb7c8SJose R. Santos 	return 1;
2291772cb7c8SJose R. Santos failed:
2292772cb7c8SJose R. Santos 	return 0;
2293772cb7c8SJose R. Santos }
2294772cb7c8SJose R. Santos 
2295e2b911c5SDarrick J. Wong static __le16 ext4_group_desc_csum(struct super_block *sb, __u32 block_group,
2296717d50e4SAndreas Dilger 				   struct ext4_group_desc *gdp)
2297717d50e4SAndreas Dilger {
2298b47820edSDaeho Jeong 	int offset = offsetof(struct ext4_group_desc, bg_checksum);
2299717d50e4SAndreas Dilger 	__u16 crc = 0;
2300717d50e4SAndreas Dilger 	__le32 le_group = cpu_to_le32(block_group);
2301e2b911c5SDarrick J. Wong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2302717d50e4SAndreas Dilger 
23039aa5d32bSDmitry Monakhov 	if (ext4_has_metadata_csum(sbi->s_sb)) {
2304feb0ab32SDarrick J. Wong 		/* Use new metadata_csum algorithm */
2305feb0ab32SDarrick J. Wong 		__u32 csum32;
2306b47820edSDaeho Jeong 		__u16 dummy_csum = 0;
2307feb0ab32SDarrick J. Wong 
2308feb0ab32SDarrick J. Wong 		csum32 = ext4_chksum(sbi, sbi->s_csum_seed, (__u8 *)&le_group,
2309feb0ab32SDarrick J. Wong 				     sizeof(le_group));
2310b47820edSDaeho Jeong 		csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp, offset);
2311b47820edSDaeho Jeong 		csum32 = ext4_chksum(sbi, csum32, (__u8 *)&dummy_csum,
2312b47820edSDaeho Jeong 				     sizeof(dummy_csum));
2313b47820edSDaeho Jeong 		offset += sizeof(dummy_csum);
2314b47820edSDaeho Jeong 		if (offset < sbi->s_desc_size)
2315b47820edSDaeho Jeong 			csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp + offset,
2316b47820edSDaeho Jeong 					     sbi->s_desc_size - offset);
2317feb0ab32SDarrick J. Wong 
2318feb0ab32SDarrick J. Wong 		crc = csum32 & 0xFFFF;
2319feb0ab32SDarrick J. Wong 		goto out;
2320feb0ab32SDarrick J. Wong 	}
2321feb0ab32SDarrick J. Wong 
2322feb0ab32SDarrick J. Wong 	/* old crc16 code */
2323e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_gdt_csum(sb))
2324813d32f9SDarrick J. Wong 		return 0;
2325813d32f9SDarrick J. Wong 
2326717d50e4SAndreas Dilger 	crc = crc16(~0, sbi->s_es->s_uuid, sizeof(sbi->s_es->s_uuid));
2327717d50e4SAndreas Dilger 	crc = crc16(crc, (__u8 *)&le_group, sizeof(le_group));
2328717d50e4SAndreas Dilger 	crc = crc16(crc, (__u8 *)gdp, offset);
2329717d50e4SAndreas Dilger 	offset += sizeof(gdp->bg_checksum); /* skip checksum */
2330717d50e4SAndreas Dilger 	/* for checksum of struct ext4_group_desc do the rest...*/
2331e2b911c5SDarrick J. Wong 	if (ext4_has_feature_64bit(sb) &&
2332717d50e4SAndreas Dilger 	    offset < le16_to_cpu(sbi->s_es->s_desc_size))
2333717d50e4SAndreas Dilger 		crc = crc16(crc, (__u8 *)gdp + offset,
2334717d50e4SAndreas Dilger 			    le16_to_cpu(sbi->s_es->s_desc_size) -
2335717d50e4SAndreas Dilger 				offset);
2336717d50e4SAndreas Dilger 
2337feb0ab32SDarrick J. Wong out:
2338717d50e4SAndreas Dilger 	return cpu_to_le16(crc);
2339717d50e4SAndreas Dilger }
2340717d50e4SAndreas Dilger 
2341feb0ab32SDarrick J. Wong int ext4_group_desc_csum_verify(struct super_block *sb, __u32 block_group,
2342717d50e4SAndreas Dilger 				struct ext4_group_desc *gdp)
2343717d50e4SAndreas Dilger {
2344feb0ab32SDarrick J. Wong 	if (ext4_has_group_desc_csum(sb) &&
2345e2b911c5SDarrick J. Wong 	    (gdp->bg_checksum != ext4_group_desc_csum(sb, block_group, gdp)))
2346717d50e4SAndreas Dilger 		return 0;
2347717d50e4SAndreas Dilger 
2348717d50e4SAndreas Dilger 	return 1;
2349717d50e4SAndreas Dilger }
2350717d50e4SAndreas Dilger 
2351feb0ab32SDarrick J. Wong void ext4_group_desc_csum_set(struct super_block *sb, __u32 block_group,
2352feb0ab32SDarrick J. Wong 			      struct ext4_group_desc *gdp)
2353feb0ab32SDarrick J. Wong {
2354feb0ab32SDarrick J. Wong 	if (!ext4_has_group_desc_csum(sb))
2355feb0ab32SDarrick J. Wong 		return;
2356e2b911c5SDarrick J. Wong 	gdp->bg_checksum = ext4_group_desc_csum(sb, block_group, gdp);
2357feb0ab32SDarrick J. Wong }
2358feb0ab32SDarrick J. Wong 
2359ac27a0ecSDave Kleikamp /* Called at mount-time, super-block is locked */
2360bfff6873SLukas Czerner static int ext4_check_descriptors(struct super_block *sb,
2361829fa70dSTheodore Ts'o 				  ext4_fsblk_t sb_block,
2362bfff6873SLukas Czerner 				  ext4_group_t *first_not_zeroed)
2363ac27a0ecSDave Kleikamp {
2364617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2365617ba13bSMingming Cao 	ext4_fsblk_t first_block = le32_to_cpu(sbi->s_es->s_first_data_block);
2366617ba13bSMingming Cao 	ext4_fsblk_t last_block;
236744de022cSTheodore Ts'o 	ext4_fsblk_t last_bg_block = sb_block + ext4_bg_num_gdb(sb, 0);
2368bd81d8eeSLaurent Vivier 	ext4_fsblk_t block_bitmap;
2369bd81d8eeSLaurent Vivier 	ext4_fsblk_t inode_bitmap;
2370bd81d8eeSLaurent Vivier 	ext4_fsblk_t inode_table;
2371ce421581SJose R. Santos 	int flexbg_flag = 0;
2372bfff6873SLukas Czerner 	ext4_group_t i, grp = sbi->s_groups_count;
2373ac27a0ecSDave Kleikamp 
2374e2b911c5SDarrick J. Wong 	if (ext4_has_feature_flex_bg(sb))
2375ce421581SJose R. Santos 		flexbg_flag = 1;
2376ce421581SJose R. Santos 
2377617ba13bSMingming Cao 	ext4_debug("Checking group descriptors");
2378ac27a0ecSDave Kleikamp 
2379197cd65aSAkinobu Mita 	for (i = 0; i < sbi->s_groups_count; i++) {
2380197cd65aSAkinobu Mita 		struct ext4_group_desc *gdp = ext4_get_group_desc(sb, i, NULL);
2381197cd65aSAkinobu Mita 
2382ce421581SJose R. Santos 		if (i == sbi->s_groups_count - 1 || flexbg_flag)
2383bd81d8eeSLaurent Vivier 			last_block = ext4_blocks_count(sbi->s_es) - 1;
2384ac27a0ecSDave Kleikamp 		else
2385ac27a0ecSDave Kleikamp 			last_block = first_block +
2386617ba13bSMingming Cao 				(EXT4_BLOCKS_PER_GROUP(sb) - 1);
2387ac27a0ecSDave Kleikamp 
2388bfff6873SLukas Czerner 		if ((grp == sbi->s_groups_count) &&
2389bfff6873SLukas Czerner 		   !(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
2390bfff6873SLukas Czerner 			grp = i;
2391bfff6873SLukas Czerner 
23928fadc143SAlexandre Ratchov 		block_bitmap = ext4_block_bitmap(sb, gdp);
2393829fa70dSTheodore Ts'o 		if (block_bitmap == sb_block) {
2394829fa70dSTheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
2395829fa70dSTheodore Ts'o 				 "Block bitmap for group %u overlaps "
2396829fa70dSTheodore Ts'o 				 "superblock", i);
239718db4b4eSTheodore Ts'o 			if (!sb_rdonly(sb))
239818db4b4eSTheodore Ts'o 				return 0;
2399829fa70dSTheodore Ts'o 		}
240077260807STheodore Ts'o 		if (block_bitmap >= sb_block + 1 &&
240177260807STheodore Ts'o 		    block_bitmap <= last_bg_block) {
240277260807STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
240377260807STheodore Ts'o 				 "Block bitmap for group %u overlaps "
240477260807STheodore Ts'o 				 "block group descriptors", i);
240577260807STheodore Ts'o 			if (!sb_rdonly(sb))
240677260807STheodore Ts'o 				return 0;
240777260807STheodore Ts'o 		}
24082b2d6d01STheodore Ts'o 		if (block_bitmap < first_block || block_bitmap > last_block) {
2409b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
2410a9df9a49STheodore Ts'o 			       "Block bitmap for group %u not in group "
2411b31e1552SEric Sandeen 			       "(block %llu)!", i, block_bitmap);
2412ac27a0ecSDave Kleikamp 			return 0;
2413ac27a0ecSDave Kleikamp 		}
24148fadc143SAlexandre Ratchov 		inode_bitmap = ext4_inode_bitmap(sb, gdp);
2415829fa70dSTheodore Ts'o 		if (inode_bitmap == sb_block) {
2416829fa70dSTheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
2417829fa70dSTheodore Ts'o 				 "Inode bitmap for group %u overlaps "
2418829fa70dSTheodore Ts'o 				 "superblock", i);
241918db4b4eSTheodore Ts'o 			if (!sb_rdonly(sb))
242018db4b4eSTheodore Ts'o 				return 0;
2421829fa70dSTheodore Ts'o 		}
242277260807STheodore Ts'o 		if (inode_bitmap >= sb_block + 1 &&
242377260807STheodore Ts'o 		    inode_bitmap <= last_bg_block) {
242477260807STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
242577260807STheodore Ts'o 				 "Inode bitmap for group %u overlaps "
242677260807STheodore Ts'o 				 "block group descriptors", i);
242777260807STheodore Ts'o 			if (!sb_rdonly(sb))
242877260807STheodore Ts'o 				return 0;
242977260807STheodore Ts'o 		}
24302b2d6d01STheodore Ts'o 		if (inode_bitmap < first_block || inode_bitmap > last_block) {
2431b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
2432a9df9a49STheodore Ts'o 			       "Inode bitmap for group %u not in group "
2433b31e1552SEric Sandeen 			       "(block %llu)!", i, inode_bitmap);
2434ac27a0ecSDave Kleikamp 			return 0;
2435ac27a0ecSDave Kleikamp 		}
24368fadc143SAlexandre Ratchov 		inode_table = ext4_inode_table(sb, gdp);
2437829fa70dSTheodore Ts'o 		if (inode_table == sb_block) {
2438829fa70dSTheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
2439829fa70dSTheodore Ts'o 				 "Inode table for group %u overlaps "
2440829fa70dSTheodore Ts'o 				 "superblock", i);
244118db4b4eSTheodore Ts'o 			if (!sb_rdonly(sb))
244218db4b4eSTheodore Ts'o 				return 0;
2443829fa70dSTheodore Ts'o 		}
244477260807STheodore Ts'o 		if (inode_table >= sb_block + 1 &&
244577260807STheodore Ts'o 		    inode_table <= last_bg_block) {
244677260807STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
244777260807STheodore Ts'o 				 "Inode table for group %u overlaps "
244877260807STheodore Ts'o 				 "block group descriptors", i);
244977260807STheodore Ts'o 			if (!sb_rdonly(sb))
245077260807STheodore Ts'o 				return 0;
245177260807STheodore Ts'o 		}
2452bd81d8eeSLaurent Vivier 		if (inode_table < first_block ||
24532b2d6d01STheodore Ts'o 		    inode_table + sbi->s_itb_per_group - 1 > last_block) {
2454b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
2455a9df9a49STheodore Ts'o 			       "Inode table for group %u not in group "
2456b31e1552SEric Sandeen 			       "(block %llu)!", i, inode_table);
2457ac27a0ecSDave Kleikamp 			return 0;
2458ac27a0ecSDave Kleikamp 		}
2459955ce5f5SAneesh Kumar K.V 		ext4_lock_group(sb, i);
2460feb0ab32SDarrick J. Wong 		if (!ext4_group_desc_csum_verify(sb, i, gdp)) {
2461b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: "
2462b31e1552SEric Sandeen 				 "Checksum for group %u failed (%u!=%u)",
2463e2b911c5SDarrick J. Wong 				 i, le16_to_cpu(ext4_group_desc_csum(sb, i,
2464fd2d4291SAvantika Mathur 				     gdp)), le16_to_cpu(gdp->bg_checksum));
2465bc98a42cSDavid Howells 			if (!sb_rdonly(sb)) {
2466955ce5f5SAneesh Kumar K.V 				ext4_unlock_group(sb, i);
2467717d50e4SAndreas Dilger 				return 0;
2468717d50e4SAndreas Dilger 			}
24697ee1ec4cSLi Zefan 		}
2470955ce5f5SAneesh Kumar K.V 		ext4_unlock_group(sb, i);
2471ce421581SJose R. Santos 		if (!flexbg_flag)
2472617ba13bSMingming Cao 			first_block += EXT4_BLOCKS_PER_GROUP(sb);
2473ac27a0ecSDave Kleikamp 	}
2474bfff6873SLukas Czerner 	if (NULL != first_not_zeroed)
2475bfff6873SLukas Czerner 		*first_not_zeroed = grp;
2476ac27a0ecSDave Kleikamp 	return 1;
2477ac27a0ecSDave Kleikamp }
2478ac27a0ecSDave Kleikamp 
2479617ba13bSMingming Cao /* ext4_orphan_cleanup() walks a singly-linked list of inodes (starting at
2480ac27a0ecSDave Kleikamp  * the superblock) which were deleted from all directories, but held open by
2481ac27a0ecSDave Kleikamp  * a process at the time of a crash.  We walk the list and try to delete these
2482ac27a0ecSDave Kleikamp  * inodes at recovery time (only with a read-write filesystem).
2483ac27a0ecSDave Kleikamp  *
2484ac27a0ecSDave Kleikamp  * In order to keep the orphan inode chain consistent during traversal (in
2485ac27a0ecSDave Kleikamp  * case of crash during recovery), we link each inode into the superblock
2486ac27a0ecSDave Kleikamp  * orphan list_head and handle it the same way as an inode deletion during
2487ac27a0ecSDave Kleikamp  * normal operation (which journals the operations for us).
2488ac27a0ecSDave Kleikamp  *
2489ac27a0ecSDave Kleikamp  * We only do an iget() and an iput() on each inode, which is very safe if we
2490ac27a0ecSDave Kleikamp  * accidentally point at an in-use or already deleted inode.  The worst that
2491ac27a0ecSDave Kleikamp  * can happen in this case is that we get a "bit already cleared" message from
2492617ba13bSMingming Cao  * ext4_free_inode().  The only reason we would point at a wrong inode is if
2493ac27a0ecSDave Kleikamp  * e2fsck was run on this filesystem, and it must have already done the orphan
2494ac27a0ecSDave Kleikamp  * inode cleanup for us, so we can safely abort without any further action.
2495ac27a0ecSDave Kleikamp  */
2496617ba13bSMingming Cao static void ext4_orphan_cleanup(struct super_block *sb,
2497617ba13bSMingming Cao 				struct ext4_super_block *es)
2498ac27a0ecSDave Kleikamp {
2499ac27a0ecSDave Kleikamp 	unsigned int s_flags = sb->s_flags;
25002c98eb5eSTheodore Ts'o 	int ret, nr_orphans = 0, nr_truncates = 0;
2501ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
250295f1fda4Szhangyi (F) 	int quota_update = 0;
2503ac27a0ecSDave Kleikamp 	int i;
2504ac27a0ecSDave Kleikamp #endif
2505ac27a0ecSDave Kleikamp 	if (!es->s_last_orphan) {
2506ac27a0ecSDave Kleikamp 		jbd_debug(4, "no orphan inodes to clean up\n");
2507ac27a0ecSDave Kleikamp 		return;
2508ac27a0ecSDave Kleikamp 	}
2509ac27a0ecSDave Kleikamp 
2510a8f48a95SEric Sandeen 	if (bdev_read_only(sb->s_bdev)) {
2511b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "write access "
2512b31e1552SEric Sandeen 			"unavailable, skipping orphan cleanup");
2513a8f48a95SEric Sandeen 		return;
2514a8f48a95SEric Sandeen 	}
2515a8f48a95SEric Sandeen 
2516d39195c3SAmir Goldstein 	/* Check if feature set would not allow a r/w mount */
2517d39195c3SAmir Goldstein 	if (!ext4_feature_set_ok(sb, 0)) {
2518d39195c3SAmir Goldstein 		ext4_msg(sb, KERN_INFO, "Skipping orphan cleanup due to "
2519d39195c3SAmir Goldstein 			 "unknown ROCOMPAT features");
2520d39195c3SAmir Goldstein 		return;
2521d39195c3SAmir Goldstein 	}
2522d39195c3SAmir Goldstein 
2523617ba13bSMingming Cao 	if (EXT4_SB(sb)->s_mount_state & EXT4_ERROR_FS) {
2524c25f9bc6SEric Sandeen 		/* don't clear list on RO mount w/ errors */
25251751e8a6SLinus Torvalds 		if (es->s_last_orphan && !(s_flags & SB_RDONLY)) {
252684474976SDmitry Monakhov 			ext4_msg(sb, KERN_INFO, "Errors on filesystem, "
2527ac27a0ecSDave Kleikamp 				  "clearing orphan list.\n");
2528ac27a0ecSDave Kleikamp 			es->s_last_orphan = 0;
2529c25f9bc6SEric Sandeen 		}
2530ac27a0ecSDave Kleikamp 		jbd_debug(1, "Skipping orphan recovery on fs with errors.\n");
2531ac27a0ecSDave Kleikamp 		return;
2532ac27a0ecSDave Kleikamp 	}
2533ac27a0ecSDave Kleikamp 
25341751e8a6SLinus Torvalds 	if (s_flags & SB_RDONLY) {
2535b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "orphan cleanup on readonly fs");
25361751e8a6SLinus Torvalds 		sb->s_flags &= ~SB_RDONLY;
2537ac27a0ecSDave Kleikamp 	}
2538ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
2539ac27a0ecSDave Kleikamp 	/* Needed for iput() to work correctly and not trash data */
25401751e8a6SLinus Torvalds 	sb->s_flags |= SB_ACTIVE;
254195f1fda4Szhangyi (F) 
254295f1fda4Szhangyi (F) 	/*
254395f1fda4Szhangyi (F) 	 * Turn on quotas which were not enabled for read-only mounts if
254495f1fda4Szhangyi (F) 	 * filesystem has quota feature, so that they are updated correctly.
254595f1fda4Szhangyi (F) 	 */
25461751e8a6SLinus Torvalds 	if (ext4_has_feature_quota(sb) && (s_flags & SB_RDONLY)) {
254795f1fda4Szhangyi (F) 		int ret = ext4_enable_quotas(sb);
254895f1fda4Szhangyi (F) 
254995f1fda4Szhangyi (F) 		if (!ret)
255095f1fda4Szhangyi (F) 			quota_update = 1;
255195f1fda4Szhangyi (F) 		else
255295f1fda4Szhangyi (F) 			ext4_msg(sb, KERN_ERR,
255395f1fda4Szhangyi (F) 				"Cannot turn on quotas: error %d", ret);
255495f1fda4Szhangyi (F) 	}
255595f1fda4Szhangyi (F) 
255695f1fda4Szhangyi (F) 	/* Turn on journaled quotas used for old sytle */
2557a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++) {
2558617ba13bSMingming Cao 		if (EXT4_SB(sb)->s_qf_names[i]) {
2559617ba13bSMingming Cao 			int ret = ext4_quota_on_mount(sb, i);
256095f1fda4Szhangyi (F) 
256195f1fda4Szhangyi (F) 			if (!ret)
256295f1fda4Szhangyi (F) 				quota_update = 1;
256395f1fda4Szhangyi (F) 			else
2564b31e1552SEric Sandeen 				ext4_msg(sb, KERN_ERR,
2565b31e1552SEric Sandeen 					"Cannot turn on journaled "
256695f1fda4Szhangyi (F) 					"quota: type %d: error %d", i, ret);
2567ac27a0ecSDave Kleikamp 		}
2568ac27a0ecSDave Kleikamp 	}
2569ac27a0ecSDave Kleikamp #endif
2570ac27a0ecSDave Kleikamp 
2571ac27a0ecSDave Kleikamp 	while (es->s_last_orphan) {
2572ac27a0ecSDave Kleikamp 		struct inode *inode;
2573ac27a0ecSDave Kleikamp 
2574c65d5c6cSVegard Nossum 		/*
2575c65d5c6cSVegard Nossum 		 * We may have encountered an error during cleanup; if
2576c65d5c6cSVegard Nossum 		 * so, skip the rest.
2577c65d5c6cSVegard Nossum 		 */
2578c65d5c6cSVegard Nossum 		if (EXT4_SB(sb)->s_mount_state & EXT4_ERROR_FS) {
2579c65d5c6cSVegard Nossum 			jbd_debug(1, "Skipping orphan recovery on fs with errors.\n");
2580c65d5c6cSVegard Nossum 			es->s_last_orphan = 0;
2581c65d5c6cSVegard Nossum 			break;
2582c65d5c6cSVegard Nossum 		}
2583c65d5c6cSVegard Nossum 
258497bd42b9SJosef Bacik 		inode = ext4_orphan_get(sb, le32_to_cpu(es->s_last_orphan));
258597bd42b9SJosef Bacik 		if (IS_ERR(inode)) {
2586ac27a0ecSDave Kleikamp 			es->s_last_orphan = 0;
2587ac27a0ecSDave Kleikamp 			break;
2588ac27a0ecSDave Kleikamp 		}
2589ac27a0ecSDave Kleikamp 
2590617ba13bSMingming Cao 		list_add(&EXT4_I(inode)->i_orphan, &EXT4_SB(sb)->s_orphan);
2591871a2931SChristoph Hellwig 		dquot_initialize(inode);
2592ac27a0ecSDave Kleikamp 		if (inode->i_nlink) {
2593566370a2SPaul Taysom 			if (test_opt(sb, DEBUG))
2594b31e1552SEric Sandeen 				ext4_msg(sb, KERN_DEBUG,
2595b31e1552SEric Sandeen 					"%s: truncating inode %lu to %lld bytes",
259646e665e9SHarvey Harrison 					__func__, inode->i_ino, inode->i_size);
2597e5f8eab8STheodore Ts'o 			jbd_debug(2, "truncating inode %lu to %lld bytes\n",
2598ac27a0ecSDave Kleikamp 				  inode->i_ino, inode->i_size);
25995955102cSAl Viro 			inode_lock(inode);
260055f252c9SLukas Czerner 			truncate_inode_pages(inode->i_mapping, inode->i_size);
26012c98eb5eSTheodore Ts'o 			ret = ext4_truncate(inode);
26022c98eb5eSTheodore Ts'o 			if (ret)
26032c98eb5eSTheodore Ts'o 				ext4_std_error(inode->i_sb, ret);
26045955102cSAl Viro 			inode_unlock(inode);
2605ac27a0ecSDave Kleikamp 			nr_truncates++;
2606ac27a0ecSDave Kleikamp 		} else {
2607566370a2SPaul Taysom 			if (test_opt(sb, DEBUG))
2608b31e1552SEric Sandeen 				ext4_msg(sb, KERN_DEBUG,
2609b31e1552SEric Sandeen 					"%s: deleting unreferenced inode %lu",
261046e665e9SHarvey Harrison 					__func__, inode->i_ino);
2611ac27a0ecSDave Kleikamp 			jbd_debug(2, "deleting unreferenced inode %lu\n",
2612ac27a0ecSDave Kleikamp 				  inode->i_ino);
2613ac27a0ecSDave Kleikamp 			nr_orphans++;
2614ac27a0ecSDave Kleikamp 		}
2615ac27a0ecSDave Kleikamp 		iput(inode);  /* The delete magic happens here! */
2616ac27a0ecSDave Kleikamp 	}
2617ac27a0ecSDave Kleikamp 
2618ac27a0ecSDave Kleikamp #define PLURAL(x) (x), ((x) == 1) ? "" : "s"
2619ac27a0ecSDave Kleikamp 
2620ac27a0ecSDave Kleikamp 	if (nr_orphans)
2621b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "%d orphan inode%s deleted",
2622b31e1552SEric Sandeen 		       PLURAL(nr_orphans));
2623ac27a0ecSDave Kleikamp 	if (nr_truncates)
2624b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "%d truncate%s cleaned up",
2625b31e1552SEric Sandeen 		       PLURAL(nr_truncates));
2626ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
262795f1fda4Szhangyi (F) 	/* Turn off quotas if they were enabled for orphan cleanup */
262895f1fda4Szhangyi (F) 	if (quota_update) {
2629a2d4a646SJan Kara 		for (i = 0; i < EXT4_MAXQUOTAS; i++) {
263095f1fda4Szhangyi (F) 			if (sb_dqopt(sb)->files[i])
2631287a8095SChristoph Hellwig 				dquot_quota_off(sb, i);
2632ac27a0ecSDave Kleikamp 		}
263395f1fda4Szhangyi (F) 	}
2634ac27a0ecSDave Kleikamp #endif
26351751e8a6SLinus Torvalds 	sb->s_flags = s_flags; /* Restore SB_RDONLY status */
2636ac27a0ecSDave Kleikamp }
26370b8e58a1SAndreas Dilger 
2638cd2291a4SEric Sandeen /*
2639cd2291a4SEric Sandeen  * Maximal extent format file size.
2640cd2291a4SEric Sandeen  * Resulting logical blkno at s_maxbytes must fit in our on-disk
2641cd2291a4SEric Sandeen  * extent format containers, within a sector_t, and within i_blocks
2642cd2291a4SEric Sandeen  * in the vfs.  ext4 inode has 48 bits of i_block in fsblock units,
2643cd2291a4SEric Sandeen  * so that won't be a limiting factor.
2644cd2291a4SEric Sandeen  *
2645f17722f9SLukas Czerner  * However there is other limiting factor. We do store extents in the form
2646f17722f9SLukas Czerner  * of starting block and length, hence the resulting length of the extent
2647f17722f9SLukas Czerner  * covering maximum file size must fit into on-disk format containers as
2648f17722f9SLukas Czerner  * well. Given that length is always by 1 unit bigger than max unit (because
2649f17722f9SLukas Czerner  * we count 0 as well) we have to lower the s_maxbytes by one fs block.
2650f17722f9SLukas Czerner  *
2651cd2291a4SEric Sandeen  * Note, this does *not* consider any metadata overhead for vfs i_blocks.
2652cd2291a4SEric Sandeen  */
2653f287a1a5STheodore Ts'o static loff_t ext4_max_size(int blkbits, int has_huge_files)
2654cd2291a4SEric Sandeen {
2655cd2291a4SEric Sandeen 	loff_t res;
2656cd2291a4SEric Sandeen 	loff_t upper_limit = MAX_LFS_FILESIZE;
2657cd2291a4SEric Sandeen 
2658cd2291a4SEric Sandeen 	/* small i_blocks in vfs inode? */
2659f287a1a5STheodore Ts'o 	if (!has_huge_files || sizeof(blkcnt_t) < sizeof(u64)) {
2660cd2291a4SEric Sandeen 		/*
266190c699a9SBartlomiej Zolnierkiewicz 		 * CONFIG_LBDAF is not enabled implies the inode
2662cd2291a4SEric Sandeen 		 * i_block represent total blocks in 512 bytes
2663cd2291a4SEric Sandeen 		 * 32 == size of vfs inode i_blocks * 8
2664cd2291a4SEric Sandeen 		 */
2665cd2291a4SEric Sandeen 		upper_limit = (1LL << 32) - 1;
2666cd2291a4SEric Sandeen 
2667cd2291a4SEric Sandeen 		/* total blocks in file system block size */
2668cd2291a4SEric Sandeen 		upper_limit >>= (blkbits - 9);
2669cd2291a4SEric Sandeen 		upper_limit <<= blkbits;
2670cd2291a4SEric Sandeen 	}
2671cd2291a4SEric Sandeen 
2672f17722f9SLukas Czerner 	/*
2673f17722f9SLukas Czerner 	 * 32-bit extent-start container, ee_block. We lower the maxbytes
2674f17722f9SLukas Czerner 	 * by one fs block, so ee_len can cover the extent of maximum file
2675f17722f9SLukas Czerner 	 * size
2676f17722f9SLukas Czerner 	 */
2677f17722f9SLukas Czerner 	res = (1LL << 32) - 1;
2678cd2291a4SEric Sandeen 	res <<= blkbits;
2679cd2291a4SEric Sandeen 
2680cd2291a4SEric Sandeen 	/* Sanity check against vm- & vfs- imposed limits */
2681cd2291a4SEric Sandeen 	if (res > upper_limit)
2682cd2291a4SEric Sandeen 		res = upper_limit;
2683cd2291a4SEric Sandeen 
2684cd2291a4SEric Sandeen 	return res;
2685cd2291a4SEric Sandeen }
2686ac27a0ecSDave Kleikamp 
2687ac27a0ecSDave Kleikamp /*
2688cd2291a4SEric Sandeen  * Maximal bitmap file size.  There is a direct, and {,double-,triple-}indirect
26890fc1b451SAneesh Kumar K.V  * block limit, and also a limit of (2^48 - 1) 512-byte sectors in i_blocks.
26900fc1b451SAneesh Kumar K.V  * We need to be 1 filesystem block less than the 2^48 sector limit.
2691ac27a0ecSDave Kleikamp  */
2692f287a1a5STheodore Ts'o static loff_t ext4_max_bitmap_size(int bits, int has_huge_files)
2693ac27a0ecSDave Kleikamp {
2694617ba13bSMingming Cao 	loff_t res = EXT4_NDIR_BLOCKS;
26950fc1b451SAneesh Kumar K.V 	int meta_blocks;
26960fc1b451SAneesh Kumar K.V 	loff_t upper_limit;
26970b8e58a1SAndreas Dilger 	/* This is calculated to be the largest file size for a dense, block
26980b8e58a1SAndreas Dilger 	 * mapped file such that the file's total number of 512-byte sectors,
26990b8e58a1SAndreas Dilger 	 * including data and all indirect blocks, does not exceed (2^48 - 1).
27000b8e58a1SAndreas Dilger 	 *
27010b8e58a1SAndreas Dilger 	 * __u32 i_blocks_lo and _u16 i_blocks_high represent the total
27020b8e58a1SAndreas Dilger 	 * number of 512-byte sectors of the file.
27030fc1b451SAneesh Kumar K.V 	 */
27040fc1b451SAneesh Kumar K.V 
2705f287a1a5STheodore Ts'o 	if (!has_huge_files || sizeof(blkcnt_t) < sizeof(u64)) {
27060fc1b451SAneesh Kumar K.V 		/*
270790c699a9SBartlomiej Zolnierkiewicz 		 * !has_huge_files or CONFIG_LBDAF not enabled implies that
27080b8e58a1SAndreas Dilger 		 * the inode i_block field represents total file blocks in
27090b8e58a1SAndreas Dilger 		 * 2^32 512-byte sectors == size of vfs inode i_blocks * 8
27100fc1b451SAneesh Kumar K.V 		 */
27110fc1b451SAneesh Kumar K.V 		upper_limit = (1LL << 32) - 1;
27120fc1b451SAneesh Kumar K.V 
27130fc1b451SAneesh Kumar K.V 		/* total blocks in file system block size */
27140fc1b451SAneesh Kumar K.V 		upper_limit >>= (bits - 9);
27150fc1b451SAneesh Kumar K.V 
27160fc1b451SAneesh Kumar K.V 	} else {
27178180a562SAneesh Kumar K.V 		/*
27188180a562SAneesh Kumar K.V 		 * We use 48 bit ext4_inode i_blocks
27198180a562SAneesh Kumar K.V 		 * With EXT4_HUGE_FILE_FL set the i_blocks
27208180a562SAneesh Kumar K.V 		 * represent total number of blocks in
27218180a562SAneesh Kumar K.V 		 * file system block size
27228180a562SAneesh Kumar K.V 		 */
27230fc1b451SAneesh Kumar K.V 		upper_limit = (1LL << 48) - 1;
27240fc1b451SAneesh Kumar K.V 
27250fc1b451SAneesh Kumar K.V 	}
27260fc1b451SAneesh Kumar K.V 
27270fc1b451SAneesh Kumar K.V 	/* indirect blocks */
27280fc1b451SAneesh Kumar K.V 	meta_blocks = 1;
27290fc1b451SAneesh Kumar K.V 	/* double indirect blocks */
27300fc1b451SAneesh Kumar K.V 	meta_blocks += 1 + (1LL << (bits-2));
27310fc1b451SAneesh Kumar K.V 	/* tripple indirect blocks */
27320fc1b451SAneesh Kumar K.V 	meta_blocks += 1 + (1LL << (bits-2)) + (1LL << (2*(bits-2)));
27330fc1b451SAneesh Kumar K.V 
27340fc1b451SAneesh Kumar K.V 	upper_limit -= meta_blocks;
27350fc1b451SAneesh Kumar K.V 	upper_limit <<= bits;
2736ac27a0ecSDave Kleikamp 
2737ac27a0ecSDave Kleikamp 	res += 1LL << (bits-2);
2738ac27a0ecSDave Kleikamp 	res += 1LL << (2*(bits-2));
2739ac27a0ecSDave Kleikamp 	res += 1LL << (3*(bits-2));
2740ac27a0ecSDave Kleikamp 	res <<= bits;
2741ac27a0ecSDave Kleikamp 	if (res > upper_limit)
2742ac27a0ecSDave Kleikamp 		res = upper_limit;
27430fc1b451SAneesh Kumar K.V 
27440fc1b451SAneesh Kumar K.V 	if (res > MAX_LFS_FILESIZE)
27450fc1b451SAneesh Kumar K.V 		res = MAX_LFS_FILESIZE;
27460fc1b451SAneesh Kumar K.V 
2747ac27a0ecSDave Kleikamp 	return res;
2748ac27a0ecSDave Kleikamp }
2749ac27a0ecSDave Kleikamp 
2750617ba13bSMingming Cao static ext4_fsblk_t descriptor_loc(struct super_block *sb,
275170bbb3e0SAndrew Morton 				   ext4_fsblk_t logical_sb_block, int nr)
2752ac27a0ecSDave Kleikamp {
2753617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
2754fd2d4291SAvantika Mathur 	ext4_group_t bg, first_meta_bg;
2755ac27a0ecSDave Kleikamp 	int has_super = 0;
2756ac27a0ecSDave Kleikamp 
2757ac27a0ecSDave Kleikamp 	first_meta_bg = le32_to_cpu(sbi->s_es->s_first_meta_bg);
2758ac27a0ecSDave Kleikamp 
2759e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_meta_bg(sb) || nr < first_meta_bg)
276070bbb3e0SAndrew Morton 		return logical_sb_block + nr + 1;
2761ac27a0ecSDave Kleikamp 	bg = sbi->s_desc_per_block * nr;
2762617ba13bSMingming Cao 	if (ext4_bg_has_super(sb, bg))
2763ac27a0ecSDave Kleikamp 		has_super = 1;
27640b8e58a1SAndreas Dilger 
2765bd63f6b0SDarrick J. Wong 	/*
2766bd63f6b0SDarrick J. Wong 	 * If we have a meta_bg fs with 1k blocks, group 0's GDT is at
2767bd63f6b0SDarrick J. Wong 	 * block 2, not 1.  If s_first_data_block == 0 (bigalloc is enabled
2768bd63f6b0SDarrick J. Wong 	 * on modern mke2fs or blksize > 1k on older mke2fs) then we must
2769bd63f6b0SDarrick J. Wong 	 * compensate.
2770bd63f6b0SDarrick J. Wong 	 */
2771bd63f6b0SDarrick J. Wong 	if (sb->s_blocksize == 1024 && nr == 0 &&
277249598e04SJun Piao 	    le32_to_cpu(sbi->s_es->s_first_data_block) == 0)
2773bd63f6b0SDarrick J. Wong 		has_super++;
2774bd63f6b0SDarrick J. Wong 
2775617ba13bSMingming Cao 	return (has_super + ext4_group_first_block_no(sb, bg));
2776ac27a0ecSDave Kleikamp }
2777ac27a0ecSDave Kleikamp 
2778c9de560dSAlex Tomas /**
2779c9de560dSAlex Tomas  * ext4_get_stripe_size: Get the stripe size.
2780c9de560dSAlex Tomas  * @sbi: In memory super block info
2781c9de560dSAlex Tomas  *
2782c9de560dSAlex Tomas  * If we have specified it via mount option, then
2783c9de560dSAlex Tomas  * use the mount option value. If the value specified at mount time is
2784c9de560dSAlex Tomas  * greater than the blocks per group use the super block value.
2785c9de560dSAlex Tomas  * If the super block value is greater than blocks per group return 0.
2786c9de560dSAlex Tomas  * Allocator needs it be less than blocks per group.
2787c9de560dSAlex Tomas  *
2788c9de560dSAlex Tomas  */
2789c9de560dSAlex Tomas static unsigned long ext4_get_stripe_size(struct ext4_sb_info *sbi)
2790c9de560dSAlex Tomas {
2791c9de560dSAlex Tomas 	unsigned long stride = le16_to_cpu(sbi->s_es->s_raid_stride);
2792c9de560dSAlex Tomas 	unsigned long stripe_width =
2793c9de560dSAlex Tomas 			le32_to_cpu(sbi->s_es->s_raid_stripe_width);
27943eb08658SDan Ehrenberg 	int ret;
2795c9de560dSAlex Tomas 
2796c9de560dSAlex Tomas 	if (sbi->s_stripe && sbi->s_stripe <= sbi->s_blocks_per_group)
27973eb08658SDan Ehrenberg 		ret = sbi->s_stripe;
27985469d7c3SJan Kara 	else if (stripe_width && stripe_width <= sbi->s_blocks_per_group)
27993eb08658SDan Ehrenberg 		ret = stripe_width;
28005469d7c3SJan Kara 	else if (stride && stride <= sbi->s_blocks_per_group)
28013eb08658SDan Ehrenberg 		ret = stride;
28023eb08658SDan Ehrenberg 	else
28033eb08658SDan Ehrenberg 		ret = 0;
2804c9de560dSAlex Tomas 
28053eb08658SDan Ehrenberg 	/*
28063eb08658SDan Ehrenberg 	 * If the stripe width is 1, this makes no sense and
28073eb08658SDan Ehrenberg 	 * we set it to 0 to turn off stripe handling code.
28083eb08658SDan Ehrenberg 	 */
28093eb08658SDan Ehrenberg 	if (ret <= 1)
28103eb08658SDan Ehrenberg 		ret = 0;
2811c9de560dSAlex Tomas 
28123eb08658SDan Ehrenberg 	return ret;
2813c9de560dSAlex Tomas }
2814ac27a0ecSDave Kleikamp 
2815a13fb1a4SEric Sandeen /*
2816a13fb1a4SEric Sandeen  * Check whether this filesystem can be mounted based on
2817a13fb1a4SEric Sandeen  * the features present and the RDONLY/RDWR mount requested.
2818a13fb1a4SEric Sandeen  * Returns 1 if this filesystem can be mounted as requested,
2819a13fb1a4SEric Sandeen  * 0 if it cannot be.
2820a13fb1a4SEric Sandeen  */
2821a13fb1a4SEric Sandeen static int ext4_feature_set_ok(struct super_block *sb, int readonly)
2822a13fb1a4SEric Sandeen {
2823e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext4_incompat_features(sb)) {
2824a13fb1a4SEric Sandeen 		ext4_msg(sb, KERN_ERR,
2825a13fb1a4SEric Sandeen 			"Couldn't mount because of "
2826a13fb1a4SEric Sandeen 			"unsupported optional features (%x)",
2827a13fb1a4SEric Sandeen 			(le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_incompat) &
2828a13fb1a4SEric Sandeen 			~EXT4_FEATURE_INCOMPAT_SUPP));
2829a13fb1a4SEric Sandeen 		return 0;
2830a13fb1a4SEric Sandeen 	}
2831a13fb1a4SEric Sandeen 
2832a13fb1a4SEric Sandeen 	if (readonly)
2833a13fb1a4SEric Sandeen 		return 1;
2834a13fb1a4SEric Sandeen 
2835e2b911c5SDarrick J. Wong 	if (ext4_has_feature_readonly(sb)) {
28362cb5cc8bSDarrick J. Wong 		ext4_msg(sb, KERN_INFO, "filesystem is read-only");
28371751e8a6SLinus Torvalds 		sb->s_flags |= SB_RDONLY;
28382cb5cc8bSDarrick J. Wong 		return 1;
28392cb5cc8bSDarrick J. Wong 	}
28402cb5cc8bSDarrick J. Wong 
2841a13fb1a4SEric Sandeen 	/* Check that feature set is OK for a read-write mount */
2842e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext4_ro_compat_features(sb)) {
2843a13fb1a4SEric Sandeen 		ext4_msg(sb, KERN_ERR, "couldn't mount RDWR because of "
2844a13fb1a4SEric Sandeen 			 "unsupported optional features (%x)",
2845a13fb1a4SEric Sandeen 			 (le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_ro_compat) &
2846a13fb1a4SEric Sandeen 				~EXT4_FEATURE_RO_COMPAT_SUPP));
2847a13fb1a4SEric Sandeen 		return 0;
2848a13fb1a4SEric Sandeen 	}
2849a13fb1a4SEric Sandeen 	/*
2850a13fb1a4SEric Sandeen 	 * Large file size enabled file system can only be mounted
2851a13fb1a4SEric Sandeen 	 * read-write on 32-bit systems if kernel is built with CONFIG_LBDAF
2852a13fb1a4SEric Sandeen 	 */
2853e2b911c5SDarrick J. Wong 	if (ext4_has_feature_huge_file(sb)) {
2854a13fb1a4SEric Sandeen 		if (sizeof(blkcnt_t) < sizeof(u64)) {
2855a13fb1a4SEric Sandeen 			ext4_msg(sb, KERN_ERR, "Filesystem with huge files "
2856a13fb1a4SEric Sandeen 				 "cannot be mounted RDWR without "
2857a13fb1a4SEric Sandeen 				 "CONFIG_LBDAF");
2858a13fb1a4SEric Sandeen 			return 0;
2859a13fb1a4SEric Sandeen 		}
2860a13fb1a4SEric Sandeen 	}
2861e2b911c5SDarrick J. Wong 	if (ext4_has_feature_bigalloc(sb) && !ext4_has_feature_extents(sb)) {
2862bab08ab9STheodore Ts'o 		ext4_msg(sb, KERN_ERR,
2863bab08ab9STheodore Ts'o 			 "Can't support bigalloc feature without "
2864bab08ab9STheodore Ts'o 			 "extents feature\n");
2865bab08ab9STheodore Ts'o 		return 0;
2866bab08ab9STheodore Ts'o 	}
28677c319d32SAditya Kali 
28687c319d32SAditya Kali #ifndef CONFIG_QUOTA
2869e2b911c5SDarrick J. Wong 	if (ext4_has_feature_quota(sb) && !readonly) {
28707c319d32SAditya Kali 		ext4_msg(sb, KERN_ERR,
28717c319d32SAditya Kali 			 "Filesystem with quota feature cannot be mounted RDWR "
28727c319d32SAditya Kali 			 "without CONFIG_QUOTA");
28737c319d32SAditya Kali 		return 0;
28747c319d32SAditya Kali 	}
2875689c958cSLi Xi 	if (ext4_has_feature_project(sb) && !readonly) {
2876689c958cSLi Xi 		ext4_msg(sb, KERN_ERR,
2877689c958cSLi Xi 			 "Filesystem with project quota feature cannot be mounted RDWR "
2878689c958cSLi Xi 			 "without CONFIG_QUOTA");
2879689c958cSLi Xi 		return 0;
2880689c958cSLi Xi 	}
28817c319d32SAditya Kali #endif  /* CONFIG_QUOTA */
2882a13fb1a4SEric Sandeen 	return 1;
2883a13fb1a4SEric Sandeen }
2884a13fb1a4SEric Sandeen 
288566e61a9eSTheodore Ts'o /*
288666e61a9eSTheodore Ts'o  * This function is called once a day if we have errors logged
288766e61a9eSTheodore Ts'o  * on the file system
288866e61a9eSTheodore Ts'o  */
2889235699a8SKees Cook static void print_daily_error_info(struct timer_list *t)
289066e61a9eSTheodore Ts'o {
2891235699a8SKees Cook 	struct ext4_sb_info *sbi = from_timer(sbi, t, s_err_report);
2892235699a8SKees Cook 	struct super_block *sb = sbi->s_sb;
2893235699a8SKees Cook 	struct ext4_super_block *es = sbi->s_es;
289466e61a9eSTheodore Ts'o 
289566e61a9eSTheodore Ts'o 	if (es->s_error_count)
2896ae0f78deSTheodore Ts'o 		/* fsck newer than v1.41.13 is needed to clean this condition. */
2897ae0f78deSTheodore Ts'o 		ext4_msg(sb, KERN_NOTICE, "error count since last fsck: %u",
289866e61a9eSTheodore Ts'o 			 le32_to_cpu(es->s_error_count));
289966e61a9eSTheodore Ts'o 	if (es->s_first_error_time) {
29006a0678a7SArnd Bergmann 		printk(KERN_NOTICE "EXT4-fs (%s): initial error at time %llu: %.*s:%d",
29016a0678a7SArnd Bergmann 		       sb->s_id,
29026a0678a7SArnd Bergmann 		       ext4_get_tstamp(es, s_first_error_time),
290366e61a9eSTheodore Ts'o 		       (int) sizeof(es->s_first_error_func),
290466e61a9eSTheodore Ts'o 		       es->s_first_error_func,
290566e61a9eSTheodore Ts'o 		       le32_to_cpu(es->s_first_error_line));
290666e61a9eSTheodore Ts'o 		if (es->s_first_error_ino)
2907651e1c3bSJoe Perches 			printk(KERN_CONT ": inode %u",
290866e61a9eSTheodore Ts'o 			       le32_to_cpu(es->s_first_error_ino));
290966e61a9eSTheodore Ts'o 		if (es->s_first_error_block)
2910651e1c3bSJoe Perches 			printk(KERN_CONT ": block %llu", (unsigned long long)
291166e61a9eSTheodore Ts'o 			       le64_to_cpu(es->s_first_error_block));
2912651e1c3bSJoe Perches 		printk(KERN_CONT "\n");
291366e61a9eSTheodore Ts'o 	}
291466e61a9eSTheodore Ts'o 	if (es->s_last_error_time) {
29156a0678a7SArnd Bergmann 		printk(KERN_NOTICE "EXT4-fs (%s): last error at time %llu: %.*s:%d",
29166a0678a7SArnd Bergmann 		       sb->s_id,
29176a0678a7SArnd Bergmann 		       ext4_get_tstamp(es, s_last_error_time),
291866e61a9eSTheodore Ts'o 		       (int) sizeof(es->s_last_error_func),
291966e61a9eSTheodore Ts'o 		       es->s_last_error_func,
292066e61a9eSTheodore Ts'o 		       le32_to_cpu(es->s_last_error_line));
292166e61a9eSTheodore Ts'o 		if (es->s_last_error_ino)
2922651e1c3bSJoe Perches 			printk(KERN_CONT ": inode %u",
292366e61a9eSTheodore Ts'o 			       le32_to_cpu(es->s_last_error_ino));
292466e61a9eSTheodore Ts'o 		if (es->s_last_error_block)
2925651e1c3bSJoe Perches 			printk(KERN_CONT ": block %llu", (unsigned long long)
292666e61a9eSTheodore Ts'o 			       le64_to_cpu(es->s_last_error_block));
2927651e1c3bSJoe Perches 		printk(KERN_CONT "\n");
292866e61a9eSTheodore Ts'o 	}
292966e61a9eSTheodore Ts'o 	mod_timer(&sbi->s_err_report, jiffies + 24*60*60*HZ);  /* Once a day */
293066e61a9eSTheodore Ts'o }
293166e61a9eSTheodore Ts'o 
2932bfff6873SLukas Czerner /* Find next suitable group and run ext4_init_inode_table */
2933bfff6873SLukas Czerner static int ext4_run_li_request(struct ext4_li_request *elr)
2934bfff6873SLukas Czerner {
2935bfff6873SLukas Czerner 	struct ext4_group_desc *gdp = NULL;
2936bfff6873SLukas Czerner 	ext4_group_t group, ngroups;
2937bfff6873SLukas Czerner 	struct super_block *sb;
2938bfff6873SLukas Czerner 	unsigned long timeout = 0;
2939bfff6873SLukas Czerner 	int ret = 0;
2940bfff6873SLukas Czerner 
2941bfff6873SLukas Czerner 	sb = elr->lr_super;
2942bfff6873SLukas Czerner 	ngroups = EXT4_SB(sb)->s_groups_count;
2943bfff6873SLukas Czerner 
2944bfff6873SLukas Czerner 	for (group = elr->lr_next_group; group < ngroups; group++) {
2945bfff6873SLukas Czerner 		gdp = ext4_get_group_desc(sb, group, NULL);
2946bfff6873SLukas Czerner 		if (!gdp) {
2947bfff6873SLukas Czerner 			ret = 1;
2948bfff6873SLukas Czerner 			break;
2949bfff6873SLukas Czerner 		}
2950bfff6873SLukas Czerner 
2951bfff6873SLukas Czerner 		if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
2952bfff6873SLukas Czerner 			break;
2953bfff6873SLukas Czerner 	}
2954bfff6873SLukas Czerner 
29557f511862STheodore Ts'o 	if (group >= ngroups)
2956bfff6873SLukas Czerner 		ret = 1;
2957bfff6873SLukas Czerner 
2958bfff6873SLukas Czerner 	if (!ret) {
2959bfff6873SLukas Czerner 		timeout = jiffies;
2960bfff6873SLukas Czerner 		ret = ext4_init_inode_table(sb, group,
2961bfff6873SLukas Czerner 					    elr->lr_timeout ? 0 : 1);
2962bfff6873SLukas Czerner 		if (elr->lr_timeout == 0) {
296351ce6511SLukas Czerner 			timeout = (jiffies - timeout) *
296451ce6511SLukas Czerner 				  elr->lr_sbi->s_li_wait_mult;
2965bfff6873SLukas Czerner 			elr->lr_timeout = timeout;
2966bfff6873SLukas Czerner 		}
2967bfff6873SLukas Czerner 		elr->lr_next_sched = jiffies + elr->lr_timeout;
2968bfff6873SLukas Czerner 		elr->lr_next_group = group + 1;
2969bfff6873SLukas Czerner 	}
2970bfff6873SLukas Czerner 	return ret;
2971bfff6873SLukas Czerner }
2972bfff6873SLukas Czerner 
2973bfff6873SLukas Czerner /*
2974bfff6873SLukas Czerner  * Remove lr_request from the list_request and free the
29754ed5c033SLukas Czerner  * request structure. Should be called with li_list_mtx held
2976bfff6873SLukas Czerner  */
2977bfff6873SLukas Czerner static void ext4_remove_li_request(struct ext4_li_request *elr)
2978bfff6873SLukas Czerner {
2979bfff6873SLukas Czerner 	struct ext4_sb_info *sbi;
2980bfff6873SLukas Czerner 
2981bfff6873SLukas Czerner 	if (!elr)
2982bfff6873SLukas Czerner 		return;
2983bfff6873SLukas Czerner 
2984bfff6873SLukas Czerner 	sbi = elr->lr_sbi;
2985bfff6873SLukas Czerner 
2986bfff6873SLukas Czerner 	list_del(&elr->lr_request);
2987bfff6873SLukas Czerner 	sbi->s_li_request = NULL;
2988bfff6873SLukas Czerner 	kfree(elr);
2989bfff6873SLukas Czerner }
2990bfff6873SLukas Czerner 
2991bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb)
2992bfff6873SLukas Czerner {
29931bb933fbSLukas Czerner 	mutex_lock(&ext4_li_mtx);
29941bb933fbSLukas Czerner 	if (!ext4_li_info) {
29951bb933fbSLukas Czerner 		mutex_unlock(&ext4_li_mtx);
2996bfff6873SLukas Czerner 		return;
29971bb933fbSLukas Czerner 	}
2998bfff6873SLukas Czerner 
2999bfff6873SLukas Czerner 	mutex_lock(&ext4_li_info->li_list_mtx);
30001bb933fbSLukas Czerner 	ext4_remove_li_request(EXT4_SB(sb)->s_li_request);
3001bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_info->li_list_mtx);
30021bb933fbSLukas Czerner 	mutex_unlock(&ext4_li_mtx);
3003bfff6873SLukas Czerner }
3004bfff6873SLukas Czerner 
30058f1f7453SEric Sandeen static struct task_struct *ext4_lazyinit_task;
30068f1f7453SEric Sandeen 
3007bfff6873SLukas Czerner /*
3008bfff6873SLukas Czerner  * This is the function where ext4lazyinit thread lives. It walks
3009bfff6873SLukas Czerner  * through the request list searching for next scheduled filesystem.
3010bfff6873SLukas Czerner  * When such a fs is found, run the lazy initialization request
3011bfff6873SLukas Czerner  * (ext4_rn_li_request) and keep track of the time spend in this
3012bfff6873SLukas Czerner  * function. Based on that time we compute next schedule time of
3013bfff6873SLukas Czerner  * the request. When walking through the list is complete, compute
3014bfff6873SLukas Czerner  * next waking time and put itself into sleep.
3015bfff6873SLukas Czerner  */
3016bfff6873SLukas Czerner static int ext4_lazyinit_thread(void *arg)
3017bfff6873SLukas Czerner {
3018bfff6873SLukas Czerner 	struct ext4_lazy_init *eli = (struct ext4_lazy_init *)arg;
3019bfff6873SLukas Czerner 	struct list_head *pos, *n;
3020bfff6873SLukas Czerner 	struct ext4_li_request *elr;
30214ed5c033SLukas Czerner 	unsigned long next_wakeup, cur;
3022bfff6873SLukas Czerner 
3023bfff6873SLukas Czerner 	BUG_ON(NULL == eli);
3024bfff6873SLukas Czerner 
3025bfff6873SLukas Czerner cont_thread:
3026bfff6873SLukas Czerner 	while (true) {
3027bfff6873SLukas Czerner 		next_wakeup = MAX_JIFFY_OFFSET;
3028bfff6873SLukas Czerner 
3029bfff6873SLukas Czerner 		mutex_lock(&eli->li_list_mtx);
3030bfff6873SLukas Czerner 		if (list_empty(&eli->li_request_list)) {
3031bfff6873SLukas Czerner 			mutex_unlock(&eli->li_list_mtx);
3032bfff6873SLukas Czerner 			goto exit_thread;
3033bfff6873SLukas Czerner 		}
3034bfff6873SLukas Czerner 		list_for_each_safe(pos, n, &eli->li_request_list) {
3035e22834f0SDmitry Monakhov 			int err = 0;
3036e22834f0SDmitry Monakhov 			int progress = 0;
3037bfff6873SLukas Czerner 			elr = list_entry(pos, struct ext4_li_request,
3038bfff6873SLukas Czerner 					 lr_request);
3039bfff6873SLukas Czerner 
3040e22834f0SDmitry Monakhov 			if (time_before(jiffies, elr->lr_next_sched)) {
3041e22834f0SDmitry Monakhov 				if (time_before(elr->lr_next_sched, next_wakeup))
3042e22834f0SDmitry Monakhov 					next_wakeup = elr->lr_next_sched;
3043e22834f0SDmitry Monakhov 				continue;
3044e22834f0SDmitry Monakhov 			}
3045e22834f0SDmitry Monakhov 			if (down_read_trylock(&elr->lr_super->s_umount)) {
3046e22834f0SDmitry Monakhov 				if (sb_start_write_trylock(elr->lr_super)) {
3047e22834f0SDmitry Monakhov 					progress = 1;
3048e22834f0SDmitry Monakhov 					/*
3049e22834f0SDmitry Monakhov 					 * We hold sb->s_umount, sb can not
3050e22834f0SDmitry Monakhov 					 * be removed from the list, it is
3051e22834f0SDmitry Monakhov 					 * now safe to drop li_list_mtx
3052e22834f0SDmitry Monakhov 					 */
3053e22834f0SDmitry Monakhov 					mutex_unlock(&eli->li_list_mtx);
3054e22834f0SDmitry Monakhov 					err = ext4_run_li_request(elr);
3055e22834f0SDmitry Monakhov 					sb_end_write(elr->lr_super);
3056e22834f0SDmitry Monakhov 					mutex_lock(&eli->li_list_mtx);
3057e22834f0SDmitry Monakhov 					n = pos->next;
3058e22834f0SDmitry Monakhov 				}
3059e22834f0SDmitry Monakhov 				up_read((&elr->lr_super->s_umount));
3060e22834f0SDmitry Monakhov 			}
3061b2c78cd0STheodore Ts'o 			/* error, remove the lazy_init job */
3062e22834f0SDmitry Monakhov 			if (err) {
3063bfff6873SLukas Czerner 				ext4_remove_li_request(elr);
3064bfff6873SLukas Czerner 				continue;
3065bfff6873SLukas Czerner 			}
3066e22834f0SDmitry Monakhov 			if (!progress) {
3067e22834f0SDmitry Monakhov 				elr->lr_next_sched = jiffies +
3068e22834f0SDmitry Monakhov 					(prandom_u32()
3069e22834f0SDmitry Monakhov 					 % (EXT4_DEF_LI_MAX_START_DELAY * HZ));
3070b2c78cd0STheodore Ts'o 			}
3071bfff6873SLukas Czerner 			if (time_before(elr->lr_next_sched, next_wakeup))
3072bfff6873SLukas Czerner 				next_wakeup = elr->lr_next_sched;
3073bfff6873SLukas Czerner 		}
3074bfff6873SLukas Czerner 		mutex_unlock(&eli->li_list_mtx);
3075bfff6873SLukas Czerner 
3076a0acae0eSTejun Heo 		try_to_freeze();
3077bfff6873SLukas Czerner 
30784ed5c033SLukas Czerner 		cur = jiffies;
30794ed5c033SLukas Czerner 		if ((time_after_eq(cur, next_wakeup)) ||
3080f4245bd4SLukas Czerner 		    (MAX_JIFFY_OFFSET == next_wakeup)) {
3081bfff6873SLukas Czerner 			cond_resched();
3082bfff6873SLukas Czerner 			continue;
3083bfff6873SLukas Czerner 		}
3084bfff6873SLukas Czerner 
30854ed5c033SLukas Czerner 		schedule_timeout_interruptible(next_wakeup - cur);
30864ed5c033SLukas Czerner 
30878f1f7453SEric Sandeen 		if (kthread_should_stop()) {
30888f1f7453SEric Sandeen 			ext4_clear_request_list();
30898f1f7453SEric Sandeen 			goto exit_thread;
30908f1f7453SEric Sandeen 		}
3091bfff6873SLukas Czerner 	}
3092bfff6873SLukas Czerner 
3093bfff6873SLukas Czerner exit_thread:
3094bfff6873SLukas Czerner 	/*
3095bfff6873SLukas Czerner 	 * It looks like the request list is empty, but we need
3096bfff6873SLukas Czerner 	 * to check it under the li_list_mtx lock, to prevent any
3097bfff6873SLukas Czerner 	 * additions into it, and of course we should lock ext4_li_mtx
3098bfff6873SLukas Czerner 	 * to atomically free the list and ext4_li_info, because at
3099bfff6873SLukas Czerner 	 * this point another ext4 filesystem could be registering
3100bfff6873SLukas Czerner 	 * new one.
3101bfff6873SLukas Czerner 	 */
3102bfff6873SLukas Czerner 	mutex_lock(&ext4_li_mtx);
3103bfff6873SLukas Czerner 	mutex_lock(&eli->li_list_mtx);
3104bfff6873SLukas Czerner 	if (!list_empty(&eli->li_request_list)) {
3105bfff6873SLukas Czerner 		mutex_unlock(&eli->li_list_mtx);
3106bfff6873SLukas Czerner 		mutex_unlock(&ext4_li_mtx);
3107bfff6873SLukas Czerner 		goto cont_thread;
3108bfff6873SLukas Czerner 	}
3109bfff6873SLukas Czerner 	mutex_unlock(&eli->li_list_mtx);
3110bfff6873SLukas Czerner 	kfree(ext4_li_info);
3111bfff6873SLukas Czerner 	ext4_li_info = NULL;
3112bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_mtx);
3113bfff6873SLukas Czerner 
3114bfff6873SLukas Czerner 	return 0;
3115bfff6873SLukas Czerner }
3116bfff6873SLukas Czerner 
3117bfff6873SLukas Czerner static void ext4_clear_request_list(void)
3118bfff6873SLukas Czerner {
3119bfff6873SLukas Czerner 	struct list_head *pos, *n;
3120bfff6873SLukas Czerner 	struct ext4_li_request *elr;
3121bfff6873SLukas Czerner 
3122bfff6873SLukas Czerner 	mutex_lock(&ext4_li_info->li_list_mtx);
3123bfff6873SLukas Czerner 	list_for_each_safe(pos, n, &ext4_li_info->li_request_list) {
3124bfff6873SLukas Czerner 		elr = list_entry(pos, struct ext4_li_request,
3125bfff6873SLukas Czerner 				 lr_request);
3126bfff6873SLukas Czerner 		ext4_remove_li_request(elr);
3127bfff6873SLukas Czerner 	}
3128bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_info->li_list_mtx);
3129bfff6873SLukas Czerner }
3130bfff6873SLukas Czerner 
3131bfff6873SLukas Czerner static int ext4_run_lazyinit_thread(void)
3132bfff6873SLukas Czerner {
31338f1f7453SEric Sandeen 	ext4_lazyinit_task = kthread_run(ext4_lazyinit_thread,
31348f1f7453SEric Sandeen 					 ext4_li_info, "ext4lazyinit");
31358f1f7453SEric Sandeen 	if (IS_ERR(ext4_lazyinit_task)) {
31368f1f7453SEric Sandeen 		int err = PTR_ERR(ext4_lazyinit_task);
3137bfff6873SLukas Czerner 		ext4_clear_request_list();
3138bfff6873SLukas Czerner 		kfree(ext4_li_info);
3139bfff6873SLukas Czerner 		ext4_li_info = NULL;
314092b97816STheodore Ts'o 		printk(KERN_CRIT "EXT4-fs: error %d creating inode table "
3141bfff6873SLukas Czerner 				 "initialization thread\n",
3142bfff6873SLukas Czerner 				 err);
3143bfff6873SLukas Czerner 		return err;
3144bfff6873SLukas Czerner 	}
3145bfff6873SLukas Czerner 	ext4_li_info->li_state |= EXT4_LAZYINIT_RUNNING;
3146bfff6873SLukas Czerner 	return 0;
3147bfff6873SLukas Czerner }
3148bfff6873SLukas Czerner 
3149bfff6873SLukas Czerner /*
3150bfff6873SLukas Czerner  * Check whether it make sense to run itable init. thread or not.
3151bfff6873SLukas Czerner  * If there is at least one uninitialized inode table, return
3152bfff6873SLukas Czerner  * corresponding group number, else the loop goes through all
3153bfff6873SLukas Czerner  * groups and return total number of groups.
3154bfff6873SLukas Czerner  */
3155bfff6873SLukas Czerner static ext4_group_t ext4_has_uninit_itable(struct super_block *sb)
3156bfff6873SLukas Czerner {
3157bfff6873SLukas Czerner 	ext4_group_t group, ngroups = EXT4_SB(sb)->s_groups_count;
3158bfff6873SLukas Czerner 	struct ext4_group_desc *gdp = NULL;
3159bfff6873SLukas Czerner 
31608844618dSTheodore Ts'o 	if (!ext4_has_group_desc_csum(sb))
31618844618dSTheodore Ts'o 		return ngroups;
31628844618dSTheodore Ts'o 
3163bfff6873SLukas Czerner 	for (group = 0; group < ngroups; group++) {
3164bfff6873SLukas Czerner 		gdp = ext4_get_group_desc(sb, group, NULL);
3165bfff6873SLukas Czerner 		if (!gdp)
3166bfff6873SLukas Czerner 			continue;
3167bfff6873SLukas Czerner 
316850122847STheodore Ts'o 		if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED)))
3169bfff6873SLukas Czerner 			break;
3170bfff6873SLukas Czerner 	}
3171bfff6873SLukas Czerner 
3172bfff6873SLukas Czerner 	return group;
3173bfff6873SLukas Czerner }
3174bfff6873SLukas Czerner 
3175bfff6873SLukas Czerner static int ext4_li_info_new(void)
3176bfff6873SLukas Czerner {
3177bfff6873SLukas Czerner 	struct ext4_lazy_init *eli = NULL;
3178bfff6873SLukas Czerner 
3179bfff6873SLukas Czerner 	eli = kzalloc(sizeof(*eli), GFP_KERNEL);
3180bfff6873SLukas Czerner 	if (!eli)
3181bfff6873SLukas Czerner 		return -ENOMEM;
3182bfff6873SLukas Czerner 
3183bfff6873SLukas Czerner 	INIT_LIST_HEAD(&eli->li_request_list);
3184bfff6873SLukas Czerner 	mutex_init(&eli->li_list_mtx);
3185bfff6873SLukas Czerner 
3186bfff6873SLukas Czerner 	eli->li_state |= EXT4_LAZYINIT_QUIT;
3187bfff6873SLukas Czerner 
3188bfff6873SLukas Czerner 	ext4_li_info = eli;
3189bfff6873SLukas Czerner 
3190bfff6873SLukas Czerner 	return 0;
3191bfff6873SLukas Czerner }
3192bfff6873SLukas Czerner 
3193bfff6873SLukas Czerner static struct ext4_li_request *ext4_li_request_new(struct super_block *sb,
3194bfff6873SLukas Czerner 					    ext4_group_t start)
3195bfff6873SLukas Czerner {
3196bfff6873SLukas Czerner 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3197bfff6873SLukas Czerner 	struct ext4_li_request *elr;
3198bfff6873SLukas Czerner 
3199bfff6873SLukas Czerner 	elr = kzalloc(sizeof(*elr), GFP_KERNEL);
3200bfff6873SLukas Czerner 	if (!elr)
3201bfff6873SLukas Czerner 		return NULL;
3202bfff6873SLukas Czerner 
3203bfff6873SLukas Czerner 	elr->lr_super = sb;
3204bfff6873SLukas Czerner 	elr->lr_sbi = sbi;
3205bfff6873SLukas Czerner 	elr->lr_next_group = start;
3206bfff6873SLukas Czerner 
3207bfff6873SLukas Czerner 	/*
3208bfff6873SLukas Czerner 	 * Randomize first schedule time of the request to
3209bfff6873SLukas Czerner 	 * spread the inode table initialization requests
3210bfff6873SLukas Czerner 	 * better.
3211bfff6873SLukas Czerner 	 */
3212dd1f723bSTheodore Ts'o 	elr->lr_next_sched = jiffies + (prandom_u32() %
3213dd1f723bSTheodore Ts'o 				(EXT4_DEF_LI_MAX_START_DELAY * HZ));
3214bfff6873SLukas Czerner 	return elr;
3215bfff6873SLukas Czerner }
3216bfff6873SLukas Czerner 
32177f511862STheodore Ts'o int ext4_register_li_request(struct super_block *sb,
3218bfff6873SLukas Czerner 			     ext4_group_t first_not_zeroed)
3219bfff6873SLukas Czerner {
3220bfff6873SLukas Czerner 	struct ext4_sb_info *sbi = EXT4_SB(sb);
32217f511862STheodore Ts'o 	struct ext4_li_request *elr = NULL;
322249598e04SJun Piao 	ext4_group_t ngroups = sbi->s_groups_count;
32236c5a6cb9SAndrew Morton 	int ret = 0;
3224bfff6873SLukas Czerner 
32257f511862STheodore Ts'o 	mutex_lock(&ext4_li_mtx);
322651ce6511SLukas Czerner 	if (sbi->s_li_request != NULL) {
322751ce6511SLukas Czerner 		/*
322851ce6511SLukas Czerner 		 * Reset timeout so it can be computed again, because
322951ce6511SLukas Czerner 		 * s_li_wait_mult might have changed.
323051ce6511SLukas Czerner 		 */
323151ce6511SLukas Czerner 		sbi->s_li_request->lr_timeout = 0;
32327f511862STheodore Ts'o 		goto out;
323351ce6511SLukas Czerner 	}
3234bfff6873SLukas Czerner 
3235bc98a42cSDavid Howells 	if (first_not_zeroed == ngroups || sb_rdonly(sb) ||
323655ff3840STao Ma 	    !test_opt(sb, INIT_INODE_TABLE))
32377f511862STheodore Ts'o 		goto out;
3238bfff6873SLukas Czerner 
3239bfff6873SLukas Czerner 	elr = ext4_li_request_new(sb, first_not_zeroed);
32407f511862STheodore Ts'o 	if (!elr) {
32417f511862STheodore Ts'o 		ret = -ENOMEM;
32427f511862STheodore Ts'o 		goto out;
32437f511862STheodore Ts'o 	}
3244bfff6873SLukas Czerner 
3245bfff6873SLukas Czerner 	if (NULL == ext4_li_info) {
3246bfff6873SLukas Czerner 		ret = ext4_li_info_new();
3247bfff6873SLukas Czerner 		if (ret)
3248bfff6873SLukas Czerner 			goto out;
3249bfff6873SLukas Czerner 	}
3250bfff6873SLukas Czerner 
3251bfff6873SLukas Czerner 	mutex_lock(&ext4_li_info->li_list_mtx);
3252bfff6873SLukas Czerner 	list_add(&elr->lr_request, &ext4_li_info->li_request_list);
3253bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_info->li_list_mtx);
3254bfff6873SLukas Czerner 
3255bfff6873SLukas Czerner 	sbi->s_li_request = elr;
325646e4690bSTao Ma 	/*
325746e4690bSTao Ma 	 * set elr to NULL here since it has been inserted to
325846e4690bSTao Ma 	 * the request_list and the removal and free of it is
325946e4690bSTao Ma 	 * handled by ext4_clear_request_list from now on.
326046e4690bSTao Ma 	 */
326146e4690bSTao Ma 	elr = NULL;
3262bfff6873SLukas Czerner 
3263bfff6873SLukas Czerner 	if (!(ext4_li_info->li_state & EXT4_LAZYINIT_RUNNING)) {
3264bfff6873SLukas Czerner 		ret = ext4_run_lazyinit_thread();
3265bfff6873SLukas Czerner 		if (ret)
3266bfff6873SLukas Czerner 			goto out;
3267bfff6873SLukas Czerner 	}
3268bfff6873SLukas Czerner out:
3269bfff6873SLukas Czerner 	mutex_unlock(&ext4_li_mtx);
3270beed5ecbSNicolas Kaiser 	if (ret)
3271bfff6873SLukas Czerner 		kfree(elr);
3272bfff6873SLukas Czerner 	return ret;
3273bfff6873SLukas Czerner }
3274bfff6873SLukas Czerner 
3275bfff6873SLukas Czerner /*
3276bfff6873SLukas Czerner  * We do not need to lock anything since this is called on
3277bfff6873SLukas Czerner  * module unload.
3278bfff6873SLukas Czerner  */
3279bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void)
3280bfff6873SLukas Czerner {
3281bfff6873SLukas Czerner 	/*
3282bfff6873SLukas Czerner 	 * If thread exited earlier
3283bfff6873SLukas Czerner 	 * there's nothing to be done.
3284bfff6873SLukas Czerner 	 */
32858f1f7453SEric Sandeen 	if (!ext4_li_info || !ext4_lazyinit_task)
3286bfff6873SLukas Czerner 		return;
3287bfff6873SLukas Czerner 
32888f1f7453SEric Sandeen 	kthread_stop(ext4_lazyinit_task);
3289bfff6873SLukas Czerner }
3290bfff6873SLukas Czerner 
329125ed6e8aSDarrick J. Wong static int set_journal_csum_feature_set(struct super_block *sb)
329225ed6e8aSDarrick J. Wong {
329325ed6e8aSDarrick J. Wong 	int ret = 1;
329425ed6e8aSDarrick J. Wong 	int compat, incompat;
329525ed6e8aSDarrick J. Wong 	struct ext4_sb_info *sbi = EXT4_SB(sb);
329625ed6e8aSDarrick J. Wong 
32979aa5d32bSDmitry Monakhov 	if (ext4_has_metadata_csum(sb)) {
3298db9ee220SDarrick J. Wong 		/* journal checksum v3 */
329925ed6e8aSDarrick J. Wong 		compat = 0;
3300db9ee220SDarrick J. Wong 		incompat = JBD2_FEATURE_INCOMPAT_CSUM_V3;
330125ed6e8aSDarrick J. Wong 	} else {
330225ed6e8aSDarrick J. Wong 		/* journal checksum v1 */
330325ed6e8aSDarrick J. Wong 		compat = JBD2_FEATURE_COMPAT_CHECKSUM;
330425ed6e8aSDarrick J. Wong 		incompat = 0;
330525ed6e8aSDarrick J. Wong 	}
330625ed6e8aSDarrick J. Wong 
3307feb8c6d3SDarrick J. Wong 	jbd2_journal_clear_features(sbi->s_journal,
3308feb8c6d3SDarrick J. Wong 			JBD2_FEATURE_COMPAT_CHECKSUM, 0,
3309feb8c6d3SDarrick J. Wong 			JBD2_FEATURE_INCOMPAT_CSUM_V3 |
3310feb8c6d3SDarrick J. Wong 			JBD2_FEATURE_INCOMPAT_CSUM_V2);
331125ed6e8aSDarrick J. Wong 	if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
331225ed6e8aSDarrick J. Wong 		ret = jbd2_journal_set_features(sbi->s_journal,
331325ed6e8aSDarrick J. Wong 				compat, 0,
331425ed6e8aSDarrick J. Wong 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT |
331525ed6e8aSDarrick J. Wong 				incompat);
331625ed6e8aSDarrick J. Wong 	} else if (test_opt(sb, JOURNAL_CHECKSUM)) {
331725ed6e8aSDarrick J. Wong 		ret = jbd2_journal_set_features(sbi->s_journal,
331825ed6e8aSDarrick J. Wong 				compat, 0,
331925ed6e8aSDarrick J. Wong 				incompat);
332025ed6e8aSDarrick J. Wong 		jbd2_journal_clear_features(sbi->s_journal, 0, 0,
332125ed6e8aSDarrick J. Wong 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
332225ed6e8aSDarrick J. Wong 	} else {
3323feb8c6d3SDarrick J. Wong 		jbd2_journal_clear_features(sbi->s_journal, 0, 0,
3324feb8c6d3SDarrick J. Wong 				JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT);
332525ed6e8aSDarrick J. Wong 	}
332625ed6e8aSDarrick J. Wong 
332725ed6e8aSDarrick J. Wong 	return ret;
332825ed6e8aSDarrick J. Wong }
332925ed6e8aSDarrick J. Wong 
3330952fc18eSTheodore Ts'o /*
3331952fc18eSTheodore Ts'o  * Note: calculating the overhead so we can be compatible with
3332952fc18eSTheodore Ts'o  * historical BSD practice is quite difficult in the face of
3333952fc18eSTheodore Ts'o  * clusters/bigalloc.  This is because multiple metadata blocks from
3334952fc18eSTheodore Ts'o  * different block group can end up in the same allocation cluster.
3335952fc18eSTheodore Ts'o  * Calculating the exact overhead in the face of clustered allocation
3336952fc18eSTheodore Ts'o  * requires either O(all block bitmaps) in memory or O(number of block
3337952fc18eSTheodore Ts'o  * groups**2) in time.  We will still calculate the superblock for
3338952fc18eSTheodore Ts'o  * older file systems --- and if we come across with a bigalloc file
3339952fc18eSTheodore Ts'o  * system with zero in s_overhead_clusters the estimate will be close to
3340952fc18eSTheodore Ts'o  * correct especially for very large cluster sizes --- but for newer
3341952fc18eSTheodore Ts'o  * file systems, it's better to calculate this figure once at mkfs
3342952fc18eSTheodore Ts'o  * time, and store it in the superblock.  If the superblock value is
3343952fc18eSTheodore Ts'o  * present (even for non-bigalloc file systems), we will use it.
3344952fc18eSTheodore Ts'o  */
3345952fc18eSTheodore Ts'o static int count_overhead(struct super_block *sb, ext4_group_t grp,
3346952fc18eSTheodore Ts'o 			  char *buf)
3347952fc18eSTheodore Ts'o {
3348952fc18eSTheodore Ts'o 	struct ext4_sb_info	*sbi = EXT4_SB(sb);
3349952fc18eSTheodore Ts'o 	struct ext4_group_desc	*gdp;
3350952fc18eSTheodore Ts'o 	ext4_fsblk_t		first_block, last_block, b;
3351952fc18eSTheodore Ts'o 	ext4_group_t		i, ngroups = ext4_get_groups_count(sb);
3352952fc18eSTheodore Ts'o 	int			s, j, count = 0;
3353952fc18eSTheodore Ts'o 
3354e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_bigalloc(sb))
33550548bbb8STheodore Ts'o 		return (ext4_bg_has_super(sb, grp) + ext4_bg_num_gdb(sb, grp) +
33560548bbb8STheodore Ts'o 			sbi->s_itb_per_group + 2);
33570548bbb8STheodore Ts'o 
3358952fc18eSTheodore Ts'o 	first_block = le32_to_cpu(sbi->s_es->s_first_data_block) +
3359952fc18eSTheodore Ts'o 		(grp * EXT4_BLOCKS_PER_GROUP(sb));
3360952fc18eSTheodore Ts'o 	last_block = first_block + EXT4_BLOCKS_PER_GROUP(sb) - 1;
3361952fc18eSTheodore Ts'o 	for (i = 0; i < ngroups; i++) {
3362952fc18eSTheodore Ts'o 		gdp = ext4_get_group_desc(sb, i, NULL);
3363952fc18eSTheodore Ts'o 		b = ext4_block_bitmap(sb, gdp);
3364952fc18eSTheodore Ts'o 		if (b >= first_block && b <= last_block) {
3365952fc18eSTheodore Ts'o 			ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf);
3366952fc18eSTheodore Ts'o 			count++;
3367952fc18eSTheodore Ts'o 		}
3368952fc18eSTheodore Ts'o 		b = ext4_inode_bitmap(sb, gdp);
3369952fc18eSTheodore Ts'o 		if (b >= first_block && b <= last_block) {
3370952fc18eSTheodore Ts'o 			ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf);
3371952fc18eSTheodore Ts'o 			count++;
3372952fc18eSTheodore Ts'o 		}
3373952fc18eSTheodore Ts'o 		b = ext4_inode_table(sb, gdp);
3374952fc18eSTheodore Ts'o 		if (b >= first_block && b + sbi->s_itb_per_group <= last_block)
3375952fc18eSTheodore Ts'o 			for (j = 0; j < sbi->s_itb_per_group; j++, b++) {
3376952fc18eSTheodore Ts'o 				int c = EXT4_B2C(sbi, b - first_block);
3377952fc18eSTheodore Ts'o 				ext4_set_bit(c, buf);
3378952fc18eSTheodore Ts'o 				count++;
3379952fc18eSTheodore Ts'o 			}
3380952fc18eSTheodore Ts'o 		if (i != grp)
3381952fc18eSTheodore Ts'o 			continue;
3382952fc18eSTheodore Ts'o 		s = 0;
3383952fc18eSTheodore Ts'o 		if (ext4_bg_has_super(sb, grp)) {
3384952fc18eSTheodore Ts'o 			ext4_set_bit(s++, buf);
3385952fc18eSTheodore Ts'o 			count++;
3386952fc18eSTheodore Ts'o 		}
3387c48ae41bSTheodore Ts'o 		j = ext4_bg_num_gdb(sb, grp);
3388c48ae41bSTheodore Ts'o 		if (s + j > EXT4_BLOCKS_PER_GROUP(sb)) {
3389c48ae41bSTheodore Ts'o 			ext4_error(sb, "Invalid number of block group "
3390c48ae41bSTheodore Ts'o 				   "descriptor blocks: %d", j);
3391c48ae41bSTheodore Ts'o 			j = EXT4_BLOCKS_PER_GROUP(sb) - s;
3392952fc18eSTheodore Ts'o 		}
3393c48ae41bSTheodore Ts'o 		count += j;
3394c48ae41bSTheodore Ts'o 		for (; j > 0; j--)
3395c48ae41bSTheodore Ts'o 			ext4_set_bit(EXT4_B2C(sbi, s++), buf);
3396952fc18eSTheodore Ts'o 	}
3397952fc18eSTheodore Ts'o 	if (!count)
3398952fc18eSTheodore Ts'o 		return 0;
3399952fc18eSTheodore Ts'o 	return EXT4_CLUSTERS_PER_GROUP(sb) -
3400952fc18eSTheodore Ts'o 		ext4_count_free(buf, EXT4_CLUSTERS_PER_GROUP(sb) / 8);
3401952fc18eSTheodore Ts'o }
3402952fc18eSTheodore Ts'o 
3403952fc18eSTheodore Ts'o /*
3404952fc18eSTheodore Ts'o  * Compute the overhead and stash it in sbi->s_overhead
3405952fc18eSTheodore Ts'o  */
3406952fc18eSTheodore Ts'o int ext4_calculate_overhead(struct super_block *sb)
3407952fc18eSTheodore Ts'o {
3408952fc18eSTheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
3409952fc18eSTheodore Ts'o 	struct ext4_super_block *es = sbi->s_es;
34103c816dedSEric Whitney 	struct inode *j_inode;
34113c816dedSEric Whitney 	unsigned int j_blocks, j_inum = le32_to_cpu(es->s_journal_inum);
3412952fc18eSTheodore Ts'o 	ext4_group_t i, ngroups = ext4_get_groups_count(sb);
3413952fc18eSTheodore Ts'o 	ext4_fsblk_t overhead = 0;
34144fdb5543SDmitry Monakhov 	char *buf = (char *) get_zeroed_page(GFP_NOFS);
3415952fc18eSTheodore Ts'o 
3416952fc18eSTheodore Ts'o 	if (!buf)
3417952fc18eSTheodore Ts'o 		return -ENOMEM;
3418952fc18eSTheodore Ts'o 
3419952fc18eSTheodore Ts'o 	/*
3420952fc18eSTheodore Ts'o 	 * Compute the overhead (FS structures).  This is constant
3421952fc18eSTheodore Ts'o 	 * for a given filesystem unless the number of block groups
3422952fc18eSTheodore Ts'o 	 * changes so we cache the previous value until it does.
3423952fc18eSTheodore Ts'o 	 */
3424952fc18eSTheodore Ts'o 
3425952fc18eSTheodore Ts'o 	/*
3426952fc18eSTheodore Ts'o 	 * All of the blocks before first_data_block are overhead
3427952fc18eSTheodore Ts'o 	 */
3428952fc18eSTheodore Ts'o 	overhead = EXT4_B2C(sbi, le32_to_cpu(es->s_first_data_block));
3429952fc18eSTheodore Ts'o 
3430952fc18eSTheodore Ts'o 	/*
3431952fc18eSTheodore Ts'o 	 * Add the overhead found in each block group
3432952fc18eSTheodore Ts'o 	 */
3433952fc18eSTheodore Ts'o 	for (i = 0; i < ngroups; i++) {
3434952fc18eSTheodore Ts'o 		int blks;
3435952fc18eSTheodore Ts'o 
3436952fc18eSTheodore Ts'o 		blks = count_overhead(sb, i, buf);
3437952fc18eSTheodore Ts'o 		overhead += blks;
3438952fc18eSTheodore Ts'o 		if (blks)
3439952fc18eSTheodore Ts'o 			memset(buf, 0, PAGE_SIZE);
3440952fc18eSTheodore Ts'o 		cond_resched();
3441952fc18eSTheodore Ts'o 	}
34423c816dedSEric Whitney 
34433c816dedSEric Whitney 	/*
34443c816dedSEric Whitney 	 * Add the internal journal blocks whether the journal has been
34453c816dedSEric Whitney 	 * loaded or not
34463c816dedSEric Whitney 	 */
3447b003b524SEric Sandeen 	if (sbi->s_journal && !sbi->journal_bdev)
3448810da240SLukas Czerner 		overhead += EXT4_NUM_B2C(sbi, sbi->s_journal->j_maxlen);
34493c816dedSEric Whitney 	else if (ext4_has_feature_journal(sb) && !sbi->s_journal) {
34503c816dedSEric Whitney 		j_inode = ext4_get_journal_inode(sb, j_inum);
34513c816dedSEric Whitney 		if (j_inode) {
34523c816dedSEric Whitney 			j_blocks = j_inode->i_size >> sb->s_blocksize_bits;
34533c816dedSEric Whitney 			overhead += EXT4_NUM_B2C(sbi, j_blocks);
34543c816dedSEric Whitney 			iput(j_inode);
34553c816dedSEric Whitney 		} else {
34563c816dedSEric Whitney 			ext4_msg(sb, KERN_ERR, "can't get journal size");
34573c816dedSEric Whitney 		}
34583c816dedSEric Whitney 	}
3459952fc18eSTheodore Ts'o 	sbi->s_overhead = overhead;
3460952fc18eSTheodore Ts'o 	smp_wmb();
3461952fc18eSTheodore Ts'o 	free_page((unsigned long) buf);
3462952fc18eSTheodore Ts'o 	return 0;
3463952fc18eSTheodore Ts'o }
3464952fc18eSTheodore Ts'o 
3465b5799018STheodore Ts'o static void ext4_set_resv_clusters(struct super_block *sb)
346627dd4385SLukas Czerner {
346727dd4385SLukas Czerner 	ext4_fsblk_t resv_clusters;
3468b5799018STheodore Ts'o 	struct ext4_sb_info *sbi = EXT4_SB(sb);
346927dd4385SLukas Czerner 
347027dd4385SLukas Czerner 	/*
347130fac0f7SJan Kara 	 * There's no need to reserve anything when we aren't using extents.
347230fac0f7SJan Kara 	 * The space estimates are exact, there are no unwritten extents,
347330fac0f7SJan Kara 	 * hole punching doesn't need new metadata... This is needed especially
347430fac0f7SJan Kara 	 * to keep ext2/3 backward compatibility.
347530fac0f7SJan Kara 	 */
3476e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_extents(sb))
3477b5799018STheodore Ts'o 		return;
347830fac0f7SJan Kara 	/*
347927dd4385SLukas Czerner 	 * By default we reserve 2% or 4096 clusters, whichever is smaller.
348027dd4385SLukas Czerner 	 * This should cover the situations where we can not afford to run
348127dd4385SLukas Czerner 	 * out of space like for example punch hole, or converting
3482556615dcSLukas Czerner 	 * unwritten extents in delalloc path. In most cases such
348327dd4385SLukas Czerner 	 * allocation would require 1, or 2 blocks, higher numbers are
348427dd4385SLukas Czerner 	 * very rare.
348527dd4385SLukas Czerner 	 */
3486b5799018STheodore Ts'o 	resv_clusters = (ext4_blocks_count(sbi->s_es) >>
3487b5799018STheodore Ts'o 			 sbi->s_cluster_bits);
348827dd4385SLukas Czerner 
348927dd4385SLukas Czerner 	do_div(resv_clusters, 50);
349027dd4385SLukas Czerner 	resv_clusters = min_t(ext4_fsblk_t, resv_clusters, 4096);
349127dd4385SLukas Czerner 
3492b5799018STheodore Ts'o 	atomic64_set(&sbi->s_resv_clusters, resv_clusters);
349327dd4385SLukas Czerner }
349427dd4385SLukas Czerner 
3495617ba13bSMingming Cao static int ext4_fill_super(struct super_block *sb, void *data, int silent)
3496ac27a0ecSDave Kleikamp {
34975e405595SDan Williams 	struct dax_device *dax_dev = fs_dax_get_by_bdev(sb->s_bdev);
3498d4c402d9SCurt Wohlgemuth 	char *orig_data = kstrdup(data, GFP_KERNEL);
3499ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
3500617ba13bSMingming Cao 	struct ext4_super_block *es = NULL;
35015aee0f8aSTheodore Ts'o 	struct ext4_sb_info *sbi = kzalloc(sizeof(*sbi), GFP_KERNEL);
3502617ba13bSMingming Cao 	ext4_fsblk_t block;
3503617ba13bSMingming Cao 	ext4_fsblk_t sb_block = get_sb_block(&data);
350470bbb3e0SAndrew Morton 	ext4_fsblk_t logical_sb_block;
3505ac27a0ecSDave Kleikamp 	unsigned long offset = 0;
3506ac27a0ecSDave Kleikamp 	unsigned long journal_devnum = 0;
3507ac27a0ecSDave Kleikamp 	unsigned long def_mount_opts;
3508ac27a0ecSDave Kleikamp 	struct inode *root;
35090390131bSFrank Mayhar 	const char *descr;
3510dcc7dae3SCyrill Gorcunov 	int ret = -ENOMEM;
3511281b5995STheodore Ts'o 	int blocksize, clustersize;
35124ec11028STheodore Ts'o 	unsigned int db_count;
35134ec11028STheodore Ts'o 	unsigned int i;
3514281b5995STheodore Ts'o 	int needs_recovery, has_huge_files, has_bigalloc;
3515bd81d8eeSLaurent Vivier 	__u64 blocks_count;
351607aa2ea1SLukas Czerner 	int err = 0;
3517b3881f74STheodore Ts'o 	unsigned int journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
3518bfff6873SLukas Czerner 	ext4_group_t first_not_zeroed;
3519ac27a0ecSDave Kleikamp 
35205aee0f8aSTheodore Ts'o 	if ((data && !orig_data) || !sbi)
35215aee0f8aSTheodore Ts'o 		goto out_free_base;
3522705895b6SPekka Enberg 
3523aed9eb1bSColin Ian King 	sbi->s_daxdev = dax_dev;
3524705895b6SPekka Enberg 	sbi->s_blockgroup_lock =
3525705895b6SPekka Enberg 		kzalloc(sizeof(struct blockgroup_lock), GFP_KERNEL);
35265aee0f8aSTheodore Ts'o 	if (!sbi->s_blockgroup_lock)
35275aee0f8aSTheodore Ts'o 		goto out_free_base;
35285aee0f8aSTheodore Ts'o 
3529ac27a0ecSDave Kleikamp 	sb->s_fs_info = sbi;
35302c0544b2STheodore Ts'o 	sbi->s_sb = sb;
3531240799cdSTheodore Ts'o 	sbi->s_inode_readahead_blks = EXT4_DEF_INODE_READAHEAD_BLKS;
3532d9c9bef1SMiklos Szeredi 	sbi->s_sb_block = sb_block;
3533f613dfcbSTheodore Ts'o 	if (sb->s_bdev->bd_part)
3534f613dfcbSTheodore Ts'o 		sbi->s_sectors_written_start =
3535dbae2c55SMichael Callahan 			part_stat_read(sb->s_bdev->bd_part, sectors[STAT_WRITE]);
3536ac27a0ecSDave Kleikamp 
35379f6200bbSTheodore Ts'o 	/* Cleanup superblock name */
3538ec3904dcSRasmus Villemoes 	strreplace(sb->s_id, '/', '!');
35399f6200bbSTheodore Ts'o 
354007aa2ea1SLukas Czerner 	/* -EINVAL is default */
3541dcc7dae3SCyrill Gorcunov 	ret = -EINVAL;
3542617ba13bSMingming Cao 	blocksize = sb_min_blocksize(sb, EXT4_MIN_BLOCK_SIZE);
3543ac27a0ecSDave Kleikamp 	if (!blocksize) {
3544b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "unable to set blocksize");
3545ac27a0ecSDave Kleikamp 		goto out_fail;
3546ac27a0ecSDave Kleikamp 	}
3547ac27a0ecSDave Kleikamp 
3548ac27a0ecSDave Kleikamp 	/*
3549617ba13bSMingming Cao 	 * The ext4 superblock will not be buffer aligned for other than 1kB
3550ac27a0ecSDave Kleikamp 	 * block sizes.  We need to calculate the offset from buffer start.
3551ac27a0ecSDave Kleikamp 	 */
3552617ba13bSMingming Cao 	if (blocksize != EXT4_MIN_BLOCK_SIZE) {
355370bbb3e0SAndrew Morton 		logical_sb_block = sb_block * EXT4_MIN_BLOCK_SIZE;
355470bbb3e0SAndrew Morton 		offset = do_div(logical_sb_block, blocksize);
3555ac27a0ecSDave Kleikamp 	} else {
355670bbb3e0SAndrew Morton 		logical_sb_block = sb_block;
3557ac27a0ecSDave Kleikamp 	}
3558ac27a0ecSDave Kleikamp 
3559a8ac900bSGioh Kim 	if (!(bh = sb_bread_unmovable(sb, logical_sb_block))) {
3560b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "unable to read superblock");
3561ac27a0ecSDave Kleikamp 		goto out_fail;
3562ac27a0ecSDave Kleikamp 	}
3563ac27a0ecSDave Kleikamp 	/*
3564ac27a0ecSDave Kleikamp 	 * Note: s_es must be initialized as soon as possible because
3565617ba13bSMingming Cao 	 *       some ext4 macro-instructions depend on its value
3566ac27a0ecSDave Kleikamp 	 */
35672716b802STheodore Ts'o 	es = (struct ext4_super_block *) (bh->b_data + offset);
3568ac27a0ecSDave Kleikamp 	sbi->s_es = es;
3569ac27a0ecSDave Kleikamp 	sb->s_magic = le16_to_cpu(es->s_magic);
3570617ba13bSMingming Cao 	if (sb->s_magic != EXT4_SUPER_MAGIC)
3571617ba13bSMingming Cao 		goto cantfind_ext4;
3572afc32f7eSTheodore Ts'o 	sbi->s_kbytes_written = le64_to_cpu(es->s_kbytes_written);
3573ac27a0ecSDave Kleikamp 
3574feb0ab32SDarrick J. Wong 	/* Warn if metadata_csum and gdt_csum are both set. */
3575e2b911c5SDarrick J. Wong 	if (ext4_has_feature_metadata_csum(sb) &&
3576e2b911c5SDarrick J. Wong 	    ext4_has_feature_gdt_csum(sb))
3577363307e6SJakub Wilk 		ext4_warning(sb, "metadata_csum and uninit_bg are "
3578feb0ab32SDarrick J. Wong 			     "redundant flags; please run fsck.");
3579feb0ab32SDarrick J. Wong 
3580d25425f8SDarrick J. Wong 	/* Check for a known checksum algorithm */
3581d25425f8SDarrick J. Wong 	if (!ext4_verify_csum_type(sb, es)) {
3582d25425f8SDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with "
3583d25425f8SDarrick J. Wong 			 "unknown checksum algorithm.");
3584d25425f8SDarrick J. Wong 		silent = 1;
3585d25425f8SDarrick J. Wong 		goto cantfind_ext4;
3586d25425f8SDarrick J. Wong 	}
3587d25425f8SDarrick J. Wong 
35880441984aSDarrick J. Wong 	/* Load the checksum driver */
35890441984aSDarrick J. Wong 	sbi->s_chksum_driver = crypto_alloc_shash("crc32c", 0, 0);
35900441984aSDarrick J. Wong 	if (IS_ERR(sbi->s_chksum_driver)) {
35910441984aSDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "Cannot load crc32c driver.");
35920441984aSDarrick J. Wong 		ret = PTR_ERR(sbi->s_chksum_driver);
35930441984aSDarrick J. Wong 		sbi->s_chksum_driver = NULL;
35940441984aSDarrick J. Wong 		goto failed_mount;
35950441984aSDarrick J. Wong 	}
35960441984aSDarrick J. Wong 
3597a9c47317SDarrick J. Wong 	/* Check superblock checksum */
3598a9c47317SDarrick J. Wong 	if (!ext4_superblock_csum_verify(sb, es)) {
3599a9c47317SDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with "
3600a9c47317SDarrick J. Wong 			 "invalid superblock checksum.  Run e2fsck?");
3601a9c47317SDarrick J. Wong 		silent = 1;
36026a797d27SDarrick J. Wong 		ret = -EFSBADCRC;
3603a9c47317SDarrick J. Wong 		goto cantfind_ext4;
3604a9c47317SDarrick J. Wong 	}
3605a9c47317SDarrick J. Wong 
3606a9c47317SDarrick J. Wong 	/* Precompute checksum seed for all metadata */
3607e2b911c5SDarrick J. Wong 	if (ext4_has_feature_csum_seed(sb))
36088c81bd8fSDarrick J. Wong 		sbi->s_csum_seed = le32_to_cpu(es->s_checksum_seed);
3609dec214d0STahsin Erdogan 	else if (ext4_has_metadata_csum(sb) || ext4_has_feature_ea_inode(sb))
3610a9c47317SDarrick J. Wong 		sbi->s_csum_seed = ext4_chksum(sbi, ~0, es->s_uuid,
3611a9c47317SDarrick J. Wong 					       sizeof(es->s_uuid));
3612a9c47317SDarrick J. Wong 
3613ac27a0ecSDave Kleikamp 	/* Set defaults before we parse the mount options */
3614ac27a0ecSDave Kleikamp 	def_mount_opts = le32_to_cpu(es->s_default_mount_opts);
3615fd8c37ecSTheodore Ts'o 	set_opt(sb, INIT_INODE_TABLE);
3616617ba13bSMingming Cao 	if (def_mount_opts & EXT4_DEFM_DEBUG)
3617fd8c37ecSTheodore Ts'o 		set_opt(sb, DEBUG);
361887f26807STheodore Ts'o 	if (def_mount_opts & EXT4_DEFM_BSDGROUPS)
3619fd8c37ecSTheodore Ts'o 		set_opt(sb, GRPID);
3620617ba13bSMingming Cao 	if (def_mount_opts & EXT4_DEFM_UID16)
3621fd8c37ecSTheodore Ts'o 		set_opt(sb, NO_UID32);
3622ea663336SEric Sandeen 	/* xattr user namespace & acls are now defaulted on */
3623fd8c37ecSTheodore Ts'o 	set_opt(sb, XATTR_USER);
362403010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL
3625fd8c37ecSTheodore Ts'o 	set_opt(sb, POSIX_ACL);
36262e7842b8SHugh Dickins #endif
362798c1a759SDarrick J. Wong 	/* don't forget to enable journal_csum when metadata_csum is enabled. */
362898c1a759SDarrick J. Wong 	if (ext4_has_metadata_csum(sb))
362998c1a759SDarrick J. Wong 		set_opt(sb, JOURNAL_CHECKSUM);
363098c1a759SDarrick J. Wong 
3631617ba13bSMingming Cao 	if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_DATA)
3632fd8c37ecSTheodore Ts'o 		set_opt(sb, JOURNAL_DATA);
3633617ba13bSMingming Cao 	else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_ORDERED)
3634fd8c37ecSTheodore Ts'o 		set_opt(sb, ORDERED_DATA);
3635617ba13bSMingming Cao 	else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_WBACK)
3636fd8c37ecSTheodore Ts'o 		set_opt(sb, WRITEBACK_DATA);
3637ac27a0ecSDave Kleikamp 
3638617ba13bSMingming Cao 	if (le16_to_cpu(sbi->s_es->s_errors) == EXT4_ERRORS_PANIC)
3639fd8c37ecSTheodore Ts'o 		set_opt(sb, ERRORS_PANIC);
3640bb4f397aSAneesh Kumar K.V 	else if (le16_to_cpu(sbi->s_es->s_errors) == EXT4_ERRORS_CONTINUE)
3641fd8c37ecSTheodore Ts'o 		set_opt(sb, ERRORS_CONT);
3642bb4f397aSAneesh Kumar K.V 	else
3643fd8c37ecSTheodore Ts'o 		set_opt(sb, ERRORS_RO);
364445f1a9c3SDarrick J. Wong 	/* block_validity enabled by default; disable with noblock_validity */
3645fd8c37ecSTheodore Ts'o 	set_opt(sb, BLOCK_VALIDITY);
36468b67f04aSTheodore Ts'o 	if (def_mount_opts & EXT4_DEFM_DISCARD)
3647fd8c37ecSTheodore Ts'o 		set_opt(sb, DISCARD);
3648ac27a0ecSDave Kleikamp 
364908cefc7aSEric W. Biederman 	sbi->s_resuid = make_kuid(&init_user_ns, le16_to_cpu(es->s_def_resuid));
365008cefc7aSEric W. Biederman 	sbi->s_resgid = make_kgid(&init_user_ns, le16_to_cpu(es->s_def_resgid));
365130773840STheodore Ts'o 	sbi->s_commit_interval = JBD2_DEFAULT_MAX_COMMIT_AGE * HZ;
365230773840STheodore Ts'o 	sbi->s_min_batch_time = EXT4_DEF_MIN_BATCH_TIME;
365330773840STheodore Ts'o 	sbi->s_max_batch_time = EXT4_DEF_MAX_BATCH_TIME;
3654ac27a0ecSDave Kleikamp 
36558b67f04aSTheodore Ts'o 	if ((def_mount_opts & EXT4_DEFM_NOBARRIER) == 0)
3656fd8c37ecSTheodore Ts'o 		set_opt(sb, BARRIER);
3657ac27a0ecSDave Kleikamp 
36581e2462f9SMingming Cao 	/*
3659dd919b98SAneesh Kumar K.V 	 * enable delayed allocation by default
3660dd919b98SAneesh Kumar K.V 	 * Use -o nodelalloc to turn it off
3661dd919b98SAneesh Kumar K.V 	 */
3662bc0b75f7STheodore Ts'o 	if (!IS_EXT3_SB(sb) && !IS_EXT2_SB(sb) &&
36638b67f04aSTheodore Ts'o 	    ((def_mount_opts & EXT4_DEFM_NODELALLOC) == 0))
3664fd8c37ecSTheodore Ts'o 		set_opt(sb, DELALLOC);
3665dd919b98SAneesh Kumar K.V 
366651ce6511SLukas Czerner 	/*
366751ce6511SLukas Czerner 	 * set default s_li_wait_mult for lazyinit, for the case there is
366851ce6511SLukas Czerner 	 * no mount option specified.
366951ce6511SLukas Czerner 	 */
367051ce6511SLukas Czerner 	sbi->s_li_wait_mult = EXT4_DEF_LI_WAIT_MULT;
367151ce6511SLukas Czerner 
36725aee0f8aSTheodore Ts'o 	if (sbi->s_es->s_mount_opts[0]) {
36735aee0f8aSTheodore Ts'o 		char *s_mount_opts = kstrndup(sbi->s_es->s_mount_opts,
36745aee0f8aSTheodore Ts'o 					      sizeof(sbi->s_es->s_mount_opts),
36755aee0f8aSTheodore Ts'o 					      GFP_KERNEL);
36765aee0f8aSTheodore Ts'o 		if (!s_mount_opts)
36775aee0f8aSTheodore Ts'o 			goto failed_mount;
36785aee0f8aSTheodore Ts'o 		if (!parse_options(s_mount_opts, sb, &journal_devnum,
36795aee0f8aSTheodore Ts'o 				   &journal_ioprio, 0)) {
36808b67f04aSTheodore Ts'o 			ext4_msg(sb, KERN_WARNING,
36818b67f04aSTheodore Ts'o 				 "failed to parse options in superblock: %s",
36825aee0f8aSTheodore Ts'o 				 s_mount_opts);
36835aee0f8aSTheodore Ts'o 		}
36845aee0f8aSTheodore Ts'o 		kfree(s_mount_opts);
36858b67f04aSTheodore Ts'o 	}
36865a916be1STheodore Ts'o 	sbi->s_def_mount_opt = sbi->s_mount_opt;
3687b3881f74STheodore Ts'o 	if (!parse_options((char *) data, sb, &journal_devnum,
3688661aa520SEric Sandeen 			   &journal_ioprio, 0))
3689ac27a0ecSDave Kleikamp 		goto failed_mount;
3690ac27a0ecSDave Kleikamp 
369156889787STheodore Ts'o 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) {
369256889787STheodore Ts'o 		printk_once(KERN_WARNING "EXT4-fs: Warning: mounting "
369356889787STheodore Ts'o 			    "with data=journal disables delayed "
369456889787STheodore Ts'o 			    "allocation and O_DIRECT support!\n");
369556889787STheodore Ts'o 		if (test_opt2(sb, EXPLICIT_DELALLOC)) {
369656889787STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "can't mount with "
369756889787STheodore Ts'o 				 "both data=journal and delalloc");
369856889787STheodore Ts'o 			goto failed_mount;
369956889787STheodore Ts'o 		}
370056889787STheodore Ts'o 		if (test_opt(sb, DIOREAD_NOLOCK)) {
370156889787STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "can't mount with "
37026ae6514bSPiotr Sarna 				 "both data=journal and dioread_nolock");
370356889787STheodore Ts'o 			goto failed_mount;
370456889787STheodore Ts'o 		}
3705923ae0ffSRoss Zwisler 		if (test_opt(sb, DAX)) {
3706923ae0ffSRoss Zwisler 			ext4_msg(sb, KERN_ERR, "can't mount with "
3707923ae0ffSRoss Zwisler 				 "both data=journal and dax");
3708923ae0ffSRoss Zwisler 			goto failed_mount;
3709923ae0ffSRoss Zwisler 		}
371073b92a2aSSergey Karamov 		if (ext4_has_feature_encrypt(sb)) {
371173b92a2aSSergey Karamov 			ext4_msg(sb, KERN_WARNING,
371273b92a2aSSergey Karamov 				 "encrypted files will use data=ordered "
371373b92a2aSSergey Karamov 				 "instead of data journaling mode");
371473b92a2aSSergey Karamov 		}
371556889787STheodore Ts'o 		if (test_opt(sb, DELALLOC))
371656889787STheodore Ts'o 			clear_opt(sb, DELALLOC);
3717001e4a87STejun Heo 	} else {
3718001e4a87STejun Heo 		sb->s_iflags |= SB_I_CGROUPWB;
371956889787STheodore Ts'o 	}
372056889787STheodore Ts'o 
37211751e8a6SLinus Torvalds 	sb->s_flags = (sb->s_flags & ~SB_POSIXACL) |
37221751e8a6SLinus Torvalds 		(test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0);
3723ac27a0ecSDave Kleikamp 
3724617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV &&
3725e2b911c5SDarrick J. Wong 	    (ext4_has_compat_features(sb) ||
3726e2b911c5SDarrick J. Wong 	     ext4_has_ro_compat_features(sb) ||
3727e2b911c5SDarrick J. Wong 	     ext4_has_incompat_features(sb)))
3728b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING,
3729b31e1552SEric Sandeen 		       "feature flags set on rev 0 fs, "
3730b31e1552SEric Sandeen 		       "running e2fsck is recommended");
3731469108ffSTheodore Tso 
3732ed3654ebSTheodore Ts'o 	if (es->s_creator_os == cpu_to_le32(EXT4_OS_HURD)) {
3733ed3654ebSTheodore Ts'o 		set_opt2(sb, HURD_COMPAT);
3734e2b911c5SDarrick J. Wong 		if (ext4_has_feature_64bit(sb)) {
3735ed3654ebSTheodore Ts'o 			ext4_msg(sb, KERN_ERR,
3736ed3654ebSTheodore Ts'o 				 "The Hurd can't support 64-bit file systems");
3737ed3654ebSTheodore Ts'o 			goto failed_mount;
3738ed3654ebSTheodore Ts'o 		}
3739dec214d0STahsin Erdogan 
3740dec214d0STahsin Erdogan 		/*
3741dec214d0STahsin Erdogan 		 * ea_inode feature uses l_i_version field which is not
3742dec214d0STahsin Erdogan 		 * available in HURD_COMPAT mode.
3743dec214d0STahsin Erdogan 		 */
3744dec214d0STahsin Erdogan 		if (ext4_has_feature_ea_inode(sb)) {
3745dec214d0STahsin Erdogan 			ext4_msg(sb, KERN_ERR,
3746dec214d0STahsin Erdogan 				 "ea_inode feature is not supported for Hurd");
3747dec214d0STahsin Erdogan 			goto failed_mount;
3748dec214d0STahsin Erdogan 		}
3749ed3654ebSTheodore Ts'o 	}
3750ed3654ebSTheodore Ts'o 
37512035e776STheodore Ts'o 	if (IS_EXT2_SB(sb)) {
37522035e776STheodore Ts'o 		if (ext2_feature_set_ok(sb))
37532035e776STheodore Ts'o 			ext4_msg(sb, KERN_INFO, "mounting ext2 file system "
37542035e776STheodore Ts'o 				 "using the ext4 subsystem");
37552035e776STheodore Ts'o 		else {
37560d9366d6SEric Sandeen 			/*
37570d9366d6SEric Sandeen 			 * If we're probing be silent, if this looks like
37580d9366d6SEric Sandeen 			 * it's actually an ext[34] filesystem.
37590d9366d6SEric Sandeen 			 */
37600d9366d6SEric Sandeen 			if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb)))
37610d9366d6SEric Sandeen 				goto failed_mount;
37622035e776STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "couldn't mount as ext2 due "
37632035e776STheodore Ts'o 				 "to feature incompatibilities");
37642035e776STheodore Ts'o 			goto failed_mount;
37652035e776STheodore Ts'o 		}
37662035e776STheodore Ts'o 	}
37672035e776STheodore Ts'o 
37682035e776STheodore Ts'o 	if (IS_EXT3_SB(sb)) {
37692035e776STheodore Ts'o 		if (ext3_feature_set_ok(sb))
37702035e776STheodore Ts'o 			ext4_msg(sb, KERN_INFO, "mounting ext3 file system "
37712035e776STheodore Ts'o 				 "using the ext4 subsystem");
37722035e776STheodore Ts'o 		else {
37730d9366d6SEric Sandeen 			/*
37740d9366d6SEric Sandeen 			 * If we're probing be silent, if this looks like
37750d9366d6SEric Sandeen 			 * it's actually an ext4 filesystem.
37760d9366d6SEric Sandeen 			 */
37770d9366d6SEric Sandeen 			if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb)))
37780d9366d6SEric Sandeen 				goto failed_mount;
37792035e776STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "couldn't mount as ext3 due "
37802035e776STheodore Ts'o 				 "to feature incompatibilities");
37812035e776STheodore Ts'o 			goto failed_mount;
37822035e776STheodore Ts'o 		}
37832035e776STheodore Ts'o 	}
37842035e776STheodore Ts'o 
3785469108ffSTheodore Tso 	/*
3786ac27a0ecSDave Kleikamp 	 * Check feature flags regardless of the revision level, since we
3787ac27a0ecSDave Kleikamp 	 * previously didn't change the revision level when setting the flags,
3788ac27a0ecSDave Kleikamp 	 * so there is a chance incompat flags are set on a rev 0 filesystem.
3789ac27a0ecSDave Kleikamp 	 */
3790bc98a42cSDavid Howells 	if (!ext4_feature_set_ok(sb, (sb_rdonly(sb))))
3791ac27a0ecSDave Kleikamp 		goto failed_mount;
3792a13fb1a4SEric Sandeen 
3793261cb20cSJan Kara 	blocksize = BLOCK_SIZE << le32_to_cpu(es->s_log_block_size);
3794617ba13bSMingming Cao 	if (blocksize < EXT4_MIN_BLOCK_SIZE ||
3795617ba13bSMingming Cao 	    blocksize > EXT4_MAX_BLOCK_SIZE) {
3796b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR,
37978cdf3372STheodore Ts'o 		       "Unsupported filesystem blocksize %d (%d log_block_size)",
37988cdf3372STheodore Ts'o 			 blocksize, le32_to_cpu(es->s_log_block_size));
37998cdf3372STheodore Ts'o 		goto failed_mount;
38008cdf3372STheodore Ts'o 	}
38018cdf3372STheodore Ts'o 	if (le32_to_cpu(es->s_log_block_size) >
38028cdf3372STheodore Ts'o 	    (EXT4_MAX_BLOCK_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) {
38038cdf3372STheodore Ts'o 		ext4_msg(sb, KERN_ERR,
38048cdf3372STheodore Ts'o 			 "Invalid log block size: %u",
38058cdf3372STheodore Ts'o 			 le32_to_cpu(es->s_log_block_size));
3806ac27a0ecSDave Kleikamp 		goto failed_mount;
3807ac27a0ecSDave Kleikamp 	}
3808bfe0a5f4STheodore Ts'o 	if (le32_to_cpu(es->s_log_cluster_size) >
3809bfe0a5f4STheodore Ts'o 	    (EXT4_MAX_CLUSTER_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) {
3810bfe0a5f4STheodore Ts'o 		ext4_msg(sb, KERN_ERR,
3811bfe0a5f4STheodore Ts'o 			 "Invalid log cluster size: %u",
3812bfe0a5f4STheodore Ts'o 			 le32_to_cpu(es->s_log_cluster_size));
3813bfe0a5f4STheodore Ts'o 		goto failed_mount;
3814bfe0a5f4STheodore Ts'o 	}
3815ac27a0ecSDave Kleikamp 
38165b9554dcSTheodore Ts'o 	if (le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) > (blocksize / 4)) {
38175b9554dcSTheodore Ts'o 		ext4_msg(sb, KERN_ERR,
38185b9554dcSTheodore Ts'o 			 "Number of reserved GDT blocks insanely large: %d",
38195b9554dcSTheodore Ts'o 			 le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks));
38205b9554dcSTheodore Ts'o 		goto failed_mount;
38215b9554dcSTheodore Ts'o 	}
38225b9554dcSTheodore Ts'o 
3823923ae0ffSRoss Zwisler 	if (sbi->s_mount_opt & EXT4_MOUNT_DAX) {
3824559db4c6SRoss Zwisler 		if (ext4_has_feature_inline_data(sb)) {
3825559db4c6SRoss Zwisler 			ext4_msg(sb, KERN_ERR, "Cannot use DAX on a filesystem"
3826559db4c6SRoss Zwisler 					" that may contain inline data");
382724f3478dSDan Williams 			sbi->s_mount_opt &= ~EXT4_MOUNT_DAX;
3828559db4c6SRoss Zwisler 		}
382980660f20SDave Jiang 		if (!bdev_dax_supported(sb->s_bdev, blocksize)) {
383024f3478dSDan Williams 			ext4_msg(sb, KERN_ERR,
383124f3478dSDan Williams 				"DAX unsupported by block device. Turning off DAX.");
383224f3478dSDan Williams 			sbi->s_mount_opt &= ~EXT4_MOUNT_DAX;
383324f3478dSDan Williams 		}
3834923ae0ffSRoss Zwisler 	}
3835923ae0ffSRoss Zwisler 
3836e2b911c5SDarrick J. Wong 	if (ext4_has_feature_encrypt(sb) && es->s_encryption_level) {
38376ddb2447STheodore Ts'o 		ext4_msg(sb, KERN_ERR, "Unsupported encryption level %d",
38386ddb2447STheodore Ts'o 			 es->s_encryption_level);
38396ddb2447STheodore Ts'o 		goto failed_mount;
38406ddb2447STheodore Ts'o 	}
38416ddb2447STheodore Ts'o 
3842ac27a0ecSDave Kleikamp 	if (sb->s_blocksize != blocksize) {
3843ce40733cSAneesh Kumar K.V 		/* Validate the filesystem blocksize */
3844ce40733cSAneesh Kumar K.V 		if (!sb_set_blocksize(sb, blocksize)) {
3845b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "bad block size %d",
3846ce40733cSAneesh Kumar K.V 					blocksize);
3847ac27a0ecSDave Kleikamp 			goto failed_mount;
3848ac27a0ecSDave Kleikamp 		}
3849ac27a0ecSDave Kleikamp 
3850ac27a0ecSDave Kleikamp 		brelse(bh);
385170bbb3e0SAndrew Morton 		logical_sb_block = sb_block * EXT4_MIN_BLOCK_SIZE;
385270bbb3e0SAndrew Morton 		offset = do_div(logical_sb_block, blocksize);
3853a8ac900bSGioh Kim 		bh = sb_bread_unmovable(sb, logical_sb_block);
3854ac27a0ecSDave Kleikamp 		if (!bh) {
3855b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR,
3856b31e1552SEric Sandeen 			       "Can't read superblock on 2nd try");
3857ac27a0ecSDave Kleikamp 			goto failed_mount;
3858ac27a0ecSDave Kleikamp 		}
38592716b802STheodore Ts'o 		es = (struct ext4_super_block *)(bh->b_data + offset);
3860ac27a0ecSDave Kleikamp 		sbi->s_es = es;
3861617ba13bSMingming Cao 		if (es->s_magic != cpu_to_le16(EXT4_SUPER_MAGIC)) {
3862b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR,
3863b31e1552SEric Sandeen 			       "Magic mismatch, very weird!");
3864ac27a0ecSDave Kleikamp 			goto failed_mount;
3865ac27a0ecSDave Kleikamp 		}
3866ac27a0ecSDave Kleikamp 	}
3867ac27a0ecSDave Kleikamp 
3868e2b911c5SDarrick J. Wong 	has_huge_files = ext4_has_feature_huge_file(sb);
3869f287a1a5STheodore Ts'o 	sbi->s_bitmap_maxbytes = ext4_max_bitmap_size(sb->s_blocksize_bits,
3870f287a1a5STheodore Ts'o 						      has_huge_files);
3871f287a1a5STheodore Ts'o 	sb->s_maxbytes = ext4_max_size(sb->s_blocksize_bits, has_huge_files);
3872ac27a0ecSDave Kleikamp 
3873617ba13bSMingming Cao 	if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV) {
3874617ba13bSMingming Cao 		sbi->s_inode_size = EXT4_GOOD_OLD_INODE_SIZE;
3875617ba13bSMingming Cao 		sbi->s_first_ino = EXT4_GOOD_OLD_FIRST_INO;
3876ac27a0ecSDave Kleikamp 	} else {
3877ac27a0ecSDave Kleikamp 		sbi->s_inode_size = le16_to_cpu(es->s_inode_size);
3878ac27a0ecSDave Kleikamp 		sbi->s_first_ino = le32_to_cpu(es->s_first_ino);
3879c37e9e01STheodore Ts'o 		if (sbi->s_first_ino < EXT4_GOOD_OLD_FIRST_INO) {
3880c37e9e01STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "invalid first ino: %u",
3881c37e9e01STheodore Ts'o 				 sbi->s_first_ino);
3882c37e9e01STheodore Ts'o 			goto failed_mount;
3883c37e9e01STheodore Ts'o 		}
3884617ba13bSMingming Cao 		if ((sbi->s_inode_size < EXT4_GOOD_OLD_INODE_SIZE) ||
38851330593eSVignesh Babu 		    (!is_power_of_2(sbi->s_inode_size)) ||
3886ac27a0ecSDave Kleikamp 		    (sbi->s_inode_size > blocksize)) {
3887b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR,
3888b31e1552SEric Sandeen 			       "unsupported inode size: %d",
3889ac27a0ecSDave Kleikamp 			       sbi->s_inode_size);
3890ac27a0ecSDave Kleikamp 			goto failed_mount;
3891ac27a0ecSDave Kleikamp 		}
3892ef7f3835SKalpak Shah 		if (sbi->s_inode_size > EXT4_GOOD_OLD_INODE_SIZE)
3893ef7f3835SKalpak Shah 			sb->s_time_gran = 1 << (EXT4_EPOCH_BITS - 2);
3894ac27a0ecSDave Kleikamp 	}
38950b8e58a1SAndreas Dilger 
38960d1ee42fSAlexandre Ratchov 	sbi->s_desc_size = le16_to_cpu(es->s_desc_size);
3897e2b911c5SDarrick J. Wong 	if (ext4_has_feature_64bit(sb)) {
38988fadc143SAlexandre Ratchov 		if (sbi->s_desc_size < EXT4_MIN_DESC_SIZE_64BIT ||
38990d1ee42fSAlexandre Ratchov 		    sbi->s_desc_size > EXT4_MAX_DESC_SIZE ||
3900d8ea6cf8Svignesh babu 		    !is_power_of_2(sbi->s_desc_size)) {
3901b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR,
3902b31e1552SEric Sandeen 			       "unsupported descriptor size %lu",
39030d1ee42fSAlexandre Ratchov 			       sbi->s_desc_size);
39040d1ee42fSAlexandre Ratchov 			goto failed_mount;
39050d1ee42fSAlexandre Ratchov 		}
39060d1ee42fSAlexandre Ratchov 	} else
39070d1ee42fSAlexandre Ratchov 		sbi->s_desc_size = EXT4_MIN_DESC_SIZE;
39080b8e58a1SAndreas Dilger 
3909ac27a0ecSDave Kleikamp 	sbi->s_blocks_per_group = le32_to_cpu(es->s_blocks_per_group);
3910ac27a0ecSDave Kleikamp 	sbi->s_inodes_per_group = le32_to_cpu(es->s_inodes_per_group);
39110b8e58a1SAndreas Dilger 
3912617ba13bSMingming Cao 	sbi->s_inodes_per_block = blocksize / EXT4_INODE_SIZE(sb);
3913ac27a0ecSDave Kleikamp 	if (sbi->s_inodes_per_block == 0)
3914617ba13bSMingming Cao 		goto cantfind_ext4;
3915cd6bb35bSTheodore Ts'o 	if (sbi->s_inodes_per_group < sbi->s_inodes_per_block ||
3916cd6bb35bSTheodore Ts'o 	    sbi->s_inodes_per_group > blocksize * 8) {
3917cd6bb35bSTheodore Ts'o 		ext4_msg(sb, KERN_ERR, "invalid inodes per group: %lu\n",
3918cd6bb35bSTheodore Ts'o 			 sbi->s_blocks_per_group);
3919cd6bb35bSTheodore Ts'o 		goto failed_mount;
3920cd6bb35bSTheodore Ts'o 	}
3921ac27a0ecSDave Kleikamp 	sbi->s_itb_per_group = sbi->s_inodes_per_group /
3922ac27a0ecSDave Kleikamp 					sbi->s_inodes_per_block;
39230d1ee42fSAlexandre Ratchov 	sbi->s_desc_per_block = blocksize / EXT4_DESC_SIZE(sb);
3924ac27a0ecSDave Kleikamp 	sbi->s_sbh = bh;
3925ac27a0ecSDave Kleikamp 	sbi->s_mount_state = le16_to_cpu(es->s_state);
3926e57aa839SFengguang Wu 	sbi->s_addr_per_block_bits = ilog2(EXT4_ADDR_PER_BLOCK(sb));
3927e57aa839SFengguang Wu 	sbi->s_desc_per_block_bits = ilog2(EXT4_DESC_PER_BLOCK(sb));
39280b8e58a1SAndreas Dilger 
3929ac27a0ecSDave Kleikamp 	for (i = 0; i < 4; i++)
3930ac27a0ecSDave Kleikamp 		sbi->s_hash_seed[i] = le32_to_cpu(es->s_hash_seed[i]);
3931ac27a0ecSDave Kleikamp 	sbi->s_def_hash_version = es->s_def_hash_version;
3932e2b911c5SDarrick J. Wong 	if (ext4_has_feature_dir_index(sb)) {
3933f99b2589STheodore Ts'o 		i = le32_to_cpu(es->s_flags);
3934f99b2589STheodore Ts'o 		if (i & EXT2_FLAGS_UNSIGNED_HASH)
3935f99b2589STheodore Ts'o 			sbi->s_hash_unsigned = 3;
3936f99b2589STheodore Ts'o 		else if ((i & EXT2_FLAGS_SIGNED_HASH) == 0) {
3937f99b2589STheodore Ts'o #ifdef __CHAR_UNSIGNED__
3938bc98a42cSDavid Howells 			if (!sb_rdonly(sb))
393923301410STheodore Ts'o 				es->s_flags |=
394023301410STheodore Ts'o 					cpu_to_le32(EXT2_FLAGS_UNSIGNED_HASH);
3941f99b2589STheodore Ts'o 			sbi->s_hash_unsigned = 3;
3942f99b2589STheodore Ts'o #else
3943bc98a42cSDavid Howells 			if (!sb_rdonly(sb))
394423301410STheodore Ts'o 				es->s_flags |=
394523301410STheodore Ts'o 					cpu_to_le32(EXT2_FLAGS_SIGNED_HASH);
3946f99b2589STheodore Ts'o #endif
3947f99b2589STheodore Ts'o 		}
394823301410STheodore Ts'o 	}
3949ac27a0ecSDave Kleikamp 
3950281b5995STheodore Ts'o 	/* Handle clustersize */
3951281b5995STheodore Ts'o 	clustersize = BLOCK_SIZE << le32_to_cpu(es->s_log_cluster_size);
3952e2b911c5SDarrick J. Wong 	has_bigalloc = ext4_has_feature_bigalloc(sb);
3953281b5995STheodore Ts'o 	if (has_bigalloc) {
3954281b5995STheodore Ts'o 		if (clustersize < blocksize) {
3955281b5995STheodore Ts'o 			ext4_msg(sb, KERN_ERR,
3956281b5995STheodore Ts'o 				 "cluster size (%d) smaller than "
3957281b5995STheodore Ts'o 				 "block size (%d)", clustersize, blocksize);
3958281b5995STheodore Ts'o 			goto failed_mount;
3959281b5995STheodore Ts'o 		}
3960281b5995STheodore Ts'o 		sbi->s_cluster_bits = le32_to_cpu(es->s_log_cluster_size) -
3961281b5995STheodore Ts'o 			le32_to_cpu(es->s_log_block_size);
3962281b5995STheodore Ts'o 		sbi->s_clusters_per_group =
3963281b5995STheodore Ts'o 			le32_to_cpu(es->s_clusters_per_group);
3964281b5995STheodore Ts'o 		if (sbi->s_clusters_per_group > blocksize * 8) {
3965281b5995STheodore Ts'o 			ext4_msg(sb, KERN_ERR,
3966281b5995STheodore Ts'o 				 "#clusters per group too big: %lu",
3967281b5995STheodore Ts'o 				 sbi->s_clusters_per_group);
3968281b5995STheodore Ts'o 			goto failed_mount;
3969281b5995STheodore Ts'o 		}
3970281b5995STheodore Ts'o 		if (sbi->s_blocks_per_group !=
3971281b5995STheodore Ts'o 		    (sbi->s_clusters_per_group * (clustersize / blocksize))) {
3972281b5995STheodore Ts'o 			ext4_msg(sb, KERN_ERR, "blocks per group (%lu) and "
3973281b5995STheodore Ts'o 				 "clusters per group (%lu) inconsistent",
3974281b5995STheodore Ts'o 				 sbi->s_blocks_per_group,
3975281b5995STheodore Ts'o 				 sbi->s_clusters_per_group);
3976281b5995STheodore Ts'o 			goto failed_mount;
3977281b5995STheodore Ts'o 		}
3978281b5995STheodore Ts'o 	} else {
3979281b5995STheodore Ts'o 		if (clustersize != blocksize) {
3980bfe0a5f4STheodore Ts'o 			ext4_msg(sb, KERN_ERR,
3981bfe0a5f4STheodore Ts'o 				 "fragment/cluster size (%d) != "
3982bfe0a5f4STheodore Ts'o 				 "block size (%d)", clustersize, blocksize);
3983bfe0a5f4STheodore Ts'o 			goto failed_mount;
3984281b5995STheodore Ts'o 		}
3985ac27a0ecSDave Kleikamp 		if (sbi->s_blocks_per_group > blocksize * 8) {
3986b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR,
3987b31e1552SEric Sandeen 				 "#blocks per group too big: %lu",
3988ac27a0ecSDave Kleikamp 				 sbi->s_blocks_per_group);
3989ac27a0ecSDave Kleikamp 			goto failed_mount;
3990ac27a0ecSDave Kleikamp 		}
3991281b5995STheodore Ts'o 		sbi->s_clusters_per_group = sbi->s_blocks_per_group;
3992281b5995STheodore Ts'o 		sbi->s_cluster_bits = 0;
3993281b5995STheodore Ts'o 	}
3994281b5995STheodore Ts'o 	sbi->s_cluster_ratio = clustersize / blocksize;
3995281b5995STheodore Ts'o 
3996960fd856STheodore Ts'o 	/* Do we have standard group size of clustersize * 8 blocks ? */
3997960fd856STheodore Ts'o 	if (sbi->s_blocks_per_group == clustersize << 3)
3998960fd856STheodore Ts'o 		set_opt2(sb, STD_GROUP_SIZE);
3999960fd856STheodore Ts'o 
4000bf43d84bSEric Sandeen 	/*
4001bf43d84bSEric Sandeen 	 * Test whether we have more sectors than will fit in sector_t,
4002bf43d84bSEric Sandeen 	 * and whether the max offset is addressable by the page cache.
4003bf43d84bSEric Sandeen 	 */
40045a9ae68aSDarrick J. Wong 	err = generic_check_addressable(sb->s_blocksize_bits,
400530ca22c7SPatrick J. LoPresti 					ext4_blocks_count(es));
40065a9ae68aSDarrick J. Wong 	if (err) {
4007b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "filesystem"
4008bf43d84bSEric Sandeen 			 " too large to mount safely on this system");
4009ac27a0ecSDave Kleikamp 		if (sizeof(sector_t) < 8)
401090c699a9SBartlomiej Zolnierkiewicz 			ext4_msg(sb, KERN_WARNING, "CONFIG_LBDAF not enabled");
4011ac27a0ecSDave Kleikamp 		goto failed_mount;
4012ac27a0ecSDave Kleikamp 	}
4013ac27a0ecSDave Kleikamp 
4014617ba13bSMingming Cao 	if (EXT4_BLOCKS_PER_GROUP(sb) == 0)
4015617ba13bSMingming Cao 		goto cantfind_ext4;
4016e7c95593SEric Sandeen 
40170f2ddca6SFrom: Thiemo Nagel 	/* check blocks count against device size */
40180f2ddca6SFrom: Thiemo Nagel 	blocks_count = sb->s_bdev->bd_inode->i_size >> sb->s_blocksize_bits;
40190f2ddca6SFrom: Thiemo Nagel 	if (blocks_count && ext4_blocks_count(es) > blocks_count) {
4020b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING, "bad geometry: block count %llu "
4021b31e1552SEric Sandeen 		       "exceeds size of device (%llu blocks)",
40220f2ddca6SFrom: Thiemo Nagel 		       ext4_blocks_count(es), blocks_count);
40230f2ddca6SFrom: Thiemo Nagel 		goto failed_mount;
40240f2ddca6SFrom: Thiemo Nagel 	}
40250f2ddca6SFrom: Thiemo Nagel 
40264ec11028STheodore Ts'o 	/*
40274ec11028STheodore Ts'o 	 * It makes no sense for the first data block to be beyond the end
40284ec11028STheodore Ts'o 	 * of the filesystem.
40294ec11028STheodore Ts'o 	 */
40304ec11028STheodore Ts'o 	if (le32_to_cpu(es->s_first_data_block) >= ext4_blocks_count(es)) {
4031b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING, "bad geometry: first data "
4032b31e1552SEric Sandeen 			 "block %u is beyond end of filesystem (%llu)",
4033e7c95593SEric Sandeen 			 le32_to_cpu(es->s_first_data_block),
40344ec11028STheodore Ts'o 			 ext4_blocks_count(es));
4035e7c95593SEric Sandeen 		goto failed_mount;
4036e7c95593SEric Sandeen 	}
4037bfe0a5f4STheodore Ts'o 	if ((es->s_first_data_block == 0) && (es->s_log_block_size == 0) &&
4038bfe0a5f4STheodore Ts'o 	    (sbi->s_cluster_ratio == 1)) {
4039bfe0a5f4STheodore Ts'o 		ext4_msg(sb, KERN_WARNING, "bad geometry: first data "
4040bfe0a5f4STheodore Ts'o 			 "block is 0 with a 1k block and cluster size");
4041bfe0a5f4STheodore Ts'o 		goto failed_mount;
4042bfe0a5f4STheodore Ts'o 	}
4043bfe0a5f4STheodore Ts'o 
4044bd81d8eeSLaurent Vivier 	blocks_count = (ext4_blocks_count(es) -
4045bd81d8eeSLaurent Vivier 			le32_to_cpu(es->s_first_data_block) +
4046bd81d8eeSLaurent Vivier 			EXT4_BLOCKS_PER_GROUP(sb) - 1);
4047bd81d8eeSLaurent Vivier 	do_div(blocks_count, EXT4_BLOCKS_PER_GROUP(sb));
40484ec11028STheodore Ts'o 	if (blocks_count > ((uint64_t)1<<32) - EXT4_DESC_PER_BLOCK(sb)) {
4049b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING, "groups count too large: %u "
40504ec11028STheodore Ts'o 		       "(block count %llu, first data block %u, "
4051b31e1552SEric Sandeen 		       "blocks per group %lu)", sbi->s_groups_count,
40524ec11028STheodore Ts'o 		       ext4_blocks_count(es),
40534ec11028STheodore Ts'o 		       le32_to_cpu(es->s_first_data_block),
40544ec11028STheodore Ts'o 		       EXT4_BLOCKS_PER_GROUP(sb));
40554ec11028STheodore Ts'o 		goto failed_mount;
40564ec11028STheodore Ts'o 	}
4057bd81d8eeSLaurent Vivier 	sbi->s_groups_count = blocks_count;
4058fb0a387dSEric Sandeen 	sbi->s_blockfile_groups = min_t(ext4_group_t, sbi->s_groups_count,
4059fb0a387dSEric Sandeen 			(EXT4_MAX_BLOCK_FILE_PHYS / EXT4_BLOCKS_PER_GROUP(sb)));
4060617ba13bSMingming Cao 	db_count = (sbi->s_groups_count + EXT4_DESC_PER_BLOCK(sb) - 1) /
4061617ba13bSMingming Cao 		   EXT4_DESC_PER_BLOCK(sb);
40623a4b77cdSEryu Guan 	if (ext4_has_feature_meta_bg(sb)) {
40632ba3e6e8STheodore Ts'o 		if (le32_to_cpu(es->s_first_meta_bg) > db_count) {
40643a4b77cdSEryu Guan 			ext4_msg(sb, KERN_WARNING,
40653a4b77cdSEryu Guan 				 "first meta block group too large: %u "
40663a4b77cdSEryu Guan 				 "(group descriptor block count %u)",
40673a4b77cdSEryu Guan 				 le32_to_cpu(es->s_first_meta_bg), db_count);
40683a4b77cdSEryu Guan 			goto failed_mount;
40693a4b77cdSEryu Guan 		}
40703a4b77cdSEryu Guan 	}
4071344476e1SKees Cook 	sbi->s_group_desc = kvmalloc_array(db_count,
4072f18a5f21STheodore Ts'o 					   sizeof(struct buffer_head *),
4073ac27a0ecSDave Kleikamp 					   GFP_KERNEL);
4074ac27a0ecSDave Kleikamp 	if (sbi->s_group_desc == NULL) {
4075b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "not enough memory");
40762cde417dSTheodore Ts'o 		ret = -ENOMEM;
4077ac27a0ecSDave Kleikamp 		goto failed_mount;
4078ac27a0ecSDave Kleikamp 	}
4079bfe0a5f4STheodore Ts'o 	if (((u64)sbi->s_groups_count * sbi->s_inodes_per_group) !=
4080bfe0a5f4STheodore Ts'o 	    le32_to_cpu(es->s_inodes_count)) {
4081bfe0a5f4STheodore Ts'o 		ext4_msg(sb, KERN_ERR, "inodes count not valid: %u vs %llu",
4082bfe0a5f4STheodore Ts'o 			 le32_to_cpu(es->s_inodes_count),
4083bfe0a5f4STheodore Ts'o 			 ((u64)sbi->s_groups_count * sbi->s_inodes_per_group));
4084bfe0a5f4STheodore Ts'o 		ret = -EINVAL;
4085bfe0a5f4STheodore Ts'o 		goto failed_mount;
4086bfe0a5f4STheodore Ts'o 	}
4087ac27a0ecSDave Kleikamp 
4088705895b6SPekka Enberg 	bgl_lock_init(sbi->s_blockgroup_lock);
4089ac27a0ecSDave Kleikamp 
409085c8f176SAndrew Perepechko 	/* Pre-read the descriptors into the buffer cache */
409185c8f176SAndrew Perepechko 	for (i = 0; i < db_count; i++) {
409285c8f176SAndrew Perepechko 		block = descriptor_loc(sb, logical_sb_block, i);
409385c8f176SAndrew Perepechko 		sb_breadahead(sb, block);
409485c8f176SAndrew Perepechko 	}
409585c8f176SAndrew Perepechko 
4096ac27a0ecSDave Kleikamp 	for (i = 0; i < db_count; i++) {
409770bbb3e0SAndrew Morton 		block = descriptor_loc(sb, logical_sb_block, i);
4098a8ac900bSGioh Kim 		sbi->s_group_desc[i] = sb_bread_unmovable(sb, block);
4099ac27a0ecSDave Kleikamp 		if (!sbi->s_group_desc[i]) {
4100b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR,
4101b31e1552SEric Sandeen 			       "can't read group descriptor %d", i);
4102ac27a0ecSDave Kleikamp 			db_count = i;
4103ac27a0ecSDave Kleikamp 			goto failed_mount2;
4104ac27a0ecSDave Kleikamp 		}
4105ac27a0ecSDave Kleikamp 	}
410644de022cSTheodore Ts'o 	sbi->s_gdb_count = db_count;
4107829fa70dSTheodore Ts'o 	if (!ext4_check_descriptors(sb, logical_sb_block, &first_not_zeroed)) {
4108b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "group descriptors corrupted!");
41096a797d27SDarrick J. Wong 		ret = -EFSCORRUPTED;
4110f9ae9cf5STheodore Ts'o 		goto failed_mount2;
4111ac27a0ecSDave Kleikamp 	}
4112772cb7c8SJose R. Santos 
4113235699a8SKees Cook 	timer_setup(&sbi->s_err_report, print_daily_error_info, 0);
411404496411STao Ma 
4115a75ae78fSDmitry Monakhov 	/* Register extent status tree shrinker */
4116eb68d0e2SZheng Liu 	if (ext4_es_register_shrinker(sbi))
4117ce7e010aSTheodore Ts'o 		goto failed_mount3;
4118ce7e010aSTheodore Ts'o 
4119c9de560dSAlex Tomas 	sbi->s_stripe = ext4_get_stripe_size(sbi);
412067a5da56SZheng Liu 	sbi->s_extent_max_zeroout_kb = 32;
4121c9de560dSAlex Tomas 
4122f9ae9cf5STheodore Ts'o 	/*
4123f9ae9cf5STheodore Ts'o 	 * set up enough so that it can read an inode
4124f9ae9cf5STheodore Ts'o 	 */
4125f9ae9cf5STheodore Ts'o 	sb->s_op = &ext4_sops;
4126617ba13bSMingming Cao 	sb->s_export_op = &ext4_export_ops;
4127617ba13bSMingming Cao 	sb->s_xattr = ext4_xattr_handlers;
4128ffcc4182SEric Biggers #ifdef CONFIG_EXT4_FS_ENCRYPTION
4129a7550b30SJaegeuk Kim 	sb->s_cop = &ext4_cryptops;
4130ffcc4182SEric Biggers #endif
4131ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
4132617ba13bSMingming Cao 	sb->dq_op = &ext4_quota_operations;
4133e2b911c5SDarrick J. Wong 	if (ext4_has_feature_quota(sb))
41341fa5efe3SJan Kara 		sb->s_qcop = &dquot_quotactl_sysfile_ops;
4135262b4662SJan Kara 	else
4136262b4662SJan Kara 		sb->s_qcop = &ext4_qctl_operations;
4137689c958cSLi Xi 	sb->s_quota_types = QTYPE_MASK_USR | QTYPE_MASK_GRP | QTYPE_MASK_PRJ;
4138ac27a0ecSDave Kleikamp #endif
413985787090SChristoph Hellwig 	memcpy(&sb->s_uuid, es->s_uuid, sizeof(es->s_uuid));
4140f2fa2ffcSAneesh Kumar K.V 
4141ac27a0ecSDave Kleikamp 	INIT_LIST_HEAD(&sbi->s_orphan); /* unlinked but open files */
41423b9d4ed2STheodore Ts'o 	mutex_init(&sbi->s_orphan_lock);
4143ac27a0ecSDave Kleikamp 
4144ac27a0ecSDave Kleikamp 	sb->s_root = NULL;
4145ac27a0ecSDave Kleikamp 
4146ac27a0ecSDave Kleikamp 	needs_recovery = (es->s_last_orphan != 0 ||
4147e2b911c5SDarrick J. Wong 			  ext4_has_feature_journal_needs_recovery(sb));
4148ac27a0ecSDave Kleikamp 
4149bc98a42cSDavid Howells 	if (ext4_has_feature_mmp(sb) && !sb_rdonly(sb))
4150c5e06d10SJohann Lombardi 		if (ext4_multi_mount_protect(sb, le64_to_cpu(es->s_mmp_block)))
415150460fe8SDarrick J. Wong 			goto failed_mount3a;
4152c5e06d10SJohann Lombardi 
4153ac27a0ecSDave Kleikamp 	/*
4154ac27a0ecSDave Kleikamp 	 * The first inode we look at is the journal inode.  Don't try
4155ac27a0ecSDave Kleikamp 	 * root first: it may be modified in the journal!
4156ac27a0ecSDave Kleikamp 	 */
4157e2b911c5SDarrick J. Wong 	if (!test_opt(sb, NOLOAD) && ext4_has_feature_journal(sb)) {
41584753d8a2STheodore Ts'o 		err = ext4_load_journal(sb, es, journal_devnum);
41594753d8a2STheodore Ts'o 		if (err)
416050460fe8SDarrick J. Wong 			goto failed_mount3a;
4161bc98a42cSDavid Howells 	} else if (test_opt(sb, NOLOAD) && !sb_rdonly(sb) &&
4162e2b911c5SDarrick J. Wong 		   ext4_has_feature_journal_needs_recovery(sb)) {
4163b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "required journal recovery "
4164b31e1552SEric Sandeen 		       "suppressed and not mounted read-only");
4165744692dcSJiaying Zhang 		goto failed_mount_wq;
4166ac27a0ecSDave Kleikamp 	} else {
41671e381f60SDmitry Monakhov 		/* Nojournal mode, all journal mount options are illegal */
41681e381f60SDmitry Monakhov 		if (test_opt2(sb, EXPLICIT_JOURNAL_CHECKSUM)) {
41691e381f60SDmitry Monakhov 			ext4_msg(sb, KERN_ERR, "can't mount with "
41701e381f60SDmitry Monakhov 				 "journal_checksum, fs mounted w/o journal");
41711e381f60SDmitry Monakhov 			goto failed_mount_wq;
41721e381f60SDmitry Monakhov 		}
41731e381f60SDmitry Monakhov 		if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
41741e381f60SDmitry Monakhov 			ext4_msg(sb, KERN_ERR, "can't mount with "
41751e381f60SDmitry Monakhov 				 "journal_async_commit, fs mounted w/o journal");
41761e381f60SDmitry Monakhov 			goto failed_mount_wq;
41771e381f60SDmitry Monakhov 		}
41781e381f60SDmitry Monakhov 		if (sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ) {
41791e381f60SDmitry Monakhov 			ext4_msg(sb, KERN_ERR, "can't mount with "
41801e381f60SDmitry Monakhov 				 "commit=%lu, fs mounted w/o journal",
41811e381f60SDmitry Monakhov 				 sbi->s_commit_interval / HZ);
41821e381f60SDmitry Monakhov 			goto failed_mount_wq;
41831e381f60SDmitry Monakhov 		}
41841e381f60SDmitry Monakhov 		if (EXT4_MOUNT_DATA_FLAGS &
41851e381f60SDmitry Monakhov 		    (sbi->s_mount_opt ^ sbi->s_def_mount_opt)) {
41861e381f60SDmitry Monakhov 			ext4_msg(sb, KERN_ERR, "can't mount with "
41871e381f60SDmitry Monakhov 				 "data=, fs mounted w/o journal");
41881e381f60SDmitry Monakhov 			goto failed_mount_wq;
41891e381f60SDmitry Monakhov 		}
41901e381f60SDmitry Monakhov 		sbi->s_def_mount_opt &= EXT4_MOUNT_JOURNAL_CHECKSUM;
41911e381f60SDmitry Monakhov 		clear_opt(sb, JOURNAL_CHECKSUM);
4192fd8c37ecSTheodore Ts'o 		clear_opt(sb, DATA_FLAGS);
41930390131bSFrank Mayhar 		sbi->s_journal = NULL;
41940390131bSFrank Mayhar 		needs_recovery = 0;
41950390131bSFrank Mayhar 		goto no_journal;
4196ac27a0ecSDave Kleikamp 	}
4197ac27a0ecSDave Kleikamp 
4198e2b911c5SDarrick J. Wong 	if (ext4_has_feature_64bit(sb) &&
4199eb40a09cSJose R. Santos 	    !jbd2_journal_set_features(EXT4_SB(sb)->s_journal, 0, 0,
4200eb40a09cSJose R. Santos 				       JBD2_FEATURE_INCOMPAT_64BIT)) {
4201b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "Failed to set 64-bit journal feature");
4202744692dcSJiaying Zhang 		goto failed_mount_wq;
4203eb40a09cSJose R. Santos 	}
4204eb40a09cSJose R. Santos 
420525ed6e8aSDarrick J. Wong 	if (!set_journal_csum_feature_set(sb)) {
420625ed6e8aSDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "Failed to set journal checksum "
420725ed6e8aSDarrick J. Wong 			 "feature set");
420825ed6e8aSDarrick J. Wong 		goto failed_mount_wq;
4209d4da6c9cSLinus Torvalds 	}
4210818d276cSGirish Shilamkar 
4211ac27a0ecSDave Kleikamp 	/* We have now updated the journal if required, so we can
4212ac27a0ecSDave Kleikamp 	 * validate the data journaling mode. */
4213ac27a0ecSDave Kleikamp 	switch (test_opt(sb, DATA_FLAGS)) {
4214ac27a0ecSDave Kleikamp 	case 0:
4215ac27a0ecSDave Kleikamp 		/* No mode set, assume a default based on the journal
421663f57933SAndrew Morton 		 * capabilities: ORDERED_DATA if the journal can
421763f57933SAndrew Morton 		 * cope, else JOURNAL_DATA
421863f57933SAndrew Morton 		 */
4219dab291afSMingming Cao 		if (jbd2_journal_check_available_features
422027f394a7STyson Nottingham 		    (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) {
4221fd8c37ecSTheodore Ts'o 			set_opt(sb, ORDERED_DATA);
422227f394a7STyson Nottingham 			sbi->s_def_mount_opt |= EXT4_MOUNT_ORDERED_DATA;
422327f394a7STyson Nottingham 		} else {
4224fd8c37ecSTheodore Ts'o 			set_opt(sb, JOURNAL_DATA);
422527f394a7STyson Nottingham 			sbi->s_def_mount_opt |= EXT4_MOUNT_JOURNAL_DATA;
422627f394a7STyson Nottingham 		}
4227ac27a0ecSDave Kleikamp 		break;
4228ac27a0ecSDave Kleikamp 
4229617ba13bSMingming Cao 	case EXT4_MOUNT_ORDERED_DATA:
4230617ba13bSMingming Cao 	case EXT4_MOUNT_WRITEBACK_DATA:
4231dab291afSMingming Cao 		if (!jbd2_journal_check_available_features
4232dab291afSMingming Cao 		    (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) {
4233b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "Journal does not support "
4234b31e1552SEric Sandeen 			       "requested data journaling mode");
4235744692dcSJiaying Zhang 			goto failed_mount_wq;
4236ac27a0ecSDave Kleikamp 		}
4237ac27a0ecSDave Kleikamp 	default:
4238ac27a0ecSDave Kleikamp 		break;
4239ac27a0ecSDave Kleikamp 	}
4240ab04df78SJan Kara 
4241ab04df78SJan Kara 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA &&
4242ab04df78SJan Kara 	    test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
4243ab04df78SJan Kara 		ext4_msg(sb, KERN_ERR, "can't mount with "
4244ab04df78SJan Kara 			"journal_async_commit in data=ordered mode");
4245ab04df78SJan Kara 		goto failed_mount_wq;
4246ab04df78SJan Kara 	}
4247ab04df78SJan Kara 
4248b3881f74STheodore Ts'o 	set_task_ioprio(sbi->s_journal->j_task, journal_ioprio);
4249ac27a0ecSDave Kleikamp 
425018aadd47SBobi Jam 	sbi->s_journal->j_commit_callback = ext4_journal_commit_callback;
425118aadd47SBobi Jam 
4252ce7e010aSTheodore Ts'o no_journal:
4253cdb7ee4cSTahsin Erdogan 	if (!test_opt(sb, NO_MBCACHE)) {
425447387409STahsin Erdogan 		sbi->s_ea_block_cache = ext4_xattr_create_cache();
425547387409STahsin Erdogan 		if (!sbi->s_ea_block_cache) {
4256cdb7ee4cSTahsin Erdogan 			ext4_msg(sb, KERN_ERR,
4257cdb7ee4cSTahsin Erdogan 				 "Failed to create ea_block_cache");
42589c191f70ST Makphaibulchoke 			goto failed_mount_wq;
42599c191f70ST Makphaibulchoke 		}
42609c191f70ST Makphaibulchoke 
4261dec214d0STahsin Erdogan 		if (ext4_has_feature_ea_inode(sb)) {
4262dec214d0STahsin Erdogan 			sbi->s_ea_inode_cache = ext4_xattr_create_cache();
4263dec214d0STahsin Erdogan 			if (!sbi->s_ea_inode_cache) {
4264dec214d0STahsin Erdogan 				ext4_msg(sb, KERN_ERR,
4265dec214d0STahsin Erdogan 					 "Failed to create ea_inode_cache");
4266dec214d0STahsin Erdogan 				goto failed_mount_wq;
4267dec214d0STahsin Erdogan 			}
4268dec214d0STahsin Erdogan 		}
4269cdb7ee4cSTahsin Erdogan 	}
4270dec214d0STahsin Erdogan 
4271e2b911c5SDarrick J. Wong 	if ((DUMMY_ENCRYPTION_ENABLED(sbi) || ext4_has_feature_encrypt(sb)) &&
427209cbfeafSKirill A. Shutemov 	    (blocksize != PAGE_SIZE)) {
42731cb767cdSTheodore Ts'o 		ext4_msg(sb, KERN_ERR,
42741cb767cdSTheodore Ts'o 			 "Unsupported blocksize for fs encryption");
42751cb767cdSTheodore Ts'o 		goto failed_mount_wq;
42761cb767cdSTheodore Ts'o 	}
42771cb767cdSTheodore Ts'o 
4278bc98a42cSDavid Howells 	if (DUMMY_ENCRYPTION_ENABLED(sbi) && !sb_rdonly(sb) &&
4279e2b911c5SDarrick J. Wong 	    !ext4_has_feature_encrypt(sb)) {
4280e2b911c5SDarrick J. Wong 		ext4_set_feature_encrypt(sb);
42816ddb2447STheodore Ts'o 		ext4_commit_super(sb, 1);
42826ddb2447STheodore Ts'o 	}
42836ddb2447STheodore Ts'o 
4284fd89d5f2STejun Heo 	/*
4285952fc18eSTheodore Ts'o 	 * Get the # of file system overhead blocks from the
4286952fc18eSTheodore Ts'o 	 * superblock if present.
4287952fc18eSTheodore Ts'o 	 */
4288952fc18eSTheodore Ts'o 	if (es->s_overhead_clusters)
4289952fc18eSTheodore Ts'o 		sbi->s_overhead = le32_to_cpu(es->s_overhead_clusters);
4290952fc18eSTheodore Ts'o 	else {
429107aa2ea1SLukas Czerner 		err = ext4_calculate_overhead(sb);
429207aa2ea1SLukas Czerner 		if (err)
4293952fc18eSTheodore Ts'o 			goto failed_mount_wq;
4294952fc18eSTheodore Ts'o 	}
4295952fc18eSTheodore Ts'o 
4296952fc18eSTheodore Ts'o 	/*
4297fd89d5f2STejun Heo 	 * The maximum number of concurrent works can be high and
4298fd89d5f2STejun Heo 	 * concurrency isn't really necessary.  Limit it to 1.
4299fd89d5f2STejun Heo 	 */
43002e8fa54eSJan Kara 	EXT4_SB(sb)->rsv_conversion_wq =
43012e8fa54eSJan Kara 		alloc_workqueue("ext4-rsv-conversion", WQ_MEM_RECLAIM | WQ_UNBOUND, 1);
43022e8fa54eSJan Kara 	if (!EXT4_SB(sb)->rsv_conversion_wq) {
43032e8fa54eSJan Kara 		printk(KERN_ERR "EXT4-fs: failed to create workqueue\n");
430407aa2ea1SLukas Czerner 		ret = -ENOMEM;
43052e8fa54eSJan Kara 		goto failed_mount4;
43062e8fa54eSJan Kara 	}
43072e8fa54eSJan Kara 
4308ac27a0ecSDave Kleikamp 	/*
4309dab291afSMingming Cao 	 * The jbd2_journal_load will have done any necessary log recovery,
4310ac27a0ecSDave Kleikamp 	 * so we can safely mount the rest of the filesystem now.
4311ac27a0ecSDave Kleikamp 	 */
4312ac27a0ecSDave Kleikamp 
43131d1fe1eeSDavid Howells 	root = ext4_iget(sb, EXT4_ROOT_INO);
43141d1fe1eeSDavid Howells 	if (IS_ERR(root)) {
4315b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "get root inode failed");
43161d1fe1eeSDavid Howells 		ret = PTR_ERR(root);
431732a9bb57SManish Katiyar 		root = NULL;
4318ac27a0ecSDave Kleikamp 		goto failed_mount4;
4319ac27a0ecSDave Kleikamp 	}
4320ac27a0ecSDave Kleikamp 	if (!S_ISDIR(root->i_mode) || !root->i_blocks || !root->i_size) {
4321b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "corrupt root inode, run e2fsck");
432294bf608aSAl Viro 		iput(root);
4323ac27a0ecSDave Kleikamp 		goto failed_mount4;
4324ac27a0ecSDave Kleikamp 	}
432548fde701SAl Viro 	sb->s_root = d_make_root(root);
43261d1fe1eeSDavid Howells 	if (!sb->s_root) {
4327b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "get root dentry failed");
43281d1fe1eeSDavid Howells 		ret = -ENOMEM;
43291d1fe1eeSDavid Howells 		goto failed_mount4;
43301d1fe1eeSDavid Howells 	}
4331ac27a0ecSDave Kleikamp 
4332c89128a0SJaegeuk Kim 	ret = ext4_setup_super(sb, es, sb_rdonly(sb));
4333c89128a0SJaegeuk Kim 	if (ret == -EROFS) {
43341751e8a6SLinus Torvalds 		sb->s_flags |= SB_RDONLY;
4335c89128a0SJaegeuk Kim 		ret = 0;
4336c89128a0SJaegeuk Kim 	} else if (ret)
4337c89128a0SJaegeuk Kim 		goto failed_mount4a;
4338ef7f3835SKalpak Shah 
4339ef7f3835SKalpak Shah 	/* determine the minimum size of new large inodes, if present */
4340670e9875STheodore Ts'o 	if (sbi->s_inode_size > EXT4_GOOD_OLD_INODE_SIZE &&
4341670e9875STheodore Ts'o 	    sbi->s_want_extra_isize == 0) {
4342ef7f3835SKalpak Shah 		sbi->s_want_extra_isize = sizeof(struct ext4_inode) -
4343ef7f3835SKalpak Shah 						     EXT4_GOOD_OLD_INODE_SIZE;
4344e2b911c5SDarrick J. Wong 		if (ext4_has_feature_extra_isize(sb)) {
4345ef7f3835SKalpak Shah 			if (sbi->s_want_extra_isize <
4346ef7f3835SKalpak Shah 			    le16_to_cpu(es->s_want_extra_isize))
4347ef7f3835SKalpak Shah 				sbi->s_want_extra_isize =
4348ef7f3835SKalpak Shah 					le16_to_cpu(es->s_want_extra_isize);
4349ef7f3835SKalpak Shah 			if (sbi->s_want_extra_isize <
4350ef7f3835SKalpak Shah 			    le16_to_cpu(es->s_min_extra_isize))
4351ef7f3835SKalpak Shah 				sbi->s_want_extra_isize =
4352ef7f3835SKalpak Shah 					le16_to_cpu(es->s_min_extra_isize);
4353ef7f3835SKalpak Shah 		}
4354ef7f3835SKalpak Shah 	}
4355ef7f3835SKalpak Shah 	/* Check if enough inode space is available */
4356ef7f3835SKalpak Shah 	if (EXT4_GOOD_OLD_INODE_SIZE + sbi->s_want_extra_isize >
4357ef7f3835SKalpak Shah 							sbi->s_inode_size) {
4358ef7f3835SKalpak Shah 		sbi->s_want_extra_isize = sizeof(struct ext4_inode) -
4359ef7f3835SKalpak Shah 						       EXT4_GOOD_OLD_INODE_SIZE;
4360b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "required extra inode space not"
4361b31e1552SEric Sandeen 			 "available");
4362ef7f3835SKalpak Shah 	}
4363ef7f3835SKalpak Shah 
4364b5799018STheodore Ts'o 	ext4_set_resv_clusters(sb);
436527dd4385SLukas Czerner 
43666fd058f7STheodore Ts'o 	err = ext4_setup_system_zone(sb);
43676fd058f7STheodore Ts'o 	if (err) {
4368b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "failed to initialize system "
4369fbe845ddSCurt Wohlgemuth 			 "zone (%d)", err);
4370f9ae9cf5STheodore Ts'o 		goto failed_mount4a;
4371f9ae9cf5STheodore Ts'o 	}
4372f9ae9cf5STheodore Ts'o 
4373f9ae9cf5STheodore Ts'o 	ext4_ext_init(sb);
4374f9ae9cf5STheodore Ts'o 	err = ext4_mb_init(sb);
4375f9ae9cf5STheodore Ts'o 	if (err) {
4376f9ae9cf5STheodore Ts'o 		ext4_msg(sb, KERN_ERR, "failed to initialize mballoc (%d)",
4377f9ae9cf5STheodore Ts'o 			 err);
4378dcf2d804STao Ma 		goto failed_mount5;
4379c2774d84SAneesh Kumar K.V 	}
4380c2774d84SAneesh Kumar K.V 
4381d5e03cbbSTheodore Ts'o 	block = ext4_count_free_clusters(sb);
4382d5e03cbbSTheodore Ts'o 	ext4_free_blocks_count_set(sbi->s_es,
4383d5e03cbbSTheodore Ts'o 				   EXT4_C2B(sbi, block));
43844274f516STheodore Ts'o 	ext4_superblock_csum_set(sb);
4385908c7f19STejun Heo 	err = percpu_counter_init(&sbi->s_freeclusters_counter, block,
4386908c7f19STejun Heo 				  GFP_KERNEL);
4387d5e03cbbSTheodore Ts'o 	if (!err) {
4388d5e03cbbSTheodore Ts'o 		unsigned long freei = ext4_count_free_inodes(sb);
4389d5e03cbbSTheodore Ts'o 		sbi->s_es->s_free_inodes_count = cpu_to_le32(freei);
43904274f516STheodore Ts'o 		ext4_superblock_csum_set(sb);
4391908c7f19STejun Heo 		err = percpu_counter_init(&sbi->s_freeinodes_counter, freei,
4392908c7f19STejun Heo 					  GFP_KERNEL);
4393d5e03cbbSTheodore Ts'o 	}
4394d5e03cbbSTheodore Ts'o 	if (!err)
4395d5e03cbbSTheodore Ts'o 		err = percpu_counter_init(&sbi->s_dirs_counter,
4396908c7f19STejun Heo 					  ext4_count_dirs(sb), GFP_KERNEL);
4397d5e03cbbSTheodore Ts'o 	if (!err)
4398908c7f19STejun Heo 		err = percpu_counter_init(&sbi->s_dirtyclusters_counter, 0,
4399908c7f19STejun Heo 					  GFP_KERNEL);
4400c8585c6fSDaeho Jeong 	if (!err)
4401c8585c6fSDaeho Jeong 		err = percpu_init_rwsem(&sbi->s_journal_flag_rwsem);
4402c8585c6fSDaeho Jeong 
4403d5e03cbbSTheodore Ts'o 	if (err) {
4404d5e03cbbSTheodore Ts'o 		ext4_msg(sb, KERN_ERR, "insufficient memory");
4405d5e03cbbSTheodore Ts'o 		goto failed_mount6;
4406d5e03cbbSTheodore Ts'o 	}
4407d5e03cbbSTheodore Ts'o 
4408e2b911c5SDarrick J. Wong 	if (ext4_has_feature_flex_bg(sb))
4409d5e03cbbSTheodore Ts'o 		if (!ext4_fill_flex_info(sb)) {
4410d5e03cbbSTheodore Ts'o 			ext4_msg(sb, KERN_ERR,
4411d5e03cbbSTheodore Ts'o 			       "unable to initialize "
4412d5e03cbbSTheodore Ts'o 			       "flex_bg meta info!");
4413d5e03cbbSTheodore Ts'o 			goto failed_mount6;
4414d5e03cbbSTheodore Ts'o 		}
4415d5e03cbbSTheodore Ts'o 
4416bfff6873SLukas Czerner 	err = ext4_register_li_request(sb, first_not_zeroed);
4417bfff6873SLukas Czerner 	if (err)
4418dcf2d804STao Ma 		goto failed_mount6;
4419bfff6873SLukas Czerner 
4420b5799018STheodore Ts'o 	err = ext4_register_sysfs(sb);
4421dcf2d804STao Ma 	if (err)
4422dcf2d804STao Ma 		goto failed_mount7;
44233197ebdbSTheodore Ts'o 
44249b2ff357SJan Kara #ifdef CONFIG_QUOTA
44259b2ff357SJan Kara 	/* Enable quota usage during mount. */
4426bc98a42cSDavid Howells 	if (ext4_has_feature_quota(sb) && !sb_rdonly(sb)) {
44279b2ff357SJan Kara 		err = ext4_enable_quotas(sb);
44289b2ff357SJan Kara 		if (err)
44299b2ff357SJan Kara 			goto failed_mount8;
44309b2ff357SJan Kara 	}
44319b2ff357SJan Kara #endif  /* CONFIG_QUOTA */
44329b2ff357SJan Kara 
4433617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state |= EXT4_ORPHAN_FS;
4434617ba13bSMingming Cao 	ext4_orphan_cleanup(sb, es);
4435617ba13bSMingming Cao 	EXT4_SB(sb)->s_mount_state &= ~EXT4_ORPHAN_FS;
44360390131bSFrank Mayhar 	if (needs_recovery) {
4437b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "recovery complete");
4438617ba13bSMingming Cao 		ext4_mark_recovery_complete(sb, es);
44390390131bSFrank Mayhar 	}
44400390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal) {
44410390131bSFrank Mayhar 		if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA)
44420390131bSFrank Mayhar 			descr = " journalled data mode";
44430390131bSFrank Mayhar 		else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA)
44440390131bSFrank Mayhar 			descr = " ordered data mode";
44450390131bSFrank Mayhar 		else
44460390131bSFrank Mayhar 			descr = " writeback data mode";
44470390131bSFrank Mayhar 	} else
44480390131bSFrank Mayhar 		descr = "out journal";
44490390131bSFrank Mayhar 
445079add3a3SLukas Czerner 	if (test_opt(sb, DISCARD)) {
445179add3a3SLukas Czerner 		struct request_queue *q = bdev_get_queue(sb->s_bdev);
445279add3a3SLukas Czerner 		if (!blk_queue_discard(q))
445379add3a3SLukas Czerner 			ext4_msg(sb, KERN_WARNING,
445479add3a3SLukas Czerner 				 "mounting with \"discard\" option, but "
445579add3a3SLukas Czerner 				 "the device does not support discard");
445679add3a3SLukas Czerner 	}
445779add3a3SLukas Czerner 
4458e294a537STheodore Ts'o 	if (___ratelimit(&ext4_mount_msg_ratelimit, "EXT4-fs mount"))
4459d4c402d9SCurt Wohlgemuth 		ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. "
44605aee0f8aSTheodore Ts'o 			 "Opts: %.*s%s%s", descr,
44615aee0f8aSTheodore Ts'o 			 (int) sizeof(sbi->s_es->s_mount_opts),
44625aee0f8aSTheodore Ts'o 			 sbi->s_es->s_mount_opts,
44638b67f04aSTheodore Ts'o 			 *sbi->s_es->s_mount_opts ? "; " : "", orig_data);
4464ac27a0ecSDave Kleikamp 
446566e61a9eSTheodore Ts'o 	if (es->s_error_count)
446666e61a9eSTheodore Ts'o 		mod_timer(&sbi->s_err_report, jiffies + 300*HZ); /* 5 minutes */
4467ac27a0ecSDave Kleikamp 
4468efbed4dcSTheodore Ts'o 	/* Enable message ratelimiting. Default is 10 messages per 5 secs. */
4469efbed4dcSTheodore Ts'o 	ratelimit_state_init(&sbi->s_err_ratelimit_state, 5 * HZ, 10);
4470efbed4dcSTheodore Ts'o 	ratelimit_state_init(&sbi->s_warning_ratelimit_state, 5 * HZ, 10);
4471efbed4dcSTheodore Ts'o 	ratelimit_state_init(&sbi->s_msg_ratelimit_state, 5 * HZ, 10);
4472efbed4dcSTheodore Ts'o 
4473d4c402d9SCurt Wohlgemuth 	kfree(orig_data);
4474ac27a0ecSDave Kleikamp 	return 0;
4475ac27a0ecSDave Kleikamp 
4476617ba13bSMingming Cao cantfind_ext4:
4477ac27a0ecSDave Kleikamp 	if (!silent)
4478b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "VFS: Can't find ext4 filesystem");
4479ac27a0ecSDave Kleikamp 	goto failed_mount;
4480ac27a0ecSDave Kleikamp 
448172ba7450STheodore Ts'o #ifdef CONFIG_QUOTA
448272ba7450STheodore Ts'o failed_mount8:
4483ebd173beSTheodore Ts'o 	ext4_unregister_sysfs(sb);
448472ba7450STheodore Ts'o #endif
4485dcf2d804STao Ma failed_mount7:
4486dcf2d804STao Ma 	ext4_unregister_li_request(sb);
4487dcf2d804STao Ma failed_mount6:
4488f9ae9cf5STheodore Ts'o 	ext4_mb_release(sb);
4489d5e03cbbSTheodore Ts'o 	if (sbi->s_flex_groups)
4490b93b41d4SAl Viro 		kvfree(sbi->s_flex_groups);
4491d5e03cbbSTheodore Ts'o 	percpu_counter_destroy(&sbi->s_freeclusters_counter);
4492d5e03cbbSTheodore Ts'o 	percpu_counter_destroy(&sbi->s_freeinodes_counter);
4493d5e03cbbSTheodore Ts'o 	percpu_counter_destroy(&sbi->s_dirs_counter);
4494d5e03cbbSTheodore Ts'o 	percpu_counter_destroy(&sbi->s_dirtyclusters_counter);
449500764937SAzat Khuzhin failed_mount5:
4496f9ae9cf5STheodore Ts'o 	ext4_ext_release(sb);
4497f9ae9cf5STheodore Ts'o 	ext4_release_system_zone(sb);
4498f9ae9cf5STheodore Ts'o failed_mount4a:
449994bf608aSAl Viro 	dput(sb->s_root);
450032a9bb57SManish Katiyar 	sb->s_root = NULL;
450194bf608aSAl Viro failed_mount4:
4502b31e1552SEric Sandeen 	ext4_msg(sb, KERN_ERR, "mount failed");
45032e8fa54eSJan Kara 	if (EXT4_SB(sb)->rsv_conversion_wq)
45042e8fa54eSJan Kara 		destroy_workqueue(EXT4_SB(sb)->rsv_conversion_wq);
45054c0425ffSMingming Cao failed_mount_wq:
4506dec214d0STahsin Erdogan 	if (sbi->s_ea_inode_cache) {
4507dec214d0STahsin Erdogan 		ext4_xattr_destroy_cache(sbi->s_ea_inode_cache);
4508dec214d0STahsin Erdogan 		sbi->s_ea_inode_cache = NULL;
4509dec214d0STahsin Erdogan 	}
451047387409STahsin Erdogan 	if (sbi->s_ea_block_cache) {
451147387409STahsin Erdogan 		ext4_xattr_destroy_cache(sbi->s_ea_block_cache);
451247387409STahsin Erdogan 		sbi->s_ea_block_cache = NULL;
451382939d79SJan Kara 	}
45140390131bSFrank Mayhar 	if (sbi->s_journal) {
4515dab291afSMingming Cao 		jbd2_journal_destroy(sbi->s_journal);
451647b4a50bSJan Kara 		sbi->s_journal = NULL;
45170390131bSFrank Mayhar 	}
451850460fe8SDarrick J. Wong failed_mount3a:
4519d3922a77SZheng Liu 	ext4_es_unregister_shrinker(sbi);
4520eb68d0e2SZheng Liu failed_mount3:
45219105bb14SAl Viro 	del_timer_sync(&sbi->s_err_report);
4522c5e06d10SJohann Lombardi 	if (sbi->s_mmp_tsk)
4523c5e06d10SJohann Lombardi 		kthread_stop(sbi->s_mmp_tsk);
4524ac27a0ecSDave Kleikamp failed_mount2:
4525ac27a0ecSDave Kleikamp 	for (i = 0; i < db_count; i++)
4526ac27a0ecSDave Kleikamp 		brelse(sbi->s_group_desc[i]);
4527b93b41d4SAl Viro 	kvfree(sbi->s_group_desc);
4528ac27a0ecSDave Kleikamp failed_mount:
45290441984aSDarrick J. Wong 	if (sbi->s_chksum_driver)
45300441984aSDarrick J. Wong 		crypto_free_shash(sbi->s_chksum_driver);
4531ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
4532a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
4533ac27a0ecSDave Kleikamp 		kfree(sbi->s_qf_names[i]);
4534ac27a0ecSDave Kleikamp #endif
4535617ba13bSMingming Cao 	ext4_blkdev_remove(sbi);
4536ac27a0ecSDave Kleikamp 	brelse(bh);
4537ac27a0ecSDave Kleikamp out_fail:
4538ac27a0ecSDave Kleikamp 	sb->s_fs_info = NULL;
4539f6830165SManish Katiyar 	kfree(sbi->s_blockgroup_lock);
45405aee0f8aSTheodore Ts'o out_free_base:
4541ac27a0ecSDave Kleikamp 	kfree(sbi);
4542d4c402d9SCurt Wohlgemuth 	kfree(orig_data);
45435e405595SDan Williams 	fs_put_dax(dax_dev);
454407aa2ea1SLukas Czerner 	return err ? err : ret;
4545ac27a0ecSDave Kleikamp }
4546ac27a0ecSDave Kleikamp 
4547ac27a0ecSDave Kleikamp /*
4548ac27a0ecSDave Kleikamp  * Setup any per-fs journal parameters now.  We'll do this both on
4549ac27a0ecSDave Kleikamp  * initial mount, once the journal has been initialised but before we've
4550ac27a0ecSDave Kleikamp  * done any recovery; and again on any subsequent remount.
4551ac27a0ecSDave Kleikamp  */
4552617ba13bSMingming Cao static void ext4_init_journal_params(struct super_block *sb, journal_t *journal)
4553ac27a0ecSDave Kleikamp {
4554617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4555ac27a0ecSDave Kleikamp 
4556ac27a0ecSDave Kleikamp 	journal->j_commit_interval = sbi->s_commit_interval;
455730773840STheodore Ts'o 	journal->j_min_batch_time = sbi->s_min_batch_time;
455830773840STheodore Ts'o 	journal->j_max_batch_time = sbi->s_max_batch_time;
4559ac27a0ecSDave Kleikamp 
4560a931da6aSTheodore Ts'o 	write_lock(&journal->j_state_lock);
4561ac27a0ecSDave Kleikamp 	if (test_opt(sb, BARRIER))
4562dab291afSMingming Cao 		journal->j_flags |= JBD2_BARRIER;
4563ac27a0ecSDave Kleikamp 	else
4564dab291afSMingming Cao 		journal->j_flags &= ~JBD2_BARRIER;
45655bf5683aSHidehiro Kawai 	if (test_opt(sb, DATA_ERR_ABORT))
45665bf5683aSHidehiro Kawai 		journal->j_flags |= JBD2_ABORT_ON_SYNCDATA_ERR;
45675bf5683aSHidehiro Kawai 	else
45685bf5683aSHidehiro Kawai 		journal->j_flags &= ~JBD2_ABORT_ON_SYNCDATA_ERR;
4569a931da6aSTheodore Ts'o 	write_unlock(&journal->j_state_lock);
4570ac27a0ecSDave Kleikamp }
4571ac27a0ecSDave Kleikamp 
4572c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb,
4573ac27a0ecSDave Kleikamp 					     unsigned int journal_inum)
4574ac27a0ecSDave Kleikamp {
4575ac27a0ecSDave Kleikamp 	struct inode *journal_inode;
4576ac27a0ecSDave Kleikamp 
4577c6cb7e77SEric Whitney 	/*
4578c6cb7e77SEric Whitney 	 * Test for the existence of a valid inode on disk.  Bad things
4579c6cb7e77SEric Whitney 	 * happen if we iget() an unused inode, as the subsequent iput()
4580c6cb7e77SEric Whitney 	 * will try to delete it.
4581c6cb7e77SEric Whitney 	 */
45821d1fe1eeSDavid Howells 	journal_inode = ext4_iget(sb, journal_inum);
45831d1fe1eeSDavid Howells 	if (IS_ERR(journal_inode)) {
4584b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "no journal found");
4585ac27a0ecSDave Kleikamp 		return NULL;
4586ac27a0ecSDave Kleikamp 	}
4587ac27a0ecSDave Kleikamp 	if (!journal_inode->i_nlink) {
4588ac27a0ecSDave Kleikamp 		make_bad_inode(journal_inode);
4589ac27a0ecSDave Kleikamp 		iput(journal_inode);
4590b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "journal inode is deleted");
4591ac27a0ecSDave Kleikamp 		return NULL;
4592ac27a0ecSDave Kleikamp 	}
4593ac27a0ecSDave Kleikamp 
4594e5f8eab8STheodore Ts'o 	jbd_debug(2, "Journal inode found at %p: %lld bytes\n",
4595ac27a0ecSDave Kleikamp 		  journal_inode, journal_inode->i_size);
45961d1fe1eeSDavid Howells 	if (!S_ISREG(journal_inode->i_mode)) {
4597b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "invalid journal inode");
4598ac27a0ecSDave Kleikamp 		iput(journal_inode);
4599ac27a0ecSDave Kleikamp 		return NULL;
4600ac27a0ecSDave Kleikamp 	}
4601c6cb7e77SEric Whitney 	return journal_inode;
4602c6cb7e77SEric Whitney }
4603c6cb7e77SEric Whitney 
4604c6cb7e77SEric Whitney static journal_t *ext4_get_journal(struct super_block *sb,
4605c6cb7e77SEric Whitney 				   unsigned int journal_inum)
4606c6cb7e77SEric Whitney {
4607c6cb7e77SEric Whitney 	struct inode *journal_inode;
4608c6cb7e77SEric Whitney 	journal_t *journal;
4609c6cb7e77SEric Whitney 
4610c6cb7e77SEric Whitney 	BUG_ON(!ext4_has_feature_journal(sb));
4611c6cb7e77SEric Whitney 
4612c6cb7e77SEric Whitney 	journal_inode = ext4_get_journal_inode(sb, journal_inum);
4613c6cb7e77SEric Whitney 	if (!journal_inode)
4614c6cb7e77SEric Whitney 		return NULL;
4615ac27a0ecSDave Kleikamp 
4616dab291afSMingming Cao 	journal = jbd2_journal_init_inode(journal_inode);
4617ac27a0ecSDave Kleikamp 	if (!journal) {
4618b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "Could not load journal inode");
4619ac27a0ecSDave Kleikamp 		iput(journal_inode);
4620ac27a0ecSDave Kleikamp 		return NULL;
4621ac27a0ecSDave Kleikamp 	}
4622ac27a0ecSDave Kleikamp 	journal->j_private = sb;
4623617ba13bSMingming Cao 	ext4_init_journal_params(sb, journal);
4624ac27a0ecSDave Kleikamp 	return journal;
4625ac27a0ecSDave Kleikamp }
4626ac27a0ecSDave Kleikamp 
4627617ba13bSMingming Cao static journal_t *ext4_get_dev_journal(struct super_block *sb,
4628ac27a0ecSDave Kleikamp 				       dev_t j_dev)
4629ac27a0ecSDave Kleikamp {
4630ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
4631ac27a0ecSDave Kleikamp 	journal_t *journal;
4632617ba13bSMingming Cao 	ext4_fsblk_t start;
4633617ba13bSMingming Cao 	ext4_fsblk_t len;
4634ac27a0ecSDave Kleikamp 	int hblock, blocksize;
4635617ba13bSMingming Cao 	ext4_fsblk_t sb_block;
4636ac27a0ecSDave Kleikamp 	unsigned long offset;
4637617ba13bSMingming Cao 	struct ext4_super_block *es;
4638ac27a0ecSDave Kleikamp 	struct block_device *bdev;
4639ac27a0ecSDave Kleikamp 
4640e2b911c5SDarrick J. Wong 	BUG_ON(!ext4_has_feature_journal(sb));
46410390131bSFrank Mayhar 
4642b31e1552SEric Sandeen 	bdev = ext4_blkdev_get(j_dev, sb);
4643ac27a0ecSDave Kleikamp 	if (bdev == NULL)
4644ac27a0ecSDave Kleikamp 		return NULL;
4645ac27a0ecSDave Kleikamp 
4646ac27a0ecSDave Kleikamp 	blocksize = sb->s_blocksize;
4647e1defc4fSMartin K. Petersen 	hblock = bdev_logical_block_size(bdev);
4648ac27a0ecSDave Kleikamp 	if (blocksize < hblock) {
4649b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR,
4650b31e1552SEric Sandeen 			"blocksize too small for journal device");
4651ac27a0ecSDave Kleikamp 		goto out_bdev;
4652ac27a0ecSDave Kleikamp 	}
4653ac27a0ecSDave Kleikamp 
4654617ba13bSMingming Cao 	sb_block = EXT4_MIN_BLOCK_SIZE / blocksize;
4655617ba13bSMingming Cao 	offset = EXT4_MIN_BLOCK_SIZE % blocksize;
4656ac27a0ecSDave Kleikamp 	set_blocksize(bdev, blocksize);
4657ac27a0ecSDave Kleikamp 	if (!(bh = __bread(bdev, sb_block, blocksize))) {
4658b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "couldn't read superblock of "
4659b31e1552SEric Sandeen 		       "external journal");
4660ac27a0ecSDave Kleikamp 		goto out_bdev;
4661ac27a0ecSDave Kleikamp 	}
4662ac27a0ecSDave Kleikamp 
46632716b802STheodore Ts'o 	es = (struct ext4_super_block *) (bh->b_data + offset);
4664617ba13bSMingming Cao 	if ((le16_to_cpu(es->s_magic) != EXT4_SUPER_MAGIC) ||
4665ac27a0ecSDave Kleikamp 	    !(le32_to_cpu(es->s_feature_incompat) &
4666617ba13bSMingming Cao 	      EXT4_FEATURE_INCOMPAT_JOURNAL_DEV)) {
4667b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "external journal has "
4668b31e1552SEric Sandeen 					"bad superblock");
4669ac27a0ecSDave Kleikamp 		brelse(bh);
4670ac27a0ecSDave Kleikamp 		goto out_bdev;
4671ac27a0ecSDave Kleikamp 	}
4672ac27a0ecSDave Kleikamp 
4673df4763beSDarrick J. Wong 	if ((le32_to_cpu(es->s_feature_ro_compat) &
4674df4763beSDarrick J. Wong 	     EXT4_FEATURE_RO_COMPAT_METADATA_CSUM) &&
4675df4763beSDarrick J. Wong 	    es->s_checksum != ext4_superblock_csum(sb, es)) {
4676df4763beSDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "external journal has "
4677df4763beSDarrick J. Wong 				       "corrupt superblock");
4678df4763beSDarrick J. Wong 		brelse(bh);
4679df4763beSDarrick J. Wong 		goto out_bdev;
4680df4763beSDarrick J. Wong 	}
4681df4763beSDarrick J. Wong 
4682617ba13bSMingming Cao 	if (memcmp(EXT4_SB(sb)->s_es->s_journal_uuid, es->s_uuid, 16)) {
4683b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "journal UUID does not match");
4684ac27a0ecSDave Kleikamp 		brelse(bh);
4685ac27a0ecSDave Kleikamp 		goto out_bdev;
4686ac27a0ecSDave Kleikamp 	}
4687ac27a0ecSDave Kleikamp 
4688bd81d8eeSLaurent Vivier 	len = ext4_blocks_count(es);
4689ac27a0ecSDave Kleikamp 	start = sb_block + 1;
4690ac27a0ecSDave Kleikamp 	brelse(bh);	/* we're done with the superblock */
4691ac27a0ecSDave Kleikamp 
4692dab291afSMingming Cao 	journal = jbd2_journal_init_dev(bdev, sb->s_bdev,
4693ac27a0ecSDave Kleikamp 					start, len, blocksize);
4694ac27a0ecSDave Kleikamp 	if (!journal) {
4695b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "failed to create device journal");
4696ac27a0ecSDave Kleikamp 		goto out_bdev;
4697ac27a0ecSDave Kleikamp 	}
4698ac27a0ecSDave Kleikamp 	journal->j_private = sb;
4699dfec8a14SMike Christie 	ll_rw_block(REQ_OP_READ, REQ_META | REQ_PRIO, 1, &journal->j_sb_buffer);
4700ac27a0ecSDave Kleikamp 	wait_on_buffer(journal->j_sb_buffer);
4701ac27a0ecSDave Kleikamp 	if (!buffer_uptodate(journal->j_sb_buffer)) {
4702b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "I/O error on journal device");
4703ac27a0ecSDave Kleikamp 		goto out_journal;
4704ac27a0ecSDave Kleikamp 	}
4705ac27a0ecSDave Kleikamp 	if (be32_to_cpu(journal->j_superblock->s_nr_users) != 1) {
4706b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "External journal has more than one "
4707b31e1552SEric Sandeen 					"user (unsupported) - %d",
4708ac27a0ecSDave Kleikamp 			be32_to_cpu(journal->j_superblock->s_nr_users));
4709ac27a0ecSDave Kleikamp 		goto out_journal;
4710ac27a0ecSDave Kleikamp 	}
4711617ba13bSMingming Cao 	EXT4_SB(sb)->journal_bdev = bdev;
4712617ba13bSMingming Cao 	ext4_init_journal_params(sb, journal);
4713ac27a0ecSDave Kleikamp 	return journal;
47140b8e58a1SAndreas Dilger 
4715ac27a0ecSDave Kleikamp out_journal:
4716dab291afSMingming Cao 	jbd2_journal_destroy(journal);
4717ac27a0ecSDave Kleikamp out_bdev:
4718617ba13bSMingming Cao 	ext4_blkdev_put(bdev);
4719ac27a0ecSDave Kleikamp 	return NULL;
4720ac27a0ecSDave Kleikamp }
4721ac27a0ecSDave Kleikamp 
4722617ba13bSMingming Cao static int ext4_load_journal(struct super_block *sb,
4723617ba13bSMingming Cao 			     struct ext4_super_block *es,
4724ac27a0ecSDave Kleikamp 			     unsigned long journal_devnum)
4725ac27a0ecSDave Kleikamp {
4726ac27a0ecSDave Kleikamp 	journal_t *journal;
4727ac27a0ecSDave Kleikamp 	unsigned int journal_inum = le32_to_cpu(es->s_journal_inum);
4728ac27a0ecSDave Kleikamp 	dev_t journal_dev;
4729ac27a0ecSDave Kleikamp 	int err = 0;
4730ac27a0ecSDave Kleikamp 	int really_read_only;
4731ac27a0ecSDave Kleikamp 
4732e2b911c5SDarrick J. Wong 	BUG_ON(!ext4_has_feature_journal(sb));
47330390131bSFrank Mayhar 
4734ac27a0ecSDave Kleikamp 	if (journal_devnum &&
4735ac27a0ecSDave Kleikamp 	    journal_devnum != le32_to_cpu(es->s_journal_dev)) {
4736b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "external journal device major/minor "
4737b31e1552SEric Sandeen 			"numbers have changed");
4738ac27a0ecSDave Kleikamp 		journal_dev = new_decode_dev(journal_devnum);
4739ac27a0ecSDave Kleikamp 	} else
4740ac27a0ecSDave Kleikamp 		journal_dev = new_decode_dev(le32_to_cpu(es->s_journal_dev));
4741ac27a0ecSDave Kleikamp 
4742ac27a0ecSDave Kleikamp 	really_read_only = bdev_read_only(sb->s_bdev);
4743ac27a0ecSDave Kleikamp 
4744ac27a0ecSDave Kleikamp 	/*
4745ac27a0ecSDave Kleikamp 	 * Are we loading a blank journal or performing recovery after a
4746ac27a0ecSDave Kleikamp 	 * crash?  For recovery, we need to check in advance whether we
4747ac27a0ecSDave Kleikamp 	 * can get read-write access to the device.
4748ac27a0ecSDave Kleikamp 	 */
4749e2b911c5SDarrick J. Wong 	if (ext4_has_feature_journal_needs_recovery(sb)) {
4750bc98a42cSDavid Howells 		if (sb_rdonly(sb)) {
4751b31e1552SEric Sandeen 			ext4_msg(sb, KERN_INFO, "INFO: recovery "
4752b31e1552SEric Sandeen 					"required on readonly filesystem");
4753ac27a0ecSDave Kleikamp 			if (really_read_only) {
4754b31e1552SEric Sandeen 				ext4_msg(sb, KERN_ERR, "write access "
4755d98bf8cdSSimon Ruderich 					"unavailable, cannot proceed "
4756d98bf8cdSSimon Ruderich 					"(try mounting with noload)");
4757ac27a0ecSDave Kleikamp 				return -EROFS;
4758ac27a0ecSDave Kleikamp 			}
4759b31e1552SEric Sandeen 			ext4_msg(sb, KERN_INFO, "write access will "
4760b31e1552SEric Sandeen 			       "be enabled during recovery");
4761ac27a0ecSDave Kleikamp 		}
4762ac27a0ecSDave Kleikamp 	}
4763ac27a0ecSDave Kleikamp 
4764ac27a0ecSDave Kleikamp 	if (journal_inum && journal_dev) {
4765b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "filesystem has both journal "
4766b31e1552SEric Sandeen 		       "and inode journals!");
4767ac27a0ecSDave Kleikamp 		return -EINVAL;
4768ac27a0ecSDave Kleikamp 	}
4769ac27a0ecSDave Kleikamp 
4770ac27a0ecSDave Kleikamp 	if (journal_inum) {
4771617ba13bSMingming Cao 		if (!(journal = ext4_get_journal(sb, journal_inum)))
4772ac27a0ecSDave Kleikamp 			return -EINVAL;
4773ac27a0ecSDave Kleikamp 	} else {
4774617ba13bSMingming Cao 		if (!(journal = ext4_get_dev_journal(sb, journal_dev)))
4775ac27a0ecSDave Kleikamp 			return -EINVAL;
4776ac27a0ecSDave Kleikamp 	}
4777ac27a0ecSDave Kleikamp 
477890576c0bSTheodore Ts'o 	if (!(journal->j_flags & JBD2_BARRIER))
4779b31e1552SEric Sandeen 		ext4_msg(sb, KERN_INFO, "barriers disabled");
47804776004fSTheodore Ts'o 
4781e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_journal_needs_recovery(sb))
4782dab291afSMingming Cao 		err = jbd2_journal_wipe(journal, !really_read_only);
47831c13d5c0STheodore Ts'o 	if (!err) {
47841c13d5c0STheodore Ts'o 		char *save = kmalloc(EXT4_S_ERR_LEN, GFP_KERNEL);
47851c13d5c0STheodore Ts'o 		if (save)
47861c13d5c0STheodore Ts'o 			memcpy(save, ((char *) es) +
47871c13d5c0STheodore Ts'o 			       EXT4_S_ERR_START, EXT4_S_ERR_LEN);
4788dab291afSMingming Cao 		err = jbd2_journal_load(journal);
47891c13d5c0STheodore Ts'o 		if (save)
47901c13d5c0STheodore Ts'o 			memcpy(((char *) es) + EXT4_S_ERR_START,
47911c13d5c0STheodore Ts'o 			       save, EXT4_S_ERR_LEN);
47921c13d5c0STheodore Ts'o 		kfree(save);
47931c13d5c0STheodore Ts'o 	}
4794ac27a0ecSDave Kleikamp 
4795ac27a0ecSDave Kleikamp 	if (err) {
4796b31e1552SEric Sandeen 		ext4_msg(sb, KERN_ERR, "error loading journal");
4797dab291afSMingming Cao 		jbd2_journal_destroy(journal);
4798ac27a0ecSDave Kleikamp 		return err;
4799ac27a0ecSDave Kleikamp 	}
4800ac27a0ecSDave Kleikamp 
4801617ba13bSMingming Cao 	EXT4_SB(sb)->s_journal = journal;
4802617ba13bSMingming Cao 	ext4_clear_journal_err(sb, es);
4803ac27a0ecSDave Kleikamp 
4804c41303ceSMaciej Żenczykowski 	if (!really_read_only && journal_devnum &&
4805ac27a0ecSDave Kleikamp 	    journal_devnum != le32_to_cpu(es->s_journal_dev)) {
4806ac27a0ecSDave Kleikamp 		es->s_journal_dev = cpu_to_le32(journal_devnum);
4807ac27a0ecSDave Kleikamp 
4808ac27a0ecSDave Kleikamp 		/* Make sure we flush the recovery flag to disk. */
4809e2d67052STheodore Ts'o 		ext4_commit_super(sb, 1);
4810ac27a0ecSDave Kleikamp 	}
4811ac27a0ecSDave Kleikamp 
4812ac27a0ecSDave Kleikamp 	return 0;
4813ac27a0ecSDave Kleikamp }
4814ac27a0ecSDave Kleikamp 
4815e2d67052STheodore Ts'o static int ext4_commit_super(struct super_block *sb, int sync)
4816ac27a0ecSDave Kleikamp {
4817e2d67052STheodore Ts'o 	struct ext4_super_block *es = EXT4_SB(sb)->s_es;
4818617ba13bSMingming Cao 	struct buffer_head *sbh = EXT4_SB(sb)->s_sbh;
4819c4be0c1dSTakashi Sato 	int error = 0;
4820ac27a0ecSDave Kleikamp 
4821bdfe0cbdSTheodore Ts'o 	if (!sbh || block_device_ejected(sb))
4822c4be0c1dSTakashi Sato 		return error;
4823a17712c8SJon Derrick 
4824a17712c8SJon Derrick 	/*
4825a17712c8SJon Derrick 	 * The superblock bh should be mapped, but it might not be if the
4826a17712c8SJon Derrick 	 * device was hot-removed. Not much we can do but fail the I/O.
4827a17712c8SJon Derrick 	 */
4828a17712c8SJon Derrick 	if (!buffer_mapped(sbh))
4829a17712c8SJon Derrick 		return error;
4830a17712c8SJon Derrick 
483171290b36STheodore Ts'o 	/*
483271290b36STheodore Ts'o 	 * If the file system is mounted read-only, don't update the
483371290b36STheodore Ts'o 	 * superblock write time.  This avoids updating the superblock
483471290b36STheodore Ts'o 	 * write time when we are mounting the root file system
483571290b36STheodore Ts'o 	 * read/only but we need to replay the journal; at that point,
483671290b36STheodore Ts'o 	 * for people who are east of GMT and who make their clock
483771290b36STheodore Ts'o 	 * tick in localtime for Windows bug-for-bug compatibility,
483871290b36STheodore Ts'o 	 * the clock is set in the future, and this will cause e2fsck
483971290b36STheodore Ts'o 	 * to complain and force a full file system check.
484071290b36STheodore Ts'o 	 */
48411751e8a6SLinus Torvalds 	if (!(sb->s_flags & SB_RDONLY))
48426a0678a7SArnd Bergmann 		ext4_update_tstamp(es, s_wtime);
4843f613dfcbSTheodore Ts'o 	if (sb->s_bdev->bd_part)
4844afc32f7eSTheodore Ts'o 		es->s_kbytes_written =
4845afc32f7eSTheodore Ts'o 			cpu_to_le64(EXT4_SB(sb)->s_kbytes_written +
4846dbae2c55SMichael Callahan 			    ((part_stat_read(sb->s_bdev->bd_part,
4847dbae2c55SMichael Callahan 					     sectors[STAT_WRITE]) -
4848afc32f7eSTheodore Ts'o 			      EXT4_SB(sb)->s_sectors_written_start) >> 1));
4849f613dfcbSTheodore Ts'o 	else
4850f613dfcbSTheodore Ts'o 		es->s_kbytes_written =
4851f613dfcbSTheodore Ts'o 			cpu_to_le64(EXT4_SB(sb)->s_kbytes_written);
4852d5e03cbbSTheodore Ts'o 	if (percpu_counter_initialized(&EXT4_SB(sb)->s_freeclusters_counter))
485357042651STheodore Ts'o 		ext4_free_blocks_count_set(es,
485457042651STheodore Ts'o 			EXT4_C2B(EXT4_SB(sb), percpu_counter_sum_positive(
485557042651STheodore Ts'o 				&EXT4_SB(sb)->s_freeclusters_counter)));
4856d5e03cbbSTheodore Ts'o 	if (percpu_counter_initialized(&EXT4_SB(sb)->s_freeinodes_counter))
48577f93cff9STheodore Ts'o 		es->s_free_inodes_count =
48587f93cff9STheodore Ts'o 			cpu_to_le32(percpu_counter_sum_positive(
48595d1b1b3fSAneesh Kumar K.V 				&EXT4_SB(sb)->s_freeinodes_counter));
4860ac27a0ecSDave Kleikamp 	BUFFER_TRACE(sbh, "marking dirty");
486106db49e6STheodore Ts'o 	ext4_superblock_csum_set(sb);
48621566a48aSTheodore Ts'o 	if (sync)
48634743f839SPranay Kr. Srivastava 		lock_buffer(sbh);
48644743f839SPranay Kr. Srivastava 	if (buffer_write_io_error(sbh)) {
48654743f839SPranay Kr. Srivastava 		/*
48664743f839SPranay Kr. Srivastava 		 * Oh, dear.  A previous attempt to write the
48674743f839SPranay Kr. Srivastava 		 * superblock failed.  This could happen because the
48684743f839SPranay Kr. Srivastava 		 * USB device was yanked out.  Or it could happen to
48694743f839SPranay Kr. Srivastava 		 * be a transient write error and maybe the block will
48704743f839SPranay Kr. Srivastava 		 * be remapped.  Nothing we can do but to retry the
48714743f839SPranay Kr. Srivastava 		 * write and hope for the best.
48724743f839SPranay Kr. Srivastava 		 */
48734743f839SPranay Kr. Srivastava 		ext4_msg(sb, KERN_ERR, "previous I/O error to "
48744743f839SPranay Kr. Srivastava 		       "superblock detected");
48754743f839SPranay Kr. Srivastava 		clear_buffer_write_io_error(sbh);
48764743f839SPranay Kr. Srivastava 		set_buffer_uptodate(sbh);
48774743f839SPranay Kr. Srivastava 	}
4878ac27a0ecSDave Kleikamp 	mark_buffer_dirty(sbh);
4879914258bfSTheodore Ts'o 	if (sync) {
48801566a48aSTheodore Ts'o 		unlock_buffer(sbh);
4881564bc402SDaeho Jeong 		error = __sync_dirty_buffer(sbh,
488200473374SJan Kara 			REQ_SYNC | (test_opt(sb, BARRIER) ? REQ_FUA : 0));
4883c89128a0SJaegeuk Kim 		if (buffer_write_io_error(sbh)) {
4884b31e1552SEric Sandeen 			ext4_msg(sb, KERN_ERR, "I/O error while writing "
4885b31e1552SEric Sandeen 			       "superblock");
4886914258bfSTheodore Ts'o 			clear_buffer_write_io_error(sbh);
4887914258bfSTheodore Ts'o 			set_buffer_uptodate(sbh);
4888914258bfSTheodore Ts'o 		}
4889914258bfSTheodore Ts'o 	}
4890c4be0c1dSTakashi Sato 	return error;
4891ac27a0ecSDave Kleikamp }
4892ac27a0ecSDave Kleikamp 
4893ac27a0ecSDave Kleikamp /*
4894ac27a0ecSDave Kleikamp  * Have we just finished recovery?  If so, and if we are mounting (or
4895ac27a0ecSDave Kleikamp  * remounting) the filesystem readonly, then we will end up with a
4896ac27a0ecSDave Kleikamp  * consistent fs on disk.  Record that fact.
4897ac27a0ecSDave Kleikamp  */
4898617ba13bSMingming Cao static void ext4_mark_recovery_complete(struct super_block *sb,
4899617ba13bSMingming Cao 					struct ext4_super_block *es)
4900ac27a0ecSDave Kleikamp {
4901617ba13bSMingming Cao 	journal_t *journal = EXT4_SB(sb)->s_journal;
4902ac27a0ecSDave Kleikamp 
4903e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_journal(sb)) {
49040390131bSFrank Mayhar 		BUG_ON(journal != NULL);
49050390131bSFrank Mayhar 		return;
49060390131bSFrank Mayhar 	}
4907dab291afSMingming Cao 	jbd2_journal_lock_updates(journal);
49087ffe1ea8SHidehiro Kawai 	if (jbd2_journal_flush(journal) < 0)
49097ffe1ea8SHidehiro Kawai 		goto out;
49107ffe1ea8SHidehiro Kawai 
4911bc98a42cSDavid Howells 	if (ext4_has_feature_journal_needs_recovery(sb) && sb_rdonly(sb)) {
4912e2b911c5SDarrick J. Wong 		ext4_clear_feature_journal_needs_recovery(sb);
4913e2d67052STheodore Ts'o 		ext4_commit_super(sb, 1);
4914ac27a0ecSDave Kleikamp 	}
49157ffe1ea8SHidehiro Kawai 
49167ffe1ea8SHidehiro Kawai out:
4917dab291afSMingming Cao 	jbd2_journal_unlock_updates(journal);
4918ac27a0ecSDave Kleikamp }
4919ac27a0ecSDave Kleikamp 
4920ac27a0ecSDave Kleikamp /*
4921ac27a0ecSDave Kleikamp  * If we are mounting (or read-write remounting) a filesystem whose journal
4922ac27a0ecSDave Kleikamp  * has recorded an error from a previous lifetime, move that error to the
4923ac27a0ecSDave Kleikamp  * main filesystem now.
4924ac27a0ecSDave Kleikamp  */
4925617ba13bSMingming Cao static void ext4_clear_journal_err(struct super_block *sb,
4926617ba13bSMingming Cao 				   struct ext4_super_block *es)
4927ac27a0ecSDave Kleikamp {
4928ac27a0ecSDave Kleikamp 	journal_t *journal;
4929ac27a0ecSDave Kleikamp 	int j_errno;
4930ac27a0ecSDave Kleikamp 	const char *errstr;
4931ac27a0ecSDave Kleikamp 
4932e2b911c5SDarrick J. Wong 	BUG_ON(!ext4_has_feature_journal(sb));
49330390131bSFrank Mayhar 
4934617ba13bSMingming Cao 	journal = EXT4_SB(sb)->s_journal;
4935ac27a0ecSDave Kleikamp 
4936ac27a0ecSDave Kleikamp 	/*
4937ac27a0ecSDave Kleikamp 	 * Now check for any error status which may have been recorded in the
4938617ba13bSMingming Cao 	 * journal by a prior ext4_error() or ext4_abort()
4939ac27a0ecSDave Kleikamp 	 */
4940ac27a0ecSDave Kleikamp 
4941dab291afSMingming Cao 	j_errno = jbd2_journal_errno(journal);
4942ac27a0ecSDave Kleikamp 	if (j_errno) {
4943ac27a0ecSDave Kleikamp 		char nbuf[16];
4944ac27a0ecSDave Kleikamp 
4945617ba13bSMingming Cao 		errstr = ext4_decode_error(sb, j_errno, nbuf);
494612062dddSEric Sandeen 		ext4_warning(sb, "Filesystem error recorded "
4947ac27a0ecSDave Kleikamp 			     "from previous mount: %s", errstr);
494812062dddSEric Sandeen 		ext4_warning(sb, "Marking fs in need of filesystem check.");
4949ac27a0ecSDave Kleikamp 
4950617ba13bSMingming Cao 		EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS;
4951617ba13bSMingming Cao 		es->s_state |= cpu_to_le16(EXT4_ERROR_FS);
4952e2d67052STheodore Ts'o 		ext4_commit_super(sb, 1);
4953ac27a0ecSDave Kleikamp 
4954dab291afSMingming Cao 		jbd2_journal_clear_err(journal);
4955d796c52eSTheodore Ts'o 		jbd2_journal_update_sb_errno(journal);
4956ac27a0ecSDave Kleikamp 	}
4957ac27a0ecSDave Kleikamp }
4958ac27a0ecSDave Kleikamp 
4959ac27a0ecSDave Kleikamp /*
4960ac27a0ecSDave Kleikamp  * Force the running and committing transactions to commit,
4961ac27a0ecSDave Kleikamp  * and wait on the commit.
4962ac27a0ecSDave Kleikamp  */
4963617ba13bSMingming Cao int ext4_force_commit(struct super_block *sb)
4964ac27a0ecSDave Kleikamp {
4965ac27a0ecSDave Kleikamp 	journal_t *journal;
4966ac27a0ecSDave Kleikamp 
4967bc98a42cSDavid Howells 	if (sb_rdonly(sb))
4968ac27a0ecSDave Kleikamp 		return 0;
4969ac27a0ecSDave Kleikamp 
4970617ba13bSMingming Cao 	journal = EXT4_SB(sb)->s_journal;
4971b1deefc9SGuo Chao 	return ext4_journal_force_commit(journal);
4972ac27a0ecSDave Kleikamp }
4973ac27a0ecSDave Kleikamp 
4974617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait)
4975ac27a0ecSDave Kleikamp {
497614ce0cb4STheodore Ts'o 	int ret = 0;
49779eddacf9SJan Kara 	tid_t target;
497806a407f1SDmitry Monakhov 	bool needs_barrier = false;
49798d5d02e6SMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
4980ac27a0ecSDave Kleikamp 
498149598e04SJun Piao 	if (unlikely(ext4_forced_shutdown(sbi)))
49820db1ff22STheodore Ts'o 		return 0;
49830db1ff22STheodore Ts'o 
49849bffad1eSTheodore Ts'o 	trace_ext4_sync_fs(sb, wait);
49852e8fa54eSJan Kara 	flush_workqueue(sbi->rsv_conversion_wq);
4986a1177825SJan Kara 	/*
4987a1177825SJan Kara 	 * Writeback quota in non-journalled quota case - journalled quota has
4988a1177825SJan Kara 	 * no dirty dquots
4989a1177825SJan Kara 	 */
4990a1177825SJan Kara 	dquot_writeback_dquots(sb, -1);
499106a407f1SDmitry Monakhov 	/*
499206a407f1SDmitry Monakhov 	 * Data writeback is possible w/o journal transaction, so barrier must
499306a407f1SDmitry Monakhov 	 * being sent at the end of the function. But we can skip it if
499406a407f1SDmitry Monakhov 	 * transaction_commit will do it for us.
499506a407f1SDmitry Monakhov 	 */
4996bda32530STheodore Ts'o 	if (sbi->s_journal) {
499706a407f1SDmitry Monakhov 		target = jbd2_get_latest_transaction(sbi->s_journal);
499806a407f1SDmitry Monakhov 		if (wait && sbi->s_journal->j_flags & JBD2_BARRIER &&
499906a407f1SDmitry Monakhov 		    !jbd2_trans_will_send_data_barrier(sbi->s_journal, target))
500006a407f1SDmitry Monakhov 			needs_barrier = true;
500106a407f1SDmitry Monakhov 
50028d5d02e6SMingming Cao 		if (jbd2_journal_start_commit(sbi->s_journal, &target)) {
5003ac27a0ecSDave Kleikamp 			if (wait)
5004bda32530STheodore Ts'o 				ret = jbd2_log_wait_commit(sbi->s_journal,
5005bda32530STheodore Ts'o 							   target);
50060390131bSFrank Mayhar 		}
5007bda32530STheodore Ts'o 	} else if (wait && test_opt(sb, BARRIER))
5008bda32530STheodore Ts'o 		needs_barrier = true;
500906a407f1SDmitry Monakhov 	if (needs_barrier) {
501006a407f1SDmitry Monakhov 		int err;
501106a407f1SDmitry Monakhov 		err = blkdev_issue_flush(sb->s_bdev, GFP_KERNEL, NULL);
501206a407f1SDmitry Monakhov 		if (!ret)
501306a407f1SDmitry Monakhov 			ret = err;
501406a407f1SDmitry Monakhov 	}
501506a407f1SDmitry Monakhov 
501606a407f1SDmitry Monakhov 	return ret;
501706a407f1SDmitry Monakhov }
501806a407f1SDmitry Monakhov 
5019ac27a0ecSDave Kleikamp /*
5020ac27a0ecSDave Kleikamp  * LVM calls this function before a (read-only) snapshot is created.  This
5021ac27a0ecSDave Kleikamp  * gives us a chance to flush the journal completely and mark the fs clean.
5022be4f27d3SYongqiang Yang  *
5023be4f27d3SYongqiang Yang  * Note that only this function cannot bring a filesystem to be in a clean
50248e8ad8a5SJan Kara  * state independently. It relies on upper layer to stop all data & metadata
50258e8ad8a5SJan Kara  * modifications.
5026ac27a0ecSDave Kleikamp  */
5027c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb)
5028ac27a0ecSDave Kleikamp {
5029c4be0c1dSTakashi Sato 	int error = 0;
5030c4be0c1dSTakashi Sato 	journal_t *journal;
5031ac27a0ecSDave Kleikamp 
5032bc98a42cSDavid Howells 	if (sb_rdonly(sb))
50339ca92389STheodore Ts'o 		return 0;
50349ca92389STheodore Ts'o 
5035c4be0c1dSTakashi Sato 	journal = EXT4_SB(sb)->s_journal;
5036ac27a0ecSDave Kleikamp 
5037bb044576STheodore Ts'o 	if (journal) {
5038ac27a0ecSDave Kleikamp 		/* Now we set up the journal barrier. */
5039dab291afSMingming Cao 		jbd2_journal_lock_updates(journal);
50407ffe1ea8SHidehiro Kawai 
50417ffe1ea8SHidehiro Kawai 		/*
5042bb044576STheodore Ts'o 		 * Don't clear the needs_recovery flag if we failed to
5043bb044576STheodore Ts'o 		 * flush the journal.
50447ffe1ea8SHidehiro Kawai 		 */
5045c4be0c1dSTakashi Sato 		error = jbd2_journal_flush(journal);
50466b0310fbSEric Sandeen 		if (error < 0)
50476b0310fbSEric Sandeen 			goto out;
5048ac27a0ecSDave Kleikamp 
5049ac27a0ecSDave Kleikamp 		/* Journal blocked and flushed, clear needs_recovery flag. */
5050e2b911c5SDarrick J. Wong 		ext4_clear_feature_journal_needs_recovery(sb);
5051c642dc9eSEric Sandeen 	}
5052c642dc9eSEric Sandeen 
5053e2d67052STheodore Ts'o 	error = ext4_commit_super(sb, 1);
50546b0310fbSEric Sandeen out:
5055bb044576STheodore Ts'o 	if (journal)
50568e8ad8a5SJan Kara 		/* we rely on upper layer to stop further updates */
5057bb044576STheodore Ts'o 		jbd2_journal_unlock_updates(journal);
50586b0310fbSEric Sandeen 	return error;
5059ac27a0ecSDave Kleikamp }
5060ac27a0ecSDave Kleikamp 
5061ac27a0ecSDave Kleikamp /*
5062ac27a0ecSDave Kleikamp  * Called by LVM after the snapshot is done.  We need to reset the RECOVER
5063ac27a0ecSDave Kleikamp  * flag here, even though the filesystem is not technically dirty yet.
5064ac27a0ecSDave Kleikamp  */
5065c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb)
5066ac27a0ecSDave Kleikamp {
5067bc98a42cSDavid Howells 	if (sb_rdonly(sb) || ext4_forced_shutdown(EXT4_SB(sb)))
50689ca92389STheodore Ts'o 		return 0;
50699ca92389STheodore Ts'o 
5070c642dc9eSEric Sandeen 	if (EXT4_SB(sb)->s_journal) {
50719ca92389STheodore Ts'o 		/* Reset the needs_recovery flag before the fs is unlocked. */
5072e2b911c5SDarrick J. Wong 		ext4_set_feature_journal_needs_recovery(sb);
5073c642dc9eSEric Sandeen 	}
5074c642dc9eSEric Sandeen 
5075e2d67052STheodore Ts'o 	ext4_commit_super(sb, 1);
5076c4be0c1dSTakashi Sato 	return 0;
5077ac27a0ecSDave Kleikamp }
5078ac27a0ecSDave Kleikamp 
5079673c6100STheodore Ts'o /*
5080673c6100STheodore Ts'o  * Structure to save mount options for ext4_remount's benefit
5081673c6100STheodore Ts'o  */
5082673c6100STheodore Ts'o struct ext4_mount_options {
5083673c6100STheodore Ts'o 	unsigned long s_mount_opt;
5084a2595b8aSTheodore Ts'o 	unsigned long s_mount_opt2;
508508cefc7aSEric W. Biederman 	kuid_t s_resuid;
508608cefc7aSEric W. Biederman 	kgid_t s_resgid;
5087673c6100STheodore Ts'o 	unsigned long s_commit_interval;
5088673c6100STheodore Ts'o 	u32 s_min_batch_time, s_max_batch_time;
5089673c6100STheodore Ts'o #ifdef CONFIG_QUOTA
5090673c6100STheodore Ts'o 	int s_jquota_fmt;
5091a2d4a646SJan Kara 	char *s_qf_names[EXT4_MAXQUOTAS];
5092673c6100STheodore Ts'o #endif
5093673c6100STheodore Ts'o };
5094673c6100STheodore Ts'o 
5095617ba13bSMingming Cao static int ext4_remount(struct super_block *sb, int *flags, char *data)
5096ac27a0ecSDave Kleikamp {
5097617ba13bSMingming Cao 	struct ext4_super_block *es;
5098617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
5099ac27a0ecSDave Kleikamp 	unsigned long old_sb_flags;
5100617ba13bSMingming Cao 	struct ext4_mount_options old_opts;
5101c79d967dSChristoph Hellwig 	int enable_quota = 0;
51028a266467STheodore Ts'o 	ext4_group_t g;
5103b3881f74STheodore Ts'o 	unsigned int journal_ioprio = DEFAULT_JOURNAL_IOPRIO;
5104c5e06d10SJohann Lombardi 	int err = 0;
5105ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
510603dafb5fSChen Gang 	int i, j;
5107ac27a0ecSDave Kleikamp #endif
5108d4c402d9SCurt Wohlgemuth 	char *orig_data = kstrdup(data, GFP_KERNEL);
5109ac27a0ecSDave Kleikamp 
511021ac738eSChengguang Xu 	if (data && !orig_data)
511121ac738eSChengguang Xu 		return -ENOMEM;
511221ac738eSChengguang Xu 
5113ac27a0ecSDave Kleikamp 	/* Store the original options */
5114ac27a0ecSDave Kleikamp 	old_sb_flags = sb->s_flags;
5115ac27a0ecSDave Kleikamp 	old_opts.s_mount_opt = sbi->s_mount_opt;
5116a2595b8aSTheodore Ts'o 	old_opts.s_mount_opt2 = sbi->s_mount_opt2;
5117ac27a0ecSDave Kleikamp 	old_opts.s_resuid = sbi->s_resuid;
5118ac27a0ecSDave Kleikamp 	old_opts.s_resgid = sbi->s_resgid;
5119ac27a0ecSDave Kleikamp 	old_opts.s_commit_interval = sbi->s_commit_interval;
512030773840STheodore Ts'o 	old_opts.s_min_batch_time = sbi->s_min_batch_time;
512130773840STheodore Ts'o 	old_opts.s_max_batch_time = sbi->s_max_batch_time;
5122ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5123ac27a0ecSDave Kleikamp 	old_opts.s_jquota_fmt = sbi->s_jquota_fmt;
5124a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
512503dafb5fSChen Gang 		if (sbi->s_qf_names[i]) {
512603dafb5fSChen Gang 			old_opts.s_qf_names[i] = kstrdup(sbi->s_qf_names[i],
512703dafb5fSChen Gang 							 GFP_KERNEL);
512803dafb5fSChen Gang 			if (!old_opts.s_qf_names[i]) {
512903dafb5fSChen Gang 				for (j = 0; j < i; j++)
513003dafb5fSChen Gang 					kfree(old_opts.s_qf_names[j]);
51313e36a163SWei Yongjun 				kfree(orig_data);
513203dafb5fSChen Gang 				return -ENOMEM;
513303dafb5fSChen Gang 			}
513403dafb5fSChen Gang 		} else
513503dafb5fSChen Gang 			old_opts.s_qf_names[i] = NULL;
5136ac27a0ecSDave Kleikamp #endif
5137b3881f74STheodore Ts'o 	if (sbi->s_journal && sbi->s_journal->j_task->io_context)
5138b3881f74STheodore Ts'o 		journal_ioprio = sbi->s_journal->j_task->io_context->ioprio;
5139ac27a0ecSDave Kleikamp 
5140661aa520SEric Sandeen 	if (!parse_options(data, sb, NULL, &journal_ioprio, 1)) {
5141ac27a0ecSDave Kleikamp 		err = -EINVAL;
5142ac27a0ecSDave Kleikamp 		goto restore_opts;
5143ac27a0ecSDave Kleikamp 	}
5144ac27a0ecSDave Kleikamp 
51456b992ff2SDarrick J. Wong 	if ((old_opts.s_mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) ^
51466b992ff2SDarrick J. Wong 	    test_opt(sb, JOURNAL_CHECKSUM)) {
51476b992ff2SDarrick J. Wong 		ext4_msg(sb, KERN_ERR, "changing journal_checksum "
51482d5b86e0SEric Sandeen 			 "during remount not supported; ignoring");
51492d5b86e0SEric Sandeen 		sbi->s_mount_opt ^= EXT4_MOUNT_JOURNAL_CHECKSUM;
5150c6d3d56dSDarrick J. Wong 	}
5151c6d3d56dSDarrick J. Wong 
51526ae6514bSPiotr Sarna 	if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) {
51536ae6514bSPiotr Sarna 		if (test_opt2(sb, EXPLICIT_DELALLOC)) {
51546ae6514bSPiotr Sarna 			ext4_msg(sb, KERN_ERR, "can't mount with "
51556ae6514bSPiotr Sarna 				 "both data=journal and delalloc");
51566ae6514bSPiotr Sarna 			err = -EINVAL;
51576ae6514bSPiotr Sarna 			goto restore_opts;
51586ae6514bSPiotr Sarna 		}
51596ae6514bSPiotr Sarna 		if (test_opt(sb, DIOREAD_NOLOCK)) {
51606ae6514bSPiotr Sarna 			ext4_msg(sb, KERN_ERR, "can't mount with "
51616ae6514bSPiotr Sarna 				 "both data=journal and dioread_nolock");
51626ae6514bSPiotr Sarna 			err = -EINVAL;
51636ae6514bSPiotr Sarna 			goto restore_opts;
51646ae6514bSPiotr Sarna 		}
5165923ae0ffSRoss Zwisler 		if (test_opt(sb, DAX)) {
5166923ae0ffSRoss Zwisler 			ext4_msg(sb, KERN_ERR, "can't mount with "
5167923ae0ffSRoss Zwisler 				 "both data=journal and dax");
5168923ae0ffSRoss Zwisler 			err = -EINVAL;
5169923ae0ffSRoss Zwisler 			goto restore_opts;
5170923ae0ffSRoss Zwisler 		}
5171ab04df78SJan Kara 	} else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA) {
5172ab04df78SJan Kara 		if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) {
5173ab04df78SJan Kara 			ext4_msg(sb, KERN_ERR, "can't mount with "
5174ab04df78SJan Kara 				"journal_async_commit in data=ordered mode");
5175ab04df78SJan Kara 			err = -EINVAL;
5176ab04df78SJan Kara 			goto restore_opts;
5177ab04df78SJan Kara 		}
5178923ae0ffSRoss Zwisler 	}
5179923ae0ffSRoss Zwisler 
5180cdb7ee4cSTahsin Erdogan 	if ((sbi->s_mount_opt ^ old_opts.s_mount_opt) & EXT4_MOUNT_NO_MBCACHE) {
5181cdb7ee4cSTahsin Erdogan 		ext4_msg(sb, KERN_ERR, "can't enable nombcache during remount");
5182cdb7ee4cSTahsin Erdogan 		err = -EINVAL;
5183cdb7ee4cSTahsin Erdogan 		goto restore_opts;
5184cdb7ee4cSTahsin Erdogan 	}
5185cdb7ee4cSTahsin Erdogan 
5186923ae0ffSRoss Zwisler 	if ((sbi->s_mount_opt ^ old_opts.s_mount_opt) & EXT4_MOUNT_DAX) {
5187923ae0ffSRoss Zwisler 		ext4_msg(sb, KERN_WARNING, "warning: refusing change of "
5188923ae0ffSRoss Zwisler 			"dax flag with busy inodes while remounting");
5189923ae0ffSRoss Zwisler 		sbi->s_mount_opt ^= EXT4_MOUNT_DAX;
51906ae6514bSPiotr Sarna 	}
51916ae6514bSPiotr Sarna 
51924ab2f15bSTheodore Ts'o 	if (sbi->s_mount_flags & EXT4_MF_FS_ABORTED)
5193c67d859eSTheodore Ts'o 		ext4_abort(sb, "Abort forced by user");
5194ac27a0ecSDave Kleikamp 
51951751e8a6SLinus Torvalds 	sb->s_flags = (sb->s_flags & ~SB_POSIXACL) |
51961751e8a6SLinus Torvalds 		(test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0);
5197ac27a0ecSDave Kleikamp 
5198ac27a0ecSDave Kleikamp 	es = sbi->s_es;
5199ac27a0ecSDave Kleikamp 
5200b3881f74STheodore Ts'o 	if (sbi->s_journal) {
5201617ba13bSMingming Cao 		ext4_init_journal_params(sb, sbi->s_journal);
5202b3881f74STheodore Ts'o 		set_task_ioprio(sbi->s_journal->j_task, journal_ioprio);
5203b3881f74STheodore Ts'o 	}
5204ac27a0ecSDave Kleikamp 
52051751e8a6SLinus Torvalds 	if (*flags & SB_LAZYTIME)
52061751e8a6SLinus Torvalds 		sb->s_flags |= SB_LAZYTIME;
5207a2fd66d0STheodore Ts'o 
52081751e8a6SLinus Torvalds 	if ((bool)(*flags & SB_RDONLY) != sb_rdonly(sb)) {
52094ab2f15bSTheodore Ts'o 		if (sbi->s_mount_flags & EXT4_MF_FS_ABORTED) {
5210ac27a0ecSDave Kleikamp 			err = -EROFS;
5211ac27a0ecSDave Kleikamp 			goto restore_opts;
5212ac27a0ecSDave Kleikamp 		}
5213ac27a0ecSDave Kleikamp 
52141751e8a6SLinus Torvalds 		if (*flags & SB_RDONLY) {
521538c03b34STheodore Ts'o 			err = sync_filesystem(sb);
521638c03b34STheodore Ts'o 			if (err < 0)
521738c03b34STheodore Ts'o 				goto restore_opts;
52180f0dd62fSChristoph Hellwig 			err = dquot_suspend(sb, -1);
52190f0dd62fSChristoph Hellwig 			if (err < 0)
5220c79d967dSChristoph Hellwig 				goto restore_opts;
5221c79d967dSChristoph Hellwig 
5222ac27a0ecSDave Kleikamp 			/*
5223ac27a0ecSDave Kleikamp 			 * First of all, the unconditional stuff we have to do
5224ac27a0ecSDave Kleikamp 			 * to disable replay of the journal when we next remount
5225ac27a0ecSDave Kleikamp 			 */
52261751e8a6SLinus Torvalds 			sb->s_flags |= SB_RDONLY;
5227ac27a0ecSDave Kleikamp 
5228ac27a0ecSDave Kleikamp 			/*
5229ac27a0ecSDave Kleikamp 			 * OK, test if we are remounting a valid rw partition
5230ac27a0ecSDave Kleikamp 			 * readonly, and if so set the rdonly flag and then
5231ac27a0ecSDave Kleikamp 			 * mark the partition as valid again.
5232ac27a0ecSDave Kleikamp 			 */
5233617ba13bSMingming Cao 			if (!(es->s_state & cpu_to_le16(EXT4_VALID_FS)) &&
5234617ba13bSMingming Cao 			    (sbi->s_mount_state & EXT4_VALID_FS))
5235ac27a0ecSDave Kleikamp 				es->s_state = cpu_to_le16(sbi->s_mount_state);
5236ac27a0ecSDave Kleikamp 
5237a63c9eb2STheodore Ts'o 			if (sbi->s_journal)
5238617ba13bSMingming Cao 				ext4_mark_recovery_complete(sb, es);
52392dca60d9STheodore Ts'o 			if (sbi->s_mmp_tsk)
52402dca60d9STheodore Ts'o 				kthread_stop(sbi->s_mmp_tsk);
5241ac27a0ecSDave Kleikamp 		} else {
5242a13fb1a4SEric Sandeen 			/* Make sure we can mount this feature set readwrite */
5243e2b911c5SDarrick J. Wong 			if (ext4_has_feature_readonly(sb) ||
52442cb5cc8bSDarrick J. Wong 			    !ext4_feature_set_ok(sb, 0)) {
5245ac27a0ecSDave Kleikamp 				err = -EROFS;
5246ac27a0ecSDave Kleikamp 				goto restore_opts;
5247ac27a0ecSDave Kleikamp 			}
5248ead6596bSEric Sandeen 			/*
52498a266467STheodore Ts'o 			 * Make sure the group descriptor checksums
52500b8e58a1SAndreas Dilger 			 * are sane.  If they aren't, refuse to remount r/w.
52518a266467STheodore Ts'o 			 */
52528a266467STheodore Ts'o 			for (g = 0; g < sbi->s_groups_count; g++) {
52538a266467STheodore Ts'o 				struct ext4_group_desc *gdp =
52548a266467STheodore Ts'o 					ext4_get_group_desc(sb, g, NULL);
52558a266467STheodore Ts'o 
5256feb0ab32SDarrick J. Wong 				if (!ext4_group_desc_csum_verify(sb, g, gdp)) {
5257b31e1552SEric Sandeen 					ext4_msg(sb, KERN_ERR,
5258b31e1552SEric Sandeen 	       "ext4_remount: Checksum for group %u failed (%u!=%u)",
5259e2b911c5SDarrick J. Wong 		g, le16_to_cpu(ext4_group_desc_csum(sb, g, gdp)),
52608a266467STheodore Ts'o 					       le16_to_cpu(gdp->bg_checksum));
52616a797d27SDarrick J. Wong 					err = -EFSBADCRC;
52628a266467STheodore Ts'o 					goto restore_opts;
52638a266467STheodore Ts'o 				}
52648a266467STheodore Ts'o 			}
52658a266467STheodore Ts'o 
52668a266467STheodore Ts'o 			/*
5267ead6596bSEric Sandeen 			 * If we have an unprocessed orphan list hanging
5268ead6596bSEric Sandeen 			 * around from a previously readonly bdev mount,
5269ead6596bSEric Sandeen 			 * require a full umount/remount for now.
5270ead6596bSEric Sandeen 			 */
5271ead6596bSEric Sandeen 			if (es->s_last_orphan) {
5272b31e1552SEric Sandeen 				ext4_msg(sb, KERN_WARNING, "Couldn't "
5273ead6596bSEric Sandeen 				       "remount RDWR because of unprocessed "
5274ead6596bSEric Sandeen 				       "orphan inode list.  Please "
5275b31e1552SEric Sandeen 				       "umount/remount instead");
5276ead6596bSEric Sandeen 				err = -EINVAL;
5277ead6596bSEric Sandeen 				goto restore_opts;
5278ead6596bSEric Sandeen 			}
5279ead6596bSEric Sandeen 
5280ac27a0ecSDave Kleikamp 			/*
5281ac27a0ecSDave Kleikamp 			 * Mounting a RDONLY partition read-write, so reread
5282ac27a0ecSDave Kleikamp 			 * and store the current valid flag.  (It may have
5283ac27a0ecSDave Kleikamp 			 * been changed by e2fsck since we originally mounted
5284ac27a0ecSDave Kleikamp 			 * the partition.)
5285ac27a0ecSDave Kleikamp 			 */
52860390131bSFrank Mayhar 			if (sbi->s_journal)
5287617ba13bSMingming Cao 				ext4_clear_journal_err(sb, es);
5288ac27a0ecSDave Kleikamp 			sbi->s_mount_state = le16_to_cpu(es->s_state);
5289c89128a0SJaegeuk Kim 
5290c89128a0SJaegeuk Kim 			err = ext4_setup_super(sb, es, 0);
5291c89128a0SJaegeuk Kim 			if (err)
5292c89128a0SJaegeuk Kim 				goto restore_opts;
5293c89128a0SJaegeuk Kim 
52941751e8a6SLinus Torvalds 			sb->s_flags &= ~SB_RDONLY;
5295e2b911c5SDarrick J. Wong 			if (ext4_has_feature_mmp(sb))
5296c5e06d10SJohann Lombardi 				if (ext4_multi_mount_protect(sb,
5297c5e06d10SJohann Lombardi 						le64_to_cpu(es->s_mmp_block))) {
5298c5e06d10SJohann Lombardi 					err = -EROFS;
5299c5e06d10SJohann Lombardi 					goto restore_opts;
5300c5e06d10SJohann Lombardi 				}
5301c79d967dSChristoph Hellwig 			enable_quota = 1;
5302ac27a0ecSDave Kleikamp 		}
5303ac27a0ecSDave Kleikamp 	}
5304bfff6873SLukas Czerner 
5305bfff6873SLukas Czerner 	/*
5306bfff6873SLukas Czerner 	 * Reinitialize lazy itable initialization thread based on
5307bfff6873SLukas Czerner 	 * current settings
5308bfff6873SLukas Czerner 	 */
5309bc98a42cSDavid Howells 	if (sb_rdonly(sb) || !test_opt(sb, INIT_INODE_TABLE))
5310bfff6873SLukas Czerner 		ext4_unregister_li_request(sb);
5311bfff6873SLukas Czerner 	else {
5312bfff6873SLukas Czerner 		ext4_group_t first_not_zeroed;
5313bfff6873SLukas Czerner 		first_not_zeroed = ext4_has_uninit_itable(sb);
5314bfff6873SLukas Czerner 		ext4_register_li_request(sb, first_not_zeroed);
5315bfff6873SLukas Czerner 	}
5316bfff6873SLukas Czerner 
53176fd058f7STheodore Ts'o 	ext4_setup_system_zone(sb);
5318c89128a0SJaegeuk Kim 	if (sbi->s_journal == NULL && !(old_sb_flags & SB_RDONLY)) {
5319c89128a0SJaegeuk Kim 		err = ext4_commit_super(sb, 1);
5320c89128a0SJaegeuk Kim 		if (err)
5321c89128a0SJaegeuk Kim 			goto restore_opts;
5322c89128a0SJaegeuk Kim 	}
53230390131bSFrank Mayhar 
5324ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5325ac27a0ecSDave Kleikamp 	/* Release old quota file names */
5326a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++)
5327ac27a0ecSDave Kleikamp 		kfree(old_opts.s_qf_names[i]);
53287c319d32SAditya Kali 	if (enable_quota) {
53297c319d32SAditya Kali 		if (sb_any_quota_suspended(sb))
53300f0dd62fSChristoph Hellwig 			dquot_resume(sb, -1);
5331e2b911c5SDarrick J. Wong 		else if (ext4_has_feature_quota(sb)) {
53327c319d32SAditya Kali 			err = ext4_enable_quotas(sb);
533307724f98STheodore Ts'o 			if (err)
53347c319d32SAditya Kali 				goto restore_opts;
53357c319d32SAditya Kali 		}
53367c319d32SAditya Kali 	}
53377c319d32SAditya Kali #endif
5338d4c402d9SCurt Wohlgemuth 
53391751e8a6SLinus Torvalds 	*flags = (*flags & ~SB_LAZYTIME) | (sb->s_flags & SB_LAZYTIME);
5340d4c402d9SCurt Wohlgemuth 	ext4_msg(sb, KERN_INFO, "re-mounted. Opts: %s", orig_data);
5341d4c402d9SCurt Wohlgemuth 	kfree(orig_data);
5342ac27a0ecSDave Kleikamp 	return 0;
53430b8e58a1SAndreas Dilger 
5344ac27a0ecSDave Kleikamp restore_opts:
5345ac27a0ecSDave Kleikamp 	sb->s_flags = old_sb_flags;
5346ac27a0ecSDave Kleikamp 	sbi->s_mount_opt = old_opts.s_mount_opt;
5347a2595b8aSTheodore Ts'o 	sbi->s_mount_opt2 = old_opts.s_mount_opt2;
5348ac27a0ecSDave Kleikamp 	sbi->s_resuid = old_opts.s_resuid;
5349ac27a0ecSDave Kleikamp 	sbi->s_resgid = old_opts.s_resgid;
5350ac27a0ecSDave Kleikamp 	sbi->s_commit_interval = old_opts.s_commit_interval;
535130773840STheodore Ts'o 	sbi->s_min_batch_time = old_opts.s_min_batch_time;
535230773840STheodore Ts'o 	sbi->s_max_batch_time = old_opts.s_max_batch_time;
5353ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5354ac27a0ecSDave Kleikamp 	sbi->s_jquota_fmt = old_opts.s_jquota_fmt;
5355a2d4a646SJan Kara 	for (i = 0; i < EXT4_MAXQUOTAS; i++) {
5356ac27a0ecSDave Kleikamp 		kfree(sbi->s_qf_names[i]);
5357ac27a0ecSDave Kleikamp 		sbi->s_qf_names[i] = old_opts.s_qf_names[i];
5358ac27a0ecSDave Kleikamp 	}
5359ac27a0ecSDave Kleikamp #endif
5360d4c402d9SCurt Wohlgemuth 	kfree(orig_data);
5361ac27a0ecSDave Kleikamp 	return err;
5362ac27a0ecSDave Kleikamp }
5363ac27a0ecSDave Kleikamp 
5364689c958cSLi Xi #ifdef CONFIG_QUOTA
5365689c958cSLi Xi static int ext4_statfs_project(struct super_block *sb,
5366689c958cSLi Xi 			       kprojid_t projid, struct kstatfs *buf)
5367689c958cSLi Xi {
5368689c958cSLi Xi 	struct kqid qid;
5369689c958cSLi Xi 	struct dquot *dquot;
5370689c958cSLi Xi 	u64 limit;
5371689c958cSLi Xi 	u64 curblock;
5372689c958cSLi Xi 
5373689c958cSLi Xi 	qid = make_kqid_projid(projid);
5374689c958cSLi Xi 	dquot = dqget(sb, qid);
5375689c958cSLi Xi 	if (IS_ERR(dquot))
5376689c958cSLi Xi 		return PTR_ERR(dquot);
53777b9ca4c6SJan Kara 	spin_lock(&dquot->dq_dqb_lock);
5378689c958cSLi Xi 
5379689c958cSLi Xi 	limit = (dquot->dq_dqb.dqb_bsoftlimit ?
5380689c958cSLi Xi 		 dquot->dq_dqb.dqb_bsoftlimit :
5381689c958cSLi Xi 		 dquot->dq_dqb.dqb_bhardlimit) >> sb->s_blocksize_bits;
5382689c958cSLi Xi 	if (limit && buf->f_blocks > limit) {
5383f06925c7SKonstantin Khlebnikov 		curblock = (dquot->dq_dqb.dqb_curspace +
5384f06925c7SKonstantin Khlebnikov 			    dquot->dq_dqb.dqb_rsvspace) >> sb->s_blocksize_bits;
5385689c958cSLi Xi 		buf->f_blocks = limit;
5386689c958cSLi Xi 		buf->f_bfree = buf->f_bavail =
5387689c958cSLi Xi 			(buf->f_blocks > curblock) ?
5388689c958cSLi Xi 			 (buf->f_blocks - curblock) : 0;
5389689c958cSLi Xi 	}
5390689c958cSLi Xi 
5391689c958cSLi Xi 	limit = dquot->dq_dqb.dqb_isoftlimit ?
5392689c958cSLi Xi 		dquot->dq_dqb.dqb_isoftlimit :
5393689c958cSLi Xi 		dquot->dq_dqb.dqb_ihardlimit;
5394689c958cSLi Xi 	if (limit && buf->f_files > limit) {
5395689c958cSLi Xi 		buf->f_files = limit;
5396689c958cSLi Xi 		buf->f_ffree =
5397689c958cSLi Xi 			(buf->f_files > dquot->dq_dqb.dqb_curinodes) ?
5398689c958cSLi Xi 			 (buf->f_files - dquot->dq_dqb.dqb_curinodes) : 0;
5399689c958cSLi Xi 	}
5400689c958cSLi Xi 
54017b9ca4c6SJan Kara 	spin_unlock(&dquot->dq_dqb_lock);
5402689c958cSLi Xi 	dqput(dquot);
5403689c958cSLi Xi 	return 0;
5404689c958cSLi Xi }
5405689c958cSLi Xi #endif
5406689c958cSLi Xi 
5407617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf)
5408ac27a0ecSDave Kleikamp {
5409ac27a0ecSDave Kleikamp 	struct super_block *sb = dentry->d_sb;
5410617ba13bSMingming Cao 	struct ext4_sb_info *sbi = EXT4_SB(sb);
5411617ba13bSMingming Cao 	struct ext4_super_block *es = sbi->s_es;
541227dd4385SLukas Czerner 	ext4_fsblk_t overhead = 0, resv_blocks;
5413960cc398SPekka Enberg 	u64 fsid;
5414d02a9391SKazuya Mio 	s64 bfree;
541527dd4385SLukas Czerner 	resv_blocks = EXT4_C2B(sbi, atomic64_read(&sbi->s_resv_clusters));
5416ac27a0ecSDave Kleikamp 
5417952fc18eSTheodore Ts'o 	if (!test_opt(sb, MINIX_DF))
5418952fc18eSTheodore Ts'o 		overhead = sbi->s_overhead;
5419ac27a0ecSDave Kleikamp 
5420617ba13bSMingming Cao 	buf->f_type = EXT4_SUPER_MAGIC;
5421ac27a0ecSDave Kleikamp 	buf->f_bsize = sb->s_blocksize;
5422b72f78cbSEric Sandeen 	buf->f_blocks = ext4_blocks_count(es) - EXT4_C2B(sbi, overhead);
542357042651STheodore Ts'o 	bfree = percpu_counter_sum_positive(&sbi->s_freeclusters_counter) -
542457042651STheodore Ts'o 		percpu_counter_sum_positive(&sbi->s_dirtyclusters_counter);
5425d02a9391SKazuya Mio 	/* prevent underflow in case that few free space is available */
542657042651STheodore Ts'o 	buf->f_bfree = EXT4_C2B(sbi, max_t(s64, bfree, 0));
542727dd4385SLukas Czerner 	buf->f_bavail = buf->f_bfree -
542827dd4385SLukas Czerner 			(ext4_r_blocks_count(es) + resv_blocks);
542927dd4385SLukas Czerner 	if (buf->f_bfree < (ext4_r_blocks_count(es) + resv_blocks))
5430ac27a0ecSDave Kleikamp 		buf->f_bavail = 0;
5431ac27a0ecSDave Kleikamp 	buf->f_files = le32_to_cpu(es->s_inodes_count);
543252d9f3b4SPeter Zijlstra 	buf->f_ffree = percpu_counter_sum_positive(&sbi->s_freeinodes_counter);
5433617ba13bSMingming Cao 	buf->f_namelen = EXT4_NAME_LEN;
5434960cc398SPekka Enberg 	fsid = le64_to_cpup((void *)es->s_uuid) ^
5435960cc398SPekka Enberg 	       le64_to_cpup((void *)es->s_uuid + sizeof(u64));
5436960cc398SPekka Enberg 	buf->f_fsid.val[0] = fsid & 0xFFFFFFFFUL;
5437960cc398SPekka Enberg 	buf->f_fsid.val[1] = (fsid >> 32) & 0xFFFFFFFFUL;
54380b8e58a1SAndreas Dilger 
5439689c958cSLi Xi #ifdef CONFIG_QUOTA
5440689c958cSLi Xi 	if (ext4_test_inode_flag(dentry->d_inode, EXT4_INODE_PROJINHERIT) &&
5441689c958cSLi Xi 	    sb_has_quota_limits_enabled(sb, PRJQUOTA))
5442689c958cSLi Xi 		ext4_statfs_project(sb, EXT4_I(dentry->d_inode)->i_projid, buf);
5443689c958cSLi Xi #endif
5444ac27a0ecSDave Kleikamp 	return 0;
5445ac27a0ecSDave Kleikamp }
5446ac27a0ecSDave Kleikamp 
5447ac27a0ecSDave Kleikamp 
5448ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA
5449ac27a0ecSDave Kleikamp 
5450bc8230eeSJan Kara /*
5451bc8230eeSJan Kara  * Helper functions so that transaction is started before we acquire dqio_sem
5452bc8230eeSJan Kara  * to keep correct lock ordering of transaction > dqio_sem
5453bc8230eeSJan Kara  */
5454ac27a0ecSDave Kleikamp static inline struct inode *dquot_to_inode(struct dquot *dquot)
5455ac27a0ecSDave Kleikamp {
54564c376dcaSEric W. Biederman 	return sb_dqopt(dquot->dq_sb)->files[dquot->dq_id.type];
5457ac27a0ecSDave Kleikamp }
5458ac27a0ecSDave Kleikamp 
5459617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot)
5460ac27a0ecSDave Kleikamp {
5461ac27a0ecSDave Kleikamp 	int ret, err;
5462ac27a0ecSDave Kleikamp 	handle_t *handle;
5463ac27a0ecSDave Kleikamp 	struct inode *inode;
5464ac27a0ecSDave Kleikamp 
5465ac27a0ecSDave Kleikamp 	inode = dquot_to_inode(dquot);
54669924a92aSTheodore Ts'o 	handle = ext4_journal_start(inode, EXT4_HT_QUOTA,
5467617ba13bSMingming Cao 				    EXT4_QUOTA_TRANS_BLOCKS(dquot->dq_sb));
5468ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
5469ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
5470ac27a0ecSDave Kleikamp 	ret = dquot_commit(dquot);
5471617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
5472ac27a0ecSDave Kleikamp 	if (!ret)
5473ac27a0ecSDave Kleikamp 		ret = err;
5474ac27a0ecSDave Kleikamp 	return ret;
5475ac27a0ecSDave Kleikamp }
5476ac27a0ecSDave Kleikamp 
5477617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot)
5478ac27a0ecSDave Kleikamp {
5479ac27a0ecSDave Kleikamp 	int ret, err;
5480ac27a0ecSDave Kleikamp 	handle_t *handle;
5481ac27a0ecSDave Kleikamp 
54829924a92aSTheodore Ts'o 	handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA,
5483617ba13bSMingming Cao 				    EXT4_QUOTA_INIT_BLOCKS(dquot->dq_sb));
5484ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
5485ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
5486ac27a0ecSDave Kleikamp 	ret = dquot_acquire(dquot);
5487617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
5488ac27a0ecSDave Kleikamp 	if (!ret)
5489ac27a0ecSDave Kleikamp 		ret = err;
5490ac27a0ecSDave Kleikamp 	return ret;
5491ac27a0ecSDave Kleikamp }
5492ac27a0ecSDave Kleikamp 
5493617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot)
5494ac27a0ecSDave Kleikamp {
5495ac27a0ecSDave Kleikamp 	int ret, err;
5496ac27a0ecSDave Kleikamp 	handle_t *handle;
5497ac27a0ecSDave Kleikamp 
54989924a92aSTheodore Ts'o 	handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA,
5499617ba13bSMingming Cao 				    EXT4_QUOTA_DEL_BLOCKS(dquot->dq_sb));
55009c3013e9SJan Kara 	if (IS_ERR(handle)) {
55019c3013e9SJan Kara 		/* Release dquot anyway to avoid endless cycle in dqput() */
55029c3013e9SJan Kara 		dquot_release(dquot);
5503ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
55049c3013e9SJan Kara 	}
5505ac27a0ecSDave Kleikamp 	ret = dquot_release(dquot);
5506617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
5507ac27a0ecSDave Kleikamp 	if (!ret)
5508ac27a0ecSDave Kleikamp 		ret = err;
5509ac27a0ecSDave Kleikamp 	return ret;
5510ac27a0ecSDave Kleikamp }
5511ac27a0ecSDave Kleikamp 
5512617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot)
5513ac27a0ecSDave Kleikamp {
5514262b4662SJan Kara 	struct super_block *sb = dquot->dq_sb;
5515262b4662SJan Kara 	struct ext4_sb_info *sbi = EXT4_SB(sb);
5516262b4662SJan Kara 
55172c8be6b2SJan Kara 	/* Are we journaling quotas? */
5518e2b911c5SDarrick J. Wong 	if (ext4_has_feature_quota(sb) ||
5519262b4662SJan Kara 	    sbi->s_qf_names[USRQUOTA] || sbi->s_qf_names[GRPQUOTA]) {
5520ac27a0ecSDave Kleikamp 		dquot_mark_dquot_dirty(dquot);
5521617ba13bSMingming Cao 		return ext4_write_dquot(dquot);
5522ac27a0ecSDave Kleikamp 	} else {
5523ac27a0ecSDave Kleikamp 		return dquot_mark_dquot_dirty(dquot);
5524ac27a0ecSDave Kleikamp 	}
5525ac27a0ecSDave Kleikamp }
5526ac27a0ecSDave Kleikamp 
5527617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type)
5528ac27a0ecSDave Kleikamp {
5529ac27a0ecSDave Kleikamp 	int ret, err;
5530ac27a0ecSDave Kleikamp 	handle_t *handle;
5531ac27a0ecSDave Kleikamp 
5532ac27a0ecSDave Kleikamp 	/* Data block + inode block */
55332b0143b5SDavid Howells 	handle = ext4_journal_start(d_inode(sb->s_root), EXT4_HT_QUOTA, 2);
5534ac27a0ecSDave Kleikamp 	if (IS_ERR(handle))
5535ac27a0ecSDave Kleikamp 		return PTR_ERR(handle);
5536ac27a0ecSDave Kleikamp 	ret = dquot_commit_info(sb, type);
5537617ba13bSMingming Cao 	err = ext4_journal_stop(handle);
5538ac27a0ecSDave Kleikamp 	if (!ret)
5539ac27a0ecSDave Kleikamp 		ret = err;
5540ac27a0ecSDave Kleikamp 	return ret;
5541ac27a0ecSDave Kleikamp }
5542ac27a0ecSDave Kleikamp 
5543ac27a0ecSDave Kleikamp /*
5544ac27a0ecSDave Kleikamp  * Turn on quotas during mount time - we need to find
5545ac27a0ecSDave Kleikamp  * the quota file and such...
5546ac27a0ecSDave Kleikamp  */
5547617ba13bSMingming Cao static int ext4_quota_on_mount(struct super_block *sb, int type)
5548ac27a0ecSDave Kleikamp {
5549287a8095SChristoph Hellwig 	return dquot_quota_on_mount(sb, EXT4_SB(sb)->s_qf_names[type],
5550617ba13bSMingming Cao 					EXT4_SB(sb)->s_jquota_fmt, type);
5551ac27a0ecSDave Kleikamp }
5552ac27a0ecSDave Kleikamp 
5553daf647d2STheodore Ts'o static void lockdep_set_quota_inode(struct inode *inode, int subclass)
5554daf647d2STheodore Ts'o {
5555daf647d2STheodore Ts'o 	struct ext4_inode_info *ei = EXT4_I(inode);
5556daf647d2STheodore Ts'o 
5557daf647d2STheodore Ts'o 	/* The first argument of lockdep_set_subclass has to be
5558daf647d2STheodore Ts'o 	 * *exactly* the same as the argument to init_rwsem() --- in
5559daf647d2STheodore Ts'o 	 * this case, in init_once() --- or lockdep gets unhappy
5560daf647d2STheodore Ts'o 	 * because the name of the lock is set using the
5561daf647d2STheodore Ts'o 	 * stringification of the argument to init_rwsem().
5562daf647d2STheodore Ts'o 	 */
5563daf647d2STheodore Ts'o 	(void) ei;	/* shut up clang warning if !CONFIG_LOCKDEP */
5564daf647d2STheodore Ts'o 	lockdep_set_subclass(&ei->i_data_sem, subclass);
5565daf647d2STheodore Ts'o }
5566daf647d2STheodore Ts'o 
5567ac27a0ecSDave Kleikamp /*
5568ac27a0ecSDave Kleikamp  * Standard function to be called on quota_on
5569ac27a0ecSDave Kleikamp  */
5570617ba13bSMingming Cao static int ext4_quota_on(struct super_block *sb, int type, int format_id,
55718c54ca9cSAl Viro 			 const struct path *path)
5572ac27a0ecSDave Kleikamp {
5573ac27a0ecSDave Kleikamp 	int err;
5574ac27a0ecSDave Kleikamp 
5575ac27a0ecSDave Kleikamp 	if (!test_opt(sb, QUOTA))
5576ac27a0ecSDave Kleikamp 		return -EINVAL;
55770623543bSJan Kara 
5578ac27a0ecSDave Kleikamp 	/* Quotafile not on the same filesystem? */
5579d8c9584eSAl Viro 	if (path->dentry->d_sb != sb)
5580ac27a0ecSDave Kleikamp 		return -EXDEV;
55810623543bSJan Kara 	/* Journaling quota? */
55820623543bSJan Kara 	if (EXT4_SB(sb)->s_qf_names[type]) {
55832b2d6d01STheodore Ts'o 		/* Quotafile not in fs root? */
5584f00c9e44SJan Kara 		if (path->dentry->d_parent != sb->s_root)
5585b31e1552SEric Sandeen 			ext4_msg(sb, KERN_WARNING,
5586b31e1552SEric Sandeen 				"Quota file not on filesystem root. "
5587b31e1552SEric Sandeen 				"Journaled quota will not work");
558891389240SJan Kara 		sb_dqopt(sb)->flags |= DQUOT_NOLIST_DIRTY;
558991389240SJan Kara 	} else {
559091389240SJan Kara 		/*
559191389240SJan Kara 		 * Clear the flag just in case mount options changed since
559291389240SJan Kara 		 * last time.
559391389240SJan Kara 		 */
559491389240SJan Kara 		sb_dqopt(sb)->flags &= ~DQUOT_NOLIST_DIRTY;
55950623543bSJan Kara 	}
55960623543bSJan Kara 
55970623543bSJan Kara 	/*
55980623543bSJan Kara 	 * When we journal data on quota file, we have to flush journal to see
55990623543bSJan Kara 	 * all updates to the file when we bypass pagecache...
56000623543bSJan Kara 	 */
56010390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal &&
56022b0143b5SDavid Howells 	    ext4_should_journal_data(d_inode(path->dentry))) {
56030623543bSJan Kara 		/*
56040623543bSJan Kara 		 * We don't need to lock updates but journal_flush() could
56050623543bSJan Kara 		 * otherwise be livelocked...
56060623543bSJan Kara 		 */
56070623543bSJan Kara 		jbd2_journal_lock_updates(EXT4_SB(sb)->s_journal);
56087ffe1ea8SHidehiro Kawai 		err = jbd2_journal_flush(EXT4_SB(sb)->s_journal);
56090623543bSJan Kara 		jbd2_journal_unlock_updates(EXT4_SB(sb)->s_journal);
5610f00c9e44SJan Kara 		if (err)
56117ffe1ea8SHidehiro Kawai 			return err;
56127ffe1ea8SHidehiro Kawai 	}
5613957153fcSJan Kara 
5614daf647d2STheodore Ts'o 	lockdep_set_quota_inode(path->dentry->d_inode, I_DATA_SEM_QUOTA);
5615daf647d2STheodore Ts'o 	err = dquot_quota_on(sb, type, format_id, path);
5616957153fcSJan Kara 	if (err) {
5617daf647d2STheodore Ts'o 		lockdep_set_quota_inode(path->dentry->d_inode,
5618daf647d2STheodore Ts'o 					     I_DATA_SEM_NORMAL);
5619957153fcSJan Kara 	} else {
5620957153fcSJan Kara 		struct inode *inode = d_inode(path->dentry);
5621957153fcSJan Kara 		handle_t *handle;
5622957153fcSJan Kara 
562361a92987SJan Kara 		/*
562461a92987SJan Kara 		 * Set inode flags to prevent userspace from messing with quota
562561a92987SJan Kara 		 * files. If this fails, we return success anyway since quotas
562661a92987SJan Kara 		 * are already enabled and this is not a hard failure.
562761a92987SJan Kara 		 */
5628957153fcSJan Kara 		inode_lock(inode);
5629957153fcSJan Kara 		handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1);
5630957153fcSJan Kara 		if (IS_ERR(handle))
5631957153fcSJan Kara 			goto unlock_inode;
5632957153fcSJan Kara 		EXT4_I(inode)->i_flags |= EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL;
5633957153fcSJan Kara 		inode_set_flags(inode, S_NOATIME | S_IMMUTABLE,
5634957153fcSJan Kara 				S_NOATIME | S_IMMUTABLE);
5635957153fcSJan Kara 		ext4_mark_inode_dirty(handle, inode);
5636957153fcSJan Kara 		ext4_journal_stop(handle);
5637957153fcSJan Kara 	unlock_inode:
5638957153fcSJan Kara 		inode_unlock(inode);
5639957153fcSJan Kara 	}
5640daf647d2STheodore Ts'o 	return err;
5641ac27a0ecSDave Kleikamp }
5642ac27a0ecSDave Kleikamp 
56437c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id,
56447c319d32SAditya Kali 			     unsigned int flags)
56457c319d32SAditya Kali {
56467c319d32SAditya Kali 	int err;
56477c319d32SAditya Kali 	struct inode *qf_inode;
5648a2d4a646SJan Kara 	unsigned long qf_inums[EXT4_MAXQUOTAS] = {
56497c319d32SAditya Kali 		le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum),
5650689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum),
5651689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum)
56527c319d32SAditya Kali 	};
56537c319d32SAditya Kali 
5654e2b911c5SDarrick J. Wong 	BUG_ON(!ext4_has_feature_quota(sb));
56557c319d32SAditya Kali 
56567c319d32SAditya Kali 	if (!qf_inums[type])
56577c319d32SAditya Kali 		return -EPERM;
56587c319d32SAditya Kali 
56597c319d32SAditya Kali 	qf_inode = ext4_iget(sb, qf_inums[type]);
56607c319d32SAditya Kali 	if (IS_ERR(qf_inode)) {
56617c319d32SAditya Kali 		ext4_error(sb, "Bad quota inode # %lu", qf_inums[type]);
56627c319d32SAditya Kali 		return PTR_ERR(qf_inode);
56637c319d32SAditya Kali 	}
56647c319d32SAditya Kali 
5665bcb13850SJan Kara 	/* Don't account quota for quota files to avoid recursion */
5666bcb13850SJan Kara 	qf_inode->i_flags |= S_NOQUOTA;
5667daf647d2STheodore Ts'o 	lockdep_set_quota_inode(qf_inode, I_DATA_SEM_QUOTA);
56687c319d32SAditya Kali 	err = dquot_enable(qf_inode, type, format_id, flags);
56697c319d32SAditya Kali 	iput(qf_inode);
5670daf647d2STheodore Ts'o 	if (err)
5671daf647d2STheodore Ts'o 		lockdep_set_quota_inode(qf_inode, I_DATA_SEM_NORMAL);
56727c319d32SAditya Kali 
56737c319d32SAditya Kali 	return err;
56747c319d32SAditya Kali }
56757c319d32SAditya Kali 
56767c319d32SAditya Kali /* Enable usage tracking for all quota types. */
56777c319d32SAditya Kali static int ext4_enable_quotas(struct super_block *sb)
56787c319d32SAditya Kali {
56797c319d32SAditya Kali 	int type, err = 0;
5680a2d4a646SJan Kara 	unsigned long qf_inums[EXT4_MAXQUOTAS] = {
56817c319d32SAditya Kali 		le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum),
5682689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum),
5683689c958cSLi Xi 		le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum)
56847c319d32SAditya Kali 	};
568549da9392SJan Kara 	bool quota_mopt[EXT4_MAXQUOTAS] = {
568649da9392SJan Kara 		test_opt(sb, USRQUOTA),
568749da9392SJan Kara 		test_opt(sb, GRPQUOTA),
568849da9392SJan Kara 		test_opt(sb, PRJQUOTA),
568949da9392SJan Kara 	};
56907c319d32SAditya Kali 
569191389240SJan Kara 	sb_dqopt(sb)->flags |= DQUOT_QUOTA_SYS_FILE | DQUOT_NOLIST_DIRTY;
5692a2d4a646SJan Kara 	for (type = 0; type < EXT4_MAXQUOTAS; type++) {
56937c319d32SAditya Kali 		if (qf_inums[type]) {
56947c319d32SAditya Kali 			err = ext4_quota_enable(sb, type, QFMT_VFS_V1,
569549da9392SJan Kara 				DQUOT_USAGE_ENABLED |
569649da9392SJan Kara 				(quota_mopt[type] ? DQUOT_LIMITS_ENABLED : 0));
56977c319d32SAditya Kali 			if (err) {
56987c319d32SAditya Kali 				ext4_warning(sb,
569972ba7450STheodore Ts'o 					"Failed to enable quota tracking "
570072ba7450STheodore Ts'o 					"(type=%d, err=%d). Please run "
570172ba7450STheodore Ts'o 					"e2fsck to fix.", type, err);
57027f144fd0SJunichi Uekawa 				for (type--; type >= 0; type--)
57037f144fd0SJunichi Uekawa 					dquot_quota_off(sb, type);
57047f144fd0SJunichi Uekawa 
57057c319d32SAditya Kali 				return err;
57067c319d32SAditya Kali 			}
57077c319d32SAditya Kali 		}
57087c319d32SAditya Kali 	}
57097c319d32SAditya Kali 	return 0;
57107c319d32SAditya Kali }
57117c319d32SAditya Kali 
5712ca0e05e4SDmitry Monakhov static int ext4_quota_off(struct super_block *sb, int type)
5713ca0e05e4SDmitry Monakhov {
571421f97697SJan Kara 	struct inode *inode = sb_dqopt(sb)->files[type];
571521f97697SJan Kara 	handle_t *handle;
5716957153fcSJan Kara 	int err;
571721f97697SJan Kara 
571887009d86SDmitry Monakhov 	/* Force all delayed allocation blocks to be allocated.
571987009d86SDmitry Monakhov 	 * Caller already holds s_umount sem */
572087009d86SDmitry Monakhov 	if (test_opt(sb, DELALLOC))
5721ca0e05e4SDmitry Monakhov 		sync_filesystem(sb);
5722ca0e05e4SDmitry Monakhov 
5723957153fcSJan Kara 	if (!inode || !igrab(inode))
57240b268590SAmir Goldstein 		goto out;
57250b268590SAmir Goldstein 
5726957153fcSJan Kara 	err = dquot_quota_off(sb, type);
5727964edf66SJan Kara 	if (err || ext4_has_feature_quota(sb))
5728957153fcSJan Kara 		goto out_put;
5729957153fcSJan Kara 
5730957153fcSJan Kara 	inode_lock(inode);
573161a92987SJan Kara 	/*
573261a92987SJan Kara 	 * Update modification times of quota files when userspace can
573361a92987SJan Kara 	 * start looking at them. If we fail, we return success anyway since
573461a92987SJan Kara 	 * this is not a hard failure and quotas are already disabled.
573561a92987SJan Kara 	 */
57369924a92aSTheodore Ts'o 	handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1);
573721f97697SJan Kara 	if (IS_ERR(handle))
5738957153fcSJan Kara 		goto out_unlock;
5739957153fcSJan Kara 	EXT4_I(inode)->i_flags &= ~(EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL);
5740957153fcSJan Kara 	inode_set_flags(inode, 0, S_NOATIME | S_IMMUTABLE);
5741eeca7ea1SDeepa Dinamani 	inode->i_mtime = inode->i_ctime = current_time(inode);
574221f97697SJan Kara 	ext4_mark_inode_dirty(handle, inode);
574321f97697SJan Kara 	ext4_journal_stop(handle);
5744957153fcSJan Kara out_unlock:
5745957153fcSJan Kara 	inode_unlock(inode);
5746957153fcSJan Kara out_put:
5747964edf66SJan Kara 	lockdep_set_quota_inode(inode, I_DATA_SEM_NORMAL);
5748957153fcSJan Kara 	iput(inode);
5749957153fcSJan Kara 	return err;
575021f97697SJan Kara out:
5751ca0e05e4SDmitry Monakhov 	return dquot_quota_off(sb, type);
5752ca0e05e4SDmitry Monakhov }
5753ca0e05e4SDmitry Monakhov 
5754ac27a0ecSDave Kleikamp /* Read data from quotafile - avoid pagecache and such because we cannot afford
5755ac27a0ecSDave Kleikamp  * acquiring the locks... As quota files are never truncated and quota code
5756ac27a0ecSDave Kleikamp  * itself serializes the operations (and no one else should touch the files)
5757ac27a0ecSDave Kleikamp  * we don't have to be afraid of races */
5758617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data,
5759ac27a0ecSDave Kleikamp 			       size_t len, loff_t off)
5760ac27a0ecSDave Kleikamp {
5761ac27a0ecSDave Kleikamp 	struct inode *inode = sb_dqopt(sb)->files[type];
5762725d26d3SAneesh Kumar K.V 	ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
5763ac27a0ecSDave Kleikamp 	int offset = off & (sb->s_blocksize - 1);
5764ac27a0ecSDave Kleikamp 	int tocopy;
5765ac27a0ecSDave Kleikamp 	size_t toread;
5766ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
5767ac27a0ecSDave Kleikamp 	loff_t i_size = i_size_read(inode);
5768ac27a0ecSDave Kleikamp 
5769ac27a0ecSDave Kleikamp 	if (off > i_size)
5770ac27a0ecSDave Kleikamp 		return 0;
5771ac27a0ecSDave Kleikamp 	if (off+len > i_size)
5772ac27a0ecSDave Kleikamp 		len = i_size-off;
5773ac27a0ecSDave Kleikamp 	toread = len;
5774ac27a0ecSDave Kleikamp 	while (toread > 0) {
5775ac27a0ecSDave Kleikamp 		tocopy = sb->s_blocksize - offset < toread ?
5776ac27a0ecSDave Kleikamp 				sb->s_blocksize - offset : toread;
57771c215028STheodore Ts'o 		bh = ext4_bread(NULL, inode, blk, 0);
57781c215028STheodore Ts'o 		if (IS_ERR(bh))
57791c215028STheodore Ts'o 			return PTR_ERR(bh);
5780ac27a0ecSDave Kleikamp 		if (!bh)	/* A hole? */
5781ac27a0ecSDave Kleikamp 			memset(data, 0, tocopy);
5782ac27a0ecSDave Kleikamp 		else
5783ac27a0ecSDave Kleikamp 			memcpy(data, bh->b_data+offset, tocopy);
5784ac27a0ecSDave Kleikamp 		brelse(bh);
5785ac27a0ecSDave Kleikamp 		offset = 0;
5786ac27a0ecSDave Kleikamp 		toread -= tocopy;
5787ac27a0ecSDave Kleikamp 		data += tocopy;
5788ac27a0ecSDave Kleikamp 		blk++;
5789ac27a0ecSDave Kleikamp 	}
5790ac27a0ecSDave Kleikamp 	return len;
5791ac27a0ecSDave Kleikamp }
5792ac27a0ecSDave Kleikamp 
5793ac27a0ecSDave Kleikamp /* Write to quotafile (we know the transaction is already started and has
5794ac27a0ecSDave Kleikamp  * enough credits) */
5795617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type,
5796ac27a0ecSDave Kleikamp 				const char *data, size_t len, loff_t off)
5797ac27a0ecSDave Kleikamp {
5798ac27a0ecSDave Kleikamp 	struct inode *inode = sb_dqopt(sb)->files[type];
5799725d26d3SAneesh Kumar K.V 	ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb);
58001c215028STheodore Ts'o 	int err, offset = off & (sb->s_blocksize - 1);
5801c5e298aeSTheodore Ts'o 	int retries = 0;
5802ac27a0ecSDave Kleikamp 	struct buffer_head *bh;
5803ac27a0ecSDave Kleikamp 	handle_t *handle = journal_current_handle();
5804ac27a0ecSDave Kleikamp 
58050390131bSFrank Mayhar 	if (EXT4_SB(sb)->s_journal && !handle) {
5806b31e1552SEric Sandeen 		ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)"
5807b31e1552SEric Sandeen 			" cancelled because transaction is not started",
58089c3013e9SJan Kara 			(unsigned long long)off, (unsigned long long)len);
58099c3013e9SJan Kara 		return -EIO;
58109c3013e9SJan Kara 	}
581167eeb568SDmitry Monakhov 	/*
581267eeb568SDmitry Monakhov 	 * Since we account only one data block in transaction credits,
581367eeb568SDmitry Monakhov 	 * then it is impossible to cross a block boundary.
581467eeb568SDmitry Monakhov 	 */
581567eeb568SDmitry Monakhov 	if (sb->s_blocksize - offset < len) {
581667eeb568SDmitry Monakhov 		ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)"
581767eeb568SDmitry Monakhov 			" cancelled because not block aligned",
581867eeb568SDmitry Monakhov 			(unsigned long long)off, (unsigned long long)len);
581967eeb568SDmitry Monakhov 		return -EIO;
582067eeb568SDmitry Monakhov 	}
582167eeb568SDmitry Monakhov 
5822c5e298aeSTheodore Ts'o 	do {
5823c5e298aeSTheodore Ts'o 		bh = ext4_bread(handle, inode, blk,
5824c5e298aeSTheodore Ts'o 				EXT4_GET_BLOCKS_CREATE |
5825c5e298aeSTheodore Ts'o 				EXT4_GET_BLOCKS_METADATA_NOFAIL);
5826c5e298aeSTheodore Ts'o 	} while (IS_ERR(bh) && (PTR_ERR(bh) == -ENOSPC) &&
5827c5e298aeSTheodore Ts'o 		 ext4_should_retry_alloc(inode->i_sb, &retries));
58281c215028STheodore Ts'o 	if (IS_ERR(bh))
58291c215028STheodore Ts'o 		return PTR_ERR(bh);
5830ac27a0ecSDave Kleikamp 	if (!bh)
5831ac27a0ecSDave Kleikamp 		goto out;
58325d601255Sliang xie 	BUFFER_TRACE(bh, "get write access");
5833617ba13bSMingming Cao 	err = ext4_journal_get_write_access(handle, bh);
5834ac27a0ecSDave Kleikamp 	if (err) {
5835ac27a0ecSDave Kleikamp 		brelse(bh);
58361c215028STheodore Ts'o 		return err;
5837ac27a0ecSDave Kleikamp 	}
5838ac27a0ecSDave Kleikamp 	lock_buffer(bh);
583967eeb568SDmitry Monakhov 	memcpy(bh->b_data+offset, data, len);
5840ac27a0ecSDave Kleikamp 	flush_dcache_page(bh->b_page);
5841ac27a0ecSDave Kleikamp 	unlock_buffer(bh);
58420390131bSFrank Mayhar 	err = ext4_handle_dirty_metadata(handle, NULL, bh);
5843ac27a0ecSDave Kleikamp 	brelse(bh);
5844ac27a0ecSDave Kleikamp out:
584567eeb568SDmitry Monakhov 	if (inode->i_size < off + len) {
584667eeb568SDmitry Monakhov 		i_size_write(inode, off + len);
5847617ba13bSMingming Cao 		EXT4_I(inode)->i_disksize = inode->i_size;
5848617ba13bSMingming Cao 		ext4_mark_inode_dirty(handle, inode);
584921f97697SJan Kara 	}
585067eeb568SDmitry Monakhov 	return len;
5851ac27a0ecSDave Kleikamp }
5852ac27a0ecSDave Kleikamp 
58538f0e8746STheodore Ts'o static int ext4_get_next_id(struct super_block *sb, struct kqid *qid)
58548f0e8746STheodore Ts'o {
58558f0e8746STheodore Ts'o 	const struct quota_format_ops	*ops;
58568f0e8746STheodore Ts'o 
58578f0e8746STheodore Ts'o 	if (!sb_has_quota_loaded(sb, qid->type))
58588f0e8746STheodore Ts'o 		return -ESRCH;
58598f0e8746STheodore Ts'o 	ops = sb_dqopt(sb)->ops[qid->type];
58608f0e8746STheodore Ts'o 	if (!ops || !ops->get_next_id)
58618f0e8746STheodore Ts'o 		return -ENOSYS;
58628f0e8746STheodore Ts'o 	return dquot_get_next_id(sb, qid);
58638f0e8746STheodore Ts'o }
5864ac27a0ecSDave Kleikamp #endif
5865ac27a0ecSDave Kleikamp 
5866152a0836SAl Viro static struct dentry *ext4_mount(struct file_system_type *fs_type, int flags,
5867152a0836SAl Viro 		       const char *dev_name, void *data)
5868ac27a0ecSDave Kleikamp {
5869152a0836SAl Viro 	return mount_bdev(fs_type, flags, dev_name, data, ext4_fill_super);
5870ac27a0ecSDave Kleikamp }
5871ac27a0ecSDave Kleikamp 
5872c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2)
587324b58424STheodore Ts'o static inline void register_as_ext2(void)
587424b58424STheodore Ts'o {
587524b58424STheodore Ts'o 	int err = register_filesystem(&ext2_fs_type);
587624b58424STheodore Ts'o 	if (err)
587724b58424STheodore Ts'o 		printk(KERN_WARNING
587824b58424STheodore Ts'o 		       "EXT4-fs: Unable to register as ext2 (%d)\n", err);
587924b58424STheodore Ts'o }
588024b58424STheodore Ts'o 
588124b58424STheodore Ts'o static inline void unregister_as_ext2(void)
588224b58424STheodore Ts'o {
588324b58424STheodore Ts'o 	unregister_filesystem(&ext2_fs_type);
588424b58424STheodore Ts'o }
58852035e776STheodore Ts'o 
58862035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb)
58872035e776STheodore Ts'o {
5888e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext2_incompat_features(sb))
58892035e776STheodore Ts'o 		return 0;
5890bc98a42cSDavid Howells 	if (sb_rdonly(sb))
58912035e776STheodore Ts'o 		return 1;
5892e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext2_ro_compat_features(sb))
58932035e776STheodore Ts'o 		return 0;
58942035e776STheodore Ts'o 	return 1;
58952035e776STheodore Ts'o }
589624b58424STheodore Ts'o #else
589724b58424STheodore Ts'o static inline void register_as_ext2(void) { }
589824b58424STheodore Ts'o static inline void unregister_as_ext2(void) { }
58992035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb) { return 0; }
590024b58424STheodore Ts'o #endif
590124b58424STheodore Ts'o 
590224b58424STheodore Ts'o static inline void register_as_ext3(void)
590324b58424STheodore Ts'o {
590424b58424STheodore Ts'o 	int err = register_filesystem(&ext3_fs_type);
590524b58424STheodore Ts'o 	if (err)
590624b58424STheodore Ts'o 		printk(KERN_WARNING
590724b58424STheodore Ts'o 		       "EXT4-fs: Unable to register as ext3 (%d)\n", err);
590824b58424STheodore Ts'o }
590924b58424STheodore Ts'o 
591024b58424STheodore Ts'o static inline void unregister_as_ext3(void)
591124b58424STheodore Ts'o {
591224b58424STheodore Ts'o 	unregister_filesystem(&ext3_fs_type);
591324b58424STheodore Ts'o }
59142035e776STheodore Ts'o 
59152035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb)
59162035e776STheodore Ts'o {
5917e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext3_incompat_features(sb))
59182035e776STheodore Ts'o 		return 0;
5919e2b911c5SDarrick J. Wong 	if (!ext4_has_feature_journal(sb))
59202035e776STheodore Ts'o 		return 0;
5921bc98a42cSDavid Howells 	if (sb_rdonly(sb))
59222035e776STheodore Ts'o 		return 1;
5923e2b911c5SDarrick J. Wong 	if (ext4_has_unknown_ext3_ro_compat_features(sb))
59242035e776STheodore Ts'o 		return 0;
59252035e776STheodore Ts'o 	return 1;
59262035e776STheodore Ts'o }
592724b58424STheodore Ts'o 
592803010a33STheodore Ts'o static struct file_system_type ext4_fs_type = {
5929ac27a0ecSDave Kleikamp 	.owner		= THIS_MODULE,
593003010a33STheodore Ts'o 	.name		= "ext4",
5931152a0836SAl Viro 	.mount		= ext4_mount,
5932ac27a0ecSDave Kleikamp 	.kill_sb	= kill_block_super,
5933ac27a0ecSDave Kleikamp 	.fs_flags	= FS_REQUIRES_DEV,
5934ac27a0ecSDave Kleikamp };
59357f78e035SEric W. Biederman MODULE_ALIAS_FS("ext4");
5936ac27a0ecSDave Kleikamp 
5937e9e3bcecSEric Sandeen /* Shared across all ext4 file systems */
5938e9e3bcecSEric Sandeen wait_queue_head_t ext4__ioend_wq[EXT4_WQ_HASH_SZ];
5939e9e3bcecSEric Sandeen 
59405dabfc78STheodore Ts'o static int __init ext4_init_fs(void)
5941ac27a0ecSDave Kleikamp {
5942e9e3bcecSEric Sandeen 	int i, err;
5943c9de560dSAlex Tomas 
5944e294a537STheodore Ts'o 	ratelimit_state_init(&ext4_mount_msg_ratelimit, 30 * HZ, 64);
594507c0c5d8SAl Viro 	ext4_li_info = NULL;
594607c0c5d8SAl Viro 	mutex_init(&ext4_li_mtx);
594707c0c5d8SAl Viro 
59489a4c8019SCarlos Maiolino 	/* Build-time check for flags consistency */
594912e9b892SDmitry Monakhov 	ext4_check_flag_values();
5950e9e3bcecSEric Sandeen 
5951e142d052SJan Kara 	for (i = 0; i < EXT4_WQ_HASH_SZ; i++)
5952e9e3bcecSEric Sandeen 		init_waitqueue_head(&ext4__ioend_wq[i]);
5953e9e3bcecSEric Sandeen 
595451865fdaSZheng Liu 	err = ext4_init_es();
59556fd058f7STheodore Ts'o 	if (err)
59566fd058f7STheodore Ts'o 		return err;
595751865fdaSZheng Liu 
5958*1dc0aa46SEric Whitney 	err = ext4_init_pending();
5959*1dc0aa46SEric Whitney 	if (err)
5960*1dc0aa46SEric Whitney 		goto out6;
5961*1dc0aa46SEric Whitney 
596251865fdaSZheng Liu 	err = ext4_init_pageio();
596351865fdaSZheng Liu 	if (err)
5964b5799018STheodore Ts'o 		goto out5;
596551865fdaSZheng Liu 
59665dabfc78STheodore Ts'o 	err = ext4_init_system_zone();
5967bd2d0210STheodore Ts'o 	if (err)
5968b5799018STheodore Ts'o 		goto out4;
5969857ac889SLukas Czerner 
5970b5799018STheodore Ts'o 	err = ext4_init_sysfs();
5971dd68314cSTheodore Ts'o 	if (err)
5972b5799018STheodore Ts'o 		goto out3;
5973857ac889SLukas Czerner 
59745dabfc78STheodore Ts'o 	err = ext4_init_mballoc();
5975ac27a0ecSDave Kleikamp 	if (err)
5976c9de560dSAlex Tomas 		goto out2;
5977ac27a0ecSDave Kleikamp 	err = init_inodecache();
5978ac27a0ecSDave Kleikamp 	if (err)
5979ac27a0ecSDave Kleikamp 		goto out1;
598024b58424STheodore Ts'o 	register_as_ext3();
59812035e776STheodore Ts'o 	register_as_ext2();
598203010a33STheodore Ts'o 	err = register_filesystem(&ext4_fs_type);
5983ac27a0ecSDave Kleikamp 	if (err)
5984ac27a0ecSDave Kleikamp 		goto out;
5985bfff6873SLukas Czerner 
5986ac27a0ecSDave Kleikamp 	return 0;
5987ac27a0ecSDave Kleikamp out:
598824b58424STheodore Ts'o 	unregister_as_ext2();
598924b58424STheodore Ts'o 	unregister_as_ext3();
5990ac27a0ecSDave Kleikamp 	destroy_inodecache();
5991ac27a0ecSDave Kleikamp out1:
59925dabfc78STheodore Ts'o 	ext4_exit_mballoc();
59939c191f70ST Makphaibulchoke out2:
5994b5799018STheodore Ts'o 	ext4_exit_sysfs();
5995b5799018STheodore Ts'o out3:
5996dd68314cSTheodore Ts'o 	ext4_exit_system_zone();
5997b5799018STheodore Ts'o out4:
59985dabfc78STheodore Ts'o 	ext4_exit_pageio();
5999b5799018STheodore Ts'o out5:
6000*1dc0aa46SEric Whitney 	ext4_exit_pending();
6001*1dc0aa46SEric Whitney out6:
600251865fdaSZheng Liu 	ext4_exit_es();
600351865fdaSZheng Liu 
6004ac27a0ecSDave Kleikamp 	return err;
6005ac27a0ecSDave Kleikamp }
6006ac27a0ecSDave Kleikamp 
60075dabfc78STheodore Ts'o static void __exit ext4_exit_fs(void)
6008ac27a0ecSDave Kleikamp {
6009bfff6873SLukas Czerner 	ext4_destroy_lazyinit_thread();
601024b58424STheodore Ts'o 	unregister_as_ext2();
601124b58424STheodore Ts'o 	unregister_as_ext3();
601203010a33STheodore Ts'o 	unregister_filesystem(&ext4_fs_type);
6013ac27a0ecSDave Kleikamp 	destroy_inodecache();
60145dabfc78STheodore Ts'o 	ext4_exit_mballoc();
6015b5799018STheodore Ts'o 	ext4_exit_sysfs();
60165dabfc78STheodore Ts'o 	ext4_exit_system_zone();
60175dabfc78STheodore Ts'o 	ext4_exit_pageio();
6018dd12ed14SEric Sandeen 	ext4_exit_es();
6019*1dc0aa46SEric Whitney 	ext4_exit_pending();
6020ac27a0ecSDave Kleikamp }
6021ac27a0ecSDave Kleikamp 
6022ac27a0ecSDave Kleikamp MODULE_AUTHOR("Remy Card, Stephen Tweedie, Andrew Morton, Andreas Dilger, Theodore Ts'o and others");
602383982b6fSTheodore Ts'o MODULE_DESCRIPTION("Fourth Extended Filesystem");
6024ac27a0ecSDave Kleikamp MODULE_LICENSE("GPL");
60257ef79ad5STheodore Ts'o MODULE_SOFTDEP("pre: crc32c");
60265dabfc78STheodore Ts'o module_init(ext4_init_fs)
60275dabfc78STheodore Ts'o module_exit(ext4_exit_fs)
6028