1f5166768STheodore Ts'o // SPDX-License-Identifier: GPL-2.0 2ac27a0ecSDave Kleikamp /* 3617ba13bSMingming Cao * linux/fs/ext4/super.c 4ac27a0ecSDave Kleikamp * 5ac27a0ecSDave Kleikamp * Copyright (C) 1992, 1993, 1994, 1995 6ac27a0ecSDave Kleikamp * Remy Card (card@masi.ibp.fr) 7ac27a0ecSDave Kleikamp * Laboratoire MASI - Institut Blaise Pascal 8ac27a0ecSDave Kleikamp * Universite Pierre et Marie Curie (Paris VI) 9ac27a0ecSDave Kleikamp * 10ac27a0ecSDave Kleikamp * from 11ac27a0ecSDave Kleikamp * 12ac27a0ecSDave Kleikamp * linux/fs/minix/inode.c 13ac27a0ecSDave Kleikamp * 14ac27a0ecSDave Kleikamp * Copyright (C) 1991, 1992 Linus Torvalds 15ac27a0ecSDave Kleikamp * 16ac27a0ecSDave Kleikamp * Big-endian to little-endian byte-swapping/bitmaps by 17ac27a0ecSDave Kleikamp * David S. Miller (davem@caip.rutgers.edu), 1995 18ac27a0ecSDave Kleikamp */ 19ac27a0ecSDave Kleikamp 20ac27a0ecSDave Kleikamp #include <linux/module.h> 21ac27a0ecSDave Kleikamp #include <linux/string.h> 22ac27a0ecSDave Kleikamp #include <linux/fs.h> 23ac27a0ecSDave Kleikamp #include <linux/time.h> 24c5ca7c76STheodore Ts'o #include <linux/vmalloc.h> 25ac27a0ecSDave Kleikamp #include <linux/slab.h> 26ac27a0ecSDave Kleikamp #include <linux/init.h> 27ac27a0ecSDave Kleikamp #include <linux/blkdev.h> 2866114cadSTejun Heo #include <linux/backing-dev.h> 29ac27a0ecSDave Kleikamp #include <linux/parser.h> 30ac27a0ecSDave Kleikamp #include <linux/buffer_head.h> 31a5694255SChristoph Hellwig #include <linux/exportfs.h> 32ac27a0ecSDave Kleikamp #include <linux/vfs.h> 33ac27a0ecSDave Kleikamp #include <linux/random.h> 34ac27a0ecSDave Kleikamp #include <linux/mount.h> 35ac27a0ecSDave Kleikamp #include <linux/namei.h> 36ac27a0ecSDave Kleikamp #include <linux/quotaops.h> 37ac27a0ecSDave Kleikamp #include <linux/seq_file.h> 383197ebdbSTheodore Ts'o #include <linux/ctype.h> 391330593eSVignesh Babu #include <linux/log2.h> 40717d50e4SAndreas Dilger #include <linux/crc16.h> 41ef510424SDan Williams #include <linux/dax.h> 427abc52c2SDan Magenheimer #include <linux/cleancache.h> 437c0f6ba6SLinus Torvalds #include <linux/uaccess.h> 44ee73f9a5SJeff Layton #include <linux/iversion.h> 45c83ad55eSGabriel Krisman Bertazi #include <linux/unicode.h> 46ac27a0ecSDave Kleikamp 47bfff6873SLukas Czerner #include <linux/kthread.h> 48bfff6873SLukas Czerner #include <linux/freezer.h> 49bfff6873SLukas Czerner 503dcf5451SChristoph Hellwig #include "ext4.h" 514a092d73STheodore Ts'o #include "ext4_extents.h" /* Needed for trace points definition */ 523dcf5451SChristoph Hellwig #include "ext4_jbd2.h" 53ac27a0ecSDave Kleikamp #include "xattr.h" 54ac27a0ecSDave Kleikamp #include "acl.h" 553661d286STheodore Ts'o #include "mballoc.h" 560c9ec4beSDarrick J. Wong #include "fsmap.h" 57ac27a0ecSDave Kleikamp 589bffad1eSTheodore Ts'o #define CREATE_TRACE_POINTS 599bffad1eSTheodore Ts'o #include <trace/events/ext4.h> 609bffad1eSTheodore Ts'o 610b75a840SLukas Czerner static struct ext4_lazy_init *ext4_li_info; 620b75a840SLukas Czerner static struct mutex ext4_li_mtx; 63e294a537STheodore Ts'o static struct ratelimit_state ext4_mount_msg_ratelimit; 649f6200bbSTheodore Ts'o 65617ba13bSMingming Cao static int ext4_load_journal(struct super_block *, struct ext4_super_block *, 66ac27a0ecSDave Kleikamp unsigned long journal_devnum); 672adf6da8STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root); 68e2d67052STheodore Ts'o static int ext4_commit_super(struct super_block *sb, int sync); 69617ba13bSMingming Cao static void ext4_mark_recovery_complete(struct super_block *sb, 70617ba13bSMingming Cao struct ext4_super_block *es); 71617ba13bSMingming Cao static void ext4_clear_journal_err(struct super_block *sb, 72617ba13bSMingming Cao struct ext4_super_block *es); 73617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait); 74617ba13bSMingming Cao static int ext4_remount(struct super_block *sb, int *flags, char *data); 75617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf); 76c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb); 77c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb); 78152a0836SAl Viro static struct dentry *ext4_mount(struct file_system_type *fs_type, int flags, 79152a0836SAl Viro const char *dev_name, void *data); 802035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb); 812035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb); 82d39195c3SAmir Goldstein static int ext4_feature_set_ok(struct super_block *sb, int readonly); 83bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void); 84bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb); 858f1f7453SEric Sandeen static void ext4_clear_request_list(void); 86c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb, 87c6cb7e77SEric Whitney unsigned int journal_inum); 88ac27a0ecSDave Kleikamp 89e74031fdSJan Kara /* 90e74031fdSJan Kara * Lock ordering 91e74031fdSJan Kara * 92e74031fdSJan Kara * Note the difference between i_mmap_sem (EXT4_I(inode)->i_mmap_sem) and 93e74031fdSJan Kara * i_mmap_rwsem (inode->i_mmap_rwsem)! 94e74031fdSJan Kara * 95e74031fdSJan Kara * page fault path: 96e74031fdSJan Kara * mmap_sem -> sb_start_pagefault -> i_mmap_sem (r) -> transaction start -> 97e74031fdSJan Kara * page lock -> i_data_sem (rw) 98e74031fdSJan Kara * 99e74031fdSJan Kara * buffered write path: 100e74031fdSJan Kara * sb_start_write -> i_mutex -> mmap_sem 101e74031fdSJan Kara * sb_start_write -> i_mutex -> transaction start -> page lock -> 102e74031fdSJan Kara * i_data_sem (rw) 103e74031fdSJan Kara * 104e74031fdSJan Kara * truncate: 1051d39834fSNikolay Borisov * sb_start_write -> i_mutex -> i_mmap_sem (w) -> i_mmap_rwsem (w) -> page lock 1061d39834fSNikolay Borisov * sb_start_write -> i_mutex -> i_mmap_sem (w) -> transaction start -> 1071d39834fSNikolay Borisov * i_data_sem (rw) 108e74031fdSJan Kara * 109e74031fdSJan Kara * direct IO: 1101d39834fSNikolay Borisov * sb_start_write -> i_mutex -> mmap_sem 1111d39834fSNikolay Borisov * sb_start_write -> i_mutex -> transaction start -> i_data_sem (rw) 112e74031fdSJan Kara * 113e74031fdSJan Kara * writepages: 114e74031fdSJan Kara * transaction start -> page lock(s) -> i_data_sem (rw) 115e74031fdSJan Kara */ 116e74031fdSJan Kara 117c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2) 1182035e776STheodore Ts'o static struct file_system_type ext2_fs_type = { 1192035e776STheodore Ts'o .owner = THIS_MODULE, 1202035e776STheodore Ts'o .name = "ext2", 1212035e776STheodore Ts'o .mount = ext4_mount, 1222035e776STheodore Ts'o .kill_sb = kill_block_super, 1232035e776STheodore Ts'o .fs_flags = FS_REQUIRES_DEV, 1242035e776STheodore Ts'o }; 1257f78e035SEric W. Biederman MODULE_ALIAS_FS("ext2"); 126fa7614ddSEric W. Biederman MODULE_ALIAS("ext2"); 1272035e776STheodore Ts'o #define IS_EXT2_SB(sb) ((sb)->s_bdev->bd_holder == &ext2_fs_type) 1282035e776STheodore Ts'o #else 1292035e776STheodore Ts'o #define IS_EXT2_SB(sb) (0) 1302035e776STheodore Ts'o #endif 1312035e776STheodore Ts'o 1322035e776STheodore Ts'o 133ba69f9abSJan Kara static struct file_system_type ext3_fs_type = { 134ba69f9abSJan Kara .owner = THIS_MODULE, 135ba69f9abSJan Kara .name = "ext3", 136152a0836SAl Viro .mount = ext4_mount, 137ba69f9abSJan Kara .kill_sb = kill_block_super, 138ba69f9abSJan Kara .fs_flags = FS_REQUIRES_DEV, 139ba69f9abSJan Kara }; 1407f78e035SEric W. Biederman MODULE_ALIAS_FS("ext3"); 141fa7614ddSEric W. Biederman MODULE_ALIAS("ext3"); 142ba69f9abSJan Kara #define IS_EXT3_SB(sb) ((sb)->s_bdev->bd_holder == &ext3_fs_type) 143bd81d8eeSLaurent Vivier 144fb265c9cSTheodore Ts'o /* 145fb265c9cSTheodore Ts'o * This works like sb_bread() except it uses ERR_PTR for error 146fb265c9cSTheodore Ts'o * returns. Currently with sb_bread it's impossible to distinguish 147fb265c9cSTheodore Ts'o * between ENOMEM and EIO situations (since both result in a NULL 148fb265c9cSTheodore Ts'o * return. 149fb265c9cSTheodore Ts'o */ 150fb265c9cSTheodore Ts'o struct buffer_head * 151fb265c9cSTheodore Ts'o ext4_sb_bread(struct super_block *sb, sector_t block, int op_flags) 152fb265c9cSTheodore Ts'o { 153fb265c9cSTheodore Ts'o struct buffer_head *bh = sb_getblk(sb, block); 154fb265c9cSTheodore Ts'o 155fb265c9cSTheodore Ts'o if (bh == NULL) 156fb265c9cSTheodore Ts'o return ERR_PTR(-ENOMEM); 157cf2834a5STheodore Ts'o if (ext4_buffer_uptodate(bh)) 158fb265c9cSTheodore Ts'o return bh; 159fb265c9cSTheodore Ts'o ll_rw_block(REQ_OP_READ, REQ_META | op_flags, 1, &bh); 160fb265c9cSTheodore Ts'o wait_on_buffer(bh); 161fb265c9cSTheodore Ts'o if (buffer_uptodate(bh)) 162fb265c9cSTheodore Ts'o return bh; 163fb265c9cSTheodore Ts'o put_bh(bh); 164fb265c9cSTheodore Ts'o return ERR_PTR(-EIO); 165fb265c9cSTheodore Ts'o } 166fb265c9cSTheodore Ts'o 167d25425f8SDarrick J. Wong static int ext4_verify_csum_type(struct super_block *sb, 168d25425f8SDarrick J. Wong struct ext4_super_block *es) 169d25425f8SDarrick J. Wong { 170e2b911c5SDarrick J. Wong if (!ext4_has_feature_metadata_csum(sb)) 171d25425f8SDarrick J. Wong return 1; 172d25425f8SDarrick J. Wong 173d25425f8SDarrick J. Wong return es->s_checksum_type == EXT4_CRC32C_CHKSUM; 174d25425f8SDarrick J. Wong } 175d25425f8SDarrick J. Wong 176a9c47317SDarrick J. Wong static __le32 ext4_superblock_csum(struct super_block *sb, 177a9c47317SDarrick J. Wong struct ext4_super_block *es) 178a9c47317SDarrick J. Wong { 179a9c47317SDarrick J. Wong struct ext4_sb_info *sbi = EXT4_SB(sb); 180a9c47317SDarrick J. Wong int offset = offsetof(struct ext4_super_block, s_checksum); 181a9c47317SDarrick J. Wong __u32 csum; 182a9c47317SDarrick J. Wong 183a9c47317SDarrick J. Wong csum = ext4_chksum(sbi, ~0, (char *)es, offset); 184a9c47317SDarrick J. Wong 185a9c47317SDarrick J. Wong return cpu_to_le32(csum); 186a9c47317SDarrick J. Wong } 187a9c47317SDarrick J. Wong 188c197855eSStephen Hemminger static int ext4_superblock_csum_verify(struct super_block *sb, 189a9c47317SDarrick J. Wong struct ext4_super_block *es) 190a9c47317SDarrick J. Wong { 1919aa5d32bSDmitry Monakhov if (!ext4_has_metadata_csum(sb)) 192a9c47317SDarrick J. Wong return 1; 193a9c47317SDarrick J. Wong 194a9c47317SDarrick J. Wong return es->s_checksum == ext4_superblock_csum(sb, es); 195a9c47317SDarrick J. Wong } 196a9c47317SDarrick J. Wong 19706db49e6STheodore Ts'o void ext4_superblock_csum_set(struct super_block *sb) 198a9c47317SDarrick J. Wong { 19906db49e6STheodore Ts'o struct ext4_super_block *es = EXT4_SB(sb)->s_es; 20006db49e6STheodore Ts'o 2019aa5d32bSDmitry Monakhov if (!ext4_has_metadata_csum(sb)) 202a9c47317SDarrick J. Wong return; 203a9c47317SDarrick J. Wong 204a9c47317SDarrick J. Wong es->s_checksum = ext4_superblock_csum(sb, es); 205a9c47317SDarrick J. Wong } 206a9c47317SDarrick J. Wong 2079933fc0aSTheodore Ts'o void *ext4_kvmalloc(size_t size, gfp_t flags) 2089933fc0aSTheodore Ts'o { 2099933fc0aSTheodore Ts'o void *ret; 2109933fc0aSTheodore Ts'o 2118be04b93SJoe Perches ret = kmalloc(size, flags | __GFP_NOWARN); 2129933fc0aSTheodore Ts'o if (!ret) 2139933fc0aSTheodore Ts'o ret = __vmalloc(size, flags, PAGE_KERNEL); 2149933fc0aSTheodore Ts'o return ret; 2159933fc0aSTheodore Ts'o } 2169933fc0aSTheodore Ts'o 2179933fc0aSTheodore Ts'o void *ext4_kvzalloc(size_t size, gfp_t flags) 2189933fc0aSTheodore Ts'o { 2199933fc0aSTheodore Ts'o void *ret; 2209933fc0aSTheodore Ts'o 2218be04b93SJoe Perches ret = kzalloc(size, flags | __GFP_NOWARN); 2229933fc0aSTheodore Ts'o if (!ret) 2239933fc0aSTheodore Ts'o ret = __vmalloc(size, flags | __GFP_ZERO, PAGE_KERNEL); 2249933fc0aSTheodore Ts'o return ret; 2259933fc0aSTheodore Ts'o } 2269933fc0aSTheodore Ts'o 2278fadc143SAlexandre Ratchov ext4_fsblk_t ext4_block_bitmap(struct super_block *sb, 2288fadc143SAlexandre Ratchov struct ext4_group_desc *bg) 229bd81d8eeSLaurent Vivier { 2303a14589cSAneesh Kumar K.V return le32_to_cpu(bg->bg_block_bitmap_lo) | 2318fadc143SAlexandre Ratchov (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ? 2328fadc143SAlexandre Ratchov (ext4_fsblk_t)le32_to_cpu(bg->bg_block_bitmap_hi) << 32 : 0); 233bd81d8eeSLaurent Vivier } 234bd81d8eeSLaurent Vivier 2358fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_bitmap(struct super_block *sb, 2368fadc143SAlexandre Ratchov struct ext4_group_desc *bg) 237bd81d8eeSLaurent Vivier { 2385272f837SAneesh Kumar K.V return le32_to_cpu(bg->bg_inode_bitmap_lo) | 2398fadc143SAlexandre Ratchov (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ? 2408fadc143SAlexandre Ratchov (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_bitmap_hi) << 32 : 0); 241bd81d8eeSLaurent Vivier } 242bd81d8eeSLaurent Vivier 2438fadc143SAlexandre Ratchov ext4_fsblk_t ext4_inode_table(struct super_block *sb, 2448fadc143SAlexandre Ratchov struct ext4_group_desc *bg) 245bd81d8eeSLaurent Vivier { 2465272f837SAneesh Kumar K.V return le32_to_cpu(bg->bg_inode_table_lo) | 2478fadc143SAlexandre Ratchov (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ? 2488fadc143SAlexandre Ratchov (ext4_fsblk_t)le32_to_cpu(bg->bg_inode_table_hi) << 32 : 0); 249bd81d8eeSLaurent Vivier } 250bd81d8eeSLaurent Vivier 251021b65bbSTheodore Ts'o __u32 ext4_free_group_clusters(struct super_block *sb, 252560671a0SAneesh Kumar K.V struct ext4_group_desc *bg) 253560671a0SAneesh Kumar K.V { 254560671a0SAneesh Kumar K.V return le16_to_cpu(bg->bg_free_blocks_count_lo) | 255560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ? 256560671a0SAneesh Kumar K.V (__u32)le16_to_cpu(bg->bg_free_blocks_count_hi) << 16 : 0); 257560671a0SAneesh Kumar K.V } 258560671a0SAneesh Kumar K.V 259560671a0SAneesh Kumar K.V __u32 ext4_free_inodes_count(struct super_block *sb, 260560671a0SAneesh Kumar K.V struct ext4_group_desc *bg) 261560671a0SAneesh Kumar K.V { 262560671a0SAneesh Kumar K.V return le16_to_cpu(bg->bg_free_inodes_count_lo) | 263560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ? 264560671a0SAneesh Kumar K.V (__u32)le16_to_cpu(bg->bg_free_inodes_count_hi) << 16 : 0); 265560671a0SAneesh Kumar K.V } 266560671a0SAneesh Kumar K.V 267560671a0SAneesh Kumar K.V __u32 ext4_used_dirs_count(struct super_block *sb, 268560671a0SAneesh Kumar K.V struct ext4_group_desc *bg) 269560671a0SAneesh Kumar K.V { 270560671a0SAneesh Kumar K.V return le16_to_cpu(bg->bg_used_dirs_count_lo) | 271560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ? 272560671a0SAneesh Kumar K.V (__u32)le16_to_cpu(bg->bg_used_dirs_count_hi) << 16 : 0); 273560671a0SAneesh Kumar K.V } 274560671a0SAneesh Kumar K.V 275560671a0SAneesh Kumar K.V __u32 ext4_itable_unused_count(struct super_block *sb, 276560671a0SAneesh Kumar K.V struct ext4_group_desc *bg) 277560671a0SAneesh Kumar K.V { 278560671a0SAneesh Kumar K.V return le16_to_cpu(bg->bg_itable_unused_lo) | 279560671a0SAneesh Kumar K.V (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT ? 280560671a0SAneesh Kumar K.V (__u32)le16_to_cpu(bg->bg_itable_unused_hi) << 16 : 0); 281560671a0SAneesh Kumar K.V } 282560671a0SAneesh Kumar K.V 2838fadc143SAlexandre Ratchov void ext4_block_bitmap_set(struct super_block *sb, 2848fadc143SAlexandre Ratchov struct ext4_group_desc *bg, ext4_fsblk_t blk) 285bd81d8eeSLaurent Vivier { 2863a14589cSAneesh Kumar K.V bg->bg_block_bitmap_lo = cpu_to_le32((u32)blk); 2878fadc143SAlexandre Ratchov if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT) 2888fadc143SAlexandre Ratchov bg->bg_block_bitmap_hi = cpu_to_le32(blk >> 32); 289bd81d8eeSLaurent Vivier } 290bd81d8eeSLaurent Vivier 2918fadc143SAlexandre Ratchov void ext4_inode_bitmap_set(struct super_block *sb, 2928fadc143SAlexandre Ratchov struct ext4_group_desc *bg, ext4_fsblk_t blk) 293bd81d8eeSLaurent Vivier { 2945272f837SAneesh Kumar K.V bg->bg_inode_bitmap_lo = cpu_to_le32((u32)blk); 2958fadc143SAlexandre Ratchov if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT) 2968fadc143SAlexandre Ratchov bg->bg_inode_bitmap_hi = cpu_to_le32(blk >> 32); 297bd81d8eeSLaurent Vivier } 298bd81d8eeSLaurent Vivier 2998fadc143SAlexandre Ratchov void ext4_inode_table_set(struct super_block *sb, 3008fadc143SAlexandre Ratchov struct ext4_group_desc *bg, ext4_fsblk_t blk) 301bd81d8eeSLaurent Vivier { 3025272f837SAneesh Kumar K.V bg->bg_inode_table_lo = cpu_to_le32((u32)blk); 3038fadc143SAlexandre Ratchov if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT) 3048fadc143SAlexandre Ratchov bg->bg_inode_table_hi = cpu_to_le32(blk >> 32); 305bd81d8eeSLaurent Vivier } 306bd81d8eeSLaurent Vivier 307021b65bbSTheodore Ts'o void ext4_free_group_clusters_set(struct super_block *sb, 308560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count) 309560671a0SAneesh Kumar K.V { 310560671a0SAneesh Kumar K.V bg->bg_free_blocks_count_lo = cpu_to_le16((__u16)count); 311560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT) 312560671a0SAneesh Kumar K.V bg->bg_free_blocks_count_hi = cpu_to_le16(count >> 16); 313560671a0SAneesh Kumar K.V } 314560671a0SAneesh Kumar K.V 315560671a0SAneesh Kumar K.V void ext4_free_inodes_set(struct super_block *sb, 316560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count) 317560671a0SAneesh Kumar K.V { 318560671a0SAneesh Kumar K.V bg->bg_free_inodes_count_lo = cpu_to_le16((__u16)count); 319560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT) 320560671a0SAneesh Kumar K.V bg->bg_free_inodes_count_hi = cpu_to_le16(count >> 16); 321560671a0SAneesh Kumar K.V } 322560671a0SAneesh Kumar K.V 323560671a0SAneesh Kumar K.V void ext4_used_dirs_set(struct super_block *sb, 324560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count) 325560671a0SAneesh Kumar K.V { 326560671a0SAneesh Kumar K.V bg->bg_used_dirs_count_lo = cpu_to_le16((__u16)count); 327560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT) 328560671a0SAneesh Kumar K.V bg->bg_used_dirs_count_hi = cpu_to_le16(count >> 16); 329560671a0SAneesh Kumar K.V } 330560671a0SAneesh Kumar K.V 331560671a0SAneesh Kumar K.V void ext4_itable_unused_set(struct super_block *sb, 332560671a0SAneesh Kumar K.V struct ext4_group_desc *bg, __u32 count) 333560671a0SAneesh Kumar K.V { 334560671a0SAneesh Kumar K.V bg->bg_itable_unused_lo = cpu_to_le16((__u16)count); 335560671a0SAneesh Kumar K.V if (EXT4_DESC_SIZE(sb) >= EXT4_MIN_DESC_SIZE_64BIT) 336560671a0SAneesh Kumar K.V bg->bg_itable_unused_hi = cpu_to_le16(count >> 16); 337560671a0SAneesh Kumar K.V } 338560671a0SAneesh Kumar K.V 3396a0678a7SArnd Bergmann static void __ext4_update_tstamp(__le32 *lo, __u8 *hi) 3406a0678a7SArnd Bergmann { 3416a0678a7SArnd Bergmann time64_t now = ktime_get_real_seconds(); 3426a0678a7SArnd Bergmann 3436a0678a7SArnd Bergmann now = clamp_val(now, 0, (1ull << 40) - 1); 3446a0678a7SArnd Bergmann 3456a0678a7SArnd Bergmann *lo = cpu_to_le32(lower_32_bits(now)); 3466a0678a7SArnd Bergmann *hi = upper_32_bits(now); 3476a0678a7SArnd Bergmann } 3486a0678a7SArnd Bergmann 3496a0678a7SArnd Bergmann static time64_t __ext4_get_tstamp(__le32 *lo, __u8 *hi) 3506a0678a7SArnd Bergmann { 3516a0678a7SArnd Bergmann return ((time64_t)(*hi) << 32) + le32_to_cpu(*lo); 3526a0678a7SArnd Bergmann } 3536a0678a7SArnd Bergmann #define ext4_update_tstamp(es, tstamp) \ 3546a0678a7SArnd Bergmann __ext4_update_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi) 3556a0678a7SArnd Bergmann #define ext4_get_tstamp(es, tstamp) \ 3566a0678a7SArnd Bergmann __ext4_get_tstamp(&(es)->tstamp, &(es)->tstamp ## _hi) 357d3d1faf6SCurt Wohlgemuth 3581c13d5c0STheodore Ts'o static void __save_error_info(struct super_block *sb, const char *func, 3591c13d5c0STheodore Ts'o unsigned int line) 3601c13d5c0STheodore Ts'o { 3611c13d5c0STheodore Ts'o struct ext4_super_block *es = EXT4_SB(sb)->s_es; 3621c13d5c0STheodore Ts'o 3631c13d5c0STheodore Ts'o EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS; 3641b46617bSTheodore Ts'o if (bdev_read_only(sb->s_bdev)) 3651b46617bSTheodore Ts'o return; 3661c13d5c0STheodore Ts'o es->s_state |= cpu_to_le16(EXT4_ERROR_FS); 3676a0678a7SArnd Bergmann ext4_update_tstamp(es, s_last_error_time); 3681c13d5c0STheodore Ts'o strncpy(es->s_last_error_func, func, sizeof(es->s_last_error_func)); 3691c13d5c0STheodore Ts'o es->s_last_error_line = cpu_to_le32(line); 370*878520acSTheodore Ts'o if (es->s_last_error_errcode == 0) 371*878520acSTheodore Ts'o es->s_last_error_errcode = EXT4_ERR_EFSCORRUPTED; 3721c13d5c0STheodore Ts'o if (!es->s_first_error_time) { 3731c13d5c0STheodore Ts'o es->s_first_error_time = es->s_last_error_time; 3746a0678a7SArnd Bergmann es->s_first_error_time_hi = es->s_last_error_time_hi; 3751c13d5c0STheodore Ts'o strncpy(es->s_first_error_func, func, 3761c13d5c0STheodore Ts'o sizeof(es->s_first_error_func)); 3771c13d5c0STheodore Ts'o es->s_first_error_line = cpu_to_le32(line); 3781c13d5c0STheodore Ts'o es->s_first_error_ino = es->s_last_error_ino; 3791c13d5c0STheodore Ts'o es->s_first_error_block = es->s_last_error_block; 380*878520acSTheodore Ts'o es->s_first_error_errcode = es->s_last_error_errcode; 3811c13d5c0STheodore Ts'o } 38266e61a9eSTheodore Ts'o /* 38366e61a9eSTheodore Ts'o * Start the daily error reporting function if it hasn't been 38466e61a9eSTheodore Ts'o * started already 38566e61a9eSTheodore Ts'o */ 38666e61a9eSTheodore Ts'o if (!es->s_error_count) 38766e61a9eSTheodore Ts'o mod_timer(&EXT4_SB(sb)->s_err_report, jiffies + 24*60*60*HZ); 388ba39ebb6SWei Yongjun le32_add_cpu(&es->s_error_count, 1); 3891c13d5c0STheodore Ts'o } 3901c13d5c0STheodore Ts'o 3911c13d5c0STheodore Ts'o static void save_error_info(struct super_block *sb, const char *func, 3921c13d5c0STheodore Ts'o unsigned int line) 3931c13d5c0STheodore Ts'o { 3941c13d5c0STheodore Ts'o __save_error_info(sb, func, line); 3951c13d5c0STheodore Ts'o ext4_commit_super(sb, 1); 3961c13d5c0STheodore Ts'o } 3971c13d5c0STheodore Ts'o 398bdfe0cbdSTheodore Ts'o /* 399bdfe0cbdSTheodore Ts'o * The del_gendisk() function uninitializes the disk-specific data 400bdfe0cbdSTheodore Ts'o * structures, including the bdi structure, without telling anyone 401bdfe0cbdSTheodore Ts'o * else. Once this happens, any attempt to call mark_buffer_dirty() 402bdfe0cbdSTheodore Ts'o * (for example, by ext4_commit_super), will cause a kernel OOPS. 403bdfe0cbdSTheodore Ts'o * This is a kludge to prevent these oops until we can put in a proper 404bdfe0cbdSTheodore Ts'o * hook in del_gendisk() to inform the VFS and file system layers. 405bdfe0cbdSTheodore Ts'o */ 406bdfe0cbdSTheodore Ts'o static int block_device_ejected(struct super_block *sb) 407bdfe0cbdSTheodore Ts'o { 408bdfe0cbdSTheodore Ts'o struct inode *bd_inode = sb->s_bdev->bd_inode; 409bdfe0cbdSTheodore Ts'o struct backing_dev_info *bdi = inode_to_bdi(bd_inode); 410bdfe0cbdSTheodore Ts'o 411bdfe0cbdSTheodore Ts'o return bdi->dev == NULL; 412bdfe0cbdSTheodore Ts'o } 413bdfe0cbdSTheodore Ts'o 41418aadd47SBobi Jam static void ext4_journal_commit_callback(journal_t *journal, transaction_t *txn) 41518aadd47SBobi Jam { 41618aadd47SBobi Jam struct super_block *sb = journal->j_private; 41718aadd47SBobi Jam struct ext4_sb_info *sbi = EXT4_SB(sb); 41818aadd47SBobi Jam int error = is_journal_aborted(journal); 4195d3ee208SDmitry Monakhov struct ext4_journal_cb_entry *jce; 42018aadd47SBobi Jam 4215d3ee208SDmitry Monakhov BUG_ON(txn->t_state == T_FINISHED); 422a0154344SDaeho Jeong 423a0154344SDaeho Jeong ext4_process_freed_data(sb, txn->t_tid); 424a0154344SDaeho Jeong 42518aadd47SBobi Jam spin_lock(&sbi->s_md_lock); 4265d3ee208SDmitry Monakhov while (!list_empty(&txn->t_private_list)) { 4275d3ee208SDmitry Monakhov jce = list_entry(txn->t_private_list.next, 4285d3ee208SDmitry Monakhov struct ext4_journal_cb_entry, jce_list); 42918aadd47SBobi Jam list_del_init(&jce->jce_list); 43018aadd47SBobi Jam spin_unlock(&sbi->s_md_lock); 43118aadd47SBobi Jam jce->jce_func(sb, jce, error); 43218aadd47SBobi Jam spin_lock(&sbi->s_md_lock); 43318aadd47SBobi Jam } 43418aadd47SBobi Jam spin_unlock(&sbi->s_md_lock); 43518aadd47SBobi Jam } 4361c13d5c0STheodore Ts'o 4371dc1097fSJan Kara static bool system_going_down(void) 4381dc1097fSJan Kara { 4391dc1097fSJan Kara return system_state == SYSTEM_HALT || system_state == SYSTEM_POWER_OFF 4401dc1097fSJan Kara || system_state == SYSTEM_RESTART; 4411dc1097fSJan Kara } 4421dc1097fSJan Kara 443ac27a0ecSDave Kleikamp /* Deal with the reporting of failure conditions on a filesystem such as 444ac27a0ecSDave Kleikamp * inconsistencies detected or read IO failures. 445ac27a0ecSDave Kleikamp * 446ac27a0ecSDave Kleikamp * On ext2, we can store the error state of the filesystem in the 447617ba13bSMingming Cao * superblock. That is not possible on ext4, because we may have other 448ac27a0ecSDave Kleikamp * write ordering constraints on the superblock which prevent us from 449ac27a0ecSDave Kleikamp * writing it out straight away; and given that the journal is about to 450ac27a0ecSDave Kleikamp * be aborted, we can't rely on the current, or future, transactions to 451ac27a0ecSDave Kleikamp * write out the superblock safely. 452ac27a0ecSDave Kleikamp * 453dab291afSMingming Cao * We'll just use the jbd2_journal_abort() error code to record an error in 454d6b198bcSThadeu Lima de Souza Cascardo * the journal instead. On recovery, the journal will complain about 455ac27a0ecSDave Kleikamp * that error until we've noted it down and cleared it. 456ac27a0ecSDave Kleikamp */ 457ac27a0ecSDave Kleikamp 458617ba13bSMingming Cao static void ext4_handle_error(struct super_block *sb) 459ac27a0ecSDave Kleikamp { 460327eaf73STheodore Ts'o if (test_opt(sb, WARN_ON_ERROR)) 461327eaf73STheodore Ts'o WARN_ON_ONCE(1); 462327eaf73STheodore Ts'o 463bc98a42cSDavid Howells if (sb_rdonly(sb)) 464ac27a0ecSDave Kleikamp return; 465ac27a0ecSDave Kleikamp 466ac27a0ecSDave Kleikamp if (!test_opt(sb, ERRORS_CONT)) { 467617ba13bSMingming Cao journal_t *journal = EXT4_SB(sb)->s_journal; 468ac27a0ecSDave Kleikamp 4694ab2f15bSTheodore Ts'o EXT4_SB(sb)->s_mount_flags |= EXT4_MF_FS_ABORTED; 470ac27a0ecSDave Kleikamp if (journal) 471dab291afSMingming Cao jbd2_journal_abort(journal, -EIO); 472ac27a0ecSDave Kleikamp } 4731dc1097fSJan Kara /* 4741dc1097fSJan Kara * We force ERRORS_RO behavior when system is rebooting. Otherwise we 4751dc1097fSJan Kara * could panic during 'reboot -f' as the underlying device got already 4761dc1097fSJan Kara * disabled. 4771dc1097fSJan Kara */ 4781dc1097fSJan Kara if (test_opt(sb, ERRORS_RO) || system_going_down()) { 479b31e1552SEric Sandeen ext4_msg(sb, KERN_CRIT, "Remounting filesystem read-only"); 4804418e141SDmitry Monakhov /* 4814418e141SDmitry Monakhov * Make sure updated value of ->s_mount_flags will be visible 4824418e141SDmitry Monakhov * before ->s_flags update 4834418e141SDmitry Monakhov */ 4844418e141SDmitry Monakhov smp_wmb(); 4851751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY; 4861dc1097fSJan Kara } else if (test_opt(sb, ERRORS_PANIC)) { 4874327ba52SDaeho Jeong if (EXT4_SB(sb)->s_journal && 4884327ba52SDaeho Jeong !(EXT4_SB(sb)->s_journal->j_flags & JBD2_REC_ERR)) 4894327ba52SDaeho Jeong return; 490617ba13bSMingming Cao panic("EXT4-fs (device %s): panic forced after error\n", 491ac27a0ecSDave Kleikamp sb->s_id); 492ac27a0ecSDave Kleikamp } 4934327ba52SDaeho Jeong } 494ac27a0ecSDave Kleikamp 495efbed4dcSTheodore Ts'o #define ext4_error_ratelimit(sb) \ 496efbed4dcSTheodore Ts'o ___ratelimit(&(EXT4_SB(sb)->s_err_ratelimit_state), \ 497efbed4dcSTheodore Ts'o "EXT4-fs error") 498efbed4dcSTheodore Ts'o 49912062dddSEric Sandeen void __ext4_error(struct super_block *sb, const char *function, 500c398eda0STheodore Ts'o unsigned int line, const char *fmt, ...) 501ac27a0ecSDave Kleikamp { 5020ff2ea7dSJoe Perches struct va_format vaf; 503ac27a0ecSDave Kleikamp va_list args; 504ac27a0ecSDave Kleikamp 5050db1ff22STheodore Ts'o if (unlikely(ext4_forced_shutdown(EXT4_SB(sb)))) 5060db1ff22STheodore Ts'o return; 5070db1ff22STheodore Ts'o 508ccf0f32aSTheodore Ts'o trace_ext4_error(sb, function, line); 509efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(sb)) { 510ac27a0ecSDave Kleikamp va_start(args, fmt); 5110ff2ea7dSJoe Perches vaf.fmt = fmt; 5120ff2ea7dSJoe Perches vaf.va = &args; 513efbed4dcSTheodore Ts'o printk(KERN_CRIT 514efbed4dcSTheodore Ts'o "EXT4-fs error (device %s): %s:%d: comm %s: %pV\n", 5150ff2ea7dSJoe Perches sb->s_id, function, line, current->comm, &vaf); 516ac27a0ecSDave Kleikamp va_end(args); 517efbed4dcSTheodore Ts'o } 518f3fc0210STheodore Ts'o save_error_info(sb, function, line); 519617ba13bSMingming Cao ext4_handle_error(sb); 520ac27a0ecSDave Kleikamp } 521ac27a0ecSDave Kleikamp 522e7c96e8eSJoe Perches void __ext4_error_inode(struct inode *inode, const char *function, 523c398eda0STheodore Ts'o unsigned int line, ext4_fsblk_t block, 524273df556SFrank Mayhar const char *fmt, ...) 525273df556SFrank Mayhar { 526273df556SFrank Mayhar va_list args; 527f7c21177STheodore Ts'o struct va_format vaf; 5281c13d5c0STheodore Ts'o struct ext4_super_block *es = EXT4_SB(inode->i_sb)->s_es; 529273df556SFrank Mayhar 5300db1ff22STheodore Ts'o if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb)))) 5310db1ff22STheodore Ts'o return; 5320db1ff22STheodore Ts'o 533ccf0f32aSTheodore Ts'o trace_ext4_error(inode->i_sb, function, line); 5341c13d5c0STheodore Ts'o es->s_last_error_ino = cpu_to_le32(inode->i_ino); 5351c13d5c0STheodore Ts'o es->s_last_error_block = cpu_to_le64(block); 536efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(inode->i_sb)) { 537273df556SFrank Mayhar va_start(args, fmt); 538f7c21177STheodore Ts'o vaf.fmt = fmt; 539f7c21177STheodore Ts'o vaf.va = &args; 540c398eda0STheodore Ts'o if (block) 541d9ee81daSJoe Perches printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: " 542d9ee81daSJoe Perches "inode #%lu: block %llu: comm %s: %pV\n", 543d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino, 544d9ee81daSJoe Perches block, current->comm, &vaf); 545d9ee81daSJoe Perches else 546d9ee81daSJoe Perches printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: " 547d9ee81daSJoe Perches "inode #%lu: comm %s: %pV\n", 548d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino, 549d9ee81daSJoe Perches current->comm, &vaf); 550273df556SFrank Mayhar va_end(args); 551efbed4dcSTheodore Ts'o } 552efbed4dcSTheodore Ts'o save_error_info(inode->i_sb, function, line); 553273df556SFrank Mayhar ext4_handle_error(inode->i_sb); 554273df556SFrank Mayhar } 555273df556SFrank Mayhar 556e7c96e8eSJoe Perches void __ext4_error_file(struct file *file, const char *function, 557f7c21177STheodore Ts'o unsigned int line, ext4_fsblk_t block, 558f7c21177STheodore Ts'o const char *fmt, ...) 559273df556SFrank Mayhar { 560273df556SFrank Mayhar va_list args; 561f7c21177STheodore Ts'o struct va_format vaf; 5621c13d5c0STheodore Ts'o struct ext4_super_block *es; 563496ad9aaSAl Viro struct inode *inode = file_inode(file); 564273df556SFrank Mayhar char pathname[80], *path; 565273df556SFrank Mayhar 5660db1ff22STheodore Ts'o if (unlikely(ext4_forced_shutdown(EXT4_SB(inode->i_sb)))) 5670db1ff22STheodore Ts'o return; 5680db1ff22STheodore Ts'o 569ccf0f32aSTheodore Ts'o trace_ext4_error(inode->i_sb, function, line); 5701c13d5c0STheodore Ts'o es = EXT4_SB(inode->i_sb)->s_es; 5711c13d5c0STheodore Ts'o es->s_last_error_ino = cpu_to_le32(inode->i_ino); 572efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(inode->i_sb)) { 5739bf39ab2SMiklos Szeredi path = file_path(file, pathname, sizeof(pathname)); 574f9a62d09SDan Carpenter if (IS_ERR(path)) 575273df556SFrank Mayhar path = "(unknown)"; 576f7c21177STheodore Ts'o va_start(args, fmt); 577f7c21177STheodore Ts'o vaf.fmt = fmt; 578f7c21177STheodore Ts'o vaf.va = &args; 579d9ee81daSJoe Perches if (block) 580d9ee81daSJoe Perches printk(KERN_CRIT 581d9ee81daSJoe Perches "EXT4-fs error (device %s): %s:%d: inode #%lu: " 582d9ee81daSJoe Perches "block %llu: comm %s: path %s: %pV\n", 583d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino, 584d9ee81daSJoe Perches block, current->comm, path, &vaf); 585d9ee81daSJoe Perches else 586d9ee81daSJoe Perches printk(KERN_CRIT 587d9ee81daSJoe Perches "EXT4-fs error (device %s): %s:%d: inode #%lu: " 588d9ee81daSJoe Perches "comm %s: path %s: %pV\n", 589d9ee81daSJoe Perches inode->i_sb->s_id, function, line, inode->i_ino, 590d9ee81daSJoe Perches current->comm, path, &vaf); 591273df556SFrank Mayhar va_end(args); 592efbed4dcSTheodore Ts'o } 593efbed4dcSTheodore Ts'o save_error_info(inode->i_sb, function, line); 594273df556SFrank Mayhar ext4_handle_error(inode->i_sb); 595273df556SFrank Mayhar } 596273df556SFrank Mayhar 597722887ddSTheodore Ts'o const char *ext4_decode_error(struct super_block *sb, int errno, 598ac27a0ecSDave Kleikamp char nbuf[16]) 599ac27a0ecSDave Kleikamp { 600ac27a0ecSDave Kleikamp char *errstr = NULL; 601ac27a0ecSDave Kleikamp 602ac27a0ecSDave Kleikamp switch (errno) { 6036a797d27SDarrick J. Wong case -EFSCORRUPTED: 6046a797d27SDarrick J. Wong errstr = "Corrupt filesystem"; 6056a797d27SDarrick J. Wong break; 6066a797d27SDarrick J. Wong case -EFSBADCRC: 6076a797d27SDarrick J. Wong errstr = "Filesystem failed CRC"; 6086a797d27SDarrick J. Wong break; 609ac27a0ecSDave Kleikamp case -EIO: 610ac27a0ecSDave Kleikamp errstr = "IO failure"; 611ac27a0ecSDave Kleikamp break; 612ac27a0ecSDave Kleikamp case -ENOMEM: 613ac27a0ecSDave Kleikamp errstr = "Out of memory"; 614ac27a0ecSDave Kleikamp break; 615ac27a0ecSDave Kleikamp case -EROFS: 61678f1ddbbSTheodore Ts'o if (!sb || (EXT4_SB(sb)->s_journal && 61778f1ddbbSTheodore Ts'o EXT4_SB(sb)->s_journal->j_flags & JBD2_ABORT)) 618ac27a0ecSDave Kleikamp errstr = "Journal has aborted"; 619ac27a0ecSDave Kleikamp else 620ac27a0ecSDave Kleikamp errstr = "Readonly filesystem"; 621ac27a0ecSDave Kleikamp break; 622ac27a0ecSDave Kleikamp default: 623ac27a0ecSDave Kleikamp /* If the caller passed in an extra buffer for unknown 624ac27a0ecSDave Kleikamp * errors, textualise them now. Else we just return 625ac27a0ecSDave Kleikamp * NULL. */ 626ac27a0ecSDave Kleikamp if (nbuf) { 627ac27a0ecSDave Kleikamp /* Check for truncated error codes... */ 628ac27a0ecSDave Kleikamp if (snprintf(nbuf, 16, "error %d", -errno) >= 0) 629ac27a0ecSDave Kleikamp errstr = nbuf; 630ac27a0ecSDave Kleikamp } 631ac27a0ecSDave Kleikamp break; 632ac27a0ecSDave Kleikamp } 633ac27a0ecSDave Kleikamp 634ac27a0ecSDave Kleikamp return errstr; 635ac27a0ecSDave Kleikamp } 636ac27a0ecSDave Kleikamp 637*878520acSTheodore Ts'o void ext4_set_errno(struct super_block *sb, int err) 638*878520acSTheodore Ts'o { 639*878520acSTheodore Ts'o if (err < 0) 640*878520acSTheodore Ts'o err = -err; 641*878520acSTheodore Ts'o 642*878520acSTheodore Ts'o switch (err) { 643*878520acSTheodore Ts'o case EIO: 644*878520acSTheodore Ts'o err = EXT4_ERR_EIO; 645*878520acSTheodore Ts'o break; 646*878520acSTheodore Ts'o case ENOMEM: 647*878520acSTheodore Ts'o err = EXT4_ERR_ENOMEM; 648*878520acSTheodore Ts'o break; 649*878520acSTheodore Ts'o case EFSBADCRC: 650*878520acSTheodore Ts'o err = EXT4_ERR_EFSBADCRC; 651*878520acSTheodore Ts'o break; 652*878520acSTheodore Ts'o case EFSCORRUPTED: 653*878520acSTheodore Ts'o err = EXT4_ERR_EFSCORRUPTED; 654*878520acSTheodore Ts'o break; 655*878520acSTheodore Ts'o case ENOSPC: 656*878520acSTheodore Ts'o err = EXT4_ERR_ENOSPC; 657*878520acSTheodore Ts'o break; 658*878520acSTheodore Ts'o case ENOKEY: 659*878520acSTheodore Ts'o err = EXT4_ERR_ENOKEY; 660*878520acSTheodore Ts'o break; 661*878520acSTheodore Ts'o case EROFS: 662*878520acSTheodore Ts'o err = EXT4_ERR_EROFS; 663*878520acSTheodore Ts'o break; 664*878520acSTheodore Ts'o case EFBIG: 665*878520acSTheodore Ts'o err = EXT4_ERR_EFBIG; 666*878520acSTheodore Ts'o break; 667*878520acSTheodore Ts'o case EEXIST: 668*878520acSTheodore Ts'o err = EXT4_ERR_EEXIST; 669*878520acSTheodore Ts'o break; 670*878520acSTheodore Ts'o case ERANGE: 671*878520acSTheodore Ts'o err = EXT4_ERR_ERANGE; 672*878520acSTheodore Ts'o break; 673*878520acSTheodore Ts'o case EOVERFLOW: 674*878520acSTheodore Ts'o err = EXT4_ERR_EOVERFLOW; 675*878520acSTheodore Ts'o break; 676*878520acSTheodore Ts'o case EBUSY: 677*878520acSTheodore Ts'o err = EXT4_ERR_EBUSY; 678*878520acSTheodore Ts'o break; 679*878520acSTheodore Ts'o case ENOTDIR: 680*878520acSTheodore Ts'o err = EXT4_ERR_ENOTDIR; 681*878520acSTheodore Ts'o break; 682*878520acSTheodore Ts'o case ENOTEMPTY: 683*878520acSTheodore Ts'o err = EXT4_ERR_ENOTEMPTY; 684*878520acSTheodore Ts'o break; 685*878520acSTheodore Ts'o case ESHUTDOWN: 686*878520acSTheodore Ts'o err = EXT4_ERR_ESHUTDOWN; 687*878520acSTheodore Ts'o break; 688*878520acSTheodore Ts'o case EFAULT: 689*878520acSTheodore Ts'o err = EXT4_ERR_EFAULT; 690*878520acSTheodore Ts'o break; 691*878520acSTheodore Ts'o default: 692*878520acSTheodore Ts'o err = EXT4_ERR_UNKNOWN; 693*878520acSTheodore Ts'o } 694*878520acSTheodore Ts'o EXT4_SB(sb)->s_es->s_last_error_errcode = err; 695*878520acSTheodore Ts'o } 696*878520acSTheodore Ts'o 697617ba13bSMingming Cao /* __ext4_std_error decodes expected errors from journaling functions 698ac27a0ecSDave Kleikamp * automatically and invokes the appropriate error response. */ 699ac27a0ecSDave Kleikamp 700c398eda0STheodore Ts'o void __ext4_std_error(struct super_block *sb, const char *function, 701c398eda0STheodore Ts'o unsigned int line, int errno) 702ac27a0ecSDave Kleikamp { 703ac27a0ecSDave Kleikamp char nbuf[16]; 704ac27a0ecSDave Kleikamp const char *errstr; 705ac27a0ecSDave Kleikamp 7060db1ff22STheodore Ts'o if (unlikely(ext4_forced_shutdown(EXT4_SB(sb)))) 7070db1ff22STheodore Ts'o return; 7080db1ff22STheodore Ts'o 709ac27a0ecSDave Kleikamp /* Special case: if the error is EROFS, and we're not already 710ac27a0ecSDave Kleikamp * inside a transaction, then there's really no point in logging 711ac27a0ecSDave Kleikamp * an error. */ 712bc98a42cSDavid Howells if (errno == -EROFS && journal_current_handle() == NULL && sb_rdonly(sb)) 713ac27a0ecSDave Kleikamp return; 714ac27a0ecSDave Kleikamp 715efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(sb)) { 716617ba13bSMingming Cao errstr = ext4_decode_error(sb, errno, nbuf); 717c398eda0STheodore Ts'o printk(KERN_CRIT "EXT4-fs error (device %s) in %s:%d: %s\n", 718c398eda0STheodore Ts'o sb->s_id, function, line, errstr); 719efbed4dcSTheodore Ts'o } 720ac27a0ecSDave Kleikamp 721*878520acSTheodore Ts'o ext4_set_errno(sb, -errno); 722efbed4dcSTheodore Ts'o save_error_info(sb, function, line); 723617ba13bSMingming Cao ext4_handle_error(sb); 724ac27a0ecSDave Kleikamp } 725ac27a0ecSDave Kleikamp 726ac27a0ecSDave Kleikamp /* 727617ba13bSMingming Cao * ext4_abort is a much stronger failure handler than ext4_error. The 728ac27a0ecSDave Kleikamp * abort function may be used to deal with unrecoverable failures such 729ac27a0ecSDave Kleikamp * as journal IO errors or ENOMEM at a critical moment in log management. 730ac27a0ecSDave Kleikamp * 731ac27a0ecSDave Kleikamp * We unconditionally force the filesystem into an ABORT|READONLY state, 732ac27a0ecSDave Kleikamp * unless the error response on the fs has been set to panic in which 733ac27a0ecSDave Kleikamp * case we take the easy way out and panic immediately. 734ac27a0ecSDave Kleikamp */ 735ac27a0ecSDave Kleikamp 736c67d859eSTheodore Ts'o void __ext4_abort(struct super_block *sb, const char *function, 737c398eda0STheodore Ts'o unsigned int line, const char *fmt, ...) 738ac27a0ecSDave Kleikamp { 739651e1c3bSJoe Perches struct va_format vaf; 740ac27a0ecSDave Kleikamp va_list args; 741ac27a0ecSDave Kleikamp 7420db1ff22STheodore Ts'o if (unlikely(ext4_forced_shutdown(EXT4_SB(sb)))) 7430db1ff22STheodore Ts'o return; 7440db1ff22STheodore Ts'o 7451c13d5c0STheodore Ts'o save_error_info(sb, function, line); 746ac27a0ecSDave Kleikamp va_start(args, fmt); 747651e1c3bSJoe Perches vaf.fmt = fmt; 748651e1c3bSJoe Perches vaf.va = &args; 749651e1c3bSJoe Perches printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: %pV\n", 750651e1c3bSJoe Perches sb->s_id, function, line, &vaf); 751ac27a0ecSDave Kleikamp va_end(args); 752ac27a0ecSDave Kleikamp 753bc98a42cSDavid Howells if (sb_rdonly(sb) == 0) { 754b31e1552SEric Sandeen ext4_msg(sb, KERN_CRIT, "Remounting filesystem read-only"); 7554ab2f15bSTheodore Ts'o EXT4_SB(sb)->s_mount_flags |= EXT4_MF_FS_ABORTED; 7564418e141SDmitry Monakhov /* 7574418e141SDmitry Monakhov * Make sure updated value of ->s_mount_flags will be visible 7584418e141SDmitry Monakhov * before ->s_flags update 7594418e141SDmitry Monakhov */ 7604418e141SDmitry Monakhov smp_wmb(); 7611751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY; 762ef2cabf7SHidehiro Kawai if (EXT4_SB(sb)->s_journal) 763dab291afSMingming Cao jbd2_journal_abort(EXT4_SB(sb)->s_journal, -EIO); 7641c13d5c0STheodore Ts'o save_error_info(sb, function, line); 7651c13d5c0STheodore Ts'o } 7662c1d0e36SJan Kara if (test_opt(sb, ERRORS_PANIC) && !system_going_down()) { 7674327ba52SDaeho Jeong if (EXT4_SB(sb)->s_journal && 7684327ba52SDaeho Jeong !(EXT4_SB(sb)->s_journal->j_flags & JBD2_REC_ERR)) 7694327ba52SDaeho Jeong return; 7701c13d5c0STheodore Ts'o panic("EXT4-fs panic from previous error\n"); 771ac27a0ecSDave Kleikamp } 7724327ba52SDaeho Jeong } 773ac27a0ecSDave Kleikamp 774e7c96e8eSJoe Perches void __ext4_msg(struct super_block *sb, 775e7c96e8eSJoe Perches const char *prefix, const char *fmt, ...) 776b31e1552SEric Sandeen { 7770ff2ea7dSJoe Perches struct va_format vaf; 778b31e1552SEric Sandeen va_list args; 779b31e1552SEric Sandeen 780efbed4dcSTheodore Ts'o if (!___ratelimit(&(EXT4_SB(sb)->s_msg_ratelimit_state), "EXT4-fs")) 781efbed4dcSTheodore Ts'o return; 782efbed4dcSTheodore Ts'o 783b31e1552SEric Sandeen va_start(args, fmt); 7840ff2ea7dSJoe Perches vaf.fmt = fmt; 7850ff2ea7dSJoe Perches vaf.va = &args; 7860ff2ea7dSJoe Perches printk("%sEXT4-fs (%s): %pV\n", prefix, sb->s_id, &vaf); 787b31e1552SEric Sandeen va_end(args); 788b31e1552SEric Sandeen } 789b31e1552SEric Sandeen 790b03a2f7eSAndreas Dilger #define ext4_warning_ratelimit(sb) \ 791b03a2f7eSAndreas Dilger ___ratelimit(&(EXT4_SB(sb)->s_warning_ratelimit_state), \ 792b03a2f7eSAndreas Dilger "EXT4-fs warning") 793b03a2f7eSAndreas Dilger 79412062dddSEric Sandeen void __ext4_warning(struct super_block *sb, const char *function, 795c398eda0STheodore Ts'o unsigned int line, const char *fmt, ...) 796ac27a0ecSDave Kleikamp { 7970ff2ea7dSJoe Perches struct va_format vaf; 798ac27a0ecSDave Kleikamp va_list args; 799ac27a0ecSDave Kleikamp 800b03a2f7eSAndreas Dilger if (!ext4_warning_ratelimit(sb)) 801efbed4dcSTheodore Ts'o return; 802efbed4dcSTheodore Ts'o 803ac27a0ecSDave Kleikamp va_start(args, fmt); 8040ff2ea7dSJoe Perches vaf.fmt = fmt; 8050ff2ea7dSJoe Perches vaf.va = &args; 8060ff2ea7dSJoe Perches printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: %pV\n", 8070ff2ea7dSJoe Perches sb->s_id, function, line, &vaf); 808ac27a0ecSDave Kleikamp va_end(args); 809ac27a0ecSDave Kleikamp } 810ac27a0ecSDave Kleikamp 811b03a2f7eSAndreas Dilger void __ext4_warning_inode(const struct inode *inode, const char *function, 812b03a2f7eSAndreas Dilger unsigned int line, const char *fmt, ...) 813b03a2f7eSAndreas Dilger { 814b03a2f7eSAndreas Dilger struct va_format vaf; 815b03a2f7eSAndreas Dilger va_list args; 816b03a2f7eSAndreas Dilger 817b03a2f7eSAndreas Dilger if (!ext4_warning_ratelimit(inode->i_sb)) 818b03a2f7eSAndreas Dilger return; 819b03a2f7eSAndreas Dilger 820b03a2f7eSAndreas Dilger va_start(args, fmt); 821b03a2f7eSAndreas Dilger vaf.fmt = fmt; 822b03a2f7eSAndreas Dilger vaf.va = &args; 823b03a2f7eSAndreas Dilger printk(KERN_WARNING "EXT4-fs warning (device %s): %s:%d: " 824b03a2f7eSAndreas Dilger "inode #%lu: comm %s: %pV\n", inode->i_sb->s_id, 825b03a2f7eSAndreas Dilger function, line, inode->i_ino, current->comm, &vaf); 826b03a2f7eSAndreas Dilger va_end(args); 827b03a2f7eSAndreas Dilger } 828b03a2f7eSAndreas Dilger 829e29136f8STheodore Ts'o void __ext4_grp_locked_error(const char *function, unsigned int line, 830e29136f8STheodore Ts'o struct super_block *sb, ext4_group_t grp, 831e29136f8STheodore Ts'o unsigned long ino, ext4_fsblk_t block, 832e29136f8STheodore Ts'o const char *fmt, ...) 8335d1b1b3fSAneesh Kumar K.V __releases(bitlock) 8345d1b1b3fSAneesh Kumar K.V __acquires(bitlock) 8355d1b1b3fSAneesh Kumar K.V { 8360ff2ea7dSJoe Perches struct va_format vaf; 8375d1b1b3fSAneesh Kumar K.V va_list args; 8385d1b1b3fSAneesh Kumar K.V struct ext4_super_block *es = EXT4_SB(sb)->s_es; 8395d1b1b3fSAneesh Kumar K.V 8400db1ff22STheodore Ts'o if (unlikely(ext4_forced_shutdown(EXT4_SB(sb)))) 8410db1ff22STheodore Ts'o return; 8420db1ff22STheodore Ts'o 843ccf0f32aSTheodore Ts'o trace_ext4_error(sb, function, line); 8441c13d5c0STheodore Ts'o es->s_last_error_ino = cpu_to_le32(ino); 8451c13d5c0STheodore Ts'o es->s_last_error_block = cpu_to_le64(block); 8461c13d5c0STheodore Ts'o __save_error_info(sb, function, line); 8470ff2ea7dSJoe Perches 848efbed4dcSTheodore Ts'o if (ext4_error_ratelimit(sb)) { 8495d1b1b3fSAneesh Kumar K.V va_start(args, fmt); 8500ff2ea7dSJoe Perches vaf.fmt = fmt; 8510ff2ea7dSJoe Perches vaf.va = &args; 85221149d61SRobin Dong printk(KERN_CRIT "EXT4-fs error (device %s): %s:%d: group %u, ", 853e29136f8STheodore Ts'o sb->s_id, function, line, grp); 854e29136f8STheodore Ts'o if (ino) 8550ff2ea7dSJoe Perches printk(KERN_CONT "inode %lu: ", ino); 856e29136f8STheodore Ts'o if (block) 857efbed4dcSTheodore Ts'o printk(KERN_CONT "block %llu:", 858efbed4dcSTheodore Ts'o (unsigned long long) block); 8590ff2ea7dSJoe Perches printk(KERN_CONT "%pV\n", &vaf); 8605d1b1b3fSAneesh Kumar K.V va_end(args); 861efbed4dcSTheodore Ts'o } 8625d1b1b3fSAneesh Kumar K.V 863327eaf73STheodore Ts'o if (test_opt(sb, WARN_ON_ERROR)) 864327eaf73STheodore Ts'o WARN_ON_ONCE(1); 865327eaf73STheodore Ts'o 8665d1b1b3fSAneesh Kumar K.V if (test_opt(sb, ERRORS_CONT)) { 867e2d67052STheodore Ts'o ext4_commit_super(sb, 0); 8685d1b1b3fSAneesh Kumar K.V return; 8695d1b1b3fSAneesh Kumar K.V } 8701c13d5c0STheodore Ts'o 8715d1b1b3fSAneesh Kumar K.V ext4_unlock_group(sb, grp); 87206f29cc8SZhouyi Zhou ext4_commit_super(sb, 1); 8735d1b1b3fSAneesh Kumar K.V ext4_handle_error(sb); 8745d1b1b3fSAneesh Kumar K.V /* 8755d1b1b3fSAneesh Kumar K.V * We only get here in the ERRORS_RO case; relocking the group 8765d1b1b3fSAneesh Kumar K.V * may be dangerous, but nothing bad will happen since the 8775d1b1b3fSAneesh Kumar K.V * filesystem will have already been marked read/only and the 8785d1b1b3fSAneesh Kumar K.V * journal has been aborted. We return 1 as a hint to callers 8795d1b1b3fSAneesh Kumar K.V * who might what to use the return value from 88025985edcSLucas De Marchi * ext4_grp_locked_error() to distinguish between the 8815d1b1b3fSAneesh Kumar K.V * ERRORS_CONT and ERRORS_RO case, and perhaps return more 8825d1b1b3fSAneesh Kumar K.V * aggressively from the ext4 function in question, with a 8835d1b1b3fSAneesh Kumar K.V * more appropriate error code. 8845d1b1b3fSAneesh Kumar K.V */ 8855d1b1b3fSAneesh Kumar K.V ext4_lock_group(sb, grp); 8865d1b1b3fSAneesh Kumar K.V return; 8875d1b1b3fSAneesh Kumar K.V } 8885d1b1b3fSAneesh Kumar K.V 889db79e6d1SWang Shilong void ext4_mark_group_bitmap_corrupted(struct super_block *sb, 890db79e6d1SWang Shilong ext4_group_t group, 891db79e6d1SWang Shilong unsigned int flags) 892db79e6d1SWang Shilong { 893db79e6d1SWang Shilong struct ext4_sb_info *sbi = EXT4_SB(sb); 894db79e6d1SWang Shilong struct ext4_group_info *grp = ext4_get_group_info(sb, group); 895db79e6d1SWang Shilong struct ext4_group_desc *gdp = ext4_get_group_desc(sb, group, NULL); 8969af0b3d1SWang Shilong int ret; 897db79e6d1SWang Shilong 8989af0b3d1SWang Shilong if (flags & EXT4_GROUP_INFO_BBITMAP_CORRUPT) { 8999af0b3d1SWang Shilong ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_BBITMAP_CORRUPT_BIT, 9009af0b3d1SWang Shilong &grp->bb_state); 9019af0b3d1SWang Shilong if (!ret) 902db79e6d1SWang Shilong percpu_counter_sub(&sbi->s_freeclusters_counter, 903db79e6d1SWang Shilong grp->bb_free); 904db79e6d1SWang Shilong } 905db79e6d1SWang Shilong 9069af0b3d1SWang Shilong if (flags & EXT4_GROUP_INFO_IBITMAP_CORRUPT) { 9079af0b3d1SWang Shilong ret = ext4_test_and_set_bit(EXT4_GROUP_INFO_IBITMAP_CORRUPT_BIT, 9089af0b3d1SWang Shilong &grp->bb_state); 9099af0b3d1SWang Shilong if (!ret && gdp) { 910db79e6d1SWang Shilong int count; 911db79e6d1SWang Shilong 912db79e6d1SWang Shilong count = ext4_free_inodes_count(sb, gdp); 913db79e6d1SWang Shilong percpu_counter_sub(&sbi->s_freeinodes_counter, 914db79e6d1SWang Shilong count); 915db79e6d1SWang Shilong } 916db79e6d1SWang Shilong } 917db79e6d1SWang Shilong } 918db79e6d1SWang Shilong 919617ba13bSMingming Cao void ext4_update_dynamic_rev(struct super_block *sb) 920ac27a0ecSDave Kleikamp { 921617ba13bSMingming Cao struct ext4_super_block *es = EXT4_SB(sb)->s_es; 922ac27a0ecSDave Kleikamp 923617ba13bSMingming Cao if (le32_to_cpu(es->s_rev_level) > EXT4_GOOD_OLD_REV) 924ac27a0ecSDave Kleikamp return; 925ac27a0ecSDave Kleikamp 92612062dddSEric Sandeen ext4_warning(sb, 927ac27a0ecSDave Kleikamp "updating to rev %d because of new feature flag, " 928ac27a0ecSDave Kleikamp "running e2fsck is recommended", 929617ba13bSMingming Cao EXT4_DYNAMIC_REV); 930ac27a0ecSDave Kleikamp 931617ba13bSMingming Cao es->s_first_ino = cpu_to_le32(EXT4_GOOD_OLD_FIRST_INO); 932617ba13bSMingming Cao es->s_inode_size = cpu_to_le16(EXT4_GOOD_OLD_INODE_SIZE); 933617ba13bSMingming Cao es->s_rev_level = cpu_to_le32(EXT4_DYNAMIC_REV); 934ac27a0ecSDave Kleikamp /* leave es->s_feature_*compat flags alone */ 935ac27a0ecSDave Kleikamp /* es->s_uuid will be set by e2fsck if empty */ 936ac27a0ecSDave Kleikamp 937ac27a0ecSDave Kleikamp /* 938ac27a0ecSDave Kleikamp * The rest of the superblock fields should be zero, and if not it 939ac27a0ecSDave Kleikamp * means they are likely already in use, so leave them alone. We 940ac27a0ecSDave Kleikamp * can leave it up to e2fsck to clean up any inconsistencies there. 941ac27a0ecSDave Kleikamp */ 942ac27a0ecSDave Kleikamp } 943ac27a0ecSDave Kleikamp 944ac27a0ecSDave Kleikamp /* 945ac27a0ecSDave Kleikamp * Open the external journal device 946ac27a0ecSDave Kleikamp */ 947b31e1552SEric Sandeen static struct block_device *ext4_blkdev_get(dev_t dev, struct super_block *sb) 948ac27a0ecSDave Kleikamp { 949ac27a0ecSDave Kleikamp struct block_device *bdev; 950ac27a0ecSDave Kleikamp char b[BDEVNAME_SIZE]; 951ac27a0ecSDave Kleikamp 952d4d77629STejun Heo bdev = blkdev_get_by_dev(dev, FMODE_READ|FMODE_WRITE|FMODE_EXCL, sb); 953ac27a0ecSDave Kleikamp if (IS_ERR(bdev)) 954ac27a0ecSDave Kleikamp goto fail; 955ac27a0ecSDave Kleikamp return bdev; 956ac27a0ecSDave Kleikamp 957ac27a0ecSDave Kleikamp fail: 958b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "failed to open journal device %s: %ld", 959ac27a0ecSDave Kleikamp __bdevname(dev, b), PTR_ERR(bdev)); 960ac27a0ecSDave Kleikamp return NULL; 961ac27a0ecSDave Kleikamp } 962ac27a0ecSDave Kleikamp 963ac27a0ecSDave Kleikamp /* 964ac27a0ecSDave Kleikamp * Release the journal device 965ac27a0ecSDave Kleikamp */ 9664385bab1SAl Viro static void ext4_blkdev_put(struct block_device *bdev) 967ac27a0ecSDave Kleikamp { 9684385bab1SAl Viro blkdev_put(bdev, FMODE_READ|FMODE_WRITE|FMODE_EXCL); 969ac27a0ecSDave Kleikamp } 970ac27a0ecSDave Kleikamp 9714385bab1SAl Viro static void ext4_blkdev_remove(struct ext4_sb_info *sbi) 972ac27a0ecSDave Kleikamp { 973ac27a0ecSDave Kleikamp struct block_device *bdev; 974ac27a0ecSDave Kleikamp bdev = sbi->journal_bdev; 975ac27a0ecSDave Kleikamp if (bdev) { 9764385bab1SAl Viro ext4_blkdev_put(bdev); 977ac27a0ecSDave Kleikamp sbi->journal_bdev = NULL; 978ac27a0ecSDave Kleikamp } 979ac27a0ecSDave Kleikamp } 980ac27a0ecSDave Kleikamp 981ac27a0ecSDave Kleikamp static inline struct inode *orphan_list_entry(struct list_head *l) 982ac27a0ecSDave Kleikamp { 983617ba13bSMingming Cao return &list_entry(l, struct ext4_inode_info, i_orphan)->vfs_inode; 984ac27a0ecSDave Kleikamp } 985ac27a0ecSDave Kleikamp 986617ba13bSMingming Cao static void dump_orphan_list(struct super_block *sb, struct ext4_sb_info *sbi) 987ac27a0ecSDave Kleikamp { 988ac27a0ecSDave Kleikamp struct list_head *l; 989ac27a0ecSDave Kleikamp 990b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "sb orphan head is %d", 991ac27a0ecSDave Kleikamp le32_to_cpu(sbi->s_es->s_last_orphan)); 992ac27a0ecSDave Kleikamp 993ac27a0ecSDave Kleikamp printk(KERN_ERR "sb_info orphan list:\n"); 994ac27a0ecSDave Kleikamp list_for_each(l, &sbi->s_orphan) { 995ac27a0ecSDave Kleikamp struct inode *inode = orphan_list_entry(l); 996ac27a0ecSDave Kleikamp printk(KERN_ERR " " 997ac27a0ecSDave Kleikamp "inode %s:%lu at %p: mode %o, nlink %d, next %d\n", 998ac27a0ecSDave Kleikamp inode->i_sb->s_id, inode->i_ino, inode, 999ac27a0ecSDave Kleikamp inode->i_mode, inode->i_nlink, 1000ac27a0ecSDave Kleikamp NEXT_ORPHAN(inode)); 1001ac27a0ecSDave Kleikamp } 1002ac27a0ecSDave Kleikamp } 1003ac27a0ecSDave Kleikamp 1004957153fcSJan Kara #ifdef CONFIG_QUOTA 1005957153fcSJan Kara static int ext4_quota_off(struct super_block *sb, int type); 1006957153fcSJan Kara 1007957153fcSJan Kara static inline void ext4_quota_off_umount(struct super_block *sb) 1008957153fcSJan Kara { 1009957153fcSJan Kara int type; 1010957153fcSJan Kara 1011957153fcSJan Kara /* Use our quota_off function to clear inode flags etc. */ 1012957153fcSJan Kara for (type = 0; type < EXT4_MAXQUOTAS; type++) 1013957153fcSJan Kara ext4_quota_off(sb, type); 1014957153fcSJan Kara } 101533458eabSTheodore Ts'o 101633458eabSTheodore Ts'o /* 101733458eabSTheodore Ts'o * This is a helper function which is used in the mount/remount 101833458eabSTheodore Ts'o * codepaths (which holds s_umount) to fetch the quota file name. 101933458eabSTheodore Ts'o */ 102033458eabSTheodore Ts'o static inline char *get_qf_name(struct super_block *sb, 102133458eabSTheodore Ts'o struct ext4_sb_info *sbi, 102233458eabSTheodore Ts'o int type) 102333458eabSTheodore Ts'o { 102433458eabSTheodore Ts'o return rcu_dereference_protected(sbi->s_qf_names[type], 102533458eabSTheodore Ts'o lockdep_is_held(&sb->s_umount)); 102633458eabSTheodore Ts'o } 1027957153fcSJan Kara #else 1028957153fcSJan Kara static inline void ext4_quota_off_umount(struct super_block *sb) 1029957153fcSJan Kara { 1030957153fcSJan Kara } 1031957153fcSJan Kara #endif 1032957153fcSJan Kara 1033617ba13bSMingming Cao static void ext4_put_super(struct super_block *sb) 1034ac27a0ecSDave Kleikamp { 1035617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 1036617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es; 103797abd7d4STheodore Ts'o int aborted = 0; 1038ef2cabf7SHidehiro Kawai int i, err; 1039ac27a0ecSDave Kleikamp 1040857ac889SLukas Czerner ext4_unregister_li_request(sb); 1041957153fcSJan Kara ext4_quota_off_umount(sb); 1042e0ccfd95SChristoph Hellwig 10432e8fa54eSJan Kara destroy_workqueue(sbi->rsv_conversion_wq); 10444c0425ffSMingming Cao 10450390131bSFrank Mayhar if (sbi->s_journal) { 104697abd7d4STheodore Ts'o aborted = is_journal_aborted(sbi->s_journal); 1047ef2cabf7SHidehiro Kawai err = jbd2_journal_destroy(sbi->s_journal); 104847b4a50bSJan Kara sbi->s_journal = NULL; 1049*878520acSTheodore Ts'o if ((err < 0) && !aborted) { 1050*878520acSTheodore Ts'o ext4_set_errno(sb, -err); 1051c67d859eSTheodore Ts'o ext4_abort(sb, "Couldn't clean up the journal"); 10520390131bSFrank Mayhar } 1053*878520acSTheodore Ts'o } 1054d4edac31SJosef Bacik 1055ebd173beSTheodore Ts'o ext4_unregister_sysfs(sb); 1056d3922a77SZheng Liu ext4_es_unregister_shrinker(sbi); 10579105bb14SAl Viro del_timer_sync(&sbi->s_err_report); 1058d4edac31SJosef Bacik ext4_release_system_zone(sb); 1059d4edac31SJosef Bacik ext4_mb_release(sb); 1060d4edac31SJosef Bacik ext4_ext_release(sb); 1061d4edac31SJosef Bacik 1062bc98a42cSDavid Howells if (!sb_rdonly(sb) && !aborted) { 1063e2b911c5SDarrick J. Wong ext4_clear_feature_journal_needs_recovery(sb); 1064ac27a0ecSDave Kleikamp es->s_state = cpu_to_le16(sbi->s_mount_state); 1065ac27a0ecSDave Kleikamp } 1066bc98a42cSDavid Howells if (!sb_rdonly(sb)) 1067a8e25a83SArtem Bityutskiy ext4_commit_super(sb, 1); 1068a8e25a83SArtem Bityutskiy 1069ac27a0ecSDave Kleikamp for (i = 0; i < sbi->s_gdb_count; i++) 1070ac27a0ecSDave Kleikamp brelse(sbi->s_group_desc[i]); 1071b93b41d4SAl Viro kvfree(sbi->s_group_desc); 1072b93b41d4SAl Viro kvfree(sbi->s_flex_groups); 107357042651STheodore Ts'o percpu_counter_destroy(&sbi->s_freeclusters_counter); 1074ac27a0ecSDave Kleikamp percpu_counter_destroy(&sbi->s_freeinodes_counter); 1075ac27a0ecSDave Kleikamp percpu_counter_destroy(&sbi->s_dirs_counter); 107657042651STheodore Ts'o percpu_counter_destroy(&sbi->s_dirtyclusters_counter); 1077c8585c6fSDaeho Jeong percpu_free_rwsem(&sbi->s_journal_flag_rwsem); 1078ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 1079a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) 108033458eabSTheodore Ts'o kfree(get_qf_name(sb, sbi, i)); 1081ac27a0ecSDave Kleikamp #endif 1082ac27a0ecSDave Kleikamp 1083ac27a0ecSDave Kleikamp /* Debugging code just in case the in-memory inode orphan list 1084ac27a0ecSDave Kleikamp * isn't empty. The on-disk one can be non-empty if we've 1085ac27a0ecSDave Kleikamp * detected an error and taken the fs readonly, but the 1086ac27a0ecSDave Kleikamp * in-memory list had better be clean by this point. */ 1087ac27a0ecSDave Kleikamp if (!list_empty(&sbi->s_orphan)) 1088ac27a0ecSDave Kleikamp dump_orphan_list(sb, sbi); 1089ac27a0ecSDave Kleikamp J_ASSERT(list_empty(&sbi->s_orphan)); 1090ac27a0ecSDave Kleikamp 109189d96a6fSTheodore Ts'o sync_blockdev(sb->s_bdev); 1092f98393a6SPeter Zijlstra invalidate_bdev(sb->s_bdev); 1093ac27a0ecSDave Kleikamp if (sbi->journal_bdev && sbi->journal_bdev != sb->s_bdev) { 1094ac27a0ecSDave Kleikamp /* 1095ac27a0ecSDave Kleikamp * Invalidate the journal device's buffers. We don't want them 1096ac27a0ecSDave Kleikamp * floating about in memory - the physical journal device may 1097ac27a0ecSDave Kleikamp * hotswapped, and it breaks the `ro-after' testing code. 1098ac27a0ecSDave Kleikamp */ 1099ac27a0ecSDave Kleikamp sync_blockdev(sbi->journal_bdev); 1100f98393a6SPeter Zijlstra invalidate_bdev(sbi->journal_bdev); 1101617ba13bSMingming Cao ext4_blkdev_remove(sbi); 1102ac27a0ecSDave Kleikamp } 110350c15df6SChengguang Xu 1104dec214d0STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_inode_cache); 1105dec214d0STahsin Erdogan sbi->s_ea_inode_cache = NULL; 110650c15df6SChengguang Xu 110747387409STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_block_cache); 110847387409STahsin Erdogan sbi->s_ea_block_cache = NULL; 110950c15df6SChengguang Xu 1110c5e06d10SJohann Lombardi if (sbi->s_mmp_tsk) 1111c5e06d10SJohann Lombardi kthread_stop(sbi->s_mmp_tsk); 11129060dd2cSEric Sandeen brelse(sbi->s_sbh); 1113ac27a0ecSDave Kleikamp sb->s_fs_info = NULL; 11143197ebdbSTheodore Ts'o /* 11153197ebdbSTheodore Ts'o * Now that we are completely done shutting down the 11163197ebdbSTheodore Ts'o * superblock, we need to actually destroy the kobject. 11173197ebdbSTheodore Ts'o */ 11183197ebdbSTheodore Ts'o kobject_put(&sbi->s_kobj); 11193197ebdbSTheodore Ts'o wait_for_completion(&sbi->s_kobj_unregister); 11200441984aSDarrick J. Wong if (sbi->s_chksum_driver) 11210441984aSDarrick J. Wong crypto_free_shash(sbi->s_chksum_driver); 1122705895b6SPekka Enberg kfree(sbi->s_blockgroup_lock); 11235e405595SDan Williams fs_put_dax(sbi->s_daxdev); 1124c83ad55eSGabriel Krisman Bertazi #ifdef CONFIG_UNICODE 1125c83ad55eSGabriel Krisman Bertazi utf8_unload(sbi->s_encoding); 1126c83ad55eSGabriel Krisman Bertazi #endif 1127ac27a0ecSDave Kleikamp kfree(sbi); 1128ac27a0ecSDave Kleikamp } 1129ac27a0ecSDave Kleikamp 1130e18b890bSChristoph Lameter static struct kmem_cache *ext4_inode_cachep; 1131ac27a0ecSDave Kleikamp 1132ac27a0ecSDave Kleikamp /* 1133ac27a0ecSDave Kleikamp * Called inside transaction, so use GFP_NOFS 1134ac27a0ecSDave Kleikamp */ 1135617ba13bSMingming Cao static struct inode *ext4_alloc_inode(struct super_block *sb) 1136ac27a0ecSDave Kleikamp { 1137617ba13bSMingming Cao struct ext4_inode_info *ei; 1138ac27a0ecSDave Kleikamp 1139e6b4f8daSChristoph Lameter ei = kmem_cache_alloc(ext4_inode_cachep, GFP_NOFS); 1140ac27a0ecSDave Kleikamp if (!ei) 1141ac27a0ecSDave Kleikamp return NULL; 11420b8e58a1SAndreas Dilger 1143ee73f9a5SJeff Layton inode_set_iversion(&ei->vfs_inode, 1); 1144202ee5dfSTheodore Ts'o spin_lock_init(&ei->i_raw_lock); 1145c9de560dSAlex Tomas INIT_LIST_HEAD(&ei->i_prealloc_list); 1146c9de560dSAlex Tomas spin_lock_init(&ei->i_prealloc_lock); 11479a26b661SZheng Liu ext4_es_init_tree(&ei->i_es_tree); 11489a26b661SZheng Liu rwlock_init(&ei->i_es_lock); 1149edaa53caSZheng Liu INIT_LIST_HEAD(&ei->i_es_list); 1150eb68d0e2SZheng Liu ei->i_es_all_nr = 0; 1151edaa53caSZheng Liu ei->i_es_shk_nr = 0; 1152dd475925SJan Kara ei->i_es_shrink_lblk = 0; 1153d2a17637SMingming Cao ei->i_reserved_data_blocks = 0; 11549d0be502STheodore Ts'o ei->i_da_metadata_calc_len = 0; 11557e731bc9STheodore Ts'o ei->i_da_metadata_calc_last_lblock = 0; 1156d2a17637SMingming Cao spin_lock_init(&(ei->i_block_reservation_lock)); 11571dc0aa46SEric Whitney ext4_init_pending_tree(&ei->i_pending_tree); 1158a9e7f447SDmitry Monakhov #ifdef CONFIG_QUOTA 1159a9e7f447SDmitry Monakhov ei->i_reserved_quota = 0; 116096c7e0d9SJan Kara memset(&ei->i_dquot, 0, sizeof(ei->i_dquot)); 1161a9e7f447SDmitry Monakhov #endif 11628aefcd55STheodore Ts'o ei->jinode = NULL; 11632e8fa54eSJan Kara INIT_LIST_HEAD(&ei->i_rsv_conversion_list); 1164744692dcSJiaying Zhang spin_lock_init(&ei->i_completed_io_lock); 1165b436b9beSJan Kara ei->i_sync_tid = 0; 1166b436b9beSJan Kara ei->i_datasync_tid = 0; 1167e27f41e1SDmitry Monakhov atomic_set(&ei->i_unwritten, 0); 11682e8fa54eSJan Kara INIT_WORK(&ei->i_rsv_conversion_work, ext4_end_io_rsv_work); 1169ac27a0ecSDave Kleikamp return &ei->vfs_inode; 1170ac27a0ecSDave Kleikamp } 1171ac27a0ecSDave Kleikamp 11727ff9c073STheodore Ts'o static int ext4_drop_inode(struct inode *inode) 11737ff9c073STheodore Ts'o { 11747ff9c073STheodore Ts'o int drop = generic_drop_inode(inode); 11757ff9c073STheodore Ts'o 117629b3692eSEric Biggers if (!drop) 117729b3692eSEric Biggers drop = fscrypt_drop_inode(inode); 117829b3692eSEric Biggers 11797ff9c073STheodore Ts'o trace_ext4_drop_inode(inode, drop); 11807ff9c073STheodore Ts'o return drop; 11817ff9c073STheodore Ts'o } 11827ff9c073STheodore Ts'o 118394053139SAl Viro static void ext4_free_in_core_inode(struct inode *inode) 1184fa0d7e3dSNick Piggin { 11852c58d548SEric Biggers fscrypt_free_inode(inode); 1186fa0d7e3dSNick Piggin kmem_cache_free(ext4_inode_cachep, EXT4_I(inode)); 1187fa0d7e3dSNick Piggin } 1188fa0d7e3dSNick Piggin 1189617ba13bSMingming Cao static void ext4_destroy_inode(struct inode *inode) 1190ac27a0ecSDave Kleikamp { 11919f7dd93dSVasily Averin if (!list_empty(&(EXT4_I(inode)->i_orphan))) { 1192b31e1552SEric Sandeen ext4_msg(inode->i_sb, KERN_ERR, 1193b31e1552SEric Sandeen "Inode %lu (%p): orphan list check failed!", 1194b31e1552SEric Sandeen inode->i_ino, EXT4_I(inode)); 11959f7dd93dSVasily Averin print_hex_dump(KERN_INFO, "", DUMP_PREFIX_ADDRESS, 16, 4, 11969f7dd93dSVasily Averin EXT4_I(inode), sizeof(struct ext4_inode_info), 11979f7dd93dSVasily Averin true); 11989f7dd93dSVasily Averin dump_stack(); 11999f7dd93dSVasily Averin } 1200ac27a0ecSDave Kleikamp } 1201ac27a0ecSDave Kleikamp 120251cc5068SAlexey Dobriyan static void init_once(void *foo) 1203ac27a0ecSDave Kleikamp { 1204617ba13bSMingming Cao struct ext4_inode_info *ei = (struct ext4_inode_info *) foo; 1205ac27a0ecSDave Kleikamp 1206ac27a0ecSDave Kleikamp INIT_LIST_HEAD(&ei->i_orphan); 1207ac27a0ecSDave Kleikamp init_rwsem(&ei->xattr_sem); 12080e855ac8SAneesh Kumar K.V init_rwsem(&ei->i_data_sem); 1209ea3d7209SJan Kara init_rwsem(&ei->i_mmap_sem); 1210ac27a0ecSDave Kleikamp inode_init_once(&ei->vfs_inode); 1211ac27a0ecSDave Kleikamp } 1212ac27a0ecSDave Kleikamp 1213e67bc2b3SFabian Frederick static int __init init_inodecache(void) 1214ac27a0ecSDave Kleikamp { 1215f8dd7c70SDavid Windsor ext4_inode_cachep = kmem_cache_create_usercopy("ext4_inode_cache", 1216f8dd7c70SDavid Windsor sizeof(struct ext4_inode_info), 0, 1217f8dd7c70SDavid Windsor (SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD| 1218f8dd7c70SDavid Windsor SLAB_ACCOUNT), 1219f8dd7c70SDavid Windsor offsetof(struct ext4_inode_info, i_data), 1220f8dd7c70SDavid Windsor sizeof_field(struct ext4_inode_info, i_data), 122120c2df83SPaul Mundt init_once); 1222617ba13bSMingming Cao if (ext4_inode_cachep == NULL) 1223ac27a0ecSDave Kleikamp return -ENOMEM; 1224ac27a0ecSDave Kleikamp return 0; 1225ac27a0ecSDave Kleikamp } 1226ac27a0ecSDave Kleikamp 1227ac27a0ecSDave Kleikamp static void destroy_inodecache(void) 1228ac27a0ecSDave Kleikamp { 12298c0a8537SKirill A. Shutemov /* 12308c0a8537SKirill A. Shutemov * Make sure all delayed rcu free inodes are flushed before we 12318c0a8537SKirill A. Shutemov * destroy cache. 12328c0a8537SKirill A. Shutemov */ 12338c0a8537SKirill A. Shutemov rcu_barrier(); 1234617ba13bSMingming Cao kmem_cache_destroy(ext4_inode_cachep); 1235ac27a0ecSDave Kleikamp } 1236ac27a0ecSDave Kleikamp 12370930fcc1SAl Viro void ext4_clear_inode(struct inode *inode) 1238ac27a0ecSDave Kleikamp { 12390930fcc1SAl Viro invalidate_inode_buffers(inode); 1240dbd5768fSJan Kara clear_inode(inode); 1241c2ea3fdeSTheodore Ts'o ext4_discard_preallocations(inode); 124251865fdaSZheng Liu ext4_es_remove_extent(inode, 0, EXT_MAX_BLOCKS); 1243f4c2d372SJan Kara dquot_drop(inode); 12448aefcd55STheodore Ts'o if (EXT4_I(inode)->jinode) { 12458aefcd55STheodore Ts'o jbd2_journal_release_jbd_inode(EXT4_JOURNAL(inode), 12468aefcd55STheodore Ts'o EXT4_I(inode)->jinode); 12478aefcd55STheodore Ts'o jbd2_free_inode(EXT4_I(inode)->jinode); 12488aefcd55STheodore Ts'o EXT4_I(inode)->jinode = NULL; 12498aefcd55STheodore Ts'o } 12503d204e24SEric Biggers fscrypt_put_encryption_info(inode); 1251c93d8f88SEric Biggers fsverity_cleanup_inode(inode); 1252ac27a0ecSDave Kleikamp } 1253ac27a0ecSDave Kleikamp 12541b961ac0SChristoph Hellwig static struct inode *ext4_nfs_get_inode(struct super_block *sb, 12551b961ac0SChristoph Hellwig u64 ino, u32 generation) 1256ac27a0ecSDave Kleikamp { 1257ac27a0ecSDave Kleikamp struct inode *inode; 1258ac27a0ecSDave Kleikamp 12598a363970STheodore Ts'o /* 1260ac27a0ecSDave Kleikamp * Currently we don't know the generation for parent directory, so 1261ac27a0ecSDave Kleikamp * a generation of 0 means "accept any" 1262ac27a0ecSDave Kleikamp */ 12638a363970STheodore Ts'o inode = ext4_iget(sb, ino, EXT4_IGET_HANDLE); 12641d1fe1eeSDavid Howells if (IS_ERR(inode)) 12651d1fe1eeSDavid Howells return ERR_CAST(inode); 12661d1fe1eeSDavid Howells if (generation && inode->i_generation != generation) { 1267ac27a0ecSDave Kleikamp iput(inode); 1268ac27a0ecSDave Kleikamp return ERR_PTR(-ESTALE); 1269ac27a0ecSDave Kleikamp } 12701b961ac0SChristoph Hellwig 12711b961ac0SChristoph Hellwig return inode; 1272ac27a0ecSDave Kleikamp } 12731b961ac0SChristoph Hellwig 12741b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_dentry(struct super_block *sb, struct fid *fid, 12751b961ac0SChristoph Hellwig int fh_len, int fh_type) 12761b961ac0SChristoph Hellwig { 12771b961ac0SChristoph Hellwig return generic_fh_to_dentry(sb, fid, fh_len, fh_type, 12781b961ac0SChristoph Hellwig ext4_nfs_get_inode); 12791b961ac0SChristoph Hellwig } 12801b961ac0SChristoph Hellwig 12811b961ac0SChristoph Hellwig static struct dentry *ext4_fh_to_parent(struct super_block *sb, struct fid *fid, 12821b961ac0SChristoph Hellwig int fh_len, int fh_type) 12831b961ac0SChristoph Hellwig { 12841b961ac0SChristoph Hellwig return generic_fh_to_parent(sb, fid, fh_len, fh_type, 12851b961ac0SChristoph Hellwig ext4_nfs_get_inode); 1286ac27a0ecSDave Kleikamp } 1287ac27a0ecSDave Kleikamp 1288fde87268STheodore Ts'o static int ext4_nfs_commit_metadata(struct inode *inode) 1289fde87268STheodore Ts'o { 1290fde87268STheodore Ts'o struct writeback_control wbc = { 1291fde87268STheodore Ts'o .sync_mode = WB_SYNC_ALL 1292fde87268STheodore Ts'o }; 1293fde87268STheodore Ts'o 1294fde87268STheodore Ts'o trace_ext4_nfs_commit_metadata(inode); 1295fde87268STheodore Ts'o return ext4_write_inode(inode, &wbc); 1296fde87268STheodore Ts'o } 1297fde87268STheodore Ts'o 1298c39a7f84SToshiyuki Okajima /* 1299c39a7f84SToshiyuki Okajima * Try to release metadata pages (indirect blocks, directories) which are 1300c39a7f84SToshiyuki Okajima * mapped via the block device. Since these pages could have journal heads 1301c39a7f84SToshiyuki Okajima * which would prevent try_to_free_buffers() from freeing them, we must use 1302c39a7f84SToshiyuki Okajima * jbd2 layer's try_to_free_buffers() function to release them. 1303c39a7f84SToshiyuki Okajima */ 13040b8e58a1SAndreas Dilger static int bdev_try_to_free_page(struct super_block *sb, struct page *page, 13050b8e58a1SAndreas Dilger gfp_t wait) 1306c39a7f84SToshiyuki Okajima { 1307c39a7f84SToshiyuki Okajima journal_t *journal = EXT4_SB(sb)->s_journal; 1308c39a7f84SToshiyuki Okajima 1309c39a7f84SToshiyuki Okajima WARN_ON(PageChecked(page)); 1310c39a7f84SToshiyuki Okajima if (!page_has_buffers(page)) 1311c39a7f84SToshiyuki Okajima return 0; 1312c39a7f84SToshiyuki Okajima if (journal) 1313c39a7f84SToshiyuki Okajima return jbd2_journal_try_to_free_buffers(journal, page, 1314d0164adcSMel Gorman wait & ~__GFP_DIRECT_RECLAIM); 1315c39a7f84SToshiyuki Okajima return try_to_free_buffers(page); 1316c39a7f84SToshiyuki Okajima } 1317c39a7f84SToshiyuki Okajima 1318643fa961SChandan Rajendra #ifdef CONFIG_FS_ENCRYPTION 1319a7550b30SJaegeuk Kim static int ext4_get_context(struct inode *inode, void *ctx, size_t len) 1320a7550b30SJaegeuk Kim { 1321a7550b30SJaegeuk Kim return ext4_xattr_get(inode, EXT4_XATTR_INDEX_ENCRYPTION, 1322a7550b30SJaegeuk Kim EXT4_XATTR_NAME_ENCRYPTION_CONTEXT, ctx, len); 1323a7550b30SJaegeuk Kim } 1324a7550b30SJaegeuk Kim 1325a7550b30SJaegeuk Kim static int ext4_set_context(struct inode *inode, const void *ctx, size_t len, 1326a7550b30SJaegeuk Kim void *fs_data) 1327a7550b30SJaegeuk Kim { 13282f8f5e76SEric Biggers handle_t *handle = fs_data; 1329c1a5d5f6STahsin Erdogan int res, res2, credits, retries = 0; 1330a7550b30SJaegeuk Kim 13319ce0151aSEric Biggers /* 13329ce0151aSEric Biggers * Encrypting the root directory is not allowed because e2fsck expects 13339ce0151aSEric Biggers * lost+found to exist and be unencrypted, and encrypting the root 13349ce0151aSEric Biggers * directory would imply encrypting the lost+found directory as well as 13359ce0151aSEric Biggers * the filename "lost+found" itself. 13369ce0151aSEric Biggers */ 13379ce0151aSEric Biggers if (inode->i_ino == EXT4_ROOT_INO) 13389ce0151aSEric Biggers return -EPERM; 1339a7550b30SJaegeuk Kim 13407d3e06a8SRoss Zwisler if (WARN_ON_ONCE(IS_DAX(inode) && i_size_read(inode))) 13417d3e06a8SRoss Zwisler return -EINVAL; 13427d3e06a8SRoss Zwisler 134394840e3cSEric Biggers res = ext4_convert_inline_data(inode); 134494840e3cSEric Biggers if (res) 134594840e3cSEric Biggers return res; 134694840e3cSEric Biggers 13472f8f5e76SEric Biggers /* 13482f8f5e76SEric Biggers * If a journal handle was specified, then the encryption context is 13492f8f5e76SEric Biggers * being set on a new inode via inheritance and is part of a larger 13502f8f5e76SEric Biggers * transaction to create the inode. Otherwise the encryption context is 13512f8f5e76SEric Biggers * being set on an existing inode in its own transaction. Only in the 13522f8f5e76SEric Biggers * latter case should the "retry on ENOSPC" logic be used. 13532f8f5e76SEric Biggers */ 13542f8f5e76SEric Biggers 13552f8f5e76SEric Biggers if (handle) { 13562f8f5e76SEric Biggers res = ext4_xattr_set_handle(handle, inode, 13572f8f5e76SEric Biggers EXT4_XATTR_INDEX_ENCRYPTION, 13582f8f5e76SEric Biggers EXT4_XATTR_NAME_ENCRYPTION_CONTEXT, 13592f8f5e76SEric Biggers ctx, len, 0); 1360a7550b30SJaegeuk Kim if (!res) { 1361a7550b30SJaegeuk Kim ext4_set_inode_flag(inode, EXT4_INODE_ENCRYPT); 1362a7550b30SJaegeuk Kim ext4_clear_inode_state(inode, 1363a7550b30SJaegeuk Kim EXT4_STATE_MAY_INLINE_DATA); 1364a3caa24bSJan Kara /* 13652ee6a576SEric Biggers * Update inode->i_flags - S_ENCRYPTED will be enabled, 13662ee6a576SEric Biggers * S_DAX may be disabled 1367a3caa24bSJan Kara */ 1368a3caa24bSJan Kara ext4_set_inode_flags(inode); 1369a7550b30SJaegeuk Kim } 1370a7550b30SJaegeuk Kim return res; 1371a7550b30SJaegeuk Kim } 1372a7550b30SJaegeuk Kim 1373b8cb5a54STahsin Erdogan res = dquot_initialize(inode); 1374b8cb5a54STahsin Erdogan if (res) 1375b8cb5a54STahsin Erdogan return res; 13762f8f5e76SEric Biggers retry: 1377af65207cSTahsin Erdogan res = ext4_xattr_set_credits(inode, len, false /* is_create */, 1378af65207cSTahsin Erdogan &credits); 1379dec214d0STahsin Erdogan if (res) 1380dec214d0STahsin Erdogan return res; 1381dec214d0STahsin Erdogan 1382c1a5d5f6STahsin Erdogan handle = ext4_journal_start(inode, EXT4_HT_MISC, credits); 1383a7550b30SJaegeuk Kim if (IS_ERR(handle)) 1384a7550b30SJaegeuk Kim return PTR_ERR(handle); 1385a7550b30SJaegeuk Kim 13862f8f5e76SEric Biggers res = ext4_xattr_set_handle(handle, inode, EXT4_XATTR_INDEX_ENCRYPTION, 13872f8f5e76SEric Biggers EXT4_XATTR_NAME_ENCRYPTION_CONTEXT, 13882f8f5e76SEric Biggers ctx, len, 0); 1389a7550b30SJaegeuk Kim if (!res) { 1390a7550b30SJaegeuk Kim ext4_set_inode_flag(inode, EXT4_INODE_ENCRYPT); 13912ee6a576SEric Biggers /* 13922ee6a576SEric Biggers * Update inode->i_flags - S_ENCRYPTED will be enabled, 13932ee6a576SEric Biggers * S_DAX may be disabled 13942ee6a576SEric Biggers */ 1395a3caa24bSJan Kara ext4_set_inode_flags(inode); 1396a7550b30SJaegeuk Kim res = ext4_mark_inode_dirty(handle, inode); 1397a7550b30SJaegeuk Kim if (res) 1398a7550b30SJaegeuk Kim EXT4_ERROR_INODE(inode, "Failed to mark inode dirty"); 1399a7550b30SJaegeuk Kim } 1400a7550b30SJaegeuk Kim res2 = ext4_journal_stop(handle); 14012f8f5e76SEric Biggers 14022f8f5e76SEric Biggers if (res == -ENOSPC && ext4_should_retry_alloc(inode->i_sb, &retries)) 14032f8f5e76SEric Biggers goto retry; 1404a7550b30SJaegeuk Kim if (!res) 1405a7550b30SJaegeuk Kim res = res2; 1406a7550b30SJaegeuk Kim return res; 1407a7550b30SJaegeuk Kim } 1408a7550b30SJaegeuk Kim 1409c250b7ddSEric Biggers static bool ext4_dummy_context(struct inode *inode) 1410a7550b30SJaegeuk Kim { 1411a7550b30SJaegeuk Kim return DUMMY_ENCRYPTION_ENABLED(EXT4_SB(inode->i_sb)); 1412a7550b30SJaegeuk Kim } 1413a7550b30SJaegeuk Kim 1414b925acb8SEric Biggers static bool ext4_has_stable_inodes(struct super_block *sb) 1415b925acb8SEric Biggers { 1416b925acb8SEric Biggers return ext4_has_feature_stable_inodes(sb); 1417b925acb8SEric Biggers } 1418b925acb8SEric Biggers 1419b925acb8SEric Biggers static void ext4_get_ino_and_lblk_bits(struct super_block *sb, 1420b925acb8SEric Biggers int *ino_bits_ret, int *lblk_bits_ret) 1421b925acb8SEric Biggers { 1422b925acb8SEric Biggers *ino_bits_ret = 8 * sizeof(EXT4_SB(sb)->s_es->s_inodes_count); 1423b925acb8SEric Biggers *lblk_bits_ret = 8 * sizeof(ext4_lblk_t); 1424b925acb8SEric Biggers } 1425b925acb8SEric Biggers 14266f69f0edSEric Biggers static const struct fscrypt_operations ext4_cryptops = { 1427a5d431efSEric Biggers .key_prefix = "ext4:", 1428a7550b30SJaegeuk Kim .get_context = ext4_get_context, 1429a7550b30SJaegeuk Kim .set_context = ext4_set_context, 1430a7550b30SJaegeuk Kim .dummy_context = ext4_dummy_context, 1431a7550b30SJaegeuk Kim .empty_dir = ext4_empty_dir, 1432e12ee683SEric Biggers .max_namelen = EXT4_NAME_LEN, 1433b925acb8SEric Biggers .has_stable_inodes = ext4_has_stable_inodes, 1434b925acb8SEric Biggers .get_ino_and_lblk_bits = ext4_get_ino_and_lblk_bits, 1435a7550b30SJaegeuk Kim }; 1436a7550b30SJaegeuk Kim #endif 1437a7550b30SJaegeuk Kim 1438ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 1439d6006186SEric Biggers static const char * const quotatypes[] = INITQFNAMES; 1440689c958cSLi Xi #define QTYPE2NAME(t) (quotatypes[t]) 1441ac27a0ecSDave Kleikamp 1442617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot); 1443617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot); 1444617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot); 1445617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot); 1446617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type); 14476f28e087SJan Kara static int ext4_quota_on(struct super_block *sb, int type, int format_id, 14488c54ca9cSAl Viro const struct path *path); 1449617ba13bSMingming Cao static int ext4_quota_on_mount(struct super_block *sb, int type); 1450617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data, 1451ac27a0ecSDave Kleikamp size_t len, loff_t off); 1452617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type, 1453ac27a0ecSDave Kleikamp const char *data, size_t len, loff_t off); 14547c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id, 14557c319d32SAditya Kali unsigned int flags); 14567c319d32SAditya Kali static int ext4_enable_quotas(struct super_block *sb); 1457ac27a0ecSDave Kleikamp 145896c7e0d9SJan Kara static struct dquot **ext4_get_dquots(struct inode *inode) 145996c7e0d9SJan Kara { 146096c7e0d9SJan Kara return EXT4_I(inode)->i_dquot; 146196c7e0d9SJan Kara } 146296c7e0d9SJan Kara 146361e225dcSAlexey Dobriyan static const struct dquot_operations ext4_quota_operations = { 146460e58e0fSMingming Cao .get_reserved_space = ext4_get_reserved_space, 1465617ba13bSMingming Cao .write_dquot = ext4_write_dquot, 1466617ba13bSMingming Cao .acquire_dquot = ext4_acquire_dquot, 1467617ba13bSMingming Cao .release_dquot = ext4_release_dquot, 1468617ba13bSMingming Cao .mark_dirty = ext4_mark_dquot_dirty, 1469a5b5ee32SJan Kara .write_info = ext4_write_info, 1470a5b5ee32SJan Kara .alloc_dquot = dquot_alloc, 1471a5b5ee32SJan Kara .destroy_dquot = dquot_destroy, 1472040cb378SLi Xi .get_projid = ext4_get_projid, 14737a9ca53aSTahsin Erdogan .get_inode_usage = ext4_get_inode_usage, 1474ebc11f7bSChengguang Xu .get_next_id = dquot_get_next_id, 1475ac27a0ecSDave Kleikamp }; 1476ac27a0ecSDave Kleikamp 14770d54b217SAlexey Dobriyan static const struct quotactl_ops ext4_qctl_operations = { 1478617ba13bSMingming Cao .quota_on = ext4_quota_on, 1479ca0e05e4SDmitry Monakhov .quota_off = ext4_quota_off, 1480287a8095SChristoph Hellwig .quota_sync = dquot_quota_sync, 14810a240339SJan Kara .get_state = dquot_get_state, 1482287a8095SChristoph Hellwig .set_info = dquot_set_dqinfo, 1483287a8095SChristoph Hellwig .get_dqblk = dquot_get_dqblk, 14846332b9b5SEric Sandeen .set_dqblk = dquot_set_dqblk, 14856332b9b5SEric Sandeen .get_nextdqblk = dquot_get_next_dqblk, 1486ac27a0ecSDave Kleikamp }; 1487ac27a0ecSDave Kleikamp #endif 1488ac27a0ecSDave Kleikamp 1489ee9b6d61SJosef 'Jeff' Sipek static const struct super_operations ext4_sops = { 1490617ba13bSMingming Cao .alloc_inode = ext4_alloc_inode, 149194053139SAl Viro .free_inode = ext4_free_in_core_inode, 1492617ba13bSMingming Cao .destroy_inode = ext4_destroy_inode, 1493617ba13bSMingming Cao .write_inode = ext4_write_inode, 1494617ba13bSMingming Cao .dirty_inode = ext4_dirty_inode, 14957ff9c073STheodore Ts'o .drop_inode = ext4_drop_inode, 14960930fcc1SAl Viro .evict_inode = ext4_evict_inode, 1497617ba13bSMingming Cao .put_super = ext4_put_super, 1498617ba13bSMingming Cao .sync_fs = ext4_sync_fs, 1499c4be0c1dSTakashi Sato .freeze_fs = ext4_freeze, 1500c4be0c1dSTakashi Sato .unfreeze_fs = ext4_unfreeze, 1501617ba13bSMingming Cao .statfs = ext4_statfs, 1502617ba13bSMingming Cao .remount_fs = ext4_remount, 1503617ba13bSMingming Cao .show_options = ext4_show_options, 1504ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 1505617ba13bSMingming Cao .quota_read = ext4_quota_read, 1506617ba13bSMingming Cao .quota_write = ext4_quota_write, 150796c7e0d9SJan Kara .get_dquots = ext4_get_dquots, 1508ac27a0ecSDave Kleikamp #endif 1509c39a7f84SToshiyuki Okajima .bdev_try_to_free_page = bdev_try_to_free_page, 1510ac27a0ecSDave Kleikamp }; 1511ac27a0ecSDave Kleikamp 151239655164SChristoph Hellwig static const struct export_operations ext4_export_ops = { 15131b961ac0SChristoph Hellwig .fh_to_dentry = ext4_fh_to_dentry, 15141b961ac0SChristoph Hellwig .fh_to_parent = ext4_fh_to_parent, 1515617ba13bSMingming Cao .get_parent = ext4_get_parent, 1516fde87268STheodore Ts'o .commit_metadata = ext4_nfs_commit_metadata, 1517ac27a0ecSDave Kleikamp }; 1518ac27a0ecSDave Kleikamp 1519ac27a0ecSDave Kleikamp enum { 1520ac27a0ecSDave Kleikamp Opt_bsd_df, Opt_minix_df, Opt_grpid, Opt_nogrpid, 1521ac27a0ecSDave Kleikamp Opt_resgid, Opt_resuid, Opt_sb, Opt_err_cont, Opt_err_panic, Opt_err_ro, 152272578c33STheodore Ts'o Opt_nouid32, Opt_debug, Opt_removed, 1523ac27a0ecSDave Kleikamp Opt_user_xattr, Opt_nouser_xattr, Opt_acl, Opt_noacl, 152472578c33STheodore Ts'o Opt_auto_da_alloc, Opt_noauto_da_alloc, Opt_noload, 1525ad4eec61SEric Sandeen Opt_commit, Opt_min_batch_time, Opt_max_batch_time, Opt_journal_dev, 1526ad4eec61SEric Sandeen Opt_journal_path, Opt_journal_checksum, Opt_journal_async_commit, 1527ac27a0ecSDave Kleikamp Opt_abort, Opt_data_journal, Opt_data_ordered, Opt_data_writeback, 15286ddb2447STheodore Ts'o Opt_data_err_abort, Opt_data_err_ignore, Opt_test_dummy_encryption, 1529ac27a0ecSDave Kleikamp Opt_usrjquota, Opt_grpjquota, Opt_offusrjquota, Opt_offgrpjquota, 15305a20bdfcSJan Kara Opt_jqfmt_vfsold, Opt_jqfmt_vfsv0, Opt_jqfmt_vfsv1, Opt_quota, 1531ee4a3fcdSTheodore Ts'o Opt_noquota, Opt_barrier, Opt_nobarrier, Opt_err, 153249da9392SJan Kara Opt_usrquota, Opt_grpquota, Opt_prjquota, Opt_i_version, Opt_dax, 1533327eaf73STheodore Ts'o Opt_stripe, Opt_delalloc, Opt_nodelalloc, Opt_warn_on_error, 1534327eaf73STheodore Ts'o Opt_nowarn_on_error, Opt_mblk_io_submit, 1535670e9875STheodore Ts'o Opt_lazytime, Opt_nolazytime, Opt_debug_want_extra_isize, 15361449032bSTheodore Ts'o Opt_nomblk_io_submit, Opt_block_validity, Opt_noblock_validity, 15375328e635SEric Sandeen Opt_inode_readahead_blks, Opt_journal_ioprio, 1538744692dcSJiaying Zhang Opt_dioread_nolock, Opt_dioread_lock, 1539fc6cb1cdSTheodore Ts'o Opt_discard, Opt_nodiscard, Opt_init_itable, Opt_noinit_itable, 1540cdb7ee4cSTahsin Erdogan Opt_max_dir_size_kb, Opt_nojournal_checksum, Opt_nombcache, 1541ac27a0ecSDave Kleikamp }; 1542ac27a0ecSDave Kleikamp 1543a447c093SSteven Whitehouse static const match_table_t tokens = { 1544ac27a0ecSDave Kleikamp {Opt_bsd_df, "bsddf"}, 1545ac27a0ecSDave Kleikamp {Opt_minix_df, "minixdf"}, 1546ac27a0ecSDave Kleikamp {Opt_grpid, "grpid"}, 1547ac27a0ecSDave Kleikamp {Opt_grpid, "bsdgroups"}, 1548ac27a0ecSDave Kleikamp {Opt_nogrpid, "nogrpid"}, 1549ac27a0ecSDave Kleikamp {Opt_nogrpid, "sysvgroups"}, 1550ac27a0ecSDave Kleikamp {Opt_resgid, "resgid=%u"}, 1551ac27a0ecSDave Kleikamp {Opt_resuid, "resuid=%u"}, 1552ac27a0ecSDave Kleikamp {Opt_sb, "sb=%u"}, 1553ac27a0ecSDave Kleikamp {Opt_err_cont, "errors=continue"}, 1554ac27a0ecSDave Kleikamp {Opt_err_panic, "errors=panic"}, 1555ac27a0ecSDave Kleikamp {Opt_err_ro, "errors=remount-ro"}, 1556ac27a0ecSDave Kleikamp {Opt_nouid32, "nouid32"}, 1557ac27a0ecSDave Kleikamp {Opt_debug, "debug"}, 155872578c33STheodore Ts'o {Opt_removed, "oldalloc"}, 155972578c33STheodore Ts'o {Opt_removed, "orlov"}, 1560ac27a0ecSDave Kleikamp {Opt_user_xattr, "user_xattr"}, 1561ac27a0ecSDave Kleikamp {Opt_nouser_xattr, "nouser_xattr"}, 1562ac27a0ecSDave Kleikamp {Opt_acl, "acl"}, 1563ac27a0ecSDave Kleikamp {Opt_noacl, "noacl"}, 1564e3bb52aeSEric Sandeen {Opt_noload, "norecovery"}, 15655a916be1STheodore Ts'o {Opt_noload, "noload"}, 156672578c33STheodore Ts'o {Opt_removed, "nobh"}, 156772578c33STheodore Ts'o {Opt_removed, "bh"}, 1568ac27a0ecSDave Kleikamp {Opt_commit, "commit=%u"}, 156930773840STheodore Ts'o {Opt_min_batch_time, "min_batch_time=%u"}, 157030773840STheodore Ts'o {Opt_max_batch_time, "max_batch_time=%u"}, 1571ac27a0ecSDave Kleikamp {Opt_journal_dev, "journal_dev=%u"}, 1572ad4eec61SEric Sandeen {Opt_journal_path, "journal_path=%s"}, 1573818d276cSGirish Shilamkar {Opt_journal_checksum, "journal_checksum"}, 1574c6d3d56dSDarrick J. Wong {Opt_nojournal_checksum, "nojournal_checksum"}, 1575818d276cSGirish Shilamkar {Opt_journal_async_commit, "journal_async_commit"}, 1576ac27a0ecSDave Kleikamp {Opt_abort, "abort"}, 1577ac27a0ecSDave Kleikamp {Opt_data_journal, "data=journal"}, 1578ac27a0ecSDave Kleikamp {Opt_data_ordered, "data=ordered"}, 1579ac27a0ecSDave Kleikamp {Opt_data_writeback, "data=writeback"}, 15805bf5683aSHidehiro Kawai {Opt_data_err_abort, "data_err=abort"}, 15815bf5683aSHidehiro Kawai {Opt_data_err_ignore, "data_err=ignore"}, 1582ac27a0ecSDave Kleikamp {Opt_offusrjquota, "usrjquota="}, 1583ac27a0ecSDave Kleikamp {Opt_usrjquota, "usrjquota=%s"}, 1584ac27a0ecSDave Kleikamp {Opt_offgrpjquota, "grpjquota="}, 1585ac27a0ecSDave Kleikamp {Opt_grpjquota, "grpjquota=%s"}, 1586ac27a0ecSDave Kleikamp {Opt_jqfmt_vfsold, "jqfmt=vfsold"}, 1587ac27a0ecSDave Kleikamp {Opt_jqfmt_vfsv0, "jqfmt=vfsv0"}, 15885a20bdfcSJan Kara {Opt_jqfmt_vfsv1, "jqfmt=vfsv1"}, 1589ac27a0ecSDave Kleikamp {Opt_grpquota, "grpquota"}, 1590ac27a0ecSDave Kleikamp {Opt_noquota, "noquota"}, 1591ac27a0ecSDave Kleikamp {Opt_quota, "quota"}, 1592ac27a0ecSDave Kleikamp {Opt_usrquota, "usrquota"}, 159349da9392SJan Kara {Opt_prjquota, "prjquota"}, 1594ac27a0ecSDave Kleikamp {Opt_barrier, "barrier=%u"}, 159506705bffSTheodore Ts'o {Opt_barrier, "barrier"}, 159606705bffSTheodore Ts'o {Opt_nobarrier, "nobarrier"}, 159725ec56b5SJean Noel Cordenner {Opt_i_version, "i_version"}, 1598923ae0ffSRoss Zwisler {Opt_dax, "dax"}, 1599c9de560dSAlex Tomas {Opt_stripe, "stripe=%u"}, 160064769240SAlex Tomas {Opt_delalloc, "delalloc"}, 1601327eaf73STheodore Ts'o {Opt_warn_on_error, "warn_on_error"}, 1602327eaf73STheodore Ts'o {Opt_nowarn_on_error, "nowarn_on_error"}, 1603a26f4992STheodore Ts'o {Opt_lazytime, "lazytime"}, 1604a26f4992STheodore Ts'o {Opt_nolazytime, "nolazytime"}, 1605670e9875STheodore Ts'o {Opt_debug_want_extra_isize, "debug_want_extra_isize=%u"}, 1606dd919b98SAneesh Kumar K.V {Opt_nodelalloc, "nodelalloc"}, 160736ade451SJan Kara {Opt_removed, "mblk_io_submit"}, 160836ade451SJan Kara {Opt_removed, "nomblk_io_submit"}, 16096fd058f7STheodore Ts'o {Opt_block_validity, "block_validity"}, 16106fd058f7STheodore Ts'o {Opt_noblock_validity, "noblock_validity"}, 1611240799cdSTheodore Ts'o {Opt_inode_readahead_blks, "inode_readahead_blks=%u"}, 1612b3881f74STheodore Ts'o {Opt_journal_ioprio, "journal_ioprio=%u"}, 1613afd4672dSTheodore Ts'o {Opt_auto_da_alloc, "auto_da_alloc=%u"}, 161406705bffSTheodore Ts'o {Opt_auto_da_alloc, "auto_da_alloc"}, 161506705bffSTheodore Ts'o {Opt_noauto_da_alloc, "noauto_da_alloc"}, 1616744692dcSJiaying Zhang {Opt_dioread_nolock, "dioread_nolock"}, 1617744692dcSJiaying Zhang {Opt_dioread_lock, "dioread_lock"}, 16185328e635SEric Sandeen {Opt_discard, "discard"}, 16195328e635SEric Sandeen {Opt_nodiscard, "nodiscard"}, 1620fc6cb1cdSTheodore Ts'o {Opt_init_itable, "init_itable=%u"}, 1621fc6cb1cdSTheodore Ts'o {Opt_init_itable, "init_itable"}, 1622fc6cb1cdSTheodore Ts'o {Opt_noinit_itable, "noinit_itable"}, 1623df981d03STheodore Ts'o {Opt_max_dir_size_kb, "max_dir_size_kb=%u"}, 16246ddb2447STheodore Ts'o {Opt_test_dummy_encryption, "test_dummy_encryption"}, 1625cdb7ee4cSTahsin Erdogan {Opt_nombcache, "nombcache"}, 1626cdb7ee4cSTahsin Erdogan {Opt_nombcache, "no_mbcache"}, /* for backward compatibility */ 1627c7198b9cSTheodore Ts'o {Opt_removed, "check=none"}, /* mount option from ext2/3 */ 1628c7198b9cSTheodore Ts'o {Opt_removed, "nocheck"}, /* mount option from ext2/3 */ 1629c7198b9cSTheodore Ts'o {Opt_removed, "reservation"}, /* mount option from ext2/3 */ 1630c7198b9cSTheodore Ts'o {Opt_removed, "noreservation"}, /* mount option from ext2/3 */ 1631c7198b9cSTheodore Ts'o {Opt_removed, "journal=%u"}, /* mount option from ext2/3 */ 1632f3f12faaSJosef Bacik {Opt_err, NULL}, 1633ac27a0ecSDave Kleikamp }; 1634ac27a0ecSDave Kleikamp 1635617ba13bSMingming Cao static ext4_fsblk_t get_sb_block(void **data) 1636ac27a0ecSDave Kleikamp { 1637617ba13bSMingming Cao ext4_fsblk_t sb_block; 1638ac27a0ecSDave Kleikamp char *options = (char *) *data; 1639ac27a0ecSDave Kleikamp 1640ac27a0ecSDave Kleikamp if (!options || strncmp(options, "sb=", 3) != 0) 1641ac27a0ecSDave Kleikamp return 1; /* Default location */ 16420b8e58a1SAndreas Dilger 1643ac27a0ecSDave Kleikamp options += 3; 16440b8e58a1SAndreas Dilger /* TODO: use simple_strtoll with >32bit ext4 */ 1645ac27a0ecSDave Kleikamp sb_block = simple_strtoul(options, &options, 0); 1646ac27a0ecSDave Kleikamp if (*options && *options != ',') { 16474776004fSTheodore Ts'o printk(KERN_ERR "EXT4-fs: Invalid sb specification: %s\n", 1648ac27a0ecSDave Kleikamp (char *) *data); 1649ac27a0ecSDave Kleikamp return 1; 1650ac27a0ecSDave Kleikamp } 1651ac27a0ecSDave Kleikamp if (*options == ',') 1652ac27a0ecSDave Kleikamp options++; 1653ac27a0ecSDave Kleikamp *data = (void *) options; 16540b8e58a1SAndreas Dilger 1655ac27a0ecSDave Kleikamp return sb_block; 1656ac27a0ecSDave Kleikamp } 1657ac27a0ecSDave Kleikamp 1658b3881f74STheodore Ts'o #define DEFAULT_JOURNAL_IOPRIO (IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, 3)) 1659d6006186SEric Biggers static const char deprecated_msg[] = 1660d6006186SEric Biggers "Mount option \"%s\" will be removed by %s\n" 1661437ca0fdSDmitry Monakhov "Contact linux-ext4@vger.kernel.org if you think we should keep it.\n"; 1662b3881f74STheodore Ts'o 166356c50f11SDmitry Monakhov #ifdef CONFIG_QUOTA 166456c50f11SDmitry Monakhov static int set_qf_name(struct super_block *sb, int qtype, substring_t *args) 166556c50f11SDmitry Monakhov { 166656c50f11SDmitry Monakhov struct ext4_sb_info *sbi = EXT4_SB(sb); 166733458eabSTheodore Ts'o char *qname, *old_qname = get_qf_name(sb, sbi, qtype); 166803dafb5fSChen Gang int ret = -1; 166956c50f11SDmitry Monakhov 167033458eabSTheodore Ts'o if (sb_any_quota_loaded(sb) && !old_qname) { 167156c50f11SDmitry Monakhov ext4_msg(sb, KERN_ERR, 167256c50f11SDmitry Monakhov "Cannot change journaled " 167356c50f11SDmitry Monakhov "quota options when quota turned on"); 167457f73c2cSTheodore Ts'o return -1; 167556c50f11SDmitry Monakhov } 1676e2b911c5SDarrick J. Wong if (ext4_has_feature_quota(sb)) { 1677c325a67cSTheodore Ts'o ext4_msg(sb, KERN_INFO, "Journaled quota options " 1678c325a67cSTheodore Ts'o "ignored when QUOTA feature is enabled"); 1679c325a67cSTheodore Ts'o return 1; 1680262b4662SJan Kara } 168156c50f11SDmitry Monakhov qname = match_strdup(args); 168256c50f11SDmitry Monakhov if (!qname) { 168356c50f11SDmitry Monakhov ext4_msg(sb, KERN_ERR, 168456c50f11SDmitry Monakhov "Not enough memory for storing quotafile name"); 168557f73c2cSTheodore Ts'o return -1; 168656c50f11SDmitry Monakhov } 168733458eabSTheodore Ts'o if (old_qname) { 168833458eabSTheodore Ts'o if (strcmp(old_qname, qname) == 0) 168903dafb5fSChen Gang ret = 1; 169003dafb5fSChen Gang else 169156c50f11SDmitry Monakhov ext4_msg(sb, KERN_ERR, 169203dafb5fSChen Gang "%s quota file already specified", 169303dafb5fSChen Gang QTYPE2NAME(qtype)); 169403dafb5fSChen Gang goto errout; 169556c50f11SDmitry Monakhov } 169603dafb5fSChen Gang if (strchr(qname, '/')) { 169756c50f11SDmitry Monakhov ext4_msg(sb, KERN_ERR, 169856c50f11SDmitry Monakhov "quotafile must be on filesystem root"); 169903dafb5fSChen Gang goto errout; 170056c50f11SDmitry Monakhov } 170133458eabSTheodore Ts'o rcu_assign_pointer(sbi->s_qf_names[qtype], qname); 1702fd8c37ecSTheodore Ts'o set_opt(sb, QUOTA); 170356c50f11SDmitry Monakhov return 1; 170403dafb5fSChen Gang errout: 170503dafb5fSChen Gang kfree(qname); 170603dafb5fSChen Gang return ret; 170756c50f11SDmitry Monakhov } 170856c50f11SDmitry Monakhov 170956c50f11SDmitry Monakhov static int clear_qf_name(struct super_block *sb, int qtype) 171056c50f11SDmitry Monakhov { 171156c50f11SDmitry Monakhov 171256c50f11SDmitry Monakhov struct ext4_sb_info *sbi = EXT4_SB(sb); 171333458eabSTheodore Ts'o char *old_qname = get_qf_name(sb, sbi, qtype); 171456c50f11SDmitry Monakhov 171533458eabSTheodore Ts'o if (sb_any_quota_loaded(sb) && old_qname) { 171656c50f11SDmitry Monakhov ext4_msg(sb, KERN_ERR, "Cannot change journaled quota options" 171756c50f11SDmitry Monakhov " when quota turned on"); 171857f73c2cSTheodore Ts'o return -1; 171956c50f11SDmitry Monakhov } 172033458eabSTheodore Ts'o rcu_assign_pointer(sbi->s_qf_names[qtype], NULL); 172133458eabSTheodore Ts'o synchronize_rcu(); 172233458eabSTheodore Ts'o kfree(old_qname); 172356c50f11SDmitry Monakhov return 1; 172456c50f11SDmitry Monakhov } 172556c50f11SDmitry Monakhov #endif 172656c50f11SDmitry Monakhov 172726092bf5STheodore Ts'o #define MOPT_SET 0x0001 172826092bf5STheodore Ts'o #define MOPT_CLEAR 0x0002 172926092bf5STheodore Ts'o #define MOPT_NOSUPPORT 0x0004 173026092bf5STheodore Ts'o #define MOPT_EXPLICIT 0x0008 173126092bf5STheodore Ts'o #define MOPT_CLEAR_ERR 0x0010 173226092bf5STheodore Ts'o #define MOPT_GTE0 0x0020 173326092bf5STheodore Ts'o #ifdef CONFIG_QUOTA 173426092bf5STheodore Ts'o #define MOPT_Q 0 173526092bf5STheodore Ts'o #define MOPT_QFMT 0x0040 173626092bf5STheodore Ts'o #else 173726092bf5STheodore Ts'o #define MOPT_Q MOPT_NOSUPPORT 173826092bf5STheodore Ts'o #define MOPT_QFMT MOPT_NOSUPPORT 173926092bf5STheodore Ts'o #endif 174026092bf5STheodore Ts'o #define MOPT_DATAJ 0x0080 17418dc0aa8cSTheodore Ts'o #define MOPT_NO_EXT2 0x0100 17428dc0aa8cSTheodore Ts'o #define MOPT_NO_EXT3 0x0200 17438dc0aa8cSTheodore Ts'o #define MOPT_EXT4_ONLY (MOPT_NO_EXT2 | MOPT_NO_EXT3) 1744ad4eec61SEric Sandeen #define MOPT_STRING 0x0400 174526092bf5STheodore Ts'o 174626092bf5STheodore Ts'o static const struct mount_opts { 174726092bf5STheodore Ts'o int token; 174826092bf5STheodore Ts'o int mount_opt; 174926092bf5STheodore Ts'o int flags; 175026092bf5STheodore Ts'o } ext4_mount_opts[] = { 175126092bf5STheodore Ts'o {Opt_minix_df, EXT4_MOUNT_MINIX_DF, MOPT_SET}, 175226092bf5STheodore Ts'o {Opt_bsd_df, EXT4_MOUNT_MINIX_DF, MOPT_CLEAR}, 175326092bf5STheodore Ts'o {Opt_grpid, EXT4_MOUNT_GRPID, MOPT_SET}, 175426092bf5STheodore Ts'o {Opt_nogrpid, EXT4_MOUNT_GRPID, MOPT_CLEAR}, 175526092bf5STheodore Ts'o {Opt_block_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_SET}, 175626092bf5STheodore Ts'o {Opt_noblock_validity, EXT4_MOUNT_BLOCK_VALIDITY, MOPT_CLEAR}, 17578dc0aa8cSTheodore Ts'o {Opt_dioread_nolock, EXT4_MOUNT_DIOREAD_NOLOCK, 17588dc0aa8cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_SET}, 17598dc0aa8cSTheodore Ts'o {Opt_dioread_lock, EXT4_MOUNT_DIOREAD_NOLOCK, 17608dc0aa8cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_CLEAR}, 176126092bf5STheodore Ts'o {Opt_discard, EXT4_MOUNT_DISCARD, MOPT_SET}, 176226092bf5STheodore Ts'o {Opt_nodiscard, EXT4_MOUNT_DISCARD, MOPT_CLEAR}, 17638dc0aa8cSTheodore Ts'o {Opt_delalloc, EXT4_MOUNT_DELALLOC, 17648dc0aa8cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT}, 17658dc0aa8cSTheodore Ts'o {Opt_nodelalloc, EXT4_MOUNT_DELALLOC, 176659d9fa5cSTheodore Ts'o MOPT_EXT4_ONLY | MOPT_CLEAR}, 1767327eaf73STheodore Ts'o {Opt_warn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_SET}, 1768327eaf73STheodore Ts'o {Opt_nowarn_on_error, EXT4_MOUNT_WARN_ON_ERROR, MOPT_CLEAR}, 1769c6d3d56dSDarrick J. Wong {Opt_nojournal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM, 1770c6d3d56dSDarrick J. Wong MOPT_EXT4_ONLY | MOPT_CLEAR}, 17718dc0aa8cSTheodore Ts'o {Opt_journal_checksum, EXT4_MOUNT_JOURNAL_CHECKSUM, 17721e381f60SDmitry Monakhov MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT}, 177326092bf5STheodore Ts'o {Opt_journal_async_commit, (EXT4_MOUNT_JOURNAL_ASYNC_COMMIT | 17748dc0aa8cSTheodore Ts'o EXT4_MOUNT_JOURNAL_CHECKSUM), 17751e381f60SDmitry Monakhov MOPT_EXT4_ONLY | MOPT_SET | MOPT_EXPLICIT}, 17768dc0aa8cSTheodore Ts'o {Opt_noload, EXT4_MOUNT_NOLOAD, MOPT_NO_EXT2 | MOPT_SET}, 177726092bf5STheodore Ts'o {Opt_err_panic, EXT4_MOUNT_ERRORS_PANIC, MOPT_SET | MOPT_CLEAR_ERR}, 177826092bf5STheodore Ts'o {Opt_err_ro, EXT4_MOUNT_ERRORS_RO, MOPT_SET | MOPT_CLEAR_ERR}, 177926092bf5STheodore Ts'o {Opt_err_cont, EXT4_MOUNT_ERRORS_CONT, MOPT_SET | MOPT_CLEAR_ERR}, 17808dc0aa8cSTheodore Ts'o {Opt_data_err_abort, EXT4_MOUNT_DATA_ERR_ABORT, 17817915a861SAles Novak MOPT_NO_EXT2}, 17828dc0aa8cSTheodore Ts'o {Opt_data_err_ignore, EXT4_MOUNT_DATA_ERR_ABORT, 17837915a861SAles Novak MOPT_NO_EXT2}, 178426092bf5STheodore Ts'o {Opt_barrier, EXT4_MOUNT_BARRIER, MOPT_SET}, 178526092bf5STheodore Ts'o {Opt_nobarrier, EXT4_MOUNT_BARRIER, MOPT_CLEAR}, 178626092bf5STheodore Ts'o {Opt_noauto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_SET}, 178726092bf5STheodore Ts'o {Opt_auto_da_alloc, EXT4_MOUNT_NO_AUTO_DA_ALLOC, MOPT_CLEAR}, 178826092bf5STheodore Ts'o {Opt_noinit_itable, EXT4_MOUNT_INIT_INODE_TABLE, MOPT_CLEAR}, 178926092bf5STheodore Ts'o {Opt_commit, 0, MOPT_GTE0}, 179026092bf5STheodore Ts'o {Opt_max_batch_time, 0, MOPT_GTE0}, 179126092bf5STheodore Ts'o {Opt_min_batch_time, 0, MOPT_GTE0}, 179226092bf5STheodore Ts'o {Opt_inode_readahead_blks, 0, MOPT_GTE0}, 179326092bf5STheodore Ts'o {Opt_init_itable, 0, MOPT_GTE0}, 1794923ae0ffSRoss Zwisler {Opt_dax, EXT4_MOUNT_DAX, MOPT_SET}, 179526092bf5STheodore Ts'o {Opt_stripe, 0, MOPT_GTE0}, 17960efb3b23SJan Kara {Opt_resuid, 0, MOPT_GTE0}, 17970efb3b23SJan Kara {Opt_resgid, 0, MOPT_GTE0}, 17985ba92bcfSCarlos Maiolino {Opt_journal_dev, 0, MOPT_NO_EXT2 | MOPT_GTE0}, 17995ba92bcfSCarlos Maiolino {Opt_journal_path, 0, MOPT_NO_EXT2 | MOPT_STRING}, 18005ba92bcfSCarlos Maiolino {Opt_journal_ioprio, 0, MOPT_NO_EXT2 | MOPT_GTE0}, 18018dc0aa8cSTheodore Ts'o {Opt_data_journal, EXT4_MOUNT_JOURNAL_DATA, MOPT_NO_EXT2 | MOPT_DATAJ}, 18028dc0aa8cSTheodore Ts'o {Opt_data_ordered, EXT4_MOUNT_ORDERED_DATA, MOPT_NO_EXT2 | MOPT_DATAJ}, 18038dc0aa8cSTheodore Ts'o {Opt_data_writeback, EXT4_MOUNT_WRITEBACK_DATA, 18048dc0aa8cSTheodore Ts'o MOPT_NO_EXT2 | MOPT_DATAJ}, 180526092bf5STheodore Ts'o {Opt_user_xattr, EXT4_MOUNT_XATTR_USER, MOPT_SET}, 180626092bf5STheodore Ts'o {Opt_nouser_xattr, EXT4_MOUNT_XATTR_USER, MOPT_CLEAR}, 180726092bf5STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL 180826092bf5STheodore Ts'o {Opt_acl, EXT4_MOUNT_POSIX_ACL, MOPT_SET}, 180926092bf5STheodore Ts'o {Opt_noacl, EXT4_MOUNT_POSIX_ACL, MOPT_CLEAR}, 181026092bf5STheodore Ts'o #else 181126092bf5STheodore Ts'o {Opt_acl, 0, MOPT_NOSUPPORT}, 181226092bf5STheodore Ts'o {Opt_noacl, 0, MOPT_NOSUPPORT}, 181326092bf5STheodore Ts'o #endif 181426092bf5STheodore Ts'o {Opt_nouid32, EXT4_MOUNT_NO_UID32, MOPT_SET}, 181526092bf5STheodore Ts'o {Opt_debug, EXT4_MOUNT_DEBUG, MOPT_SET}, 1816670e9875STheodore Ts'o {Opt_debug_want_extra_isize, 0, MOPT_GTE0}, 181726092bf5STheodore Ts'o {Opt_quota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA, MOPT_SET | MOPT_Q}, 181826092bf5STheodore Ts'o {Opt_usrquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA, 181926092bf5STheodore Ts'o MOPT_SET | MOPT_Q}, 182026092bf5STheodore Ts'o {Opt_grpquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_GRPQUOTA, 182126092bf5STheodore Ts'o MOPT_SET | MOPT_Q}, 182249da9392SJan Kara {Opt_prjquota, EXT4_MOUNT_QUOTA | EXT4_MOUNT_PRJQUOTA, 182349da9392SJan Kara MOPT_SET | MOPT_Q}, 182426092bf5STheodore Ts'o {Opt_noquota, (EXT4_MOUNT_QUOTA | EXT4_MOUNT_USRQUOTA | 182549da9392SJan Kara EXT4_MOUNT_GRPQUOTA | EXT4_MOUNT_PRJQUOTA), 182649da9392SJan Kara MOPT_CLEAR | MOPT_Q}, 182726092bf5STheodore Ts'o {Opt_usrjquota, 0, MOPT_Q}, 182826092bf5STheodore Ts'o {Opt_grpjquota, 0, MOPT_Q}, 182926092bf5STheodore Ts'o {Opt_offusrjquota, 0, MOPT_Q}, 183026092bf5STheodore Ts'o {Opt_offgrpjquota, 0, MOPT_Q}, 183126092bf5STheodore Ts'o {Opt_jqfmt_vfsold, QFMT_VFS_OLD, MOPT_QFMT}, 183226092bf5STheodore Ts'o {Opt_jqfmt_vfsv0, QFMT_VFS_V0, MOPT_QFMT}, 183326092bf5STheodore Ts'o {Opt_jqfmt_vfsv1, QFMT_VFS_V1, MOPT_QFMT}, 1834df981d03STheodore Ts'o {Opt_max_dir_size_kb, 0, MOPT_GTE0}, 18356ddb2447STheodore Ts'o {Opt_test_dummy_encryption, 0, MOPT_GTE0}, 1836cdb7ee4cSTahsin Erdogan {Opt_nombcache, EXT4_MOUNT_NO_MBCACHE, MOPT_SET}, 183726092bf5STheodore Ts'o {Opt_err, 0, 0} 183826092bf5STheodore Ts'o }; 183926092bf5STheodore Ts'o 1840c83ad55eSGabriel Krisman Bertazi #ifdef CONFIG_UNICODE 1841c83ad55eSGabriel Krisman Bertazi static const struct ext4_sb_encodings { 1842c83ad55eSGabriel Krisman Bertazi __u16 magic; 1843c83ad55eSGabriel Krisman Bertazi char *name; 1844c83ad55eSGabriel Krisman Bertazi char *version; 1845c83ad55eSGabriel Krisman Bertazi } ext4_sb_encoding_map[] = { 1846c83ad55eSGabriel Krisman Bertazi {EXT4_ENC_UTF8_12_1, "utf8", "12.1.0"}, 1847c83ad55eSGabriel Krisman Bertazi }; 1848c83ad55eSGabriel Krisman Bertazi 1849c83ad55eSGabriel Krisman Bertazi static int ext4_sb_read_encoding(const struct ext4_super_block *es, 1850c83ad55eSGabriel Krisman Bertazi const struct ext4_sb_encodings **encoding, 1851c83ad55eSGabriel Krisman Bertazi __u16 *flags) 1852c83ad55eSGabriel Krisman Bertazi { 1853c83ad55eSGabriel Krisman Bertazi __u16 magic = le16_to_cpu(es->s_encoding); 1854c83ad55eSGabriel Krisman Bertazi int i; 1855c83ad55eSGabriel Krisman Bertazi 1856c83ad55eSGabriel Krisman Bertazi for (i = 0; i < ARRAY_SIZE(ext4_sb_encoding_map); i++) 1857c83ad55eSGabriel Krisman Bertazi if (magic == ext4_sb_encoding_map[i].magic) 1858c83ad55eSGabriel Krisman Bertazi break; 1859c83ad55eSGabriel Krisman Bertazi 1860c83ad55eSGabriel Krisman Bertazi if (i >= ARRAY_SIZE(ext4_sb_encoding_map)) 1861c83ad55eSGabriel Krisman Bertazi return -EINVAL; 1862c83ad55eSGabriel Krisman Bertazi 1863c83ad55eSGabriel Krisman Bertazi *encoding = &ext4_sb_encoding_map[i]; 1864c83ad55eSGabriel Krisman Bertazi *flags = le16_to_cpu(es->s_encoding_flags); 1865c83ad55eSGabriel Krisman Bertazi 1866c83ad55eSGabriel Krisman Bertazi return 0; 1867c83ad55eSGabriel Krisman Bertazi } 1868c83ad55eSGabriel Krisman Bertazi #endif 1869c83ad55eSGabriel Krisman Bertazi 187026092bf5STheodore Ts'o static int handle_mount_opt(struct super_block *sb, char *opt, int token, 187126092bf5STheodore Ts'o substring_t *args, unsigned long *journal_devnum, 187226092bf5STheodore Ts'o unsigned int *journal_ioprio, int is_remount) 187326092bf5STheodore Ts'o { 187426092bf5STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb); 187526092bf5STheodore Ts'o const struct mount_opts *m; 187608cefc7aSEric W. Biederman kuid_t uid; 187708cefc7aSEric W. Biederman kgid_t gid; 187826092bf5STheodore Ts'o int arg = 0; 187926092bf5STheodore Ts'o 188057f73c2cSTheodore Ts'o #ifdef CONFIG_QUOTA 188157f73c2cSTheodore Ts'o if (token == Opt_usrjquota) 188257f73c2cSTheodore Ts'o return set_qf_name(sb, USRQUOTA, &args[0]); 188357f73c2cSTheodore Ts'o else if (token == Opt_grpjquota) 188457f73c2cSTheodore Ts'o return set_qf_name(sb, GRPQUOTA, &args[0]); 188557f73c2cSTheodore Ts'o else if (token == Opt_offusrjquota) 188657f73c2cSTheodore Ts'o return clear_qf_name(sb, USRQUOTA); 188757f73c2cSTheodore Ts'o else if (token == Opt_offgrpjquota) 188857f73c2cSTheodore Ts'o return clear_qf_name(sb, GRPQUOTA); 188957f73c2cSTheodore Ts'o #endif 189026092bf5STheodore Ts'o switch (token) { 1891f7048605STheodore Ts'o case Opt_noacl: 1892f7048605STheodore Ts'o case Opt_nouser_xattr: 1893f7048605STheodore Ts'o ext4_msg(sb, KERN_WARNING, deprecated_msg, opt, "3.5"); 1894f7048605STheodore Ts'o break; 189526092bf5STheodore Ts'o case Opt_sb: 189626092bf5STheodore Ts'o return 1; /* handled by get_sb_block() */ 189726092bf5STheodore Ts'o case Opt_removed: 18985f3633e3SJan Kara ext4_msg(sb, KERN_WARNING, "Ignoring removed %s option", opt); 189926092bf5STheodore Ts'o return 1; 190026092bf5STheodore Ts'o case Opt_abort: 190126092bf5STheodore Ts'o sbi->s_mount_flags |= EXT4_MF_FS_ABORTED; 190226092bf5STheodore Ts'o return 1; 190326092bf5STheodore Ts'o case Opt_i_version: 1904357fdad0SMatthew Garrett sb->s_flags |= SB_I_VERSION; 190526092bf5STheodore Ts'o return 1; 1906a26f4992STheodore Ts'o case Opt_lazytime: 19071751e8a6SLinus Torvalds sb->s_flags |= SB_LAZYTIME; 1908a26f4992STheodore Ts'o return 1; 1909a26f4992STheodore Ts'o case Opt_nolazytime: 19101751e8a6SLinus Torvalds sb->s_flags &= ~SB_LAZYTIME; 1911a26f4992STheodore Ts'o return 1; 191226092bf5STheodore Ts'o } 191326092bf5STheodore Ts'o 19145f3633e3SJan Kara for (m = ext4_mount_opts; m->token != Opt_err; m++) 19155f3633e3SJan Kara if (token == m->token) 19165f3633e3SJan Kara break; 19175f3633e3SJan Kara 19185f3633e3SJan Kara if (m->token == Opt_err) { 19195f3633e3SJan Kara ext4_msg(sb, KERN_ERR, "Unrecognized mount option \"%s\" " 19205f3633e3SJan Kara "or missing value", opt); 19215f3633e3SJan Kara return -1; 19225f3633e3SJan Kara } 19235f3633e3SJan Kara 19248dc0aa8cSTheodore Ts'o if ((m->flags & MOPT_NO_EXT2) && IS_EXT2_SB(sb)) { 19258dc0aa8cSTheodore Ts'o ext4_msg(sb, KERN_ERR, 19268dc0aa8cSTheodore Ts'o "Mount option \"%s\" incompatible with ext2", opt); 19278dc0aa8cSTheodore Ts'o return -1; 19288dc0aa8cSTheodore Ts'o } 19298dc0aa8cSTheodore Ts'o if ((m->flags & MOPT_NO_EXT3) && IS_EXT3_SB(sb)) { 19308dc0aa8cSTheodore Ts'o ext4_msg(sb, KERN_ERR, 19318dc0aa8cSTheodore Ts'o "Mount option \"%s\" incompatible with ext3", opt); 19328dc0aa8cSTheodore Ts'o return -1; 19338dc0aa8cSTheodore Ts'o } 19348dc0aa8cSTheodore Ts'o 1935ad4eec61SEric Sandeen if (args->from && !(m->flags & MOPT_STRING) && match_int(args, &arg)) 19360efb3b23SJan Kara return -1; 193726092bf5STheodore Ts'o if (args->from && (m->flags & MOPT_GTE0) && (arg < 0)) 193826092bf5STheodore Ts'o return -1; 1939c93cf2d7SDmitry Monakhov if (m->flags & MOPT_EXPLICIT) { 1940c93cf2d7SDmitry Monakhov if (m->mount_opt & EXT4_MOUNT_DELALLOC) { 194126092bf5STheodore Ts'o set_opt2(sb, EXPLICIT_DELALLOC); 19421e381f60SDmitry Monakhov } else if (m->mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) { 19431e381f60SDmitry Monakhov set_opt2(sb, EXPLICIT_JOURNAL_CHECKSUM); 1944c93cf2d7SDmitry Monakhov } else 1945c93cf2d7SDmitry Monakhov return -1; 1946c93cf2d7SDmitry Monakhov } 194726092bf5STheodore Ts'o if (m->flags & MOPT_CLEAR_ERR) 194826092bf5STheodore Ts'o clear_opt(sb, ERRORS_MASK); 194926092bf5STheodore Ts'o if (token == Opt_noquota && sb_any_quota_loaded(sb)) { 195026092bf5STheodore Ts'o ext4_msg(sb, KERN_ERR, "Cannot change quota " 195126092bf5STheodore Ts'o "options when quota turned on"); 195226092bf5STheodore Ts'o return -1; 195326092bf5STheodore Ts'o } 195426092bf5STheodore Ts'o 195526092bf5STheodore Ts'o if (m->flags & MOPT_NOSUPPORT) { 195626092bf5STheodore Ts'o ext4_msg(sb, KERN_ERR, "%s option not supported", opt); 195726092bf5STheodore Ts'o } else if (token == Opt_commit) { 195826092bf5STheodore Ts'o if (arg == 0) 195926092bf5STheodore Ts'o arg = JBD2_DEFAULT_MAX_COMMIT_AGE; 19609ba55543Szhangyi (F) else if (arg > INT_MAX / HZ) { 19619ba55543Szhangyi (F) ext4_msg(sb, KERN_ERR, 19629ba55543Szhangyi (F) "Invalid commit interval %d, " 19639ba55543Szhangyi (F) "must be smaller than %d", 19649ba55543Szhangyi (F) arg, INT_MAX / HZ); 19659ba55543Szhangyi (F) return -1; 19669ba55543Szhangyi (F) } 196726092bf5STheodore Ts'o sbi->s_commit_interval = HZ * arg; 1968670e9875STheodore Ts'o } else if (token == Opt_debug_want_extra_isize) { 19699803387cSTheodore Ts'o if ((arg & 1) || 19709803387cSTheodore Ts'o (arg < 4) || 19719803387cSTheodore Ts'o (arg > (sbi->s_inode_size - EXT4_GOOD_OLD_INODE_SIZE))) { 19729803387cSTheodore Ts'o ext4_msg(sb, KERN_ERR, 19739803387cSTheodore Ts'o "Invalid want_extra_isize %d", arg); 19749803387cSTheodore Ts'o return -1; 19759803387cSTheodore Ts'o } 1976670e9875STheodore Ts'o sbi->s_want_extra_isize = arg; 197726092bf5STheodore Ts'o } else if (token == Opt_max_batch_time) { 197826092bf5STheodore Ts'o sbi->s_max_batch_time = arg; 197926092bf5STheodore Ts'o } else if (token == Opt_min_batch_time) { 198026092bf5STheodore Ts'o sbi->s_min_batch_time = arg; 198126092bf5STheodore Ts'o } else if (token == Opt_inode_readahead_blks) { 1982e33e60eaSJan Kara if (arg && (arg > (1 << 30) || !is_power_of_2(arg))) { 1983e33e60eaSJan Kara ext4_msg(sb, KERN_ERR, 1984e33e60eaSJan Kara "EXT4-fs: inode_readahead_blks must be " 1985e33e60eaSJan Kara "0 or a power of 2 smaller than 2^31"); 198626092bf5STheodore Ts'o return -1; 198726092bf5STheodore Ts'o } 198826092bf5STheodore Ts'o sbi->s_inode_readahead_blks = arg; 198926092bf5STheodore Ts'o } else if (token == Opt_init_itable) { 199026092bf5STheodore Ts'o set_opt(sb, INIT_INODE_TABLE); 199126092bf5STheodore Ts'o if (!args->from) 199226092bf5STheodore Ts'o arg = EXT4_DEF_LI_WAIT_MULT; 199326092bf5STheodore Ts'o sbi->s_li_wait_mult = arg; 1994df981d03STheodore Ts'o } else if (token == Opt_max_dir_size_kb) { 1995df981d03STheodore Ts'o sbi->s_max_dir_size_kb = arg; 199626092bf5STheodore Ts'o } else if (token == Opt_stripe) { 199726092bf5STheodore Ts'o sbi->s_stripe = arg; 19980efb3b23SJan Kara } else if (token == Opt_resuid) { 19990efb3b23SJan Kara uid = make_kuid(current_user_ns(), arg); 20000efb3b23SJan Kara if (!uid_valid(uid)) { 20015f3633e3SJan Kara ext4_msg(sb, KERN_ERR, "Invalid uid value %d", arg); 20020efb3b23SJan Kara return -1; 20030efb3b23SJan Kara } 20040efb3b23SJan Kara sbi->s_resuid = uid; 20050efb3b23SJan Kara } else if (token == Opt_resgid) { 20060efb3b23SJan Kara gid = make_kgid(current_user_ns(), arg); 20070efb3b23SJan Kara if (!gid_valid(gid)) { 20085f3633e3SJan Kara ext4_msg(sb, KERN_ERR, "Invalid gid value %d", arg); 20090efb3b23SJan Kara return -1; 20100efb3b23SJan Kara } 20110efb3b23SJan Kara sbi->s_resgid = gid; 20120efb3b23SJan Kara } else if (token == Opt_journal_dev) { 20130efb3b23SJan Kara if (is_remount) { 20140efb3b23SJan Kara ext4_msg(sb, KERN_ERR, 20150efb3b23SJan Kara "Cannot specify journal on remount"); 20160efb3b23SJan Kara return -1; 20170efb3b23SJan Kara } 20180efb3b23SJan Kara *journal_devnum = arg; 2019ad4eec61SEric Sandeen } else if (token == Opt_journal_path) { 2020ad4eec61SEric Sandeen char *journal_path; 2021ad4eec61SEric Sandeen struct inode *journal_inode; 2022ad4eec61SEric Sandeen struct path path; 2023ad4eec61SEric Sandeen int error; 2024ad4eec61SEric Sandeen 2025ad4eec61SEric Sandeen if (is_remount) { 2026ad4eec61SEric Sandeen ext4_msg(sb, KERN_ERR, 2027ad4eec61SEric Sandeen "Cannot specify journal on remount"); 2028ad4eec61SEric Sandeen return -1; 2029ad4eec61SEric Sandeen } 2030ad4eec61SEric Sandeen journal_path = match_strdup(&args[0]); 2031ad4eec61SEric Sandeen if (!journal_path) { 2032ad4eec61SEric Sandeen ext4_msg(sb, KERN_ERR, "error: could not dup " 2033ad4eec61SEric Sandeen "journal device string"); 2034ad4eec61SEric Sandeen return -1; 2035ad4eec61SEric Sandeen } 2036ad4eec61SEric Sandeen 2037ad4eec61SEric Sandeen error = kern_path(journal_path, LOOKUP_FOLLOW, &path); 2038ad4eec61SEric Sandeen if (error) { 2039ad4eec61SEric Sandeen ext4_msg(sb, KERN_ERR, "error: could not find " 2040ad4eec61SEric Sandeen "journal device path: error %d", error); 2041ad4eec61SEric Sandeen kfree(journal_path); 2042ad4eec61SEric Sandeen return -1; 2043ad4eec61SEric Sandeen } 2044ad4eec61SEric Sandeen 20452b0143b5SDavid Howells journal_inode = d_inode(path.dentry); 2046ad4eec61SEric Sandeen if (!S_ISBLK(journal_inode->i_mode)) { 2047ad4eec61SEric Sandeen ext4_msg(sb, KERN_ERR, "error: journal path %s " 2048ad4eec61SEric Sandeen "is not a block device", journal_path); 2049ad4eec61SEric Sandeen path_put(&path); 2050ad4eec61SEric Sandeen kfree(journal_path); 2051ad4eec61SEric Sandeen return -1; 2052ad4eec61SEric Sandeen } 2053ad4eec61SEric Sandeen 2054ad4eec61SEric Sandeen *journal_devnum = new_encode_dev(journal_inode->i_rdev); 2055ad4eec61SEric Sandeen path_put(&path); 2056ad4eec61SEric Sandeen kfree(journal_path); 20570efb3b23SJan Kara } else if (token == Opt_journal_ioprio) { 20580efb3b23SJan Kara if (arg > 7) { 20595f3633e3SJan Kara ext4_msg(sb, KERN_ERR, "Invalid journal IO priority" 20600efb3b23SJan Kara " (must be 0-7)"); 20610efb3b23SJan Kara return -1; 20620efb3b23SJan Kara } 20630efb3b23SJan Kara *journal_ioprio = 20640efb3b23SJan Kara IOPRIO_PRIO_VALUE(IOPRIO_CLASS_BE, arg); 20656ddb2447STheodore Ts'o } else if (token == Opt_test_dummy_encryption) { 2066643fa961SChandan Rajendra #ifdef CONFIG_FS_ENCRYPTION 20676ddb2447STheodore Ts'o sbi->s_mount_flags |= EXT4_MF_TEST_DUMMY_ENCRYPTION; 20686ddb2447STheodore Ts'o ext4_msg(sb, KERN_WARNING, 20696ddb2447STheodore Ts'o "Test dummy encryption mode enabled"); 20706ddb2447STheodore Ts'o #else 20716ddb2447STheodore Ts'o ext4_msg(sb, KERN_WARNING, 20726ddb2447STheodore Ts'o "Test dummy encryption mount option ignored"); 20736ddb2447STheodore Ts'o #endif 207426092bf5STheodore Ts'o } else if (m->flags & MOPT_DATAJ) { 207526092bf5STheodore Ts'o if (is_remount) { 207626092bf5STheodore Ts'o if (!sbi->s_journal) 207726092bf5STheodore Ts'o ext4_msg(sb, KERN_WARNING, "Remounting file system with no journal so ignoring journalled data option"); 20785f3633e3SJan Kara else if (test_opt(sb, DATA_FLAGS) != m->mount_opt) { 207926092bf5STheodore Ts'o ext4_msg(sb, KERN_ERR, 208026092bf5STheodore Ts'o "Cannot change data mode on remount"); 208126092bf5STheodore Ts'o return -1; 208226092bf5STheodore Ts'o } 208326092bf5STheodore Ts'o } else { 208426092bf5STheodore Ts'o clear_opt(sb, DATA_FLAGS); 208526092bf5STheodore Ts'o sbi->s_mount_opt |= m->mount_opt; 208626092bf5STheodore Ts'o } 208726092bf5STheodore Ts'o #ifdef CONFIG_QUOTA 208826092bf5STheodore Ts'o } else if (m->flags & MOPT_QFMT) { 208926092bf5STheodore Ts'o if (sb_any_quota_loaded(sb) && 209026092bf5STheodore Ts'o sbi->s_jquota_fmt != m->mount_opt) { 20915f3633e3SJan Kara ext4_msg(sb, KERN_ERR, "Cannot change journaled " 20925f3633e3SJan Kara "quota options when quota turned on"); 209326092bf5STheodore Ts'o return -1; 209426092bf5STheodore Ts'o } 2095e2b911c5SDarrick J. Wong if (ext4_has_feature_quota(sb)) { 2096c325a67cSTheodore Ts'o ext4_msg(sb, KERN_INFO, 2097c325a67cSTheodore Ts'o "Quota format mount options ignored " 2098262b4662SJan Kara "when QUOTA feature is enabled"); 2099c325a67cSTheodore Ts'o return 1; 2100262b4662SJan Kara } 210126092bf5STheodore Ts'o sbi->s_jquota_fmt = m->mount_opt; 210226092bf5STheodore Ts'o #endif 2103923ae0ffSRoss Zwisler } else if (token == Opt_dax) { 2104ef83b6e8SDan Williams #ifdef CONFIG_FS_DAX 2105ef83b6e8SDan Williams ext4_msg(sb, KERN_WARNING, 2106ef83b6e8SDan Williams "DAX enabled. Warning: EXPERIMENTAL, use at your own risk"); 2107ef83b6e8SDan Williams sbi->s_mount_opt |= m->mount_opt; 2108ef83b6e8SDan Williams #else 2109923ae0ffSRoss Zwisler ext4_msg(sb, KERN_INFO, "dax option not supported"); 2110923ae0ffSRoss Zwisler return -1; 2111923ae0ffSRoss Zwisler #endif 21127915a861SAles Novak } else if (token == Opt_data_err_abort) { 21137915a861SAles Novak sbi->s_mount_opt |= m->mount_opt; 21147915a861SAles Novak } else if (token == Opt_data_err_ignore) { 21157915a861SAles Novak sbi->s_mount_opt &= ~m->mount_opt; 211626092bf5STheodore Ts'o } else { 211726092bf5STheodore Ts'o if (!args->from) 211826092bf5STheodore Ts'o arg = 1; 211926092bf5STheodore Ts'o if (m->flags & MOPT_CLEAR) 212026092bf5STheodore Ts'o arg = !arg; 212126092bf5STheodore Ts'o else if (unlikely(!(m->flags & MOPT_SET))) { 212226092bf5STheodore Ts'o ext4_msg(sb, KERN_WARNING, 212326092bf5STheodore Ts'o "buggy handling of option %s", opt); 212426092bf5STheodore Ts'o WARN_ON(1); 212526092bf5STheodore Ts'o return -1; 212626092bf5STheodore Ts'o } 212726092bf5STheodore Ts'o if (arg != 0) 212826092bf5STheodore Ts'o sbi->s_mount_opt |= m->mount_opt; 212926092bf5STheodore Ts'o else 213026092bf5STheodore Ts'o sbi->s_mount_opt &= ~m->mount_opt; 213126092bf5STheodore Ts'o } 213226092bf5STheodore Ts'o return 1; 213326092bf5STheodore Ts'o } 213426092bf5STheodore Ts'o 2135ac27a0ecSDave Kleikamp static int parse_options(char *options, struct super_block *sb, 2136c3191067STheodore Ts'o unsigned long *journal_devnum, 2137b3881f74STheodore Ts'o unsigned int *journal_ioprio, 2138661aa520SEric Sandeen int is_remount) 2139ac27a0ecSDave Kleikamp { 21401e1a76edSOlof Johansson struct ext4_sb_info __maybe_unused *sbi = EXT4_SB(sb); 214133458eabSTheodore Ts'o char *p, __maybe_unused *usr_qf_name, __maybe_unused *grp_qf_name; 2142ac27a0ecSDave Kleikamp substring_t args[MAX_OPT_ARGS]; 214326092bf5STheodore Ts'o int token; 2144ac27a0ecSDave Kleikamp 2145ac27a0ecSDave Kleikamp if (!options) 2146ac27a0ecSDave Kleikamp return 1; 2147ac27a0ecSDave Kleikamp 2148ac27a0ecSDave Kleikamp while ((p = strsep(&options, ",")) != NULL) { 2149ac27a0ecSDave Kleikamp if (!*p) 2150ac27a0ecSDave Kleikamp continue; 215115121c18SEric Sandeen /* 215215121c18SEric Sandeen * Initialize args struct so we know whether arg was 215315121c18SEric Sandeen * found; some options take optional arguments. 215415121c18SEric Sandeen */ 2155caecd0afSSachin Kamat args[0].to = args[0].from = NULL; 2156ac27a0ecSDave Kleikamp token = match_token(p, tokens, args); 215726092bf5STheodore Ts'o if (handle_mount_opt(sb, p, token, args, journal_devnum, 215826092bf5STheodore Ts'o journal_ioprio, is_remount) < 0) 2159ac27a0ecSDave Kleikamp return 0; 2160ac27a0ecSDave Kleikamp } 2161ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 216249da9392SJan Kara /* 216349da9392SJan Kara * We do the test below only for project quotas. 'usrquota' and 216449da9392SJan Kara * 'grpquota' mount options are allowed even without quota feature 216549da9392SJan Kara * to support legacy quotas in quota files. 216649da9392SJan Kara */ 216749da9392SJan Kara if (test_opt(sb, PRJQUOTA) && !ext4_has_feature_project(sb)) { 216849da9392SJan Kara ext4_msg(sb, KERN_ERR, "Project quota feature not enabled. " 216949da9392SJan Kara "Cannot enable project quota enforcement."); 217049da9392SJan Kara return 0; 217149da9392SJan Kara } 217233458eabSTheodore Ts'o usr_qf_name = get_qf_name(sb, sbi, USRQUOTA); 217333458eabSTheodore Ts'o grp_qf_name = get_qf_name(sb, sbi, GRPQUOTA); 217433458eabSTheodore Ts'o if (usr_qf_name || grp_qf_name) { 217533458eabSTheodore Ts'o if (test_opt(sb, USRQUOTA) && usr_qf_name) 2176fd8c37ecSTheodore Ts'o clear_opt(sb, USRQUOTA); 2177ac27a0ecSDave Kleikamp 217833458eabSTheodore Ts'o if (test_opt(sb, GRPQUOTA) && grp_qf_name) 2179fd8c37ecSTheodore Ts'o clear_opt(sb, GRPQUOTA); 2180ac27a0ecSDave Kleikamp 218156c50f11SDmitry Monakhov if (test_opt(sb, GRPQUOTA) || test_opt(sb, USRQUOTA)) { 2182b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "old and new quota " 2183b31e1552SEric Sandeen "format mixing"); 2184ac27a0ecSDave Kleikamp return 0; 2185ac27a0ecSDave Kleikamp } 2186ac27a0ecSDave Kleikamp 2187ac27a0ecSDave Kleikamp if (!sbi->s_jquota_fmt) { 2188b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "journaled quota format " 2189b31e1552SEric Sandeen "not specified"); 2190ac27a0ecSDave Kleikamp return 0; 2191ac27a0ecSDave Kleikamp } 2192ac27a0ecSDave Kleikamp } 2193ac27a0ecSDave Kleikamp #endif 2194ac27a0ecSDave Kleikamp return 1; 2195ac27a0ecSDave Kleikamp } 2196ac27a0ecSDave Kleikamp 21972adf6da8STheodore Ts'o static inline void ext4_show_quota_options(struct seq_file *seq, 21982adf6da8STheodore Ts'o struct super_block *sb) 21992adf6da8STheodore Ts'o { 22002adf6da8STheodore Ts'o #if defined(CONFIG_QUOTA) 22012adf6da8STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb); 220233458eabSTheodore Ts'o char *usr_qf_name, *grp_qf_name; 22032adf6da8STheodore Ts'o 22042adf6da8STheodore Ts'o if (sbi->s_jquota_fmt) { 22052adf6da8STheodore Ts'o char *fmtname = ""; 22062adf6da8STheodore Ts'o 22072adf6da8STheodore Ts'o switch (sbi->s_jquota_fmt) { 22082adf6da8STheodore Ts'o case QFMT_VFS_OLD: 22092adf6da8STheodore Ts'o fmtname = "vfsold"; 22102adf6da8STheodore Ts'o break; 22112adf6da8STheodore Ts'o case QFMT_VFS_V0: 22122adf6da8STheodore Ts'o fmtname = "vfsv0"; 22132adf6da8STheodore Ts'o break; 22142adf6da8STheodore Ts'o case QFMT_VFS_V1: 22152adf6da8STheodore Ts'o fmtname = "vfsv1"; 22162adf6da8STheodore Ts'o break; 22172adf6da8STheodore Ts'o } 22182adf6da8STheodore Ts'o seq_printf(seq, ",jqfmt=%s", fmtname); 22192adf6da8STheodore Ts'o } 22202adf6da8STheodore Ts'o 222133458eabSTheodore Ts'o rcu_read_lock(); 222233458eabSTheodore Ts'o usr_qf_name = rcu_dereference(sbi->s_qf_names[USRQUOTA]); 222333458eabSTheodore Ts'o grp_qf_name = rcu_dereference(sbi->s_qf_names[GRPQUOTA]); 222433458eabSTheodore Ts'o if (usr_qf_name) 222533458eabSTheodore Ts'o seq_show_option(seq, "usrjquota", usr_qf_name); 222633458eabSTheodore Ts'o if (grp_qf_name) 222733458eabSTheodore Ts'o seq_show_option(seq, "grpjquota", grp_qf_name); 222833458eabSTheodore Ts'o rcu_read_unlock(); 22292adf6da8STheodore Ts'o #endif 22302adf6da8STheodore Ts'o } 22312adf6da8STheodore Ts'o 22325a916be1STheodore Ts'o static const char *token2str(int token) 22335a916be1STheodore Ts'o { 223450df9fd5SHerton Ronaldo Krzesinski const struct match_token *t; 22355a916be1STheodore Ts'o 22365a916be1STheodore Ts'o for (t = tokens; t->token != Opt_err; t++) 22375a916be1STheodore Ts'o if (t->token == token && !strchr(t->pattern, '=')) 22385a916be1STheodore Ts'o break; 22395a916be1STheodore Ts'o return t->pattern; 22405a916be1STheodore Ts'o } 22415a916be1STheodore Ts'o 22422adf6da8STheodore Ts'o /* 22432adf6da8STheodore Ts'o * Show an option if 22442adf6da8STheodore Ts'o * - it's set to a non-default value OR 22452adf6da8STheodore Ts'o * - if the per-sb default is different from the global default 22462adf6da8STheodore Ts'o */ 224766acdcf4STheodore Ts'o static int _ext4_show_options(struct seq_file *seq, struct super_block *sb, 224866acdcf4STheodore Ts'o int nodefs) 22492adf6da8STheodore Ts'o { 22502adf6da8STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb); 22512adf6da8STheodore Ts'o struct ext4_super_block *es = sbi->s_es; 225268afa7e0STyson Nottingham int def_errors, def_mount_opt = sbi->s_def_mount_opt; 22535a916be1STheodore Ts'o const struct mount_opts *m; 225466acdcf4STheodore Ts'o char sep = nodefs ? '\n' : ','; 22552adf6da8STheodore Ts'o 225666acdcf4STheodore Ts'o #define SEQ_OPTS_PUTS(str) seq_printf(seq, "%c" str, sep) 225766acdcf4STheodore Ts'o #define SEQ_OPTS_PRINT(str, arg) seq_printf(seq, "%c" str, sep, arg) 22582adf6da8STheodore Ts'o 22592adf6da8STheodore Ts'o if (sbi->s_sb_block != 1) 22605a916be1STheodore Ts'o SEQ_OPTS_PRINT("sb=%llu", sbi->s_sb_block); 22615a916be1STheodore Ts'o 22625a916be1STheodore Ts'o for (m = ext4_mount_opts; m->token != Opt_err; m++) { 22635a916be1STheodore Ts'o int want_set = m->flags & MOPT_SET; 22645a916be1STheodore Ts'o if (((m->flags & (MOPT_SET|MOPT_CLEAR)) == 0) || 22655a916be1STheodore Ts'o (m->flags & MOPT_CLEAR_ERR)) 22665a916be1STheodore Ts'o continue; 226768afa7e0STyson Nottingham if (!nodefs && !(m->mount_opt & (sbi->s_mount_opt ^ def_mount_opt))) 22685a916be1STheodore Ts'o continue; /* skip if same as the default */ 22695a916be1STheodore Ts'o if ((want_set && 22705a916be1STheodore Ts'o (sbi->s_mount_opt & m->mount_opt) != m->mount_opt) || 22715a916be1STheodore Ts'o (!want_set && (sbi->s_mount_opt & m->mount_opt))) 22725a916be1STheodore Ts'o continue; /* select Opt_noFoo vs Opt_Foo */ 22735a916be1STheodore Ts'o SEQ_OPTS_PRINT("%s", token2str(m->token)); 22745a916be1STheodore Ts'o } 22755a916be1STheodore Ts'o 227608cefc7aSEric W. Biederman if (nodefs || !uid_eq(sbi->s_resuid, make_kuid(&init_user_ns, EXT4_DEF_RESUID)) || 22775a916be1STheodore Ts'o le16_to_cpu(es->s_def_resuid) != EXT4_DEF_RESUID) 227808cefc7aSEric W. Biederman SEQ_OPTS_PRINT("resuid=%u", 227908cefc7aSEric W. Biederman from_kuid_munged(&init_user_ns, sbi->s_resuid)); 228008cefc7aSEric W. Biederman if (nodefs || !gid_eq(sbi->s_resgid, make_kgid(&init_user_ns, EXT4_DEF_RESGID)) || 22815a916be1STheodore Ts'o le16_to_cpu(es->s_def_resgid) != EXT4_DEF_RESGID) 228208cefc7aSEric W. Biederman SEQ_OPTS_PRINT("resgid=%u", 228308cefc7aSEric W. Biederman from_kgid_munged(&init_user_ns, sbi->s_resgid)); 228466acdcf4STheodore Ts'o def_errors = nodefs ? -1 : le16_to_cpu(es->s_errors); 22855a916be1STheodore Ts'o if (test_opt(sb, ERRORS_RO) && def_errors != EXT4_ERRORS_RO) 22865a916be1STheodore Ts'o SEQ_OPTS_PUTS("errors=remount-ro"); 22872adf6da8STheodore Ts'o if (test_opt(sb, ERRORS_CONT) && def_errors != EXT4_ERRORS_CONTINUE) 22885a916be1STheodore Ts'o SEQ_OPTS_PUTS("errors=continue"); 22892adf6da8STheodore Ts'o if (test_opt(sb, ERRORS_PANIC) && def_errors != EXT4_ERRORS_PANIC) 22905a916be1STheodore Ts'o SEQ_OPTS_PUTS("errors=panic"); 229166acdcf4STheodore Ts'o if (nodefs || sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ) 22925a916be1STheodore Ts'o SEQ_OPTS_PRINT("commit=%lu", sbi->s_commit_interval / HZ); 229366acdcf4STheodore Ts'o if (nodefs || sbi->s_min_batch_time != EXT4_DEF_MIN_BATCH_TIME) 22945a916be1STheodore Ts'o SEQ_OPTS_PRINT("min_batch_time=%u", sbi->s_min_batch_time); 229566acdcf4STheodore Ts'o if (nodefs || sbi->s_max_batch_time != EXT4_DEF_MAX_BATCH_TIME) 22965a916be1STheodore Ts'o SEQ_OPTS_PRINT("max_batch_time=%u", sbi->s_max_batch_time); 2297357fdad0SMatthew Garrett if (sb->s_flags & SB_I_VERSION) 22985a916be1STheodore Ts'o SEQ_OPTS_PUTS("i_version"); 229966acdcf4STheodore Ts'o if (nodefs || sbi->s_stripe) 23005a916be1STheodore Ts'o SEQ_OPTS_PRINT("stripe=%lu", sbi->s_stripe); 230168afa7e0STyson Nottingham if (nodefs || EXT4_MOUNT_DATA_FLAGS & 230268afa7e0STyson Nottingham (sbi->s_mount_opt ^ def_mount_opt)) { 23032adf6da8STheodore Ts'o if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) 23045a916be1STheodore Ts'o SEQ_OPTS_PUTS("data=journal"); 23052adf6da8STheodore Ts'o else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA) 23065a916be1STheodore Ts'o SEQ_OPTS_PUTS("data=ordered"); 23072adf6da8STheodore Ts'o else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_WRITEBACK_DATA) 23085a916be1STheodore Ts'o SEQ_OPTS_PUTS("data=writeback"); 23095a916be1STheodore Ts'o } 231066acdcf4STheodore Ts'o if (nodefs || 231166acdcf4STheodore Ts'o sbi->s_inode_readahead_blks != EXT4_DEF_INODE_READAHEAD_BLKS) 23125a916be1STheodore Ts'o SEQ_OPTS_PRINT("inode_readahead_blks=%u", 23132adf6da8STheodore Ts'o sbi->s_inode_readahead_blks); 23142adf6da8STheodore Ts'o 2315ceec0376STyson Nottingham if (test_opt(sb, INIT_INODE_TABLE) && (nodefs || 231666acdcf4STheodore Ts'o (sbi->s_li_wait_mult != EXT4_DEF_LI_WAIT_MULT))) 23175a916be1STheodore Ts'o SEQ_OPTS_PRINT("init_itable=%u", sbi->s_li_wait_mult); 2318df981d03STheodore Ts'o if (nodefs || sbi->s_max_dir_size_kb) 2319df981d03STheodore Ts'o SEQ_OPTS_PRINT("max_dir_size_kb=%u", sbi->s_max_dir_size_kb); 23207915a861SAles Novak if (test_opt(sb, DATA_ERR_ABORT)) 23217915a861SAles Novak SEQ_OPTS_PUTS("data_err=abort"); 2322338affb5SEric Biggers if (DUMMY_ENCRYPTION_ENABLED(sbi)) 2323338affb5SEric Biggers SEQ_OPTS_PUTS("test_dummy_encryption"); 23242adf6da8STheodore Ts'o 23252adf6da8STheodore Ts'o ext4_show_quota_options(seq, sb); 23262adf6da8STheodore Ts'o return 0; 23272adf6da8STheodore Ts'o } 23282adf6da8STheodore Ts'o 232966acdcf4STheodore Ts'o static int ext4_show_options(struct seq_file *seq, struct dentry *root) 233066acdcf4STheodore Ts'o { 233166acdcf4STheodore Ts'o return _ext4_show_options(seq, root->d_sb, 0); 233266acdcf4STheodore Ts'o } 233366acdcf4STheodore Ts'o 2334ebd173beSTheodore Ts'o int ext4_seq_options_show(struct seq_file *seq, void *offset) 233566acdcf4STheodore Ts'o { 233666acdcf4STheodore Ts'o struct super_block *sb = seq->private; 233766acdcf4STheodore Ts'o int rc; 233866acdcf4STheodore Ts'o 2339bc98a42cSDavid Howells seq_puts(seq, sb_rdonly(sb) ? "ro" : "rw"); 234066acdcf4STheodore Ts'o rc = _ext4_show_options(seq, sb, 1); 234166acdcf4STheodore Ts'o seq_puts(seq, "\n"); 234266acdcf4STheodore Ts'o return rc; 234366acdcf4STheodore Ts'o } 234466acdcf4STheodore Ts'o 2345617ba13bSMingming Cao static int ext4_setup_super(struct super_block *sb, struct ext4_super_block *es, 2346ac27a0ecSDave Kleikamp int read_only) 2347ac27a0ecSDave Kleikamp { 2348617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 2349c89128a0SJaegeuk Kim int err = 0; 2350ac27a0ecSDave Kleikamp 2351617ba13bSMingming Cao if (le32_to_cpu(es->s_rev_level) > EXT4_MAX_SUPP_REV) { 2352b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "revision level too high, " 2353b31e1552SEric Sandeen "forcing read-only mode"); 2354c89128a0SJaegeuk Kim err = -EROFS; 2355ac27a0ecSDave Kleikamp } 2356ac27a0ecSDave Kleikamp if (read_only) 2357281b5995STheodore Ts'o goto done; 2358617ba13bSMingming Cao if (!(sbi->s_mount_state & EXT4_VALID_FS)) 2359b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "warning: mounting unchecked fs, " 2360b31e1552SEric Sandeen "running e2fsck is recommended"); 2361c8b459f4SLukas Czerner else if (sbi->s_mount_state & EXT4_ERROR_FS) 2362b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, 2363b31e1552SEric Sandeen "warning: mounting fs with errors, " 2364b31e1552SEric Sandeen "running e2fsck is recommended"); 2365ed3ce80aSTao Ma else if ((__s16) le16_to_cpu(es->s_max_mnt_count) > 0 && 2366ac27a0ecSDave Kleikamp le16_to_cpu(es->s_mnt_count) >= 2367ac27a0ecSDave Kleikamp (unsigned short) (__s16) le16_to_cpu(es->s_max_mnt_count)) 2368b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, 2369b31e1552SEric Sandeen "warning: maximal mount count reached, " 2370b31e1552SEric Sandeen "running e2fsck is recommended"); 2371ac27a0ecSDave Kleikamp else if (le32_to_cpu(es->s_checkinterval) && 23726a0678a7SArnd Bergmann (ext4_get_tstamp(es, s_lastcheck) + 23736a0678a7SArnd Bergmann le32_to_cpu(es->s_checkinterval) <= ktime_get_real_seconds())) 2374b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, 2375b31e1552SEric Sandeen "warning: checktime reached, " 2376b31e1552SEric Sandeen "running e2fsck is recommended"); 23770390131bSFrank Mayhar if (!sbi->s_journal) 2378216c34b2SMarcin Slusarz es->s_state &= cpu_to_le16(~EXT4_VALID_FS); 2379ac27a0ecSDave Kleikamp if (!(__s16) le16_to_cpu(es->s_max_mnt_count)) 2380617ba13bSMingming Cao es->s_max_mnt_count = cpu_to_le16(EXT4_DFL_MAX_MNT_COUNT); 2381e8546d06SMarcin Slusarz le16_add_cpu(&es->s_mnt_count, 1); 23826a0678a7SArnd Bergmann ext4_update_tstamp(es, s_mtime); 23830390131bSFrank Mayhar if (sbi->s_journal) 2384e2b911c5SDarrick J. Wong ext4_set_feature_journal_needs_recovery(sb); 2385ac27a0ecSDave Kleikamp 2386c89128a0SJaegeuk Kim err = ext4_commit_super(sb, 1); 2387281b5995STheodore Ts'o done: 2388ac27a0ecSDave Kleikamp if (test_opt(sb, DEBUG)) 2389a9df9a49STheodore Ts'o printk(KERN_INFO "[EXT4 FS bs=%lu, gc=%u, " 2390a2595b8aSTheodore Ts'o "bpg=%lu, ipg=%lu, mo=%04x, mo2=%04x]\n", 2391ac27a0ecSDave Kleikamp sb->s_blocksize, 2392ac27a0ecSDave Kleikamp sbi->s_groups_count, 2393617ba13bSMingming Cao EXT4_BLOCKS_PER_GROUP(sb), 2394617ba13bSMingming Cao EXT4_INODES_PER_GROUP(sb), 2395a2595b8aSTheodore Ts'o sbi->s_mount_opt, sbi->s_mount_opt2); 2396ac27a0ecSDave Kleikamp 23977abc52c2SDan Magenheimer cleancache_init_fs(sb); 2398c89128a0SJaegeuk Kim return err; 2399ac27a0ecSDave Kleikamp } 2400ac27a0ecSDave Kleikamp 2401117fff10STheodore Ts'o int ext4_alloc_flex_bg_array(struct super_block *sb, ext4_group_t ngroup) 2402117fff10STheodore Ts'o { 2403117fff10STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb); 2404117fff10STheodore Ts'o struct flex_groups *new_groups; 2405117fff10STheodore Ts'o int size; 2406117fff10STheodore Ts'o 2407117fff10STheodore Ts'o if (!sbi->s_log_groups_per_flex) 2408117fff10STheodore Ts'o return 0; 2409117fff10STheodore Ts'o 2410117fff10STheodore Ts'o size = ext4_flex_group(sbi, ngroup - 1) + 1; 2411117fff10STheodore Ts'o if (size <= sbi->s_flex_groups_allocated) 2412117fff10STheodore Ts'o return 0; 2413117fff10STheodore Ts'o 2414117fff10STheodore Ts'o size = roundup_pow_of_two(size * sizeof(struct flex_groups)); 2415a7c3e901SMichal Hocko new_groups = kvzalloc(size, GFP_KERNEL); 2416117fff10STheodore Ts'o if (!new_groups) { 2417117fff10STheodore Ts'o ext4_msg(sb, KERN_ERR, "not enough memory for %d flex groups", 2418117fff10STheodore Ts'o size / (int) sizeof(struct flex_groups)); 2419117fff10STheodore Ts'o return -ENOMEM; 2420117fff10STheodore Ts'o } 2421117fff10STheodore Ts'o 2422117fff10STheodore Ts'o if (sbi->s_flex_groups) { 2423117fff10STheodore Ts'o memcpy(new_groups, sbi->s_flex_groups, 2424117fff10STheodore Ts'o (sbi->s_flex_groups_allocated * 2425117fff10STheodore Ts'o sizeof(struct flex_groups))); 2426b93b41d4SAl Viro kvfree(sbi->s_flex_groups); 2427117fff10STheodore Ts'o } 2428117fff10STheodore Ts'o sbi->s_flex_groups = new_groups; 2429117fff10STheodore Ts'o sbi->s_flex_groups_allocated = size / sizeof(struct flex_groups); 2430117fff10STheodore Ts'o return 0; 2431117fff10STheodore Ts'o } 2432117fff10STheodore Ts'o 2433772cb7c8SJose R. Santos static int ext4_fill_flex_info(struct super_block *sb) 2434772cb7c8SJose R. Santos { 2435772cb7c8SJose R. Santos struct ext4_sb_info *sbi = EXT4_SB(sb); 2436772cb7c8SJose R. Santos struct ext4_group_desc *gdp = NULL; 2437772cb7c8SJose R. Santos ext4_group_t flex_group; 2438117fff10STheodore Ts'o int i, err; 2439772cb7c8SJose R. Santos 2440503358aeSTheodore Ts'o sbi->s_log_groups_per_flex = sbi->s_es->s_log_groups_per_flex; 2441d50f2ab6SXi Wang if (sbi->s_log_groups_per_flex < 1 || sbi->s_log_groups_per_flex > 31) { 2442772cb7c8SJose R. Santos sbi->s_log_groups_per_flex = 0; 2443772cb7c8SJose R. Santos return 1; 2444772cb7c8SJose R. Santos } 2445772cb7c8SJose R. Santos 2446117fff10STheodore Ts'o err = ext4_alloc_flex_bg_array(sb, sbi->s_groups_count); 2447117fff10STheodore Ts'o if (err) 2448772cb7c8SJose R. Santos goto failed; 2449772cb7c8SJose R. Santos 2450772cb7c8SJose R. Santos for (i = 0; i < sbi->s_groups_count; i++) { 245188b6edd1STheodore Ts'o gdp = ext4_get_group_desc(sb, i, NULL); 2452772cb7c8SJose R. Santos 2453772cb7c8SJose R. Santos flex_group = ext4_flex_group(sbi, i); 24547ad9bb65STheodore Ts'o atomic_add(ext4_free_inodes_count(sb, gdp), 24557ad9bb65STheodore Ts'o &sbi->s_flex_groups[flex_group].free_inodes); 245690ba983fSTheodore Ts'o atomic64_add(ext4_free_group_clusters(sb, gdp), 245724aaa8efSTheodore Ts'o &sbi->s_flex_groups[flex_group].free_clusters); 24587ad9bb65STheodore Ts'o atomic_add(ext4_used_dirs_count(sb, gdp), 24597ad9bb65STheodore Ts'o &sbi->s_flex_groups[flex_group].used_dirs); 2460772cb7c8SJose R. Santos } 2461772cb7c8SJose R. Santos 2462772cb7c8SJose R. Santos return 1; 2463772cb7c8SJose R. Santos failed: 2464772cb7c8SJose R. Santos return 0; 2465772cb7c8SJose R. Santos } 2466772cb7c8SJose R. Santos 2467e2b911c5SDarrick J. Wong static __le16 ext4_group_desc_csum(struct super_block *sb, __u32 block_group, 2468717d50e4SAndreas Dilger struct ext4_group_desc *gdp) 2469717d50e4SAndreas Dilger { 2470b47820edSDaeho Jeong int offset = offsetof(struct ext4_group_desc, bg_checksum); 2471717d50e4SAndreas Dilger __u16 crc = 0; 2472717d50e4SAndreas Dilger __le32 le_group = cpu_to_le32(block_group); 2473e2b911c5SDarrick J. Wong struct ext4_sb_info *sbi = EXT4_SB(sb); 2474717d50e4SAndreas Dilger 24759aa5d32bSDmitry Monakhov if (ext4_has_metadata_csum(sbi->s_sb)) { 2476feb0ab32SDarrick J. Wong /* Use new metadata_csum algorithm */ 2477feb0ab32SDarrick J. Wong __u32 csum32; 2478b47820edSDaeho Jeong __u16 dummy_csum = 0; 2479feb0ab32SDarrick J. Wong 2480feb0ab32SDarrick J. Wong csum32 = ext4_chksum(sbi, sbi->s_csum_seed, (__u8 *)&le_group, 2481feb0ab32SDarrick J. Wong sizeof(le_group)); 2482b47820edSDaeho Jeong csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp, offset); 2483b47820edSDaeho Jeong csum32 = ext4_chksum(sbi, csum32, (__u8 *)&dummy_csum, 2484b47820edSDaeho Jeong sizeof(dummy_csum)); 2485b47820edSDaeho Jeong offset += sizeof(dummy_csum); 2486b47820edSDaeho Jeong if (offset < sbi->s_desc_size) 2487b47820edSDaeho Jeong csum32 = ext4_chksum(sbi, csum32, (__u8 *)gdp + offset, 2488b47820edSDaeho Jeong sbi->s_desc_size - offset); 2489feb0ab32SDarrick J. Wong 2490feb0ab32SDarrick J. Wong crc = csum32 & 0xFFFF; 2491feb0ab32SDarrick J. Wong goto out; 2492feb0ab32SDarrick J. Wong } 2493feb0ab32SDarrick J. Wong 2494feb0ab32SDarrick J. Wong /* old crc16 code */ 2495e2b911c5SDarrick J. Wong if (!ext4_has_feature_gdt_csum(sb)) 2496813d32f9SDarrick J. Wong return 0; 2497813d32f9SDarrick J. Wong 2498717d50e4SAndreas Dilger crc = crc16(~0, sbi->s_es->s_uuid, sizeof(sbi->s_es->s_uuid)); 2499717d50e4SAndreas Dilger crc = crc16(crc, (__u8 *)&le_group, sizeof(le_group)); 2500717d50e4SAndreas Dilger crc = crc16(crc, (__u8 *)gdp, offset); 2501717d50e4SAndreas Dilger offset += sizeof(gdp->bg_checksum); /* skip checksum */ 2502717d50e4SAndreas Dilger /* for checksum of struct ext4_group_desc do the rest...*/ 2503e2b911c5SDarrick J. Wong if (ext4_has_feature_64bit(sb) && 2504717d50e4SAndreas Dilger offset < le16_to_cpu(sbi->s_es->s_desc_size)) 2505717d50e4SAndreas Dilger crc = crc16(crc, (__u8 *)gdp + offset, 2506717d50e4SAndreas Dilger le16_to_cpu(sbi->s_es->s_desc_size) - 2507717d50e4SAndreas Dilger offset); 2508717d50e4SAndreas Dilger 2509feb0ab32SDarrick J. Wong out: 2510717d50e4SAndreas Dilger return cpu_to_le16(crc); 2511717d50e4SAndreas Dilger } 2512717d50e4SAndreas Dilger 2513feb0ab32SDarrick J. Wong int ext4_group_desc_csum_verify(struct super_block *sb, __u32 block_group, 2514717d50e4SAndreas Dilger struct ext4_group_desc *gdp) 2515717d50e4SAndreas Dilger { 2516feb0ab32SDarrick J. Wong if (ext4_has_group_desc_csum(sb) && 2517e2b911c5SDarrick J. Wong (gdp->bg_checksum != ext4_group_desc_csum(sb, block_group, gdp))) 2518717d50e4SAndreas Dilger return 0; 2519717d50e4SAndreas Dilger 2520717d50e4SAndreas Dilger return 1; 2521717d50e4SAndreas Dilger } 2522717d50e4SAndreas Dilger 2523feb0ab32SDarrick J. Wong void ext4_group_desc_csum_set(struct super_block *sb, __u32 block_group, 2524feb0ab32SDarrick J. Wong struct ext4_group_desc *gdp) 2525feb0ab32SDarrick J. Wong { 2526feb0ab32SDarrick J. Wong if (!ext4_has_group_desc_csum(sb)) 2527feb0ab32SDarrick J. Wong return; 2528e2b911c5SDarrick J. Wong gdp->bg_checksum = ext4_group_desc_csum(sb, block_group, gdp); 2529feb0ab32SDarrick J. Wong } 2530feb0ab32SDarrick J. Wong 2531ac27a0ecSDave Kleikamp /* Called at mount-time, super-block is locked */ 2532bfff6873SLukas Czerner static int ext4_check_descriptors(struct super_block *sb, 2533829fa70dSTheodore Ts'o ext4_fsblk_t sb_block, 2534bfff6873SLukas Czerner ext4_group_t *first_not_zeroed) 2535ac27a0ecSDave Kleikamp { 2536617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 2537617ba13bSMingming Cao ext4_fsblk_t first_block = le32_to_cpu(sbi->s_es->s_first_data_block); 2538617ba13bSMingming Cao ext4_fsblk_t last_block; 253944de022cSTheodore Ts'o ext4_fsblk_t last_bg_block = sb_block + ext4_bg_num_gdb(sb, 0); 2540bd81d8eeSLaurent Vivier ext4_fsblk_t block_bitmap; 2541bd81d8eeSLaurent Vivier ext4_fsblk_t inode_bitmap; 2542bd81d8eeSLaurent Vivier ext4_fsblk_t inode_table; 2543ce421581SJose R. Santos int flexbg_flag = 0; 2544bfff6873SLukas Czerner ext4_group_t i, grp = sbi->s_groups_count; 2545ac27a0ecSDave Kleikamp 2546e2b911c5SDarrick J. Wong if (ext4_has_feature_flex_bg(sb)) 2547ce421581SJose R. Santos flexbg_flag = 1; 2548ce421581SJose R. Santos 2549617ba13bSMingming Cao ext4_debug("Checking group descriptors"); 2550ac27a0ecSDave Kleikamp 2551197cd65aSAkinobu Mita for (i = 0; i < sbi->s_groups_count; i++) { 2552197cd65aSAkinobu Mita struct ext4_group_desc *gdp = ext4_get_group_desc(sb, i, NULL); 2553197cd65aSAkinobu Mita 2554ce421581SJose R. Santos if (i == sbi->s_groups_count - 1 || flexbg_flag) 2555bd81d8eeSLaurent Vivier last_block = ext4_blocks_count(sbi->s_es) - 1; 2556ac27a0ecSDave Kleikamp else 2557ac27a0ecSDave Kleikamp last_block = first_block + 2558617ba13bSMingming Cao (EXT4_BLOCKS_PER_GROUP(sb) - 1); 2559ac27a0ecSDave Kleikamp 2560bfff6873SLukas Czerner if ((grp == sbi->s_groups_count) && 2561bfff6873SLukas Czerner !(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED))) 2562bfff6873SLukas Czerner grp = i; 2563bfff6873SLukas Czerner 25648fadc143SAlexandre Ratchov block_bitmap = ext4_block_bitmap(sb, gdp); 2565829fa70dSTheodore Ts'o if (block_bitmap == sb_block) { 2566829fa70dSTheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 2567829fa70dSTheodore Ts'o "Block bitmap for group %u overlaps " 2568829fa70dSTheodore Ts'o "superblock", i); 256918db4b4eSTheodore Ts'o if (!sb_rdonly(sb)) 257018db4b4eSTheodore Ts'o return 0; 2571829fa70dSTheodore Ts'o } 257277260807STheodore Ts'o if (block_bitmap >= sb_block + 1 && 257377260807STheodore Ts'o block_bitmap <= last_bg_block) { 257477260807STheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 257577260807STheodore Ts'o "Block bitmap for group %u overlaps " 257677260807STheodore Ts'o "block group descriptors", i); 257777260807STheodore Ts'o if (!sb_rdonly(sb)) 257877260807STheodore Ts'o return 0; 257977260807STheodore Ts'o } 25802b2d6d01STheodore Ts'o if (block_bitmap < first_block || block_bitmap > last_block) { 2581b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 2582a9df9a49STheodore Ts'o "Block bitmap for group %u not in group " 2583b31e1552SEric Sandeen "(block %llu)!", i, block_bitmap); 2584ac27a0ecSDave Kleikamp return 0; 2585ac27a0ecSDave Kleikamp } 25868fadc143SAlexandre Ratchov inode_bitmap = ext4_inode_bitmap(sb, gdp); 2587829fa70dSTheodore Ts'o if (inode_bitmap == sb_block) { 2588829fa70dSTheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 2589829fa70dSTheodore Ts'o "Inode bitmap for group %u overlaps " 2590829fa70dSTheodore Ts'o "superblock", i); 259118db4b4eSTheodore Ts'o if (!sb_rdonly(sb)) 259218db4b4eSTheodore Ts'o return 0; 2593829fa70dSTheodore Ts'o } 259477260807STheodore Ts'o if (inode_bitmap >= sb_block + 1 && 259577260807STheodore Ts'o inode_bitmap <= last_bg_block) { 259677260807STheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 259777260807STheodore Ts'o "Inode bitmap for group %u overlaps " 259877260807STheodore Ts'o "block group descriptors", i); 259977260807STheodore Ts'o if (!sb_rdonly(sb)) 260077260807STheodore Ts'o return 0; 260177260807STheodore Ts'o } 26022b2d6d01STheodore Ts'o if (inode_bitmap < first_block || inode_bitmap > last_block) { 2603b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 2604a9df9a49STheodore Ts'o "Inode bitmap for group %u not in group " 2605b31e1552SEric Sandeen "(block %llu)!", i, inode_bitmap); 2606ac27a0ecSDave Kleikamp return 0; 2607ac27a0ecSDave Kleikamp } 26088fadc143SAlexandre Ratchov inode_table = ext4_inode_table(sb, gdp); 2609829fa70dSTheodore Ts'o if (inode_table == sb_block) { 2610829fa70dSTheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 2611829fa70dSTheodore Ts'o "Inode table for group %u overlaps " 2612829fa70dSTheodore Ts'o "superblock", i); 261318db4b4eSTheodore Ts'o if (!sb_rdonly(sb)) 261418db4b4eSTheodore Ts'o return 0; 2615829fa70dSTheodore Ts'o } 261677260807STheodore Ts'o if (inode_table >= sb_block + 1 && 261777260807STheodore Ts'o inode_table <= last_bg_block) { 261877260807STheodore Ts'o ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 261977260807STheodore Ts'o "Inode table for group %u overlaps " 262077260807STheodore Ts'o "block group descriptors", i); 262177260807STheodore Ts'o if (!sb_rdonly(sb)) 262277260807STheodore Ts'o return 0; 262377260807STheodore Ts'o } 2624bd81d8eeSLaurent Vivier if (inode_table < first_block || 26252b2d6d01STheodore Ts'o inode_table + sbi->s_itb_per_group - 1 > last_block) { 2626b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 2627a9df9a49STheodore Ts'o "Inode table for group %u not in group " 2628b31e1552SEric Sandeen "(block %llu)!", i, inode_table); 2629ac27a0ecSDave Kleikamp return 0; 2630ac27a0ecSDave Kleikamp } 2631955ce5f5SAneesh Kumar K.V ext4_lock_group(sb, i); 2632feb0ab32SDarrick J. Wong if (!ext4_group_desc_csum_verify(sb, i, gdp)) { 2633b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "ext4_check_descriptors: " 2634b31e1552SEric Sandeen "Checksum for group %u failed (%u!=%u)", 2635e2b911c5SDarrick J. Wong i, le16_to_cpu(ext4_group_desc_csum(sb, i, 2636fd2d4291SAvantika Mathur gdp)), le16_to_cpu(gdp->bg_checksum)); 2637bc98a42cSDavid Howells if (!sb_rdonly(sb)) { 2638955ce5f5SAneesh Kumar K.V ext4_unlock_group(sb, i); 2639717d50e4SAndreas Dilger return 0; 2640717d50e4SAndreas Dilger } 26417ee1ec4cSLi Zefan } 2642955ce5f5SAneesh Kumar K.V ext4_unlock_group(sb, i); 2643ce421581SJose R. Santos if (!flexbg_flag) 2644617ba13bSMingming Cao first_block += EXT4_BLOCKS_PER_GROUP(sb); 2645ac27a0ecSDave Kleikamp } 2646bfff6873SLukas Czerner if (NULL != first_not_zeroed) 2647bfff6873SLukas Czerner *first_not_zeroed = grp; 2648ac27a0ecSDave Kleikamp return 1; 2649ac27a0ecSDave Kleikamp } 2650ac27a0ecSDave Kleikamp 2651617ba13bSMingming Cao /* ext4_orphan_cleanup() walks a singly-linked list of inodes (starting at 2652ac27a0ecSDave Kleikamp * the superblock) which were deleted from all directories, but held open by 2653ac27a0ecSDave Kleikamp * a process at the time of a crash. We walk the list and try to delete these 2654ac27a0ecSDave Kleikamp * inodes at recovery time (only with a read-write filesystem). 2655ac27a0ecSDave Kleikamp * 2656ac27a0ecSDave Kleikamp * In order to keep the orphan inode chain consistent during traversal (in 2657ac27a0ecSDave Kleikamp * case of crash during recovery), we link each inode into the superblock 2658ac27a0ecSDave Kleikamp * orphan list_head and handle it the same way as an inode deletion during 2659ac27a0ecSDave Kleikamp * normal operation (which journals the operations for us). 2660ac27a0ecSDave Kleikamp * 2661ac27a0ecSDave Kleikamp * We only do an iget() and an iput() on each inode, which is very safe if we 2662ac27a0ecSDave Kleikamp * accidentally point at an in-use or already deleted inode. The worst that 2663ac27a0ecSDave Kleikamp * can happen in this case is that we get a "bit already cleared" message from 2664617ba13bSMingming Cao * ext4_free_inode(). The only reason we would point at a wrong inode is if 2665ac27a0ecSDave Kleikamp * e2fsck was run on this filesystem, and it must have already done the orphan 2666ac27a0ecSDave Kleikamp * inode cleanup for us, so we can safely abort without any further action. 2667ac27a0ecSDave Kleikamp */ 2668617ba13bSMingming Cao static void ext4_orphan_cleanup(struct super_block *sb, 2669617ba13bSMingming Cao struct ext4_super_block *es) 2670ac27a0ecSDave Kleikamp { 2671ac27a0ecSDave Kleikamp unsigned int s_flags = sb->s_flags; 26722c98eb5eSTheodore Ts'o int ret, nr_orphans = 0, nr_truncates = 0; 2673ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 267495f1fda4Szhangyi (F) int quota_update = 0; 2675ac27a0ecSDave Kleikamp int i; 2676ac27a0ecSDave Kleikamp #endif 2677ac27a0ecSDave Kleikamp if (!es->s_last_orphan) { 2678ac27a0ecSDave Kleikamp jbd_debug(4, "no orphan inodes to clean up\n"); 2679ac27a0ecSDave Kleikamp return; 2680ac27a0ecSDave Kleikamp } 2681ac27a0ecSDave Kleikamp 2682a8f48a95SEric Sandeen if (bdev_read_only(sb->s_bdev)) { 2683b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "write access " 2684b31e1552SEric Sandeen "unavailable, skipping orphan cleanup"); 2685a8f48a95SEric Sandeen return; 2686a8f48a95SEric Sandeen } 2687a8f48a95SEric Sandeen 2688d39195c3SAmir Goldstein /* Check if feature set would not allow a r/w mount */ 2689d39195c3SAmir Goldstein if (!ext4_feature_set_ok(sb, 0)) { 2690d39195c3SAmir Goldstein ext4_msg(sb, KERN_INFO, "Skipping orphan cleanup due to " 2691d39195c3SAmir Goldstein "unknown ROCOMPAT features"); 2692d39195c3SAmir Goldstein return; 2693d39195c3SAmir Goldstein } 2694d39195c3SAmir Goldstein 2695617ba13bSMingming Cao if (EXT4_SB(sb)->s_mount_state & EXT4_ERROR_FS) { 2696c25f9bc6SEric Sandeen /* don't clear list on RO mount w/ errors */ 26971751e8a6SLinus Torvalds if (es->s_last_orphan && !(s_flags & SB_RDONLY)) { 269884474976SDmitry Monakhov ext4_msg(sb, KERN_INFO, "Errors on filesystem, " 2699ac27a0ecSDave Kleikamp "clearing orphan list.\n"); 2700ac27a0ecSDave Kleikamp es->s_last_orphan = 0; 2701c25f9bc6SEric Sandeen } 2702ac27a0ecSDave Kleikamp jbd_debug(1, "Skipping orphan recovery on fs with errors.\n"); 2703ac27a0ecSDave Kleikamp return; 2704ac27a0ecSDave Kleikamp } 2705ac27a0ecSDave Kleikamp 27061751e8a6SLinus Torvalds if (s_flags & SB_RDONLY) { 2707b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "orphan cleanup on readonly fs"); 27081751e8a6SLinus Torvalds sb->s_flags &= ~SB_RDONLY; 2709ac27a0ecSDave Kleikamp } 2710ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 2711ac27a0ecSDave Kleikamp /* Needed for iput() to work correctly and not trash data */ 27121751e8a6SLinus Torvalds sb->s_flags |= SB_ACTIVE; 271395f1fda4Szhangyi (F) 271495f1fda4Szhangyi (F) /* 271595f1fda4Szhangyi (F) * Turn on quotas which were not enabled for read-only mounts if 271695f1fda4Szhangyi (F) * filesystem has quota feature, so that they are updated correctly. 271795f1fda4Szhangyi (F) */ 27181751e8a6SLinus Torvalds if (ext4_has_feature_quota(sb) && (s_flags & SB_RDONLY)) { 271995f1fda4Szhangyi (F) int ret = ext4_enable_quotas(sb); 272095f1fda4Szhangyi (F) 272195f1fda4Szhangyi (F) if (!ret) 272295f1fda4Szhangyi (F) quota_update = 1; 272395f1fda4Szhangyi (F) else 272495f1fda4Szhangyi (F) ext4_msg(sb, KERN_ERR, 272595f1fda4Szhangyi (F) "Cannot turn on quotas: error %d", ret); 272695f1fda4Szhangyi (F) } 272795f1fda4Szhangyi (F) 272895f1fda4Szhangyi (F) /* Turn on journaled quotas used for old sytle */ 2729a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) { 2730617ba13bSMingming Cao if (EXT4_SB(sb)->s_qf_names[i]) { 2731617ba13bSMingming Cao int ret = ext4_quota_on_mount(sb, i); 273295f1fda4Szhangyi (F) 273395f1fda4Szhangyi (F) if (!ret) 273495f1fda4Szhangyi (F) quota_update = 1; 273595f1fda4Szhangyi (F) else 2736b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 2737b31e1552SEric Sandeen "Cannot turn on journaled " 273895f1fda4Szhangyi (F) "quota: type %d: error %d", i, ret); 2739ac27a0ecSDave Kleikamp } 2740ac27a0ecSDave Kleikamp } 2741ac27a0ecSDave Kleikamp #endif 2742ac27a0ecSDave Kleikamp 2743ac27a0ecSDave Kleikamp while (es->s_last_orphan) { 2744ac27a0ecSDave Kleikamp struct inode *inode; 2745ac27a0ecSDave Kleikamp 2746c65d5c6cSVegard Nossum /* 2747c65d5c6cSVegard Nossum * We may have encountered an error during cleanup; if 2748c65d5c6cSVegard Nossum * so, skip the rest. 2749c65d5c6cSVegard Nossum */ 2750c65d5c6cSVegard Nossum if (EXT4_SB(sb)->s_mount_state & EXT4_ERROR_FS) { 2751c65d5c6cSVegard Nossum jbd_debug(1, "Skipping orphan recovery on fs with errors.\n"); 2752c65d5c6cSVegard Nossum es->s_last_orphan = 0; 2753c65d5c6cSVegard Nossum break; 2754c65d5c6cSVegard Nossum } 2755c65d5c6cSVegard Nossum 275697bd42b9SJosef Bacik inode = ext4_orphan_get(sb, le32_to_cpu(es->s_last_orphan)); 275797bd42b9SJosef Bacik if (IS_ERR(inode)) { 2758ac27a0ecSDave Kleikamp es->s_last_orphan = 0; 2759ac27a0ecSDave Kleikamp break; 2760ac27a0ecSDave Kleikamp } 2761ac27a0ecSDave Kleikamp 2762617ba13bSMingming Cao list_add(&EXT4_I(inode)->i_orphan, &EXT4_SB(sb)->s_orphan); 2763871a2931SChristoph Hellwig dquot_initialize(inode); 2764ac27a0ecSDave Kleikamp if (inode->i_nlink) { 2765566370a2SPaul Taysom if (test_opt(sb, DEBUG)) 2766b31e1552SEric Sandeen ext4_msg(sb, KERN_DEBUG, 2767b31e1552SEric Sandeen "%s: truncating inode %lu to %lld bytes", 276846e665e9SHarvey Harrison __func__, inode->i_ino, inode->i_size); 2769e5f8eab8STheodore Ts'o jbd_debug(2, "truncating inode %lu to %lld bytes\n", 2770ac27a0ecSDave Kleikamp inode->i_ino, inode->i_size); 27715955102cSAl Viro inode_lock(inode); 277255f252c9SLukas Czerner truncate_inode_pages(inode->i_mapping, inode->i_size); 27732c98eb5eSTheodore Ts'o ret = ext4_truncate(inode); 27742c98eb5eSTheodore Ts'o if (ret) 27752c98eb5eSTheodore Ts'o ext4_std_error(inode->i_sb, ret); 27765955102cSAl Viro inode_unlock(inode); 2777ac27a0ecSDave Kleikamp nr_truncates++; 2778ac27a0ecSDave Kleikamp } else { 2779566370a2SPaul Taysom if (test_opt(sb, DEBUG)) 2780b31e1552SEric Sandeen ext4_msg(sb, KERN_DEBUG, 2781b31e1552SEric Sandeen "%s: deleting unreferenced inode %lu", 278246e665e9SHarvey Harrison __func__, inode->i_ino); 2783ac27a0ecSDave Kleikamp jbd_debug(2, "deleting unreferenced inode %lu\n", 2784ac27a0ecSDave Kleikamp inode->i_ino); 2785ac27a0ecSDave Kleikamp nr_orphans++; 2786ac27a0ecSDave Kleikamp } 2787ac27a0ecSDave Kleikamp iput(inode); /* The delete magic happens here! */ 2788ac27a0ecSDave Kleikamp } 2789ac27a0ecSDave Kleikamp 2790ac27a0ecSDave Kleikamp #define PLURAL(x) (x), ((x) == 1) ? "" : "s" 2791ac27a0ecSDave Kleikamp 2792ac27a0ecSDave Kleikamp if (nr_orphans) 2793b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "%d orphan inode%s deleted", 2794b31e1552SEric Sandeen PLURAL(nr_orphans)); 2795ac27a0ecSDave Kleikamp if (nr_truncates) 2796b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "%d truncate%s cleaned up", 2797b31e1552SEric Sandeen PLURAL(nr_truncates)); 2798ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 279995f1fda4Szhangyi (F) /* Turn off quotas if they were enabled for orphan cleanup */ 280095f1fda4Szhangyi (F) if (quota_update) { 2801a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) { 280295f1fda4Szhangyi (F) if (sb_dqopt(sb)->files[i]) 2803287a8095SChristoph Hellwig dquot_quota_off(sb, i); 2804ac27a0ecSDave Kleikamp } 280595f1fda4Szhangyi (F) } 2806ac27a0ecSDave Kleikamp #endif 28071751e8a6SLinus Torvalds sb->s_flags = s_flags; /* Restore SB_RDONLY status */ 2808ac27a0ecSDave Kleikamp } 28090b8e58a1SAndreas Dilger 2810cd2291a4SEric Sandeen /* 2811cd2291a4SEric Sandeen * Maximal extent format file size. 2812cd2291a4SEric Sandeen * Resulting logical blkno at s_maxbytes must fit in our on-disk 2813cd2291a4SEric Sandeen * extent format containers, within a sector_t, and within i_blocks 2814cd2291a4SEric Sandeen * in the vfs. ext4 inode has 48 bits of i_block in fsblock units, 2815cd2291a4SEric Sandeen * so that won't be a limiting factor. 2816cd2291a4SEric Sandeen * 2817f17722f9SLukas Czerner * However there is other limiting factor. We do store extents in the form 2818f17722f9SLukas Czerner * of starting block and length, hence the resulting length of the extent 2819f17722f9SLukas Czerner * covering maximum file size must fit into on-disk format containers as 2820f17722f9SLukas Czerner * well. Given that length is always by 1 unit bigger than max unit (because 2821f17722f9SLukas Czerner * we count 0 as well) we have to lower the s_maxbytes by one fs block. 2822f17722f9SLukas Czerner * 2823cd2291a4SEric Sandeen * Note, this does *not* consider any metadata overhead for vfs i_blocks. 2824cd2291a4SEric Sandeen */ 2825f287a1a5STheodore Ts'o static loff_t ext4_max_size(int blkbits, int has_huge_files) 2826cd2291a4SEric Sandeen { 2827cd2291a4SEric Sandeen loff_t res; 2828cd2291a4SEric Sandeen loff_t upper_limit = MAX_LFS_FILESIZE; 2829cd2291a4SEric Sandeen 283072deb455SChristoph Hellwig BUILD_BUG_ON(sizeof(blkcnt_t) < sizeof(u64)); 283172deb455SChristoph Hellwig 283272deb455SChristoph Hellwig if (!has_huge_files) { 2833cd2291a4SEric Sandeen upper_limit = (1LL << 32) - 1; 2834cd2291a4SEric Sandeen 2835cd2291a4SEric Sandeen /* total blocks in file system block size */ 2836cd2291a4SEric Sandeen upper_limit >>= (blkbits - 9); 2837cd2291a4SEric Sandeen upper_limit <<= blkbits; 2838cd2291a4SEric Sandeen } 2839cd2291a4SEric Sandeen 2840f17722f9SLukas Czerner /* 2841f17722f9SLukas Czerner * 32-bit extent-start container, ee_block. We lower the maxbytes 2842f17722f9SLukas Czerner * by one fs block, so ee_len can cover the extent of maximum file 2843f17722f9SLukas Czerner * size 2844f17722f9SLukas Czerner */ 2845f17722f9SLukas Czerner res = (1LL << 32) - 1; 2846cd2291a4SEric Sandeen res <<= blkbits; 2847cd2291a4SEric Sandeen 2848cd2291a4SEric Sandeen /* Sanity check against vm- & vfs- imposed limits */ 2849cd2291a4SEric Sandeen if (res > upper_limit) 2850cd2291a4SEric Sandeen res = upper_limit; 2851cd2291a4SEric Sandeen 2852cd2291a4SEric Sandeen return res; 2853cd2291a4SEric Sandeen } 2854ac27a0ecSDave Kleikamp 2855ac27a0ecSDave Kleikamp /* 2856cd2291a4SEric Sandeen * Maximal bitmap file size. There is a direct, and {,double-,triple-}indirect 28570fc1b451SAneesh Kumar K.V * block limit, and also a limit of (2^48 - 1) 512-byte sectors in i_blocks. 28580fc1b451SAneesh Kumar K.V * We need to be 1 filesystem block less than the 2^48 sector limit. 2859ac27a0ecSDave Kleikamp */ 2860f287a1a5STheodore Ts'o static loff_t ext4_max_bitmap_size(int bits, int has_huge_files) 2861ac27a0ecSDave Kleikamp { 2862617ba13bSMingming Cao loff_t res = EXT4_NDIR_BLOCKS; 28630fc1b451SAneesh Kumar K.V int meta_blocks; 28640fc1b451SAneesh Kumar K.V loff_t upper_limit; 28650b8e58a1SAndreas Dilger /* This is calculated to be the largest file size for a dense, block 28660b8e58a1SAndreas Dilger * mapped file such that the file's total number of 512-byte sectors, 28670b8e58a1SAndreas Dilger * including data and all indirect blocks, does not exceed (2^48 - 1). 28680b8e58a1SAndreas Dilger * 28690b8e58a1SAndreas Dilger * __u32 i_blocks_lo and _u16 i_blocks_high represent the total 28700b8e58a1SAndreas Dilger * number of 512-byte sectors of the file. 28710fc1b451SAneesh Kumar K.V */ 28720fc1b451SAneesh Kumar K.V 287372deb455SChristoph Hellwig if (!has_huge_files) { 28740fc1b451SAneesh Kumar K.V /* 287572deb455SChristoph Hellwig * !has_huge_files or implies that the inode i_block field 287672deb455SChristoph Hellwig * represents total file blocks in 2^32 512-byte sectors == 287772deb455SChristoph Hellwig * size of vfs inode i_blocks * 8 28780fc1b451SAneesh Kumar K.V */ 28790fc1b451SAneesh Kumar K.V upper_limit = (1LL << 32) - 1; 28800fc1b451SAneesh Kumar K.V 28810fc1b451SAneesh Kumar K.V /* total blocks in file system block size */ 28820fc1b451SAneesh Kumar K.V upper_limit >>= (bits - 9); 28830fc1b451SAneesh Kumar K.V 28840fc1b451SAneesh Kumar K.V } else { 28858180a562SAneesh Kumar K.V /* 28868180a562SAneesh Kumar K.V * We use 48 bit ext4_inode i_blocks 28878180a562SAneesh Kumar K.V * With EXT4_HUGE_FILE_FL set the i_blocks 28888180a562SAneesh Kumar K.V * represent total number of blocks in 28898180a562SAneesh Kumar K.V * file system block size 28908180a562SAneesh Kumar K.V */ 28910fc1b451SAneesh Kumar K.V upper_limit = (1LL << 48) - 1; 28920fc1b451SAneesh Kumar K.V 28930fc1b451SAneesh Kumar K.V } 28940fc1b451SAneesh Kumar K.V 28950fc1b451SAneesh Kumar K.V /* indirect blocks */ 28960fc1b451SAneesh Kumar K.V meta_blocks = 1; 28970fc1b451SAneesh Kumar K.V /* double indirect blocks */ 28980fc1b451SAneesh Kumar K.V meta_blocks += 1 + (1LL << (bits-2)); 28990fc1b451SAneesh Kumar K.V /* tripple indirect blocks */ 29000fc1b451SAneesh Kumar K.V meta_blocks += 1 + (1LL << (bits-2)) + (1LL << (2*(bits-2))); 29010fc1b451SAneesh Kumar K.V 29020fc1b451SAneesh Kumar K.V upper_limit -= meta_blocks; 29030fc1b451SAneesh Kumar K.V upper_limit <<= bits; 2904ac27a0ecSDave Kleikamp 2905ac27a0ecSDave Kleikamp res += 1LL << (bits-2); 2906ac27a0ecSDave Kleikamp res += 1LL << (2*(bits-2)); 2907ac27a0ecSDave Kleikamp res += 1LL << (3*(bits-2)); 2908ac27a0ecSDave Kleikamp res <<= bits; 2909ac27a0ecSDave Kleikamp if (res > upper_limit) 2910ac27a0ecSDave Kleikamp res = upper_limit; 29110fc1b451SAneesh Kumar K.V 29120fc1b451SAneesh Kumar K.V if (res > MAX_LFS_FILESIZE) 29130fc1b451SAneesh Kumar K.V res = MAX_LFS_FILESIZE; 29140fc1b451SAneesh Kumar K.V 2915ac27a0ecSDave Kleikamp return res; 2916ac27a0ecSDave Kleikamp } 2917ac27a0ecSDave Kleikamp 2918617ba13bSMingming Cao static ext4_fsblk_t descriptor_loc(struct super_block *sb, 291970bbb3e0SAndrew Morton ext4_fsblk_t logical_sb_block, int nr) 2920ac27a0ecSDave Kleikamp { 2921617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 2922fd2d4291SAvantika Mathur ext4_group_t bg, first_meta_bg; 2923ac27a0ecSDave Kleikamp int has_super = 0; 2924ac27a0ecSDave Kleikamp 2925ac27a0ecSDave Kleikamp first_meta_bg = le32_to_cpu(sbi->s_es->s_first_meta_bg); 2926ac27a0ecSDave Kleikamp 2927e2b911c5SDarrick J. Wong if (!ext4_has_feature_meta_bg(sb) || nr < first_meta_bg) 292870bbb3e0SAndrew Morton return logical_sb_block + nr + 1; 2929ac27a0ecSDave Kleikamp bg = sbi->s_desc_per_block * nr; 2930617ba13bSMingming Cao if (ext4_bg_has_super(sb, bg)) 2931ac27a0ecSDave Kleikamp has_super = 1; 29320b8e58a1SAndreas Dilger 2933bd63f6b0SDarrick J. Wong /* 2934bd63f6b0SDarrick J. Wong * If we have a meta_bg fs with 1k blocks, group 0's GDT is at 2935bd63f6b0SDarrick J. Wong * block 2, not 1. If s_first_data_block == 0 (bigalloc is enabled 2936bd63f6b0SDarrick J. Wong * on modern mke2fs or blksize > 1k on older mke2fs) then we must 2937bd63f6b0SDarrick J. Wong * compensate. 2938bd63f6b0SDarrick J. Wong */ 2939bd63f6b0SDarrick J. Wong if (sb->s_blocksize == 1024 && nr == 0 && 294049598e04SJun Piao le32_to_cpu(sbi->s_es->s_first_data_block) == 0) 2941bd63f6b0SDarrick J. Wong has_super++; 2942bd63f6b0SDarrick J. Wong 2943617ba13bSMingming Cao return (has_super + ext4_group_first_block_no(sb, bg)); 2944ac27a0ecSDave Kleikamp } 2945ac27a0ecSDave Kleikamp 2946c9de560dSAlex Tomas /** 2947c9de560dSAlex Tomas * ext4_get_stripe_size: Get the stripe size. 2948c9de560dSAlex Tomas * @sbi: In memory super block info 2949c9de560dSAlex Tomas * 2950c9de560dSAlex Tomas * If we have specified it via mount option, then 2951c9de560dSAlex Tomas * use the mount option value. If the value specified at mount time is 2952c9de560dSAlex Tomas * greater than the blocks per group use the super block value. 2953c9de560dSAlex Tomas * If the super block value is greater than blocks per group return 0. 2954c9de560dSAlex Tomas * Allocator needs it be less than blocks per group. 2955c9de560dSAlex Tomas * 2956c9de560dSAlex Tomas */ 2957c9de560dSAlex Tomas static unsigned long ext4_get_stripe_size(struct ext4_sb_info *sbi) 2958c9de560dSAlex Tomas { 2959c9de560dSAlex Tomas unsigned long stride = le16_to_cpu(sbi->s_es->s_raid_stride); 2960c9de560dSAlex Tomas unsigned long stripe_width = 2961c9de560dSAlex Tomas le32_to_cpu(sbi->s_es->s_raid_stripe_width); 29623eb08658SDan Ehrenberg int ret; 2963c9de560dSAlex Tomas 2964c9de560dSAlex Tomas if (sbi->s_stripe && sbi->s_stripe <= sbi->s_blocks_per_group) 29653eb08658SDan Ehrenberg ret = sbi->s_stripe; 29665469d7c3SJan Kara else if (stripe_width && stripe_width <= sbi->s_blocks_per_group) 29673eb08658SDan Ehrenberg ret = stripe_width; 29685469d7c3SJan Kara else if (stride && stride <= sbi->s_blocks_per_group) 29693eb08658SDan Ehrenberg ret = stride; 29703eb08658SDan Ehrenberg else 29713eb08658SDan Ehrenberg ret = 0; 2972c9de560dSAlex Tomas 29733eb08658SDan Ehrenberg /* 29743eb08658SDan Ehrenberg * If the stripe width is 1, this makes no sense and 29753eb08658SDan Ehrenberg * we set it to 0 to turn off stripe handling code. 29763eb08658SDan Ehrenberg */ 29773eb08658SDan Ehrenberg if (ret <= 1) 29783eb08658SDan Ehrenberg ret = 0; 2979c9de560dSAlex Tomas 29803eb08658SDan Ehrenberg return ret; 2981c9de560dSAlex Tomas } 2982ac27a0ecSDave Kleikamp 2983a13fb1a4SEric Sandeen /* 2984a13fb1a4SEric Sandeen * Check whether this filesystem can be mounted based on 2985a13fb1a4SEric Sandeen * the features present and the RDONLY/RDWR mount requested. 2986a13fb1a4SEric Sandeen * Returns 1 if this filesystem can be mounted as requested, 2987a13fb1a4SEric Sandeen * 0 if it cannot be. 2988a13fb1a4SEric Sandeen */ 2989a13fb1a4SEric Sandeen static int ext4_feature_set_ok(struct super_block *sb, int readonly) 2990a13fb1a4SEric Sandeen { 2991e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext4_incompat_features(sb)) { 2992a13fb1a4SEric Sandeen ext4_msg(sb, KERN_ERR, 2993a13fb1a4SEric Sandeen "Couldn't mount because of " 2994a13fb1a4SEric Sandeen "unsupported optional features (%x)", 2995a13fb1a4SEric Sandeen (le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_incompat) & 2996a13fb1a4SEric Sandeen ~EXT4_FEATURE_INCOMPAT_SUPP)); 2997a13fb1a4SEric Sandeen return 0; 2998a13fb1a4SEric Sandeen } 2999a13fb1a4SEric Sandeen 3000c83ad55eSGabriel Krisman Bertazi #ifndef CONFIG_UNICODE 3001c83ad55eSGabriel Krisman Bertazi if (ext4_has_feature_casefold(sb)) { 3002c83ad55eSGabriel Krisman Bertazi ext4_msg(sb, KERN_ERR, 3003c83ad55eSGabriel Krisman Bertazi "Filesystem with casefold feature cannot be " 3004c83ad55eSGabriel Krisman Bertazi "mounted without CONFIG_UNICODE"); 3005c83ad55eSGabriel Krisman Bertazi return 0; 3006c83ad55eSGabriel Krisman Bertazi } 3007c83ad55eSGabriel Krisman Bertazi #endif 3008c83ad55eSGabriel Krisman Bertazi 3009a13fb1a4SEric Sandeen if (readonly) 3010a13fb1a4SEric Sandeen return 1; 3011a13fb1a4SEric Sandeen 3012e2b911c5SDarrick J. Wong if (ext4_has_feature_readonly(sb)) { 30132cb5cc8bSDarrick J. Wong ext4_msg(sb, KERN_INFO, "filesystem is read-only"); 30141751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY; 30152cb5cc8bSDarrick J. Wong return 1; 30162cb5cc8bSDarrick J. Wong } 30172cb5cc8bSDarrick J. Wong 3018a13fb1a4SEric Sandeen /* Check that feature set is OK for a read-write mount */ 3019e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext4_ro_compat_features(sb)) { 3020a13fb1a4SEric Sandeen ext4_msg(sb, KERN_ERR, "couldn't mount RDWR because of " 3021a13fb1a4SEric Sandeen "unsupported optional features (%x)", 3022a13fb1a4SEric Sandeen (le32_to_cpu(EXT4_SB(sb)->s_es->s_feature_ro_compat) & 3023a13fb1a4SEric Sandeen ~EXT4_FEATURE_RO_COMPAT_SUPP)); 3024a13fb1a4SEric Sandeen return 0; 3025a13fb1a4SEric Sandeen } 3026e2b911c5SDarrick J. Wong if (ext4_has_feature_bigalloc(sb) && !ext4_has_feature_extents(sb)) { 3027bab08ab9STheodore Ts'o ext4_msg(sb, KERN_ERR, 3028bab08ab9STheodore Ts'o "Can't support bigalloc feature without " 3029bab08ab9STheodore Ts'o "extents feature\n"); 3030bab08ab9STheodore Ts'o return 0; 3031bab08ab9STheodore Ts'o } 30327c319d32SAditya Kali 30337c319d32SAditya Kali #ifndef CONFIG_QUOTA 3034e2b911c5SDarrick J. Wong if (ext4_has_feature_quota(sb) && !readonly) { 30357c319d32SAditya Kali ext4_msg(sb, KERN_ERR, 30367c319d32SAditya Kali "Filesystem with quota feature cannot be mounted RDWR " 30377c319d32SAditya Kali "without CONFIG_QUOTA"); 30387c319d32SAditya Kali return 0; 30397c319d32SAditya Kali } 3040689c958cSLi Xi if (ext4_has_feature_project(sb) && !readonly) { 3041689c958cSLi Xi ext4_msg(sb, KERN_ERR, 3042689c958cSLi Xi "Filesystem with project quota feature cannot be mounted RDWR " 3043689c958cSLi Xi "without CONFIG_QUOTA"); 3044689c958cSLi Xi return 0; 3045689c958cSLi Xi } 30467c319d32SAditya Kali #endif /* CONFIG_QUOTA */ 3047a13fb1a4SEric Sandeen return 1; 3048a13fb1a4SEric Sandeen } 3049a13fb1a4SEric Sandeen 305066e61a9eSTheodore Ts'o /* 305166e61a9eSTheodore Ts'o * This function is called once a day if we have errors logged 305266e61a9eSTheodore Ts'o * on the file system 305366e61a9eSTheodore Ts'o */ 3054235699a8SKees Cook static void print_daily_error_info(struct timer_list *t) 305566e61a9eSTheodore Ts'o { 3056235699a8SKees Cook struct ext4_sb_info *sbi = from_timer(sbi, t, s_err_report); 3057235699a8SKees Cook struct super_block *sb = sbi->s_sb; 3058235699a8SKees Cook struct ext4_super_block *es = sbi->s_es; 305966e61a9eSTheodore Ts'o 306066e61a9eSTheodore Ts'o if (es->s_error_count) 3061ae0f78deSTheodore Ts'o /* fsck newer than v1.41.13 is needed to clean this condition. */ 3062ae0f78deSTheodore Ts'o ext4_msg(sb, KERN_NOTICE, "error count since last fsck: %u", 306366e61a9eSTheodore Ts'o le32_to_cpu(es->s_error_count)); 306466e61a9eSTheodore Ts'o if (es->s_first_error_time) { 30656a0678a7SArnd Bergmann printk(KERN_NOTICE "EXT4-fs (%s): initial error at time %llu: %.*s:%d", 30666a0678a7SArnd Bergmann sb->s_id, 30676a0678a7SArnd Bergmann ext4_get_tstamp(es, s_first_error_time), 306866e61a9eSTheodore Ts'o (int) sizeof(es->s_first_error_func), 306966e61a9eSTheodore Ts'o es->s_first_error_func, 307066e61a9eSTheodore Ts'o le32_to_cpu(es->s_first_error_line)); 307166e61a9eSTheodore Ts'o if (es->s_first_error_ino) 3072651e1c3bSJoe Perches printk(KERN_CONT ": inode %u", 307366e61a9eSTheodore Ts'o le32_to_cpu(es->s_first_error_ino)); 307466e61a9eSTheodore Ts'o if (es->s_first_error_block) 3075651e1c3bSJoe Perches printk(KERN_CONT ": block %llu", (unsigned long long) 307666e61a9eSTheodore Ts'o le64_to_cpu(es->s_first_error_block)); 3077651e1c3bSJoe Perches printk(KERN_CONT "\n"); 307866e61a9eSTheodore Ts'o } 307966e61a9eSTheodore Ts'o if (es->s_last_error_time) { 30806a0678a7SArnd Bergmann printk(KERN_NOTICE "EXT4-fs (%s): last error at time %llu: %.*s:%d", 30816a0678a7SArnd Bergmann sb->s_id, 30826a0678a7SArnd Bergmann ext4_get_tstamp(es, s_last_error_time), 308366e61a9eSTheodore Ts'o (int) sizeof(es->s_last_error_func), 308466e61a9eSTheodore Ts'o es->s_last_error_func, 308566e61a9eSTheodore Ts'o le32_to_cpu(es->s_last_error_line)); 308666e61a9eSTheodore Ts'o if (es->s_last_error_ino) 3087651e1c3bSJoe Perches printk(KERN_CONT ": inode %u", 308866e61a9eSTheodore Ts'o le32_to_cpu(es->s_last_error_ino)); 308966e61a9eSTheodore Ts'o if (es->s_last_error_block) 3090651e1c3bSJoe Perches printk(KERN_CONT ": block %llu", (unsigned long long) 309166e61a9eSTheodore Ts'o le64_to_cpu(es->s_last_error_block)); 3092651e1c3bSJoe Perches printk(KERN_CONT "\n"); 309366e61a9eSTheodore Ts'o } 309466e61a9eSTheodore Ts'o mod_timer(&sbi->s_err_report, jiffies + 24*60*60*HZ); /* Once a day */ 309566e61a9eSTheodore Ts'o } 309666e61a9eSTheodore Ts'o 3097bfff6873SLukas Czerner /* Find next suitable group and run ext4_init_inode_table */ 3098bfff6873SLukas Czerner static int ext4_run_li_request(struct ext4_li_request *elr) 3099bfff6873SLukas Czerner { 3100bfff6873SLukas Czerner struct ext4_group_desc *gdp = NULL; 3101bfff6873SLukas Czerner ext4_group_t group, ngroups; 3102bfff6873SLukas Czerner struct super_block *sb; 3103bfff6873SLukas Czerner unsigned long timeout = 0; 3104bfff6873SLukas Czerner int ret = 0; 3105bfff6873SLukas Czerner 3106bfff6873SLukas Czerner sb = elr->lr_super; 3107bfff6873SLukas Czerner ngroups = EXT4_SB(sb)->s_groups_count; 3108bfff6873SLukas Czerner 3109bfff6873SLukas Czerner for (group = elr->lr_next_group; group < ngroups; group++) { 3110bfff6873SLukas Czerner gdp = ext4_get_group_desc(sb, group, NULL); 3111bfff6873SLukas Czerner if (!gdp) { 3112bfff6873SLukas Czerner ret = 1; 3113bfff6873SLukas Czerner break; 3114bfff6873SLukas Czerner } 3115bfff6873SLukas Czerner 3116bfff6873SLukas Czerner if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED))) 3117bfff6873SLukas Czerner break; 3118bfff6873SLukas Czerner } 3119bfff6873SLukas Czerner 31207f511862STheodore Ts'o if (group >= ngroups) 3121bfff6873SLukas Czerner ret = 1; 3122bfff6873SLukas Czerner 3123bfff6873SLukas Czerner if (!ret) { 3124bfff6873SLukas Czerner timeout = jiffies; 3125bfff6873SLukas Czerner ret = ext4_init_inode_table(sb, group, 3126bfff6873SLukas Czerner elr->lr_timeout ? 0 : 1); 3127bfff6873SLukas Czerner if (elr->lr_timeout == 0) { 312851ce6511SLukas Czerner timeout = (jiffies - timeout) * 312951ce6511SLukas Czerner elr->lr_sbi->s_li_wait_mult; 3130bfff6873SLukas Czerner elr->lr_timeout = timeout; 3131bfff6873SLukas Czerner } 3132bfff6873SLukas Czerner elr->lr_next_sched = jiffies + elr->lr_timeout; 3133bfff6873SLukas Czerner elr->lr_next_group = group + 1; 3134bfff6873SLukas Czerner } 3135bfff6873SLukas Czerner return ret; 3136bfff6873SLukas Czerner } 3137bfff6873SLukas Czerner 3138bfff6873SLukas Czerner /* 3139bfff6873SLukas Czerner * Remove lr_request from the list_request and free the 31404ed5c033SLukas Czerner * request structure. Should be called with li_list_mtx held 3141bfff6873SLukas Czerner */ 3142bfff6873SLukas Czerner static void ext4_remove_li_request(struct ext4_li_request *elr) 3143bfff6873SLukas Czerner { 3144bfff6873SLukas Czerner struct ext4_sb_info *sbi; 3145bfff6873SLukas Czerner 3146bfff6873SLukas Czerner if (!elr) 3147bfff6873SLukas Czerner return; 3148bfff6873SLukas Czerner 3149bfff6873SLukas Czerner sbi = elr->lr_sbi; 3150bfff6873SLukas Czerner 3151bfff6873SLukas Czerner list_del(&elr->lr_request); 3152bfff6873SLukas Czerner sbi->s_li_request = NULL; 3153bfff6873SLukas Czerner kfree(elr); 3154bfff6873SLukas Czerner } 3155bfff6873SLukas Czerner 3156bfff6873SLukas Czerner static void ext4_unregister_li_request(struct super_block *sb) 3157bfff6873SLukas Czerner { 31581bb933fbSLukas Czerner mutex_lock(&ext4_li_mtx); 31591bb933fbSLukas Czerner if (!ext4_li_info) { 31601bb933fbSLukas Czerner mutex_unlock(&ext4_li_mtx); 3161bfff6873SLukas Czerner return; 31621bb933fbSLukas Czerner } 3163bfff6873SLukas Czerner 3164bfff6873SLukas Czerner mutex_lock(&ext4_li_info->li_list_mtx); 31651bb933fbSLukas Czerner ext4_remove_li_request(EXT4_SB(sb)->s_li_request); 3166bfff6873SLukas Czerner mutex_unlock(&ext4_li_info->li_list_mtx); 31671bb933fbSLukas Czerner mutex_unlock(&ext4_li_mtx); 3168bfff6873SLukas Czerner } 3169bfff6873SLukas Czerner 31708f1f7453SEric Sandeen static struct task_struct *ext4_lazyinit_task; 31718f1f7453SEric Sandeen 3172bfff6873SLukas Czerner /* 3173bfff6873SLukas Czerner * This is the function where ext4lazyinit thread lives. It walks 3174bfff6873SLukas Czerner * through the request list searching for next scheduled filesystem. 3175bfff6873SLukas Czerner * When such a fs is found, run the lazy initialization request 3176bfff6873SLukas Czerner * (ext4_rn_li_request) and keep track of the time spend in this 3177bfff6873SLukas Czerner * function. Based on that time we compute next schedule time of 3178bfff6873SLukas Czerner * the request. When walking through the list is complete, compute 3179bfff6873SLukas Czerner * next waking time and put itself into sleep. 3180bfff6873SLukas Czerner */ 3181bfff6873SLukas Czerner static int ext4_lazyinit_thread(void *arg) 3182bfff6873SLukas Czerner { 3183bfff6873SLukas Czerner struct ext4_lazy_init *eli = (struct ext4_lazy_init *)arg; 3184bfff6873SLukas Czerner struct list_head *pos, *n; 3185bfff6873SLukas Czerner struct ext4_li_request *elr; 31864ed5c033SLukas Czerner unsigned long next_wakeup, cur; 3187bfff6873SLukas Czerner 3188bfff6873SLukas Czerner BUG_ON(NULL == eli); 3189bfff6873SLukas Czerner 3190bfff6873SLukas Czerner cont_thread: 3191bfff6873SLukas Czerner while (true) { 3192bfff6873SLukas Czerner next_wakeup = MAX_JIFFY_OFFSET; 3193bfff6873SLukas Czerner 3194bfff6873SLukas Czerner mutex_lock(&eli->li_list_mtx); 3195bfff6873SLukas Czerner if (list_empty(&eli->li_request_list)) { 3196bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx); 3197bfff6873SLukas Czerner goto exit_thread; 3198bfff6873SLukas Czerner } 3199bfff6873SLukas Czerner list_for_each_safe(pos, n, &eli->li_request_list) { 3200e22834f0SDmitry Monakhov int err = 0; 3201e22834f0SDmitry Monakhov int progress = 0; 3202bfff6873SLukas Czerner elr = list_entry(pos, struct ext4_li_request, 3203bfff6873SLukas Czerner lr_request); 3204bfff6873SLukas Czerner 3205e22834f0SDmitry Monakhov if (time_before(jiffies, elr->lr_next_sched)) { 3206e22834f0SDmitry Monakhov if (time_before(elr->lr_next_sched, next_wakeup)) 3207e22834f0SDmitry Monakhov next_wakeup = elr->lr_next_sched; 3208e22834f0SDmitry Monakhov continue; 3209e22834f0SDmitry Monakhov } 3210e22834f0SDmitry Monakhov if (down_read_trylock(&elr->lr_super->s_umount)) { 3211e22834f0SDmitry Monakhov if (sb_start_write_trylock(elr->lr_super)) { 3212e22834f0SDmitry Monakhov progress = 1; 3213e22834f0SDmitry Monakhov /* 3214e22834f0SDmitry Monakhov * We hold sb->s_umount, sb can not 3215e22834f0SDmitry Monakhov * be removed from the list, it is 3216e22834f0SDmitry Monakhov * now safe to drop li_list_mtx 3217e22834f0SDmitry Monakhov */ 3218e22834f0SDmitry Monakhov mutex_unlock(&eli->li_list_mtx); 3219e22834f0SDmitry Monakhov err = ext4_run_li_request(elr); 3220e22834f0SDmitry Monakhov sb_end_write(elr->lr_super); 3221e22834f0SDmitry Monakhov mutex_lock(&eli->li_list_mtx); 3222e22834f0SDmitry Monakhov n = pos->next; 3223e22834f0SDmitry Monakhov } 3224e22834f0SDmitry Monakhov up_read((&elr->lr_super->s_umount)); 3225e22834f0SDmitry Monakhov } 3226b2c78cd0STheodore Ts'o /* error, remove the lazy_init job */ 3227e22834f0SDmitry Monakhov if (err) { 3228bfff6873SLukas Czerner ext4_remove_li_request(elr); 3229bfff6873SLukas Czerner continue; 3230bfff6873SLukas Czerner } 3231e22834f0SDmitry Monakhov if (!progress) { 3232e22834f0SDmitry Monakhov elr->lr_next_sched = jiffies + 3233e22834f0SDmitry Monakhov (prandom_u32() 3234e22834f0SDmitry Monakhov % (EXT4_DEF_LI_MAX_START_DELAY * HZ)); 3235b2c78cd0STheodore Ts'o } 3236bfff6873SLukas Czerner if (time_before(elr->lr_next_sched, next_wakeup)) 3237bfff6873SLukas Czerner next_wakeup = elr->lr_next_sched; 3238bfff6873SLukas Czerner } 3239bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx); 3240bfff6873SLukas Czerner 3241a0acae0eSTejun Heo try_to_freeze(); 3242bfff6873SLukas Czerner 32434ed5c033SLukas Czerner cur = jiffies; 32444ed5c033SLukas Czerner if ((time_after_eq(cur, next_wakeup)) || 3245f4245bd4SLukas Czerner (MAX_JIFFY_OFFSET == next_wakeup)) { 3246bfff6873SLukas Czerner cond_resched(); 3247bfff6873SLukas Czerner continue; 3248bfff6873SLukas Czerner } 3249bfff6873SLukas Czerner 32504ed5c033SLukas Czerner schedule_timeout_interruptible(next_wakeup - cur); 32514ed5c033SLukas Czerner 32528f1f7453SEric Sandeen if (kthread_should_stop()) { 32538f1f7453SEric Sandeen ext4_clear_request_list(); 32548f1f7453SEric Sandeen goto exit_thread; 32558f1f7453SEric Sandeen } 3256bfff6873SLukas Czerner } 3257bfff6873SLukas Czerner 3258bfff6873SLukas Czerner exit_thread: 3259bfff6873SLukas Czerner /* 3260bfff6873SLukas Czerner * It looks like the request list is empty, but we need 3261bfff6873SLukas Czerner * to check it under the li_list_mtx lock, to prevent any 3262bfff6873SLukas Czerner * additions into it, and of course we should lock ext4_li_mtx 3263bfff6873SLukas Czerner * to atomically free the list and ext4_li_info, because at 3264bfff6873SLukas Czerner * this point another ext4 filesystem could be registering 3265bfff6873SLukas Czerner * new one. 3266bfff6873SLukas Czerner */ 3267bfff6873SLukas Czerner mutex_lock(&ext4_li_mtx); 3268bfff6873SLukas Czerner mutex_lock(&eli->li_list_mtx); 3269bfff6873SLukas Czerner if (!list_empty(&eli->li_request_list)) { 3270bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx); 3271bfff6873SLukas Czerner mutex_unlock(&ext4_li_mtx); 3272bfff6873SLukas Czerner goto cont_thread; 3273bfff6873SLukas Czerner } 3274bfff6873SLukas Czerner mutex_unlock(&eli->li_list_mtx); 3275bfff6873SLukas Czerner kfree(ext4_li_info); 3276bfff6873SLukas Czerner ext4_li_info = NULL; 3277bfff6873SLukas Czerner mutex_unlock(&ext4_li_mtx); 3278bfff6873SLukas Czerner 3279bfff6873SLukas Czerner return 0; 3280bfff6873SLukas Czerner } 3281bfff6873SLukas Czerner 3282bfff6873SLukas Czerner static void ext4_clear_request_list(void) 3283bfff6873SLukas Czerner { 3284bfff6873SLukas Czerner struct list_head *pos, *n; 3285bfff6873SLukas Czerner struct ext4_li_request *elr; 3286bfff6873SLukas Czerner 3287bfff6873SLukas Czerner mutex_lock(&ext4_li_info->li_list_mtx); 3288bfff6873SLukas Czerner list_for_each_safe(pos, n, &ext4_li_info->li_request_list) { 3289bfff6873SLukas Czerner elr = list_entry(pos, struct ext4_li_request, 3290bfff6873SLukas Czerner lr_request); 3291bfff6873SLukas Czerner ext4_remove_li_request(elr); 3292bfff6873SLukas Czerner } 3293bfff6873SLukas Czerner mutex_unlock(&ext4_li_info->li_list_mtx); 3294bfff6873SLukas Czerner } 3295bfff6873SLukas Czerner 3296bfff6873SLukas Czerner static int ext4_run_lazyinit_thread(void) 3297bfff6873SLukas Czerner { 32988f1f7453SEric Sandeen ext4_lazyinit_task = kthread_run(ext4_lazyinit_thread, 32998f1f7453SEric Sandeen ext4_li_info, "ext4lazyinit"); 33008f1f7453SEric Sandeen if (IS_ERR(ext4_lazyinit_task)) { 33018f1f7453SEric Sandeen int err = PTR_ERR(ext4_lazyinit_task); 3302bfff6873SLukas Czerner ext4_clear_request_list(); 3303bfff6873SLukas Czerner kfree(ext4_li_info); 3304bfff6873SLukas Czerner ext4_li_info = NULL; 330592b97816STheodore Ts'o printk(KERN_CRIT "EXT4-fs: error %d creating inode table " 3306bfff6873SLukas Czerner "initialization thread\n", 3307bfff6873SLukas Czerner err); 3308bfff6873SLukas Czerner return err; 3309bfff6873SLukas Czerner } 3310bfff6873SLukas Czerner ext4_li_info->li_state |= EXT4_LAZYINIT_RUNNING; 3311bfff6873SLukas Czerner return 0; 3312bfff6873SLukas Czerner } 3313bfff6873SLukas Czerner 3314bfff6873SLukas Czerner /* 3315bfff6873SLukas Czerner * Check whether it make sense to run itable init. thread or not. 3316bfff6873SLukas Czerner * If there is at least one uninitialized inode table, return 3317bfff6873SLukas Czerner * corresponding group number, else the loop goes through all 3318bfff6873SLukas Czerner * groups and return total number of groups. 3319bfff6873SLukas Czerner */ 3320bfff6873SLukas Czerner static ext4_group_t ext4_has_uninit_itable(struct super_block *sb) 3321bfff6873SLukas Czerner { 3322bfff6873SLukas Czerner ext4_group_t group, ngroups = EXT4_SB(sb)->s_groups_count; 3323bfff6873SLukas Czerner struct ext4_group_desc *gdp = NULL; 3324bfff6873SLukas Czerner 33258844618dSTheodore Ts'o if (!ext4_has_group_desc_csum(sb)) 33268844618dSTheodore Ts'o return ngroups; 33278844618dSTheodore Ts'o 3328bfff6873SLukas Czerner for (group = 0; group < ngroups; group++) { 3329bfff6873SLukas Czerner gdp = ext4_get_group_desc(sb, group, NULL); 3330bfff6873SLukas Czerner if (!gdp) 3331bfff6873SLukas Czerner continue; 3332bfff6873SLukas Czerner 333350122847STheodore Ts'o if (!(gdp->bg_flags & cpu_to_le16(EXT4_BG_INODE_ZEROED))) 3334bfff6873SLukas Czerner break; 3335bfff6873SLukas Czerner } 3336bfff6873SLukas Czerner 3337bfff6873SLukas Czerner return group; 3338bfff6873SLukas Czerner } 3339bfff6873SLukas Czerner 3340bfff6873SLukas Czerner static int ext4_li_info_new(void) 3341bfff6873SLukas Czerner { 3342bfff6873SLukas Czerner struct ext4_lazy_init *eli = NULL; 3343bfff6873SLukas Czerner 3344bfff6873SLukas Czerner eli = kzalloc(sizeof(*eli), GFP_KERNEL); 3345bfff6873SLukas Czerner if (!eli) 3346bfff6873SLukas Czerner return -ENOMEM; 3347bfff6873SLukas Czerner 3348bfff6873SLukas Czerner INIT_LIST_HEAD(&eli->li_request_list); 3349bfff6873SLukas Czerner mutex_init(&eli->li_list_mtx); 3350bfff6873SLukas Czerner 3351bfff6873SLukas Czerner eli->li_state |= EXT4_LAZYINIT_QUIT; 3352bfff6873SLukas Czerner 3353bfff6873SLukas Czerner ext4_li_info = eli; 3354bfff6873SLukas Czerner 3355bfff6873SLukas Czerner return 0; 3356bfff6873SLukas Czerner } 3357bfff6873SLukas Czerner 3358bfff6873SLukas Czerner static struct ext4_li_request *ext4_li_request_new(struct super_block *sb, 3359bfff6873SLukas Czerner ext4_group_t start) 3360bfff6873SLukas Czerner { 3361bfff6873SLukas Czerner struct ext4_sb_info *sbi = EXT4_SB(sb); 3362bfff6873SLukas Czerner struct ext4_li_request *elr; 3363bfff6873SLukas Czerner 3364bfff6873SLukas Czerner elr = kzalloc(sizeof(*elr), GFP_KERNEL); 3365bfff6873SLukas Czerner if (!elr) 3366bfff6873SLukas Czerner return NULL; 3367bfff6873SLukas Czerner 3368bfff6873SLukas Czerner elr->lr_super = sb; 3369bfff6873SLukas Czerner elr->lr_sbi = sbi; 3370bfff6873SLukas Czerner elr->lr_next_group = start; 3371bfff6873SLukas Czerner 3372bfff6873SLukas Czerner /* 3373bfff6873SLukas Czerner * Randomize first schedule time of the request to 3374bfff6873SLukas Czerner * spread the inode table initialization requests 3375bfff6873SLukas Czerner * better. 3376bfff6873SLukas Czerner */ 3377dd1f723bSTheodore Ts'o elr->lr_next_sched = jiffies + (prandom_u32() % 3378dd1f723bSTheodore Ts'o (EXT4_DEF_LI_MAX_START_DELAY * HZ)); 3379bfff6873SLukas Czerner return elr; 3380bfff6873SLukas Czerner } 3381bfff6873SLukas Czerner 33827f511862STheodore Ts'o int ext4_register_li_request(struct super_block *sb, 3383bfff6873SLukas Czerner ext4_group_t first_not_zeroed) 3384bfff6873SLukas Czerner { 3385bfff6873SLukas Czerner struct ext4_sb_info *sbi = EXT4_SB(sb); 33867f511862STheodore Ts'o struct ext4_li_request *elr = NULL; 338749598e04SJun Piao ext4_group_t ngroups = sbi->s_groups_count; 33886c5a6cb9SAndrew Morton int ret = 0; 3389bfff6873SLukas Czerner 33907f511862STheodore Ts'o mutex_lock(&ext4_li_mtx); 339151ce6511SLukas Czerner if (sbi->s_li_request != NULL) { 339251ce6511SLukas Czerner /* 339351ce6511SLukas Czerner * Reset timeout so it can be computed again, because 339451ce6511SLukas Czerner * s_li_wait_mult might have changed. 339551ce6511SLukas Czerner */ 339651ce6511SLukas Czerner sbi->s_li_request->lr_timeout = 0; 33977f511862STheodore Ts'o goto out; 339851ce6511SLukas Czerner } 3399bfff6873SLukas Czerner 3400bc98a42cSDavid Howells if (first_not_zeroed == ngroups || sb_rdonly(sb) || 340155ff3840STao Ma !test_opt(sb, INIT_INODE_TABLE)) 34027f511862STheodore Ts'o goto out; 3403bfff6873SLukas Czerner 3404bfff6873SLukas Czerner elr = ext4_li_request_new(sb, first_not_zeroed); 34057f511862STheodore Ts'o if (!elr) { 34067f511862STheodore Ts'o ret = -ENOMEM; 34077f511862STheodore Ts'o goto out; 34087f511862STheodore Ts'o } 3409bfff6873SLukas Czerner 3410bfff6873SLukas Czerner if (NULL == ext4_li_info) { 3411bfff6873SLukas Czerner ret = ext4_li_info_new(); 3412bfff6873SLukas Czerner if (ret) 3413bfff6873SLukas Czerner goto out; 3414bfff6873SLukas Czerner } 3415bfff6873SLukas Czerner 3416bfff6873SLukas Czerner mutex_lock(&ext4_li_info->li_list_mtx); 3417bfff6873SLukas Czerner list_add(&elr->lr_request, &ext4_li_info->li_request_list); 3418bfff6873SLukas Czerner mutex_unlock(&ext4_li_info->li_list_mtx); 3419bfff6873SLukas Czerner 3420bfff6873SLukas Czerner sbi->s_li_request = elr; 342146e4690bSTao Ma /* 342246e4690bSTao Ma * set elr to NULL here since it has been inserted to 342346e4690bSTao Ma * the request_list and the removal and free of it is 342446e4690bSTao Ma * handled by ext4_clear_request_list from now on. 342546e4690bSTao Ma */ 342646e4690bSTao Ma elr = NULL; 3427bfff6873SLukas Czerner 3428bfff6873SLukas Czerner if (!(ext4_li_info->li_state & EXT4_LAZYINIT_RUNNING)) { 3429bfff6873SLukas Czerner ret = ext4_run_lazyinit_thread(); 3430bfff6873SLukas Czerner if (ret) 3431bfff6873SLukas Czerner goto out; 3432bfff6873SLukas Czerner } 3433bfff6873SLukas Czerner out: 3434bfff6873SLukas Czerner mutex_unlock(&ext4_li_mtx); 3435beed5ecbSNicolas Kaiser if (ret) 3436bfff6873SLukas Czerner kfree(elr); 3437bfff6873SLukas Czerner return ret; 3438bfff6873SLukas Czerner } 3439bfff6873SLukas Czerner 3440bfff6873SLukas Czerner /* 3441bfff6873SLukas Czerner * We do not need to lock anything since this is called on 3442bfff6873SLukas Czerner * module unload. 3443bfff6873SLukas Czerner */ 3444bfff6873SLukas Czerner static void ext4_destroy_lazyinit_thread(void) 3445bfff6873SLukas Czerner { 3446bfff6873SLukas Czerner /* 3447bfff6873SLukas Czerner * If thread exited earlier 3448bfff6873SLukas Czerner * there's nothing to be done. 3449bfff6873SLukas Czerner */ 34508f1f7453SEric Sandeen if (!ext4_li_info || !ext4_lazyinit_task) 3451bfff6873SLukas Czerner return; 3452bfff6873SLukas Czerner 34538f1f7453SEric Sandeen kthread_stop(ext4_lazyinit_task); 3454bfff6873SLukas Czerner } 3455bfff6873SLukas Czerner 345625ed6e8aSDarrick J. Wong static int set_journal_csum_feature_set(struct super_block *sb) 345725ed6e8aSDarrick J. Wong { 345825ed6e8aSDarrick J. Wong int ret = 1; 345925ed6e8aSDarrick J. Wong int compat, incompat; 346025ed6e8aSDarrick J. Wong struct ext4_sb_info *sbi = EXT4_SB(sb); 346125ed6e8aSDarrick J. Wong 34629aa5d32bSDmitry Monakhov if (ext4_has_metadata_csum(sb)) { 3463db9ee220SDarrick J. Wong /* journal checksum v3 */ 346425ed6e8aSDarrick J. Wong compat = 0; 3465db9ee220SDarrick J. Wong incompat = JBD2_FEATURE_INCOMPAT_CSUM_V3; 346625ed6e8aSDarrick J. Wong } else { 346725ed6e8aSDarrick J. Wong /* journal checksum v1 */ 346825ed6e8aSDarrick J. Wong compat = JBD2_FEATURE_COMPAT_CHECKSUM; 346925ed6e8aSDarrick J. Wong incompat = 0; 347025ed6e8aSDarrick J. Wong } 347125ed6e8aSDarrick J. Wong 3472feb8c6d3SDarrick J. Wong jbd2_journal_clear_features(sbi->s_journal, 3473feb8c6d3SDarrick J. Wong JBD2_FEATURE_COMPAT_CHECKSUM, 0, 3474feb8c6d3SDarrick J. Wong JBD2_FEATURE_INCOMPAT_CSUM_V3 | 3475feb8c6d3SDarrick J. Wong JBD2_FEATURE_INCOMPAT_CSUM_V2); 347625ed6e8aSDarrick J. Wong if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) { 347725ed6e8aSDarrick J. Wong ret = jbd2_journal_set_features(sbi->s_journal, 347825ed6e8aSDarrick J. Wong compat, 0, 347925ed6e8aSDarrick J. Wong JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT | 348025ed6e8aSDarrick J. Wong incompat); 348125ed6e8aSDarrick J. Wong } else if (test_opt(sb, JOURNAL_CHECKSUM)) { 348225ed6e8aSDarrick J. Wong ret = jbd2_journal_set_features(sbi->s_journal, 348325ed6e8aSDarrick J. Wong compat, 0, 348425ed6e8aSDarrick J. Wong incompat); 348525ed6e8aSDarrick J. Wong jbd2_journal_clear_features(sbi->s_journal, 0, 0, 348625ed6e8aSDarrick J. Wong JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT); 348725ed6e8aSDarrick J. Wong } else { 3488feb8c6d3SDarrick J. Wong jbd2_journal_clear_features(sbi->s_journal, 0, 0, 3489feb8c6d3SDarrick J. Wong JBD2_FEATURE_INCOMPAT_ASYNC_COMMIT); 349025ed6e8aSDarrick J. Wong } 349125ed6e8aSDarrick J. Wong 349225ed6e8aSDarrick J. Wong return ret; 349325ed6e8aSDarrick J. Wong } 349425ed6e8aSDarrick J. Wong 3495952fc18eSTheodore Ts'o /* 3496952fc18eSTheodore Ts'o * Note: calculating the overhead so we can be compatible with 3497952fc18eSTheodore Ts'o * historical BSD practice is quite difficult in the face of 3498952fc18eSTheodore Ts'o * clusters/bigalloc. This is because multiple metadata blocks from 3499952fc18eSTheodore Ts'o * different block group can end up in the same allocation cluster. 3500952fc18eSTheodore Ts'o * Calculating the exact overhead in the face of clustered allocation 3501952fc18eSTheodore Ts'o * requires either O(all block bitmaps) in memory or O(number of block 3502952fc18eSTheodore Ts'o * groups**2) in time. We will still calculate the superblock for 3503952fc18eSTheodore Ts'o * older file systems --- and if we come across with a bigalloc file 3504952fc18eSTheodore Ts'o * system with zero in s_overhead_clusters the estimate will be close to 3505952fc18eSTheodore Ts'o * correct especially for very large cluster sizes --- but for newer 3506952fc18eSTheodore Ts'o * file systems, it's better to calculate this figure once at mkfs 3507952fc18eSTheodore Ts'o * time, and store it in the superblock. If the superblock value is 3508952fc18eSTheodore Ts'o * present (even for non-bigalloc file systems), we will use it. 3509952fc18eSTheodore Ts'o */ 3510952fc18eSTheodore Ts'o static int count_overhead(struct super_block *sb, ext4_group_t grp, 3511952fc18eSTheodore Ts'o char *buf) 3512952fc18eSTheodore Ts'o { 3513952fc18eSTheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb); 3514952fc18eSTheodore Ts'o struct ext4_group_desc *gdp; 3515952fc18eSTheodore Ts'o ext4_fsblk_t first_block, last_block, b; 3516952fc18eSTheodore Ts'o ext4_group_t i, ngroups = ext4_get_groups_count(sb); 3517952fc18eSTheodore Ts'o int s, j, count = 0; 3518952fc18eSTheodore Ts'o 3519e2b911c5SDarrick J. Wong if (!ext4_has_feature_bigalloc(sb)) 35200548bbb8STheodore Ts'o return (ext4_bg_has_super(sb, grp) + ext4_bg_num_gdb(sb, grp) + 35210548bbb8STheodore Ts'o sbi->s_itb_per_group + 2); 35220548bbb8STheodore Ts'o 3523952fc18eSTheodore Ts'o first_block = le32_to_cpu(sbi->s_es->s_first_data_block) + 3524952fc18eSTheodore Ts'o (grp * EXT4_BLOCKS_PER_GROUP(sb)); 3525952fc18eSTheodore Ts'o last_block = first_block + EXT4_BLOCKS_PER_GROUP(sb) - 1; 3526952fc18eSTheodore Ts'o for (i = 0; i < ngroups; i++) { 3527952fc18eSTheodore Ts'o gdp = ext4_get_group_desc(sb, i, NULL); 3528952fc18eSTheodore Ts'o b = ext4_block_bitmap(sb, gdp); 3529952fc18eSTheodore Ts'o if (b >= first_block && b <= last_block) { 3530952fc18eSTheodore Ts'o ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf); 3531952fc18eSTheodore Ts'o count++; 3532952fc18eSTheodore Ts'o } 3533952fc18eSTheodore Ts'o b = ext4_inode_bitmap(sb, gdp); 3534952fc18eSTheodore Ts'o if (b >= first_block && b <= last_block) { 3535952fc18eSTheodore Ts'o ext4_set_bit(EXT4_B2C(sbi, b - first_block), buf); 3536952fc18eSTheodore Ts'o count++; 3537952fc18eSTheodore Ts'o } 3538952fc18eSTheodore Ts'o b = ext4_inode_table(sb, gdp); 3539952fc18eSTheodore Ts'o if (b >= first_block && b + sbi->s_itb_per_group <= last_block) 3540952fc18eSTheodore Ts'o for (j = 0; j < sbi->s_itb_per_group; j++, b++) { 3541952fc18eSTheodore Ts'o int c = EXT4_B2C(sbi, b - first_block); 3542952fc18eSTheodore Ts'o ext4_set_bit(c, buf); 3543952fc18eSTheodore Ts'o count++; 3544952fc18eSTheodore Ts'o } 3545952fc18eSTheodore Ts'o if (i != grp) 3546952fc18eSTheodore Ts'o continue; 3547952fc18eSTheodore Ts'o s = 0; 3548952fc18eSTheodore Ts'o if (ext4_bg_has_super(sb, grp)) { 3549952fc18eSTheodore Ts'o ext4_set_bit(s++, buf); 3550952fc18eSTheodore Ts'o count++; 3551952fc18eSTheodore Ts'o } 3552c48ae41bSTheodore Ts'o j = ext4_bg_num_gdb(sb, grp); 3553c48ae41bSTheodore Ts'o if (s + j > EXT4_BLOCKS_PER_GROUP(sb)) { 3554c48ae41bSTheodore Ts'o ext4_error(sb, "Invalid number of block group " 3555c48ae41bSTheodore Ts'o "descriptor blocks: %d", j); 3556c48ae41bSTheodore Ts'o j = EXT4_BLOCKS_PER_GROUP(sb) - s; 3557952fc18eSTheodore Ts'o } 3558c48ae41bSTheodore Ts'o count += j; 3559c48ae41bSTheodore Ts'o for (; j > 0; j--) 3560c48ae41bSTheodore Ts'o ext4_set_bit(EXT4_B2C(sbi, s++), buf); 3561952fc18eSTheodore Ts'o } 3562952fc18eSTheodore Ts'o if (!count) 3563952fc18eSTheodore Ts'o return 0; 3564952fc18eSTheodore Ts'o return EXT4_CLUSTERS_PER_GROUP(sb) - 3565952fc18eSTheodore Ts'o ext4_count_free(buf, EXT4_CLUSTERS_PER_GROUP(sb) / 8); 3566952fc18eSTheodore Ts'o } 3567952fc18eSTheodore Ts'o 3568952fc18eSTheodore Ts'o /* 3569952fc18eSTheodore Ts'o * Compute the overhead and stash it in sbi->s_overhead 3570952fc18eSTheodore Ts'o */ 3571952fc18eSTheodore Ts'o int ext4_calculate_overhead(struct super_block *sb) 3572952fc18eSTheodore Ts'o { 3573952fc18eSTheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb); 3574952fc18eSTheodore Ts'o struct ext4_super_block *es = sbi->s_es; 35753c816dedSEric Whitney struct inode *j_inode; 35763c816dedSEric Whitney unsigned int j_blocks, j_inum = le32_to_cpu(es->s_journal_inum); 3577952fc18eSTheodore Ts'o ext4_group_t i, ngroups = ext4_get_groups_count(sb); 3578952fc18eSTheodore Ts'o ext4_fsblk_t overhead = 0; 35794fdb5543SDmitry Monakhov char *buf = (char *) get_zeroed_page(GFP_NOFS); 3580952fc18eSTheodore Ts'o 3581952fc18eSTheodore Ts'o if (!buf) 3582952fc18eSTheodore Ts'o return -ENOMEM; 3583952fc18eSTheodore Ts'o 3584952fc18eSTheodore Ts'o /* 3585952fc18eSTheodore Ts'o * Compute the overhead (FS structures). This is constant 3586952fc18eSTheodore Ts'o * for a given filesystem unless the number of block groups 3587952fc18eSTheodore Ts'o * changes so we cache the previous value until it does. 3588952fc18eSTheodore Ts'o */ 3589952fc18eSTheodore Ts'o 3590952fc18eSTheodore Ts'o /* 3591952fc18eSTheodore Ts'o * All of the blocks before first_data_block are overhead 3592952fc18eSTheodore Ts'o */ 3593952fc18eSTheodore Ts'o overhead = EXT4_B2C(sbi, le32_to_cpu(es->s_first_data_block)); 3594952fc18eSTheodore Ts'o 3595952fc18eSTheodore Ts'o /* 3596952fc18eSTheodore Ts'o * Add the overhead found in each block group 3597952fc18eSTheodore Ts'o */ 3598952fc18eSTheodore Ts'o for (i = 0; i < ngroups; i++) { 3599952fc18eSTheodore Ts'o int blks; 3600952fc18eSTheodore Ts'o 3601952fc18eSTheodore Ts'o blks = count_overhead(sb, i, buf); 3602952fc18eSTheodore Ts'o overhead += blks; 3603952fc18eSTheodore Ts'o if (blks) 3604952fc18eSTheodore Ts'o memset(buf, 0, PAGE_SIZE); 3605952fc18eSTheodore Ts'o cond_resched(); 3606952fc18eSTheodore Ts'o } 36073c816dedSEric Whitney 36083c816dedSEric Whitney /* 36093c816dedSEric Whitney * Add the internal journal blocks whether the journal has been 36103c816dedSEric Whitney * loaded or not 36113c816dedSEric Whitney */ 3612b003b524SEric Sandeen if (sbi->s_journal && !sbi->journal_bdev) 3613810da240SLukas Czerner overhead += EXT4_NUM_B2C(sbi, sbi->s_journal->j_maxlen); 36143c816dedSEric Whitney else if (ext4_has_feature_journal(sb) && !sbi->s_journal) { 36153c816dedSEric Whitney j_inode = ext4_get_journal_inode(sb, j_inum); 36163c816dedSEric Whitney if (j_inode) { 36173c816dedSEric Whitney j_blocks = j_inode->i_size >> sb->s_blocksize_bits; 36183c816dedSEric Whitney overhead += EXT4_NUM_B2C(sbi, j_blocks); 36193c816dedSEric Whitney iput(j_inode); 36203c816dedSEric Whitney } else { 36213c816dedSEric Whitney ext4_msg(sb, KERN_ERR, "can't get journal size"); 36223c816dedSEric Whitney } 36233c816dedSEric Whitney } 3624952fc18eSTheodore Ts'o sbi->s_overhead = overhead; 3625952fc18eSTheodore Ts'o smp_wmb(); 3626952fc18eSTheodore Ts'o free_page((unsigned long) buf); 3627952fc18eSTheodore Ts'o return 0; 3628952fc18eSTheodore Ts'o } 3629952fc18eSTheodore Ts'o 3630b5799018STheodore Ts'o static void ext4_set_resv_clusters(struct super_block *sb) 363127dd4385SLukas Czerner { 363227dd4385SLukas Czerner ext4_fsblk_t resv_clusters; 3633b5799018STheodore Ts'o struct ext4_sb_info *sbi = EXT4_SB(sb); 363427dd4385SLukas Czerner 363527dd4385SLukas Czerner /* 363630fac0f7SJan Kara * There's no need to reserve anything when we aren't using extents. 363730fac0f7SJan Kara * The space estimates are exact, there are no unwritten extents, 363830fac0f7SJan Kara * hole punching doesn't need new metadata... This is needed especially 363930fac0f7SJan Kara * to keep ext2/3 backward compatibility. 364030fac0f7SJan Kara */ 3641e2b911c5SDarrick J. Wong if (!ext4_has_feature_extents(sb)) 3642b5799018STheodore Ts'o return; 364330fac0f7SJan Kara /* 364427dd4385SLukas Czerner * By default we reserve 2% or 4096 clusters, whichever is smaller. 364527dd4385SLukas Czerner * This should cover the situations where we can not afford to run 364627dd4385SLukas Czerner * out of space like for example punch hole, or converting 3647556615dcSLukas Czerner * unwritten extents in delalloc path. In most cases such 364827dd4385SLukas Czerner * allocation would require 1, or 2 blocks, higher numbers are 364927dd4385SLukas Czerner * very rare. 365027dd4385SLukas Czerner */ 3651b5799018STheodore Ts'o resv_clusters = (ext4_blocks_count(sbi->s_es) >> 3652b5799018STheodore Ts'o sbi->s_cluster_bits); 365327dd4385SLukas Czerner 365427dd4385SLukas Czerner do_div(resv_clusters, 50); 365527dd4385SLukas Czerner resv_clusters = min_t(ext4_fsblk_t, resv_clusters, 4096); 365627dd4385SLukas Czerner 3657b5799018STheodore Ts'o atomic64_set(&sbi->s_resv_clusters, resv_clusters); 365827dd4385SLukas Czerner } 365927dd4385SLukas Czerner 3660617ba13bSMingming Cao static int ext4_fill_super(struct super_block *sb, void *data, int silent) 3661ac27a0ecSDave Kleikamp { 36625e405595SDan Williams struct dax_device *dax_dev = fs_dax_get_by_bdev(sb->s_bdev); 3663d4c402d9SCurt Wohlgemuth char *orig_data = kstrdup(data, GFP_KERNEL); 3664ac27a0ecSDave Kleikamp struct buffer_head *bh; 3665617ba13bSMingming Cao struct ext4_super_block *es = NULL; 36665aee0f8aSTheodore Ts'o struct ext4_sb_info *sbi = kzalloc(sizeof(*sbi), GFP_KERNEL); 3667617ba13bSMingming Cao ext4_fsblk_t block; 3668617ba13bSMingming Cao ext4_fsblk_t sb_block = get_sb_block(&data); 366970bbb3e0SAndrew Morton ext4_fsblk_t logical_sb_block; 3670ac27a0ecSDave Kleikamp unsigned long offset = 0; 3671ac27a0ecSDave Kleikamp unsigned long journal_devnum = 0; 3672ac27a0ecSDave Kleikamp unsigned long def_mount_opts; 3673ac27a0ecSDave Kleikamp struct inode *root; 36740390131bSFrank Mayhar const char *descr; 3675dcc7dae3SCyrill Gorcunov int ret = -ENOMEM; 3676281b5995STheodore Ts'o int blocksize, clustersize; 36774ec11028STheodore Ts'o unsigned int db_count; 36784ec11028STheodore Ts'o unsigned int i; 3679281b5995STheodore Ts'o int needs_recovery, has_huge_files, has_bigalloc; 3680bd81d8eeSLaurent Vivier __u64 blocks_count; 368107aa2ea1SLukas Czerner int err = 0; 3682b3881f74STheodore Ts'o unsigned int journal_ioprio = DEFAULT_JOURNAL_IOPRIO; 3683bfff6873SLukas Czerner ext4_group_t first_not_zeroed; 3684ac27a0ecSDave Kleikamp 36855aee0f8aSTheodore Ts'o if ((data && !orig_data) || !sbi) 36865aee0f8aSTheodore Ts'o goto out_free_base; 3687705895b6SPekka Enberg 3688aed9eb1bSColin Ian King sbi->s_daxdev = dax_dev; 3689705895b6SPekka Enberg sbi->s_blockgroup_lock = 3690705895b6SPekka Enberg kzalloc(sizeof(struct blockgroup_lock), GFP_KERNEL); 36915aee0f8aSTheodore Ts'o if (!sbi->s_blockgroup_lock) 36925aee0f8aSTheodore Ts'o goto out_free_base; 36935aee0f8aSTheodore Ts'o 3694ac27a0ecSDave Kleikamp sb->s_fs_info = sbi; 36952c0544b2STheodore Ts'o sbi->s_sb = sb; 3696240799cdSTheodore Ts'o sbi->s_inode_readahead_blks = EXT4_DEF_INODE_READAHEAD_BLKS; 3697d9c9bef1SMiklos Szeredi sbi->s_sb_block = sb_block; 3698f613dfcbSTheodore Ts'o if (sb->s_bdev->bd_part) 3699f613dfcbSTheodore Ts'o sbi->s_sectors_written_start = 3700dbae2c55SMichael Callahan part_stat_read(sb->s_bdev->bd_part, sectors[STAT_WRITE]); 3701ac27a0ecSDave Kleikamp 37029f6200bbSTheodore Ts'o /* Cleanup superblock name */ 3703ec3904dcSRasmus Villemoes strreplace(sb->s_id, '/', '!'); 37049f6200bbSTheodore Ts'o 370507aa2ea1SLukas Czerner /* -EINVAL is default */ 3706dcc7dae3SCyrill Gorcunov ret = -EINVAL; 3707617ba13bSMingming Cao blocksize = sb_min_blocksize(sb, EXT4_MIN_BLOCK_SIZE); 3708ac27a0ecSDave Kleikamp if (!blocksize) { 3709b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "unable to set blocksize"); 3710ac27a0ecSDave Kleikamp goto out_fail; 3711ac27a0ecSDave Kleikamp } 3712ac27a0ecSDave Kleikamp 3713ac27a0ecSDave Kleikamp /* 3714617ba13bSMingming Cao * The ext4 superblock will not be buffer aligned for other than 1kB 3715ac27a0ecSDave Kleikamp * block sizes. We need to calculate the offset from buffer start. 3716ac27a0ecSDave Kleikamp */ 3717617ba13bSMingming Cao if (blocksize != EXT4_MIN_BLOCK_SIZE) { 371870bbb3e0SAndrew Morton logical_sb_block = sb_block * EXT4_MIN_BLOCK_SIZE; 371970bbb3e0SAndrew Morton offset = do_div(logical_sb_block, blocksize); 3720ac27a0ecSDave Kleikamp } else { 372170bbb3e0SAndrew Morton logical_sb_block = sb_block; 3722ac27a0ecSDave Kleikamp } 3723ac27a0ecSDave Kleikamp 3724a8ac900bSGioh Kim if (!(bh = sb_bread_unmovable(sb, logical_sb_block))) { 3725b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "unable to read superblock"); 3726ac27a0ecSDave Kleikamp goto out_fail; 3727ac27a0ecSDave Kleikamp } 3728ac27a0ecSDave Kleikamp /* 3729ac27a0ecSDave Kleikamp * Note: s_es must be initialized as soon as possible because 3730617ba13bSMingming Cao * some ext4 macro-instructions depend on its value 3731ac27a0ecSDave Kleikamp */ 37322716b802STheodore Ts'o es = (struct ext4_super_block *) (bh->b_data + offset); 3733ac27a0ecSDave Kleikamp sbi->s_es = es; 3734ac27a0ecSDave Kleikamp sb->s_magic = le16_to_cpu(es->s_magic); 3735617ba13bSMingming Cao if (sb->s_magic != EXT4_SUPER_MAGIC) 3736617ba13bSMingming Cao goto cantfind_ext4; 3737afc32f7eSTheodore Ts'o sbi->s_kbytes_written = le64_to_cpu(es->s_kbytes_written); 3738ac27a0ecSDave Kleikamp 3739feb0ab32SDarrick J. Wong /* Warn if metadata_csum and gdt_csum are both set. */ 3740e2b911c5SDarrick J. Wong if (ext4_has_feature_metadata_csum(sb) && 3741e2b911c5SDarrick J. Wong ext4_has_feature_gdt_csum(sb)) 3742363307e6SJakub Wilk ext4_warning(sb, "metadata_csum and uninit_bg are " 3743feb0ab32SDarrick J. Wong "redundant flags; please run fsck."); 3744feb0ab32SDarrick J. Wong 3745d25425f8SDarrick J. Wong /* Check for a known checksum algorithm */ 3746d25425f8SDarrick J. Wong if (!ext4_verify_csum_type(sb, es)) { 3747d25425f8SDarrick J. Wong ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with " 3748d25425f8SDarrick J. Wong "unknown checksum algorithm."); 3749d25425f8SDarrick J. Wong silent = 1; 3750d25425f8SDarrick J. Wong goto cantfind_ext4; 3751d25425f8SDarrick J. Wong } 3752d25425f8SDarrick J. Wong 37530441984aSDarrick J. Wong /* Load the checksum driver */ 37540441984aSDarrick J. Wong sbi->s_chksum_driver = crypto_alloc_shash("crc32c", 0, 0); 37550441984aSDarrick J. Wong if (IS_ERR(sbi->s_chksum_driver)) { 37560441984aSDarrick J. Wong ext4_msg(sb, KERN_ERR, "Cannot load crc32c driver."); 37570441984aSDarrick J. Wong ret = PTR_ERR(sbi->s_chksum_driver); 37580441984aSDarrick J. Wong sbi->s_chksum_driver = NULL; 37590441984aSDarrick J. Wong goto failed_mount; 37600441984aSDarrick J. Wong } 37610441984aSDarrick J. Wong 3762a9c47317SDarrick J. Wong /* Check superblock checksum */ 3763a9c47317SDarrick J. Wong if (!ext4_superblock_csum_verify(sb, es)) { 3764a9c47317SDarrick J. Wong ext4_msg(sb, KERN_ERR, "VFS: Found ext4 filesystem with " 3765a9c47317SDarrick J. Wong "invalid superblock checksum. Run e2fsck?"); 3766a9c47317SDarrick J. Wong silent = 1; 37676a797d27SDarrick J. Wong ret = -EFSBADCRC; 3768a9c47317SDarrick J. Wong goto cantfind_ext4; 3769a9c47317SDarrick J. Wong } 3770a9c47317SDarrick J. Wong 3771a9c47317SDarrick J. Wong /* Precompute checksum seed for all metadata */ 3772e2b911c5SDarrick J. Wong if (ext4_has_feature_csum_seed(sb)) 37738c81bd8fSDarrick J. Wong sbi->s_csum_seed = le32_to_cpu(es->s_checksum_seed); 3774dec214d0STahsin Erdogan else if (ext4_has_metadata_csum(sb) || ext4_has_feature_ea_inode(sb)) 3775a9c47317SDarrick J. Wong sbi->s_csum_seed = ext4_chksum(sbi, ~0, es->s_uuid, 3776a9c47317SDarrick J. Wong sizeof(es->s_uuid)); 3777a9c47317SDarrick J. Wong 3778ac27a0ecSDave Kleikamp /* Set defaults before we parse the mount options */ 3779ac27a0ecSDave Kleikamp def_mount_opts = le32_to_cpu(es->s_default_mount_opts); 3780fd8c37ecSTheodore Ts'o set_opt(sb, INIT_INODE_TABLE); 3781617ba13bSMingming Cao if (def_mount_opts & EXT4_DEFM_DEBUG) 3782fd8c37ecSTheodore Ts'o set_opt(sb, DEBUG); 378387f26807STheodore Ts'o if (def_mount_opts & EXT4_DEFM_BSDGROUPS) 3784fd8c37ecSTheodore Ts'o set_opt(sb, GRPID); 3785617ba13bSMingming Cao if (def_mount_opts & EXT4_DEFM_UID16) 3786fd8c37ecSTheodore Ts'o set_opt(sb, NO_UID32); 3787ea663336SEric Sandeen /* xattr user namespace & acls are now defaulted on */ 3788fd8c37ecSTheodore Ts'o set_opt(sb, XATTR_USER); 378903010a33STheodore Ts'o #ifdef CONFIG_EXT4_FS_POSIX_ACL 3790fd8c37ecSTheodore Ts'o set_opt(sb, POSIX_ACL); 37912e7842b8SHugh Dickins #endif 379298c1a759SDarrick J. Wong /* don't forget to enable journal_csum when metadata_csum is enabled. */ 379398c1a759SDarrick J. Wong if (ext4_has_metadata_csum(sb)) 379498c1a759SDarrick J. Wong set_opt(sb, JOURNAL_CHECKSUM); 379598c1a759SDarrick J. Wong 3796617ba13bSMingming Cao if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_DATA) 3797fd8c37ecSTheodore Ts'o set_opt(sb, JOURNAL_DATA); 3798617ba13bSMingming Cao else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_ORDERED) 3799fd8c37ecSTheodore Ts'o set_opt(sb, ORDERED_DATA); 3800617ba13bSMingming Cao else if ((def_mount_opts & EXT4_DEFM_JMODE) == EXT4_DEFM_JMODE_WBACK) 3801fd8c37ecSTheodore Ts'o set_opt(sb, WRITEBACK_DATA); 3802ac27a0ecSDave Kleikamp 3803617ba13bSMingming Cao if (le16_to_cpu(sbi->s_es->s_errors) == EXT4_ERRORS_PANIC) 3804fd8c37ecSTheodore Ts'o set_opt(sb, ERRORS_PANIC); 3805bb4f397aSAneesh Kumar K.V else if (le16_to_cpu(sbi->s_es->s_errors) == EXT4_ERRORS_CONTINUE) 3806fd8c37ecSTheodore Ts'o set_opt(sb, ERRORS_CONT); 3807bb4f397aSAneesh Kumar K.V else 3808fd8c37ecSTheodore Ts'o set_opt(sb, ERRORS_RO); 380945f1a9c3SDarrick J. Wong /* block_validity enabled by default; disable with noblock_validity */ 3810fd8c37ecSTheodore Ts'o set_opt(sb, BLOCK_VALIDITY); 38118b67f04aSTheodore Ts'o if (def_mount_opts & EXT4_DEFM_DISCARD) 3812fd8c37ecSTheodore Ts'o set_opt(sb, DISCARD); 3813ac27a0ecSDave Kleikamp 381408cefc7aSEric W. Biederman sbi->s_resuid = make_kuid(&init_user_ns, le16_to_cpu(es->s_def_resuid)); 381508cefc7aSEric W. Biederman sbi->s_resgid = make_kgid(&init_user_ns, le16_to_cpu(es->s_def_resgid)); 381630773840STheodore Ts'o sbi->s_commit_interval = JBD2_DEFAULT_MAX_COMMIT_AGE * HZ; 381730773840STheodore Ts'o sbi->s_min_batch_time = EXT4_DEF_MIN_BATCH_TIME; 381830773840STheodore Ts'o sbi->s_max_batch_time = EXT4_DEF_MAX_BATCH_TIME; 3819ac27a0ecSDave Kleikamp 38208b67f04aSTheodore Ts'o if ((def_mount_opts & EXT4_DEFM_NOBARRIER) == 0) 3821fd8c37ecSTheodore Ts'o set_opt(sb, BARRIER); 3822ac27a0ecSDave Kleikamp 38231e2462f9SMingming Cao /* 3824dd919b98SAneesh Kumar K.V * enable delayed allocation by default 3825dd919b98SAneesh Kumar K.V * Use -o nodelalloc to turn it off 3826dd919b98SAneesh Kumar K.V */ 3827bc0b75f7STheodore Ts'o if (!IS_EXT3_SB(sb) && !IS_EXT2_SB(sb) && 38288b67f04aSTheodore Ts'o ((def_mount_opts & EXT4_DEFM_NODELALLOC) == 0)) 3829fd8c37ecSTheodore Ts'o set_opt(sb, DELALLOC); 3830dd919b98SAneesh Kumar K.V 383151ce6511SLukas Czerner /* 383251ce6511SLukas Czerner * set default s_li_wait_mult for lazyinit, for the case there is 383351ce6511SLukas Czerner * no mount option specified. 383451ce6511SLukas Czerner */ 383551ce6511SLukas Czerner sbi->s_li_wait_mult = EXT4_DEF_LI_WAIT_MULT; 383651ce6511SLukas Czerner 38379803387cSTheodore Ts'o if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV) { 38389803387cSTheodore Ts'o sbi->s_inode_size = EXT4_GOOD_OLD_INODE_SIZE; 38399803387cSTheodore Ts'o sbi->s_first_ino = EXT4_GOOD_OLD_FIRST_INO; 38409803387cSTheodore Ts'o } else { 38419803387cSTheodore Ts'o sbi->s_inode_size = le16_to_cpu(es->s_inode_size); 38429803387cSTheodore Ts'o sbi->s_first_ino = le32_to_cpu(es->s_first_ino); 38439803387cSTheodore Ts'o if (sbi->s_first_ino < EXT4_GOOD_OLD_FIRST_INO) { 38449803387cSTheodore Ts'o ext4_msg(sb, KERN_ERR, "invalid first ino: %u", 38459803387cSTheodore Ts'o sbi->s_first_ino); 38469803387cSTheodore Ts'o goto failed_mount; 38479803387cSTheodore Ts'o } 38489803387cSTheodore Ts'o if ((sbi->s_inode_size < EXT4_GOOD_OLD_INODE_SIZE) || 38499803387cSTheodore Ts'o (!is_power_of_2(sbi->s_inode_size)) || 38509803387cSTheodore Ts'o (sbi->s_inode_size > blocksize)) { 38519803387cSTheodore Ts'o ext4_msg(sb, KERN_ERR, 38529803387cSTheodore Ts'o "unsupported inode size: %d", 38539803387cSTheodore Ts'o sbi->s_inode_size); 38549803387cSTheodore Ts'o goto failed_mount; 38559803387cSTheodore Ts'o } 38569803387cSTheodore Ts'o /* 38579803387cSTheodore Ts'o * i_atime_extra is the last extra field available for 38589803387cSTheodore Ts'o * [acm]times in struct ext4_inode. Checking for that 38599803387cSTheodore Ts'o * field should suffice to ensure we have extra space 38609803387cSTheodore Ts'o * for all three. 38619803387cSTheodore Ts'o */ 38629803387cSTheodore Ts'o if (sbi->s_inode_size >= offsetof(struct ext4_inode, i_atime_extra) + 38639803387cSTheodore Ts'o sizeof(((struct ext4_inode *)0)->i_atime_extra)) { 38649803387cSTheodore Ts'o sb->s_time_gran = 1; 38659803387cSTheodore Ts'o sb->s_time_max = EXT4_EXTRA_TIMESTAMP_MAX; 38669803387cSTheodore Ts'o } else { 38679803387cSTheodore Ts'o sb->s_time_gran = NSEC_PER_SEC; 38689803387cSTheodore Ts'o sb->s_time_max = EXT4_NON_EXTRA_TIMESTAMP_MAX; 38699803387cSTheodore Ts'o } 38709803387cSTheodore Ts'o sb->s_time_min = EXT4_TIMESTAMP_MIN; 38719803387cSTheodore Ts'o } 38729803387cSTheodore Ts'o if (sbi->s_inode_size > EXT4_GOOD_OLD_INODE_SIZE) { 38739803387cSTheodore Ts'o sbi->s_want_extra_isize = sizeof(struct ext4_inode) - 38749803387cSTheodore Ts'o EXT4_GOOD_OLD_INODE_SIZE; 38759803387cSTheodore Ts'o if (ext4_has_feature_extra_isize(sb)) { 38769803387cSTheodore Ts'o unsigned v, max = (sbi->s_inode_size - 38779803387cSTheodore Ts'o EXT4_GOOD_OLD_INODE_SIZE); 38789803387cSTheodore Ts'o 38799803387cSTheodore Ts'o v = le16_to_cpu(es->s_want_extra_isize); 38809803387cSTheodore Ts'o if (v > max) { 38819803387cSTheodore Ts'o ext4_msg(sb, KERN_ERR, 38829803387cSTheodore Ts'o "bad s_want_extra_isize: %d", v); 38839803387cSTheodore Ts'o goto failed_mount; 38849803387cSTheodore Ts'o } 38859803387cSTheodore Ts'o if (sbi->s_want_extra_isize < v) 38869803387cSTheodore Ts'o sbi->s_want_extra_isize = v; 38879803387cSTheodore Ts'o 38889803387cSTheodore Ts'o v = le16_to_cpu(es->s_min_extra_isize); 38899803387cSTheodore Ts'o if (v > max) { 38909803387cSTheodore Ts'o ext4_msg(sb, KERN_ERR, 38919803387cSTheodore Ts'o "bad s_min_extra_isize: %d", v); 38929803387cSTheodore Ts'o goto failed_mount; 38939803387cSTheodore Ts'o } 38949803387cSTheodore Ts'o if (sbi->s_want_extra_isize < v) 38959803387cSTheodore Ts'o sbi->s_want_extra_isize = v; 38969803387cSTheodore Ts'o } 38979803387cSTheodore Ts'o } 38989803387cSTheodore Ts'o 38995aee0f8aSTheodore Ts'o if (sbi->s_es->s_mount_opts[0]) { 39005aee0f8aSTheodore Ts'o char *s_mount_opts = kstrndup(sbi->s_es->s_mount_opts, 39015aee0f8aSTheodore Ts'o sizeof(sbi->s_es->s_mount_opts), 39025aee0f8aSTheodore Ts'o GFP_KERNEL); 39035aee0f8aSTheodore Ts'o if (!s_mount_opts) 39045aee0f8aSTheodore Ts'o goto failed_mount; 39055aee0f8aSTheodore Ts'o if (!parse_options(s_mount_opts, sb, &journal_devnum, 39065aee0f8aSTheodore Ts'o &journal_ioprio, 0)) { 39078b67f04aSTheodore Ts'o ext4_msg(sb, KERN_WARNING, 39088b67f04aSTheodore Ts'o "failed to parse options in superblock: %s", 39095aee0f8aSTheodore Ts'o s_mount_opts); 39105aee0f8aSTheodore Ts'o } 39115aee0f8aSTheodore Ts'o kfree(s_mount_opts); 39128b67f04aSTheodore Ts'o } 39135a916be1STheodore Ts'o sbi->s_def_mount_opt = sbi->s_mount_opt; 3914b3881f74STheodore Ts'o if (!parse_options((char *) data, sb, &journal_devnum, 3915661aa520SEric Sandeen &journal_ioprio, 0)) 3916ac27a0ecSDave Kleikamp goto failed_mount; 3917ac27a0ecSDave Kleikamp 3918c83ad55eSGabriel Krisman Bertazi #ifdef CONFIG_UNICODE 3919c83ad55eSGabriel Krisman Bertazi if (ext4_has_feature_casefold(sb) && !sbi->s_encoding) { 3920c83ad55eSGabriel Krisman Bertazi const struct ext4_sb_encodings *encoding_info; 3921c83ad55eSGabriel Krisman Bertazi struct unicode_map *encoding; 3922c83ad55eSGabriel Krisman Bertazi __u16 encoding_flags; 3923c83ad55eSGabriel Krisman Bertazi 3924c83ad55eSGabriel Krisman Bertazi if (ext4_has_feature_encrypt(sb)) { 3925c83ad55eSGabriel Krisman Bertazi ext4_msg(sb, KERN_ERR, 3926c83ad55eSGabriel Krisman Bertazi "Can't mount with encoding and encryption"); 3927c83ad55eSGabriel Krisman Bertazi goto failed_mount; 3928c83ad55eSGabriel Krisman Bertazi } 3929c83ad55eSGabriel Krisman Bertazi 3930c83ad55eSGabriel Krisman Bertazi if (ext4_sb_read_encoding(es, &encoding_info, 3931c83ad55eSGabriel Krisman Bertazi &encoding_flags)) { 3932c83ad55eSGabriel Krisman Bertazi ext4_msg(sb, KERN_ERR, 3933c83ad55eSGabriel Krisman Bertazi "Encoding requested by superblock is unknown"); 3934c83ad55eSGabriel Krisman Bertazi goto failed_mount; 3935c83ad55eSGabriel Krisman Bertazi } 3936c83ad55eSGabriel Krisman Bertazi 3937c83ad55eSGabriel Krisman Bertazi encoding = utf8_load(encoding_info->version); 3938c83ad55eSGabriel Krisman Bertazi if (IS_ERR(encoding)) { 3939c83ad55eSGabriel Krisman Bertazi ext4_msg(sb, KERN_ERR, 3940c83ad55eSGabriel Krisman Bertazi "can't mount with superblock charset: %s-%s " 3941c83ad55eSGabriel Krisman Bertazi "not supported by the kernel. flags: 0x%x.", 3942c83ad55eSGabriel Krisman Bertazi encoding_info->name, encoding_info->version, 3943c83ad55eSGabriel Krisman Bertazi encoding_flags); 3944c83ad55eSGabriel Krisman Bertazi goto failed_mount; 3945c83ad55eSGabriel Krisman Bertazi } 3946c83ad55eSGabriel Krisman Bertazi ext4_msg(sb, KERN_INFO,"Using encoding defined by superblock: " 3947c83ad55eSGabriel Krisman Bertazi "%s-%s with flags 0x%hx", encoding_info->name, 3948c83ad55eSGabriel Krisman Bertazi encoding_info->version?:"\b", encoding_flags); 3949c83ad55eSGabriel Krisman Bertazi 3950c83ad55eSGabriel Krisman Bertazi sbi->s_encoding = encoding; 3951c83ad55eSGabriel Krisman Bertazi sbi->s_encoding_flags = encoding_flags; 3952c83ad55eSGabriel Krisman Bertazi } 3953c83ad55eSGabriel Krisman Bertazi #endif 3954c83ad55eSGabriel Krisman Bertazi 395556889787STheodore Ts'o if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) { 395656889787STheodore Ts'o printk_once(KERN_WARNING "EXT4-fs: Warning: mounting " 395756889787STheodore Ts'o "with data=journal disables delayed " 395856889787STheodore Ts'o "allocation and O_DIRECT support!\n"); 395956889787STheodore Ts'o if (test_opt2(sb, EXPLICIT_DELALLOC)) { 396056889787STheodore Ts'o ext4_msg(sb, KERN_ERR, "can't mount with " 396156889787STheodore Ts'o "both data=journal and delalloc"); 396256889787STheodore Ts'o goto failed_mount; 396356889787STheodore Ts'o } 396456889787STheodore Ts'o if (test_opt(sb, DIOREAD_NOLOCK)) { 396556889787STheodore Ts'o ext4_msg(sb, KERN_ERR, "can't mount with " 39666ae6514bSPiotr Sarna "both data=journal and dioread_nolock"); 396756889787STheodore Ts'o goto failed_mount; 396856889787STheodore Ts'o } 3969923ae0ffSRoss Zwisler if (test_opt(sb, DAX)) { 3970923ae0ffSRoss Zwisler ext4_msg(sb, KERN_ERR, "can't mount with " 3971923ae0ffSRoss Zwisler "both data=journal and dax"); 3972923ae0ffSRoss Zwisler goto failed_mount; 3973923ae0ffSRoss Zwisler } 397473b92a2aSSergey Karamov if (ext4_has_feature_encrypt(sb)) { 397573b92a2aSSergey Karamov ext4_msg(sb, KERN_WARNING, 397673b92a2aSSergey Karamov "encrypted files will use data=ordered " 397773b92a2aSSergey Karamov "instead of data journaling mode"); 397873b92a2aSSergey Karamov } 397956889787STheodore Ts'o if (test_opt(sb, DELALLOC)) 398056889787STheodore Ts'o clear_opt(sb, DELALLOC); 3981001e4a87STejun Heo } else { 3982001e4a87STejun Heo sb->s_iflags |= SB_I_CGROUPWB; 398356889787STheodore Ts'o } 398456889787STheodore Ts'o 39851751e8a6SLinus Torvalds sb->s_flags = (sb->s_flags & ~SB_POSIXACL) | 39861751e8a6SLinus Torvalds (test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0); 3987ac27a0ecSDave Kleikamp 3988617ba13bSMingming Cao if (le32_to_cpu(es->s_rev_level) == EXT4_GOOD_OLD_REV && 3989e2b911c5SDarrick J. Wong (ext4_has_compat_features(sb) || 3990e2b911c5SDarrick J. Wong ext4_has_ro_compat_features(sb) || 3991e2b911c5SDarrick J. Wong ext4_has_incompat_features(sb))) 3992b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, 3993b31e1552SEric Sandeen "feature flags set on rev 0 fs, " 3994b31e1552SEric Sandeen "running e2fsck is recommended"); 3995469108ffSTheodore Tso 3996ed3654ebSTheodore Ts'o if (es->s_creator_os == cpu_to_le32(EXT4_OS_HURD)) { 3997ed3654ebSTheodore Ts'o set_opt2(sb, HURD_COMPAT); 3998e2b911c5SDarrick J. Wong if (ext4_has_feature_64bit(sb)) { 3999ed3654ebSTheodore Ts'o ext4_msg(sb, KERN_ERR, 4000ed3654ebSTheodore Ts'o "The Hurd can't support 64-bit file systems"); 4001ed3654ebSTheodore Ts'o goto failed_mount; 4002ed3654ebSTheodore Ts'o } 4003dec214d0STahsin Erdogan 4004dec214d0STahsin Erdogan /* 4005dec214d0STahsin Erdogan * ea_inode feature uses l_i_version field which is not 4006dec214d0STahsin Erdogan * available in HURD_COMPAT mode. 4007dec214d0STahsin Erdogan */ 4008dec214d0STahsin Erdogan if (ext4_has_feature_ea_inode(sb)) { 4009dec214d0STahsin Erdogan ext4_msg(sb, KERN_ERR, 4010dec214d0STahsin Erdogan "ea_inode feature is not supported for Hurd"); 4011dec214d0STahsin Erdogan goto failed_mount; 4012dec214d0STahsin Erdogan } 4013ed3654ebSTheodore Ts'o } 4014ed3654ebSTheodore Ts'o 40152035e776STheodore Ts'o if (IS_EXT2_SB(sb)) { 40162035e776STheodore Ts'o if (ext2_feature_set_ok(sb)) 40172035e776STheodore Ts'o ext4_msg(sb, KERN_INFO, "mounting ext2 file system " 40182035e776STheodore Ts'o "using the ext4 subsystem"); 40192035e776STheodore Ts'o else { 40200d9366d6SEric Sandeen /* 40210d9366d6SEric Sandeen * If we're probing be silent, if this looks like 40220d9366d6SEric Sandeen * it's actually an ext[34] filesystem. 40230d9366d6SEric Sandeen */ 40240d9366d6SEric Sandeen if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb))) 40250d9366d6SEric Sandeen goto failed_mount; 40262035e776STheodore Ts'o ext4_msg(sb, KERN_ERR, "couldn't mount as ext2 due " 40272035e776STheodore Ts'o "to feature incompatibilities"); 40282035e776STheodore Ts'o goto failed_mount; 40292035e776STheodore Ts'o } 40302035e776STheodore Ts'o } 40312035e776STheodore Ts'o 40322035e776STheodore Ts'o if (IS_EXT3_SB(sb)) { 40332035e776STheodore Ts'o if (ext3_feature_set_ok(sb)) 40342035e776STheodore Ts'o ext4_msg(sb, KERN_INFO, "mounting ext3 file system " 40352035e776STheodore Ts'o "using the ext4 subsystem"); 40362035e776STheodore Ts'o else { 40370d9366d6SEric Sandeen /* 40380d9366d6SEric Sandeen * If we're probing be silent, if this looks like 40390d9366d6SEric Sandeen * it's actually an ext4 filesystem. 40400d9366d6SEric Sandeen */ 40410d9366d6SEric Sandeen if (silent && ext4_feature_set_ok(sb, sb_rdonly(sb))) 40420d9366d6SEric Sandeen goto failed_mount; 40432035e776STheodore Ts'o ext4_msg(sb, KERN_ERR, "couldn't mount as ext3 due " 40442035e776STheodore Ts'o "to feature incompatibilities"); 40452035e776STheodore Ts'o goto failed_mount; 40462035e776STheodore Ts'o } 40472035e776STheodore Ts'o } 40482035e776STheodore Ts'o 4049469108ffSTheodore Tso /* 4050ac27a0ecSDave Kleikamp * Check feature flags regardless of the revision level, since we 4051ac27a0ecSDave Kleikamp * previously didn't change the revision level when setting the flags, 4052ac27a0ecSDave Kleikamp * so there is a chance incompat flags are set on a rev 0 filesystem. 4053ac27a0ecSDave Kleikamp */ 4054bc98a42cSDavid Howells if (!ext4_feature_set_ok(sb, (sb_rdonly(sb)))) 4055ac27a0ecSDave Kleikamp goto failed_mount; 4056a13fb1a4SEric Sandeen 4057261cb20cSJan Kara blocksize = BLOCK_SIZE << le32_to_cpu(es->s_log_block_size); 4058617ba13bSMingming Cao if (blocksize < EXT4_MIN_BLOCK_SIZE || 4059617ba13bSMingming Cao blocksize > EXT4_MAX_BLOCK_SIZE) { 4060b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 40618cdf3372STheodore Ts'o "Unsupported filesystem blocksize %d (%d log_block_size)", 40628cdf3372STheodore Ts'o blocksize, le32_to_cpu(es->s_log_block_size)); 40638cdf3372STheodore Ts'o goto failed_mount; 40648cdf3372STheodore Ts'o } 40658cdf3372STheodore Ts'o if (le32_to_cpu(es->s_log_block_size) > 40668cdf3372STheodore Ts'o (EXT4_MAX_BLOCK_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) { 40678cdf3372STheodore Ts'o ext4_msg(sb, KERN_ERR, 40688cdf3372STheodore Ts'o "Invalid log block size: %u", 40698cdf3372STheodore Ts'o le32_to_cpu(es->s_log_block_size)); 4070ac27a0ecSDave Kleikamp goto failed_mount; 4071ac27a0ecSDave Kleikamp } 4072bfe0a5f4STheodore Ts'o if (le32_to_cpu(es->s_log_cluster_size) > 4073bfe0a5f4STheodore Ts'o (EXT4_MAX_CLUSTER_LOG_SIZE - EXT4_MIN_BLOCK_LOG_SIZE)) { 4074bfe0a5f4STheodore Ts'o ext4_msg(sb, KERN_ERR, 4075bfe0a5f4STheodore Ts'o "Invalid log cluster size: %u", 4076bfe0a5f4STheodore Ts'o le32_to_cpu(es->s_log_cluster_size)); 4077bfe0a5f4STheodore Ts'o goto failed_mount; 4078bfe0a5f4STheodore Ts'o } 4079ac27a0ecSDave Kleikamp 40805b9554dcSTheodore Ts'o if (le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks) > (blocksize / 4)) { 40815b9554dcSTheodore Ts'o ext4_msg(sb, KERN_ERR, 40825b9554dcSTheodore Ts'o "Number of reserved GDT blocks insanely large: %d", 40835b9554dcSTheodore Ts'o le16_to_cpu(sbi->s_es->s_reserved_gdt_blocks)); 40845b9554dcSTheodore Ts'o goto failed_mount; 40855b9554dcSTheodore Ts'o } 40865b9554dcSTheodore Ts'o 4087923ae0ffSRoss Zwisler if (sbi->s_mount_opt & EXT4_MOUNT_DAX) { 4088559db4c6SRoss Zwisler if (ext4_has_feature_inline_data(sb)) { 4089559db4c6SRoss Zwisler ext4_msg(sb, KERN_ERR, "Cannot use DAX on a filesystem" 4090559db4c6SRoss Zwisler " that may contain inline data"); 4091361d24d4SEric Sandeen goto failed_mount; 4092559db4c6SRoss Zwisler } 409380660f20SDave Jiang if (!bdev_dax_supported(sb->s_bdev, blocksize)) { 409424f3478dSDan Williams ext4_msg(sb, KERN_ERR, 4095361d24d4SEric Sandeen "DAX unsupported by block device."); 4096361d24d4SEric Sandeen goto failed_mount; 409724f3478dSDan Williams } 4098923ae0ffSRoss Zwisler } 4099923ae0ffSRoss Zwisler 4100e2b911c5SDarrick J. Wong if (ext4_has_feature_encrypt(sb) && es->s_encryption_level) { 41016ddb2447STheodore Ts'o ext4_msg(sb, KERN_ERR, "Unsupported encryption level %d", 41026ddb2447STheodore Ts'o es->s_encryption_level); 41036ddb2447STheodore Ts'o goto failed_mount; 41046ddb2447STheodore Ts'o } 41056ddb2447STheodore Ts'o 4106ac27a0ecSDave Kleikamp if (sb->s_blocksize != blocksize) { 4107ce40733cSAneesh Kumar K.V /* Validate the filesystem blocksize */ 4108ce40733cSAneesh Kumar K.V if (!sb_set_blocksize(sb, blocksize)) { 4109b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "bad block size %d", 4110ce40733cSAneesh Kumar K.V blocksize); 4111ac27a0ecSDave Kleikamp goto failed_mount; 4112ac27a0ecSDave Kleikamp } 4113ac27a0ecSDave Kleikamp 4114ac27a0ecSDave Kleikamp brelse(bh); 411570bbb3e0SAndrew Morton logical_sb_block = sb_block * EXT4_MIN_BLOCK_SIZE; 411670bbb3e0SAndrew Morton offset = do_div(logical_sb_block, blocksize); 4117a8ac900bSGioh Kim bh = sb_bread_unmovable(sb, logical_sb_block); 4118ac27a0ecSDave Kleikamp if (!bh) { 4119b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 4120b31e1552SEric Sandeen "Can't read superblock on 2nd try"); 4121ac27a0ecSDave Kleikamp goto failed_mount; 4122ac27a0ecSDave Kleikamp } 41232716b802STheodore Ts'o es = (struct ext4_super_block *)(bh->b_data + offset); 4124ac27a0ecSDave Kleikamp sbi->s_es = es; 4125617ba13bSMingming Cao if (es->s_magic != cpu_to_le16(EXT4_SUPER_MAGIC)) { 4126b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 4127b31e1552SEric Sandeen "Magic mismatch, very weird!"); 4128ac27a0ecSDave Kleikamp goto failed_mount; 4129ac27a0ecSDave Kleikamp } 4130ac27a0ecSDave Kleikamp } 4131ac27a0ecSDave Kleikamp 4132e2b911c5SDarrick J. Wong has_huge_files = ext4_has_feature_huge_file(sb); 4133f287a1a5STheodore Ts'o sbi->s_bitmap_maxbytes = ext4_max_bitmap_size(sb->s_blocksize_bits, 4134f287a1a5STheodore Ts'o has_huge_files); 4135f287a1a5STheodore Ts'o sb->s_maxbytes = ext4_max_size(sb->s_blocksize_bits, has_huge_files); 4136ac27a0ecSDave Kleikamp 41370d1ee42fSAlexandre Ratchov sbi->s_desc_size = le16_to_cpu(es->s_desc_size); 4138e2b911c5SDarrick J. Wong if (ext4_has_feature_64bit(sb)) { 41398fadc143SAlexandre Ratchov if (sbi->s_desc_size < EXT4_MIN_DESC_SIZE_64BIT || 41400d1ee42fSAlexandre Ratchov sbi->s_desc_size > EXT4_MAX_DESC_SIZE || 4141d8ea6cf8Svignesh babu !is_power_of_2(sbi->s_desc_size)) { 4142b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 4143b31e1552SEric Sandeen "unsupported descriptor size %lu", 41440d1ee42fSAlexandre Ratchov sbi->s_desc_size); 41450d1ee42fSAlexandre Ratchov goto failed_mount; 41460d1ee42fSAlexandre Ratchov } 41470d1ee42fSAlexandre Ratchov } else 41480d1ee42fSAlexandre Ratchov sbi->s_desc_size = EXT4_MIN_DESC_SIZE; 41490b8e58a1SAndreas Dilger 4150ac27a0ecSDave Kleikamp sbi->s_blocks_per_group = le32_to_cpu(es->s_blocks_per_group); 4151ac27a0ecSDave Kleikamp sbi->s_inodes_per_group = le32_to_cpu(es->s_inodes_per_group); 41520b8e58a1SAndreas Dilger 4153617ba13bSMingming Cao sbi->s_inodes_per_block = blocksize / EXT4_INODE_SIZE(sb); 4154ac27a0ecSDave Kleikamp if (sbi->s_inodes_per_block == 0) 4155617ba13bSMingming Cao goto cantfind_ext4; 4156cd6bb35bSTheodore Ts'o if (sbi->s_inodes_per_group < sbi->s_inodes_per_block || 4157cd6bb35bSTheodore Ts'o sbi->s_inodes_per_group > blocksize * 8) { 4158cd6bb35bSTheodore Ts'o ext4_msg(sb, KERN_ERR, "invalid inodes per group: %lu\n", 4159cd6bb35bSTheodore Ts'o sbi->s_blocks_per_group); 4160cd6bb35bSTheodore Ts'o goto failed_mount; 4161cd6bb35bSTheodore Ts'o } 4162ac27a0ecSDave Kleikamp sbi->s_itb_per_group = sbi->s_inodes_per_group / 4163ac27a0ecSDave Kleikamp sbi->s_inodes_per_block; 41640d1ee42fSAlexandre Ratchov sbi->s_desc_per_block = blocksize / EXT4_DESC_SIZE(sb); 4165ac27a0ecSDave Kleikamp sbi->s_sbh = bh; 4166ac27a0ecSDave Kleikamp sbi->s_mount_state = le16_to_cpu(es->s_state); 4167e57aa839SFengguang Wu sbi->s_addr_per_block_bits = ilog2(EXT4_ADDR_PER_BLOCK(sb)); 4168e57aa839SFengguang Wu sbi->s_desc_per_block_bits = ilog2(EXT4_DESC_PER_BLOCK(sb)); 41690b8e58a1SAndreas Dilger 4170ac27a0ecSDave Kleikamp for (i = 0; i < 4; i++) 4171ac27a0ecSDave Kleikamp sbi->s_hash_seed[i] = le32_to_cpu(es->s_hash_seed[i]); 4172ac27a0ecSDave Kleikamp sbi->s_def_hash_version = es->s_def_hash_version; 4173e2b911c5SDarrick J. Wong if (ext4_has_feature_dir_index(sb)) { 4174f99b2589STheodore Ts'o i = le32_to_cpu(es->s_flags); 4175f99b2589STheodore Ts'o if (i & EXT2_FLAGS_UNSIGNED_HASH) 4176f99b2589STheodore Ts'o sbi->s_hash_unsigned = 3; 4177f99b2589STheodore Ts'o else if ((i & EXT2_FLAGS_SIGNED_HASH) == 0) { 4178f99b2589STheodore Ts'o #ifdef __CHAR_UNSIGNED__ 4179bc98a42cSDavid Howells if (!sb_rdonly(sb)) 418023301410STheodore Ts'o es->s_flags |= 418123301410STheodore Ts'o cpu_to_le32(EXT2_FLAGS_UNSIGNED_HASH); 4182f99b2589STheodore Ts'o sbi->s_hash_unsigned = 3; 4183f99b2589STheodore Ts'o #else 4184bc98a42cSDavid Howells if (!sb_rdonly(sb)) 418523301410STheodore Ts'o es->s_flags |= 418623301410STheodore Ts'o cpu_to_le32(EXT2_FLAGS_SIGNED_HASH); 4187f99b2589STheodore Ts'o #endif 4188f99b2589STheodore Ts'o } 418923301410STheodore Ts'o } 4190ac27a0ecSDave Kleikamp 4191281b5995STheodore Ts'o /* Handle clustersize */ 4192281b5995STheodore Ts'o clustersize = BLOCK_SIZE << le32_to_cpu(es->s_log_cluster_size); 4193e2b911c5SDarrick J. Wong has_bigalloc = ext4_has_feature_bigalloc(sb); 4194281b5995STheodore Ts'o if (has_bigalloc) { 4195281b5995STheodore Ts'o if (clustersize < blocksize) { 4196281b5995STheodore Ts'o ext4_msg(sb, KERN_ERR, 4197281b5995STheodore Ts'o "cluster size (%d) smaller than " 4198281b5995STheodore Ts'o "block size (%d)", clustersize, blocksize); 4199281b5995STheodore Ts'o goto failed_mount; 4200281b5995STheodore Ts'o } 4201281b5995STheodore Ts'o sbi->s_cluster_bits = le32_to_cpu(es->s_log_cluster_size) - 4202281b5995STheodore Ts'o le32_to_cpu(es->s_log_block_size); 4203281b5995STheodore Ts'o sbi->s_clusters_per_group = 4204281b5995STheodore Ts'o le32_to_cpu(es->s_clusters_per_group); 4205281b5995STheodore Ts'o if (sbi->s_clusters_per_group > blocksize * 8) { 4206281b5995STheodore Ts'o ext4_msg(sb, KERN_ERR, 4207281b5995STheodore Ts'o "#clusters per group too big: %lu", 4208281b5995STheodore Ts'o sbi->s_clusters_per_group); 4209281b5995STheodore Ts'o goto failed_mount; 4210281b5995STheodore Ts'o } 4211281b5995STheodore Ts'o if (sbi->s_blocks_per_group != 4212281b5995STheodore Ts'o (sbi->s_clusters_per_group * (clustersize / blocksize))) { 4213281b5995STheodore Ts'o ext4_msg(sb, KERN_ERR, "blocks per group (%lu) and " 4214281b5995STheodore Ts'o "clusters per group (%lu) inconsistent", 4215281b5995STheodore Ts'o sbi->s_blocks_per_group, 4216281b5995STheodore Ts'o sbi->s_clusters_per_group); 4217281b5995STheodore Ts'o goto failed_mount; 4218281b5995STheodore Ts'o } 4219281b5995STheodore Ts'o } else { 4220281b5995STheodore Ts'o if (clustersize != blocksize) { 4221bfe0a5f4STheodore Ts'o ext4_msg(sb, KERN_ERR, 4222bfe0a5f4STheodore Ts'o "fragment/cluster size (%d) != " 4223bfe0a5f4STheodore Ts'o "block size (%d)", clustersize, blocksize); 4224bfe0a5f4STheodore Ts'o goto failed_mount; 4225281b5995STheodore Ts'o } 4226ac27a0ecSDave Kleikamp if (sbi->s_blocks_per_group > blocksize * 8) { 4227b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 4228b31e1552SEric Sandeen "#blocks per group too big: %lu", 4229ac27a0ecSDave Kleikamp sbi->s_blocks_per_group); 4230ac27a0ecSDave Kleikamp goto failed_mount; 4231ac27a0ecSDave Kleikamp } 4232281b5995STheodore Ts'o sbi->s_clusters_per_group = sbi->s_blocks_per_group; 4233281b5995STheodore Ts'o sbi->s_cluster_bits = 0; 4234281b5995STheodore Ts'o } 4235281b5995STheodore Ts'o sbi->s_cluster_ratio = clustersize / blocksize; 4236281b5995STheodore Ts'o 4237960fd856STheodore Ts'o /* Do we have standard group size of clustersize * 8 blocks ? */ 4238960fd856STheodore Ts'o if (sbi->s_blocks_per_group == clustersize << 3) 4239960fd856STheodore Ts'o set_opt2(sb, STD_GROUP_SIZE); 4240960fd856STheodore Ts'o 4241bf43d84bSEric Sandeen /* 4242bf43d84bSEric Sandeen * Test whether we have more sectors than will fit in sector_t, 4243bf43d84bSEric Sandeen * and whether the max offset is addressable by the page cache. 4244bf43d84bSEric Sandeen */ 42455a9ae68aSDarrick J. Wong err = generic_check_addressable(sb->s_blocksize_bits, 424630ca22c7SPatrick J. LoPresti ext4_blocks_count(es)); 42475a9ae68aSDarrick J. Wong if (err) { 4248b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "filesystem" 4249bf43d84bSEric Sandeen " too large to mount safely on this system"); 4250ac27a0ecSDave Kleikamp goto failed_mount; 4251ac27a0ecSDave Kleikamp } 4252ac27a0ecSDave Kleikamp 4253617ba13bSMingming Cao if (EXT4_BLOCKS_PER_GROUP(sb) == 0) 4254617ba13bSMingming Cao goto cantfind_ext4; 4255e7c95593SEric Sandeen 42560f2ddca6SFrom: Thiemo Nagel /* check blocks count against device size */ 42570f2ddca6SFrom: Thiemo Nagel blocks_count = sb->s_bdev->bd_inode->i_size >> sb->s_blocksize_bits; 42580f2ddca6SFrom: Thiemo Nagel if (blocks_count && ext4_blocks_count(es) > blocks_count) { 4259b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "bad geometry: block count %llu " 4260b31e1552SEric Sandeen "exceeds size of device (%llu blocks)", 42610f2ddca6SFrom: Thiemo Nagel ext4_blocks_count(es), blocks_count); 42620f2ddca6SFrom: Thiemo Nagel goto failed_mount; 42630f2ddca6SFrom: Thiemo Nagel } 42640f2ddca6SFrom: Thiemo Nagel 42654ec11028STheodore Ts'o /* 42664ec11028STheodore Ts'o * It makes no sense for the first data block to be beyond the end 42674ec11028STheodore Ts'o * of the filesystem. 42684ec11028STheodore Ts'o */ 42694ec11028STheodore Ts'o if (le32_to_cpu(es->s_first_data_block) >= ext4_blocks_count(es)) { 4270b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "bad geometry: first data " 4271b31e1552SEric Sandeen "block %u is beyond end of filesystem (%llu)", 4272e7c95593SEric Sandeen le32_to_cpu(es->s_first_data_block), 42734ec11028STheodore Ts'o ext4_blocks_count(es)); 4274e7c95593SEric Sandeen goto failed_mount; 4275e7c95593SEric Sandeen } 4276bfe0a5f4STheodore Ts'o if ((es->s_first_data_block == 0) && (es->s_log_block_size == 0) && 4277bfe0a5f4STheodore Ts'o (sbi->s_cluster_ratio == 1)) { 4278bfe0a5f4STheodore Ts'o ext4_msg(sb, KERN_WARNING, "bad geometry: first data " 4279bfe0a5f4STheodore Ts'o "block is 0 with a 1k block and cluster size"); 4280bfe0a5f4STheodore Ts'o goto failed_mount; 4281bfe0a5f4STheodore Ts'o } 4282bfe0a5f4STheodore Ts'o 4283bd81d8eeSLaurent Vivier blocks_count = (ext4_blocks_count(es) - 4284bd81d8eeSLaurent Vivier le32_to_cpu(es->s_first_data_block) + 4285bd81d8eeSLaurent Vivier EXT4_BLOCKS_PER_GROUP(sb) - 1); 4286bd81d8eeSLaurent Vivier do_div(blocks_count, EXT4_BLOCKS_PER_GROUP(sb)); 42874ec11028STheodore Ts'o if (blocks_count > ((uint64_t)1<<32) - EXT4_DESC_PER_BLOCK(sb)) { 4288b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "groups count too large: %u " 42894ec11028STheodore Ts'o "(block count %llu, first data block %u, " 4290b31e1552SEric Sandeen "blocks per group %lu)", sbi->s_groups_count, 42914ec11028STheodore Ts'o ext4_blocks_count(es), 42924ec11028STheodore Ts'o le32_to_cpu(es->s_first_data_block), 42934ec11028STheodore Ts'o EXT4_BLOCKS_PER_GROUP(sb)); 42944ec11028STheodore Ts'o goto failed_mount; 42954ec11028STheodore Ts'o } 4296bd81d8eeSLaurent Vivier sbi->s_groups_count = blocks_count; 4297fb0a387dSEric Sandeen sbi->s_blockfile_groups = min_t(ext4_group_t, sbi->s_groups_count, 4298fb0a387dSEric Sandeen (EXT4_MAX_BLOCK_FILE_PHYS / EXT4_BLOCKS_PER_GROUP(sb))); 42999e463084STheodore Ts'o if (((u64)sbi->s_groups_count * sbi->s_inodes_per_group) != 43009e463084STheodore Ts'o le32_to_cpu(es->s_inodes_count)) { 43019e463084STheodore Ts'o ext4_msg(sb, KERN_ERR, "inodes count not valid: %u vs %llu", 43029e463084STheodore Ts'o le32_to_cpu(es->s_inodes_count), 43039e463084STheodore Ts'o ((u64)sbi->s_groups_count * sbi->s_inodes_per_group)); 43049e463084STheodore Ts'o ret = -EINVAL; 43059e463084STheodore Ts'o goto failed_mount; 43069e463084STheodore Ts'o } 4307617ba13bSMingming Cao db_count = (sbi->s_groups_count + EXT4_DESC_PER_BLOCK(sb) - 1) / 4308617ba13bSMingming Cao EXT4_DESC_PER_BLOCK(sb); 43093a4b77cdSEryu Guan if (ext4_has_feature_meta_bg(sb)) { 43102ba3e6e8STheodore Ts'o if (le32_to_cpu(es->s_first_meta_bg) > db_count) { 43113a4b77cdSEryu Guan ext4_msg(sb, KERN_WARNING, 43123a4b77cdSEryu Guan "first meta block group too large: %u " 43133a4b77cdSEryu Guan "(group descriptor block count %u)", 43143a4b77cdSEryu Guan le32_to_cpu(es->s_first_meta_bg), db_count); 43153a4b77cdSEryu Guan goto failed_mount; 43163a4b77cdSEryu Guan } 43173a4b77cdSEryu Guan } 4318344476e1SKees Cook sbi->s_group_desc = kvmalloc_array(db_count, 4319f18a5f21STheodore Ts'o sizeof(struct buffer_head *), 4320ac27a0ecSDave Kleikamp GFP_KERNEL); 4321ac27a0ecSDave Kleikamp if (sbi->s_group_desc == NULL) { 4322b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "not enough memory"); 43232cde417dSTheodore Ts'o ret = -ENOMEM; 4324ac27a0ecSDave Kleikamp goto failed_mount; 4325ac27a0ecSDave Kleikamp } 4326ac27a0ecSDave Kleikamp 4327705895b6SPekka Enberg bgl_lock_init(sbi->s_blockgroup_lock); 4328ac27a0ecSDave Kleikamp 432985c8f176SAndrew Perepechko /* Pre-read the descriptors into the buffer cache */ 433085c8f176SAndrew Perepechko for (i = 0; i < db_count; i++) { 433185c8f176SAndrew Perepechko block = descriptor_loc(sb, logical_sb_block, i); 433285c8f176SAndrew Perepechko sb_breadahead(sb, block); 433385c8f176SAndrew Perepechko } 433485c8f176SAndrew Perepechko 4335ac27a0ecSDave Kleikamp for (i = 0; i < db_count; i++) { 433670bbb3e0SAndrew Morton block = descriptor_loc(sb, logical_sb_block, i); 4337a8ac900bSGioh Kim sbi->s_group_desc[i] = sb_bread_unmovable(sb, block); 4338ac27a0ecSDave Kleikamp if (!sbi->s_group_desc[i]) { 4339b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 4340b31e1552SEric Sandeen "can't read group descriptor %d", i); 4341ac27a0ecSDave Kleikamp db_count = i; 4342ac27a0ecSDave Kleikamp goto failed_mount2; 4343ac27a0ecSDave Kleikamp } 4344ac27a0ecSDave Kleikamp } 434544de022cSTheodore Ts'o sbi->s_gdb_count = db_count; 4346829fa70dSTheodore Ts'o if (!ext4_check_descriptors(sb, logical_sb_block, &first_not_zeroed)) { 4347b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "group descriptors corrupted!"); 43486a797d27SDarrick J. Wong ret = -EFSCORRUPTED; 4349f9ae9cf5STheodore Ts'o goto failed_mount2; 4350ac27a0ecSDave Kleikamp } 4351772cb7c8SJose R. Santos 4352235699a8SKees Cook timer_setup(&sbi->s_err_report, print_daily_error_info, 0); 435304496411STao Ma 4354a75ae78fSDmitry Monakhov /* Register extent status tree shrinker */ 4355eb68d0e2SZheng Liu if (ext4_es_register_shrinker(sbi)) 4356ce7e010aSTheodore Ts'o goto failed_mount3; 4357ce7e010aSTheodore Ts'o 4358c9de560dSAlex Tomas sbi->s_stripe = ext4_get_stripe_size(sbi); 435967a5da56SZheng Liu sbi->s_extent_max_zeroout_kb = 32; 4360c9de560dSAlex Tomas 4361f9ae9cf5STheodore Ts'o /* 4362f9ae9cf5STheodore Ts'o * set up enough so that it can read an inode 4363f9ae9cf5STheodore Ts'o */ 4364f9ae9cf5STheodore Ts'o sb->s_op = &ext4_sops; 4365617ba13bSMingming Cao sb->s_export_op = &ext4_export_ops; 4366617ba13bSMingming Cao sb->s_xattr = ext4_xattr_handlers; 4367643fa961SChandan Rajendra #ifdef CONFIG_FS_ENCRYPTION 4368a7550b30SJaegeuk Kim sb->s_cop = &ext4_cryptops; 4369ffcc4182SEric Biggers #endif 4370c93d8f88SEric Biggers #ifdef CONFIG_FS_VERITY 4371c93d8f88SEric Biggers sb->s_vop = &ext4_verityops; 4372c93d8f88SEric Biggers #endif 4373ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 4374617ba13bSMingming Cao sb->dq_op = &ext4_quota_operations; 4375e2b911c5SDarrick J. Wong if (ext4_has_feature_quota(sb)) 43761fa5efe3SJan Kara sb->s_qcop = &dquot_quotactl_sysfile_ops; 4377262b4662SJan Kara else 4378262b4662SJan Kara sb->s_qcop = &ext4_qctl_operations; 4379689c958cSLi Xi sb->s_quota_types = QTYPE_MASK_USR | QTYPE_MASK_GRP | QTYPE_MASK_PRJ; 4380ac27a0ecSDave Kleikamp #endif 438185787090SChristoph Hellwig memcpy(&sb->s_uuid, es->s_uuid, sizeof(es->s_uuid)); 4382f2fa2ffcSAneesh Kumar K.V 4383ac27a0ecSDave Kleikamp INIT_LIST_HEAD(&sbi->s_orphan); /* unlinked but open files */ 43843b9d4ed2STheodore Ts'o mutex_init(&sbi->s_orphan_lock); 4385ac27a0ecSDave Kleikamp 4386ac27a0ecSDave Kleikamp sb->s_root = NULL; 4387ac27a0ecSDave Kleikamp 4388ac27a0ecSDave Kleikamp needs_recovery = (es->s_last_orphan != 0 || 4389e2b911c5SDarrick J. Wong ext4_has_feature_journal_needs_recovery(sb)); 4390ac27a0ecSDave Kleikamp 4391bc98a42cSDavid Howells if (ext4_has_feature_mmp(sb) && !sb_rdonly(sb)) 4392c5e06d10SJohann Lombardi if (ext4_multi_mount_protect(sb, le64_to_cpu(es->s_mmp_block))) 439350460fe8SDarrick J. Wong goto failed_mount3a; 4394c5e06d10SJohann Lombardi 4395ac27a0ecSDave Kleikamp /* 4396ac27a0ecSDave Kleikamp * The first inode we look at is the journal inode. Don't try 4397ac27a0ecSDave Kleikamp * root first: it may be modified in the journal! 4398ac27a0ecSDave Kleikamp */ 4399e2b911c5SDarrick J. Wong if (!test_opt(sb, NOLOAD) && ext4_has_feature_journal(sb)) { 44004753d8a2STheodore Ts'o err = ext4_load_journal(sb, es, journal_devnum); 44014753d8a2STheodore Ts'o if (err) 440250460fe8SDarrick J. Wong goto failed_mount3a; 4403bc98a42cSDavid Howells } else if (test_opt(sb, NOLOAD) && !sb_rdonly(sb) && 4404e2b911c5SDarrick J. Wong ext4_has_feature_journal_needs_recovery(sb)) { 4405b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "required journal recovery " 4406b31e1552SEric Sandeen "suppressed and not mounted read-only"); 4407744692dcSJiaying Zhang goto failed_mount_wq; 4408ac27a0ecSDave Kleikamp } else { 44091e381f60SDmitry Monakhov /* Nojournal mode, all journal mount options are illegal */ 44101e381f60SDmitry Monakhov if (test_opt2(sb, EXPLICIT_JOURNAL_CHECKSUM)) { 44111e381f60SDmitry Monakhov ext4_msg(sb, KERN_ERR, "can't mount with " 44121e381f60SDmitry Monakhov "journal_checksum, fs mounted w/o journal"); 44131e381f60SDmitry Monakhov goto failed_mount_wq; 44141e381f60SDmitry Monakhov } 44151e381f60SDmitry Monakhov if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) { 44161e381f60SDmitry Monakhov ext4_msg(sb, KERN_ERR, "can't mount with " 44171e381f60SDmitry Monakhov "journal_async_commit, fs mounted w/o journal"); 44181e381f60SDmitry Monakhov goto failed_mount_wq; 44191e381f60SDmitry Monakhov } 44201e381f60SDmitry Monakhov if (sbi->s_commit_interval != JBD2_DEFAULT_MAX_COMMIT_AGE*HZ) { 44211e381f60SDmitry Monakhov ext4_msg(sb, KERN_ERR, "can't mount with " 44221e381f60SDmitry Monakhov "commit=%lu, fs mounted w/o journal", 44231e381f60SDmitry Monakhov sbi->s_commit_interval / HZ); 44241e381f60SDmitry Monakhov goto failed_mount_wq; 44251e381f60SDmitry Monakhov } 44261e381f60SDmitry Monakhov if (EXT4_MOUNT_DATA_FLAGS & 44271e381f60SDmitry Monakhov (sbi->s_mount_opt ^ sbi->s_def_mount_opt)) { 44281e381f60SDmitry Monakhov ext4_msg(sb, KERN_ERR, "can't mount with " 44291e381f60SDmitry Monakhov "data=, fs mounted w/o journal"); 44301e381f60SDmitry Monakhov goto failed_mount_wq; 44311e381f60SDmitry Monakhov } 443250b29d8fSDebabrata Banerjee sbi->s_def_mount_opt &= ~EXT4_MOUNT_JOURNAL_CHECKSUM; 44331e381f60SDmitry Monakhov clear_opt(sb, JOURNAL_CHECKSUM); 4434fd8c37ecSTheodore Ts'o clear_opt(sb, DATA_FLAGS); 44350390131bSFrank Mayhar sbi->s_journal = NULL; 44360390131bSFrank Mayhar needs_recovery = 0; 44370390131bSFrank Mayhar goto no_journal; 4438ac27a0ecSDave Kleikamp } 4439ac27a0ecSDave Kleikamp 4440e2b911c5SDarrick J. Wong if (ext4_has_feature_64bit(sb) && 4441eb40a09cSJose R. Santos !jbd2_journal_set_features(EXT4_SB(sb)->s_journal, 0, 0, 4442eb40a09cSJose R. Santos JBD2_FEATURE_INCOMPAT_64BIT)) { 4443b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "Failed to set 64-bit journal feature"); 4444744692dcSJiaying Zhang goto failed_mount_wq; 4445eb40a09cSJose R. Santos } 4446eb40a09cSJose R. Santos 444725ed6e8aSDarrick J. Wong if (!set_journal_csum_feature_set(sb)) { 444825ed6e8aSDarrick J. Wong ext4_msg(sb, KERN_ERR, "Failed to set journal checksum " 444925ed6e8aSDarrick J. Wong "feature set"); 445025ed6e8aSDarrick J. Wong goto failed_mount_wq; 4451d4da6c9cSLinus Torvalds } 4452818d276cSGirish Shilamkar 4453ac27a0ecSDave Kleikamp /* We have now updated the journal if required, so we can 4454ac27a0ecSDave Kleikamp * validate the data journaling mode. */ 4455ac27a0ecSDave Kleikamp switch (test_opt(sb, DATA_FLAGS)) { 4456ac27a0ecSDave Kleikamp case 0: 4457ac27a0ecSDave Kleikamp /* No mode set, assume a default based on the journal 445863f57933SAndrew Morton * capabilities: ORDERED_DATA if the journal can 445963f57933SAndrew Morton * cope, else JOURNAL_DATA 446063f57933SAndrew Morton */ 4461dab291afSMingming Cao if (jbd2_journal_check_available_features 446227f394a7STyson Nottingham (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) { 4463fd8c37ecSTheodore Ts'o set_opt(sb, ORDERED_DATA); 446427f394a7STyson Nottingham sbi->s_def_mount_opt |= EXT4_MOUNT_ORDERED_DATA; 446527f394a7STyson Nottingham } else { 4466fd8c37ecSTheodore Ts'o set_opt(sb, JOURNAL_DATA); 446727f394a7STyson Nottingham sbi->s_def_mount_opt |= EXT4_MOUNT_JOURNAL_DATA; 446827f394a7STyson Nottingham } 4469ac27a0ecSDave Kleikamp break; 4470ac27a0ecSDave Kleikamp 4471617ba13bSMingming Cao case EXT4_MOUNT_ORDERED_DATA: 4472617ba13bSMingming Cao case EXT4_MOUNT_WRITEBACK_DATA: 4473dab291afSMingming Cao if (!jbd2_journal_check_available_features 4474dab291afSMingming Cao (sbi->s_journal, 0, 0, JBD2_FEATURE_INCOMPAT_REVOKE)) { 4475b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "Journal does not support " 4476b31e1552SEric Sandeen "requested data journaling mode"); 4477744692dcSJiaying Zhang goto failed_mount_wq; 4478ac27a0ecSDave Kleikamp } 4479ac27a0ecSDave Kleikamp default: 4480ac27a0ecSDave Kleikamp break; 4481ac27a0ecSDave Kleikamp } 4482ab04df78SJan Kara 4483ab04df78SJan Kara if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA && 4484ab04df78SJan Kara test_opt(sb, JOURNAL_ASYNC_COMMIT)) { 4485ab04df78SJan Kara ext4_msg(sb, KERN_ERR, "can't mount with " 4486ab04df78SJan Kara "journal_async_commit in data=ordered mode"); 4487ab04df78SJan Kara goto failed_mount_wq; 4488ab04df78SJan Kara } 4489ab04df78SJan Kara 4490b3881f74STheodore Ts'o set_task_ioprio(sbi->s_journal->j_task, journal_ioprio); 4491ac27a0ecSDave Kleikamp 449218aadd47SBobi Jam sbi->s_journal->j_commit_callback = ext4_journal_commit_callback; 449318aadd47SBobi Jam 4494ce7e010aSTheodore Ts'o no_journal: 4495cdb7ee4cSTahsin Erdogan if (!test_opt(sb, NO_MBCACHE)) { 449647387409STahsin Erdogan sbi->s_ea_block_cache = ext4_xattr_create_cache(); 449747387409STahsin Erdogan if (!sbi->s_ea_block_cache) { 4498cdb7ee4cSTahsin Erdogan ext4_msg(sb, KERN_ERR, 4499cdb7ee4cSTahsin Erdogan "Failed to create ea_block_cache"); 45009c191f70ST Makphaibulchoke goto failed_mount_wq; 45019c191f70ST Makphaibulchoke } 45029c191f70ST Makphaibulchoke 4503dec214d0STahsin Erdogan if (ext4_has_feature_ea_inode(sb)) { 4504dec214d0STahsin Erdogan sbi->s_ea_inode_cache = ext4_xattr_create_cache(); 4505dec214d0STahsin Erdogan if (!sbi->s_ea_inode_cache) { 4506dec214d0STahsin Erdogan ext4_msg(sb, KERN_ERR, 4507dec214d0STahsin Erdogan "Failed to create ea_inode_cache"); 4508dec214d0STahsin Erdogan goto failed_mount_wq; 4509dec214d0STahsin Erdogan } 4510dec214d0STahsin Erdogan } 4511cdb7ee4cSTahsin Erdogan } 4512dec214d0STahsin Erdogan 4513c93d8f88SEric Biggers if (ext4_has_feature_verity(sb) && blocksize != PAGE_SIZE) { 4514c93d8f88SEric Biggers ext4_msg(sb, KERN_ERR, "Unsupported blocksize for fs-verity"); 4515c93d8f88SEric Biggers goto failed_mount_wq; 4516c93d8f88SEric Biggers } 4517c93d8f88SEric Biggers 4518bc98a42cSDavid Howells if (DUMMY_ENCRYPTION_ENABLED(sbi) && !sb_rdonly(sb) && 4519e2b911c5SDarrick J. Wong !ext4_has_feature_encrypt(sb)) { 4520e2b911c5SDarrick J. Wong ext4_set_feature_encrypt(sb); 45216ddb2447STheodore Ts'o ext4_commit_super(sb, 1); 45226ddb2447STheodore Ts'o } 45236ddb2447STheodore Ts'o 4524fd89d5f2STejun Heo /* 4525952fc18eSTheodore Ts'o * Get the # of file system overhead blocks from the 4526952fc18eSTheodore Ts'o * superblock if present. 4527952fc18eSTheodore Ts'o */ 4528952fc18eSTheodore Ts'o if (es->s_overhead_clusters) 4529952fc18eSTheodore Ts'o sbi->s_overhead = le32_to_cpu(es->s_overhead_clusters); 4530952fc18eSTheodore Ts'o else { 453107aa2ea1SLukas Czerner err = ext4_calculate_overhead(sb); 453207aa2ea1SLukas Czerner if (err) 4533952fc18eSTheodore Ts'o goto failed_mount_wq; 4534952fc18eSTheodore Ts'o } 4535952fc18eSTheodore Ts'o 4536952fc18eSTheodore Ts'o /* 4537fd89d5f2STejun Heo * The maximum number of concurrent works can be high and 4538fd89d5f2STejun Heo * concurrency isn't really necessary. Limit it to 1. 4539fd89d5f2STejun Heo */ 45402e8fa54eSJan Kara EXT4_SB(sb)->rsv_conversion_wq = 45412e8fa54eSJan Kara alloc_workqueue("ext4-rsv-conversion", WQ_MEM_RECLAIM | WQ_UNBOUND, 1); 45422e8fa54eSJan Kara if (!EXT4_SB(sb)->rsv_conversion_wq) { 45432e8fa54eSJan Kara printk(KERN_ERR "EXT4-fs: failed to create workqueue\n"); 454407aa2ea1SLukas Czerner ret = -ENOMEM; 45452e8fa54eSJan Kara goto failed_mount4; 45462e8fa54eSJan Kara } 45472e8fa54eSJan Kara 4548ac27a0ecSDave Kleikamp /* 4549dab291afSMingming Cao * The jbd2_journal_load will have done any necessary log recovery, 4550ac27a0ecSDave Kleikamp * so we can safely mount the rest of the filesystem now. 4551ac27a0ecSDave Kleikamp */ 4552ac27a0ecSDave Kleikamp 45538a363970STheodore Ts'o root = ext4_iget(sb, EXT4_ROOT_INO, EXT4_IGET_SPECIAL); 45541d1fe1eeSDavid Howells if (IS_ERR(root)) { 4555b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "get root inode failed"); 45561d1fe1eeSDavid Howells ret = PTR_ERR(root); 455732a9bb57SManish Katiyar root = NULL; 4558ac27a0ecSDave Kleikamp goto failed_mount4; 4559ac27a0ecSDave Kleikamp } 4560ac27a0ecSDave Kleikamp if (!S_ISDIR(root->i_mode) || !root->i_blocks || !root->i_size) { 4561b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "corrupt root inode, run e2fsck"); 456294bf608aSAl Viro iput(root); 4563ac27a0ecSDave Kleikamp goto failed_mount4; 4564ac27a0ecSDave Kleikamp } 4565b886ee3eSGabriel Krisman Bertazi 4566b886ee3eSGabriel Krisman Bertazi #ifdef CONFIG_UNICODE 4567b886ee3eSGabriel Krisman Bertazi if (sbi->s_encoding) 4568b886ee3eSGabriel Krisman Bertazi sb->s_d_op = &ext4_dentry_ops; 4569b886ee3eSGabriel Krisman Bertazi #endif 4570b886ee3eSGabriel Krisman Bertazi 457148fde701SAl Viro sb->s_root = d_make_root(root); 45721d1fe1eeSDavid Howells if (!sb->s_root) { 4573b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "get root dentry failed"); 45741d1fe1eeSDavid Howells ret = -ENOMEM; 45751d1fe1eeSDavid Howells goto failed_mount4; 45761d1fe1eeSDavid Howells } 4577ac27a0ecSDave Kleikamp 4578c89128a0SJaegeuk Kim ret = ext4_setup_super(sb, es, sb_rdonly(sb)); 4579c89128a0SJaegeuk Kim if (ret == -EROFS) { 45801751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY; 4581c89128a0SJaegeuk Kim ret = 0; 4582c89128a0SJaegeuk Kim } else if (ret) 4583c89128a0SJaegeuk Kim goto failed_mount4a; 4584ef7f3835SKalpak Shah 4585b5799018STheodore Ts'o ext4_set_resv_clusters(sb); 458627dd4385SLukas Czerner 45876fd058f7STheodore Ts'o err = ext4_setup_system_zone(sb); 45886fd058f7STheodore Ts'o if (err) { 4589b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "failed to initialize system " 4590fbe845ddSCurt Wohlgemuth "zone (%d)", err); 4591f9ae9cf5STheodore Ts'o goto failed_mount4a; 4592f9ae9cf5STheodore Ts'o } 4593f9ae9cf5STheodore Ts'o 4594f9ae9cf5STheodore Ts'o ext4_ext_init(sb); 4595f9ae9cf5STheodore Ts'o err = ext4_mb_init(sb); 4596f9ae9cf5STheodore Ts'o if (err) { 4597f9ae9cf5STheodore Ts'o ext4_msg(sb, KERN_ERR, "failed to initialize mballoc (%d)", 4598f9ae9cf5STheodore Ts'o err); 4599dcf2d804STao Ma goto failed_mount5; 4600c2774d84SAneesh Kumar K.V } 4601c2774d84SAneesh Kumar K.V 4602d5e03cbbSTheodore Ts'o block = ext4_count_free_clusters(sb); 4603d5e03cbbSTheodore Ts'o ext4_free_blocks_count_set(sbi->s_es, 4604d5e03cbbSTheodore Ts'o EXT4_C2B(sbi, block)); 46054274f516STheodore Ts'o ext4_superblock_csum_set(sb); 4606908c7f19STejun Heo err = percpu_counter_init(&sbi->s_freeclusters_counter, block, 4607908c7f19STejun Heo GFP_KERNEL); 4608d5e03cbbSTheodore Ts'o if (!err) { 4609d5e03cbbSTheodore Ts'o unsigned long freei = ext4_count_free_inodes(sb); 4610d5e03cbbSTheodore Ts'o sbi->s_es->s_free_inodes_count = cpu_to_le32(freei); 46114274f516STheodore Ts'o ext4_superblock_csum_set(sb); 4612908c7f19STejun Heo err = percpu_counter_init(&sbi->s_freeinodes_counter, freei, 4613908c7f19STejun Heo GFP_KERNEL); 4614d5e03cbbSTheodore Ts'o } 4615d5e03cbbSTheodore Ts'o if (!err) 4616d5e03cbbSTheodore Ts'o err = percpu_counter_init(&sbi->s_dirs_counter, 4617908c7f19STejun Heo ext4_count_dirs(sb), GFP_KERNEL); 4618d5e03cbbSTheodore Ts'o if (!err) 4619908c7f19STejun Heo err = percpu_counter_init(&sbi->s_dirtyclusters_counter, 0, 4620908c7f19STejun Heo GFP_KERNEL); 4621c8585c6fSDaeho Jeong if (!err) 4622c8585c6fSDaeho Jeong err = percpu_init_rwsem(&sbi->s_journal_flag_rwsem); 4623c8585c6fSDaeho Jeong 4624d5e03cbbSTheodore Ts'o if (err) { 4625d5e03cbbSTheodore Ts'o ext4_msg(sb, KERN_ERR, "insufficient memory"); 4626d5e03cbbSTheodore Ts'o goto failed_mount6; 4627d5e03cbbSTheodore Ts'o } 4628d5e03cbbSTheodore Ts'o 4629e2b911c5SDarrick J. Wong if (ext4_has_feature_flex_bg(sb)) 4630d5e03cbbSTheodore Ts'o if (!ext4_fill_flex_info(sb)) { 4631d5e03cbbSTheodore Ts'o ext4_msg(sb, KERN_ERR, 4632d5e03cbbSTheodore Ts'o "unable to initialize " 4633d5e03cbbSTheodore Ts'o "flex_bg meta info!"); 4634d5e03cbbSTheodore Ts'o goto failed_mount6; 4635d5e03cbbSTheodore Ts'o } 4636d5e03cbbSTheodore Ts'o 4637bfff6873SLukas Czerner err = ext4_register_li_request(sb, first_not_zeroed); 4638bfff6873SLukas Czerner if (err) 4639dcf2d804STao Ma goto failed_mount6; 4640bfff6873SLukas Czerner 4641b5799018STheodore Ts'o err = ext4_register_sysfs(sb); 4642dcf2d804STao Ma if (err) 4643dcf2d804STao Ma goto failed_mount7; 46443197ebdbSTheodore Ts'o 46459b2ff357SJan Kara #ifdef CONFIG_QUOTA 46469b2ff357SJan Kara /* Enable quota usage during mount. */ 4647bc98a42cSDavid Howells if (ext4_has_feature_quota(sb) && !sb_rdonly(sb)) { 46489b2ff357SJan Kara err = ext4_enable_quotas(sb); 46499b2ff357SJan Kara if (err) 46509b2ff357SJan Kara goto failed_mount8; 46519b2ff357SJan Kara } 46529b2ff357SJan Kara #endif /* CONFIG_QUOTA */ 46539b2ff357SJan Kara 4654617ba13bSMingming Cao EXT4_SB(sb)->s_mount_state |= EXT4_ORPHAN_FS; 4655617ba13bSMingming Cao ext4_orphan_cleanup(sb, es); 4656617ba13bSMingming Cao EXT4_SB(sb)->s_mount_state &= ~EXT4_ORPHAN_FS; 46570390131bSFrank Mayhar if (needs_recovery) { 4658b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "recovery complete"); 4659617ba13bSMingming Cao ext4_mark_recovery_complete(sb, es); 46600390131bSFrank Mayhar } 46610390131bSFrank Mayhar if (EXT4_SB(sb)->s_journal) { 46620390131bSFrank Mayhar if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) 46630390131bSFrank Mayhar descr = " journalled data mode"; 46640390131bSFrank Mayhar else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA) 46650390131bSFrank Mayhar descr = " ordered data mode"; 46660390131bSFrank Mayhar else 46670390131bSFrank Mayhar descr = " writeback data mode"; 46680390131bSFrank Mayhar } else 46690390131bSFrank Mayhar descr = "out journal"; 46700390131bSFrank Mayhar 467179add3a3SLukas Czerner if (test_opt(sb, DISCARD)) { 467279add3a3SLukas Czerner struct request_queue *q = bdev_get_queue(sb->s_bdev); 467379add3a3SLukas Czerner if (!blk_queue_discard(q)) 467479add3a3SLukas Czerner ext4_msg(sb, KERN_WARNING, 467579add3a3SLukas Czerner "mounting with \"discard\" option, but " 467679add3a3SLukas Czerner "the device does not support discard"); 467779add3a3SLukas Czerner } 467879add3a3SLukas Czerner 4679e294a537STheodore Ts'o if (___ratelimit(&ext4_mount_msg_ratelimit, "EXT4-fs mount")) 4680d4c402d9SCurt Wohlgemuth ext4_msg(sb, KERN_INFO, "mounted filesystem with%s. " 46815aee0f8aSTheodore Ts'o "Opts: %.*s%s%s", descr, 46825aee0f8aSTheodore Ts'o (int) sizeof(sbi->s_es->s_mount_opts), 46835aee0f8aSTheodore Ts'o sbi->s_es->s_mount_opts, 46848b67f04aSTheodore Ts'o *sbi->s_es->s_mount_opts ? "; " : "", orig_data); 4685ac27a0ecSDave Kleikamp 468666e61a9eSTheodore Ts'o if (es->s_error_count) 468766e61a9eSTheodore Ts'o mod_timer(&sbi->s_err_report, jiffies + 300*HZ); /* 5 minutes */ 4688ac27a0ecSDave Kleikamp 4689efbed4dcSTheodore Ts'o /* Enable message ratelimiting. Default is 10 messages per 5 secs. */ 4690efbed4dcSTheodore Ts'o ratelimit_state_init(&sbi->s_err_ratelimit_state, 5 * HZ, 10); 4691efbed4dcSTheodore Ts'o ratelimit_state_init(&sbi->s_warning_ratelimit_state, 5 * HZ, 10); 4692efbed4dcSTheodore Ts'o ratelimit_state_init(&sbi->s_msg_ratelimit_state, 5 * HZ, 10); 4693efbed4dcSTheodore Ts'o 4694d4c402d9SCurt Wohlgemuth kfree(orig_data); 4695ac27a0ecSDave Kleikamp return 0; 4696ac27a0ecSDave Kleikamp 4697617ba13bSMingming Cao cantfind_ext4: 4698ac27a0ecSDave Kleikamp if (!silent) 4699b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "VFS: Can't find ext4 filesystem"); 4700ac27a0ecSDave Kleikamp goto failed_mount; 4701ac27a0ecSDave Kleikamp 470272ba7450STheodore Ts'o #ifdef CONFIG_QUOTA 470372ba7450STheodore Ts'o failed_mount8: 4704ebd173beSTheodore Ts'o ext4_unregister_sysfs(sb); 470572ba7450STheodore Ts'o #endif 4706dcf2d804STao Ma failed_mount7: 4707dcf2d804STao Ma ext4_unregister_li_request(sb); 4708dcf2d804STao Ma failed_mount6: 4709f9ae9cf5STheodore Ts'o ext4_mb_release(sb); 4710d5e03cbbSTheodore Ts'o if (sbi->s_flex_groups) 4711b93b41d4SAl Viro kvfree(sbi->s_flex_groups); 4712d5e03cbbSTheodore Ts'o percpu_counter_destroy(&sbi->s_freeclusters_counter); 4713d5e03cbbSTheodore Ts'o percpu_counter_destroy(&sbi->s_freeinodes_counter); 4714d5e03cbbSTheodore Ts'o percpu_counter_destroy(&sbi->s_dirs_counter); 4715d5e03cbbSTheodore Ts'o percpu_counter_destroy(&sbi->s_dirtyclusters_counter); 4716af18e35bSVasily Averin percpu_free_rwsem(&sbi->s_journal_flag_rwsem); 471700764937SAzat Khuzhin failed_mount5: 4718f9ae9cf5STheodore Ts'o ext4_ext_release(sb); 4719f9ae9cf5STheodore Ts'o ext4_release_system_zone(sb); 4720f9ae9cf5STheodore Ts'o failed_mount4a: 472194bf608aSAl Viro dput(sb->s_root); 472232a9bb57SManish Katiyar sb->s_root = NULL; 472394bf608aSAl Viro failed_mount4: 4724b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "mount failed"); 47252e8fa54eSJan Kara if (EXT4_SB(sb)->rsv_conversion_wq) 47262e8fa54eSJan Kara destroy_workqueue(EXT4_SB(sb)->rsv_conversion_wq); 47274c0425ffSMingming Cao failed_mount_wq: 4728dec214d0STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_inode_cache); 4729dec214d0STahsin Erdogan sbi->s_ea_inode_cache = NULL; 473050c15df6SChengguang Xu 473147387409STahsin Erdogan ext4_xattr_destroy_cache(sbi->s_ea_block_cache); 473247387409STahsin Erdogan sbi->s_ea_block_cache = NULL; 473350c15df6SChengguang Xu 47340390131bSFrank Mayhar if (sbi->s_journal) { 4735dab291afSMingming Cao jbd2_journal_destroy(sbi->s_journal); 473647b4a50bSJan Kara sbi->s_journal = NULL; 47370390131bSFrank Mayhar } 473850460fe8SDarrick J. Wong failed_mount3a: 4739d3922a77SZheng Liu ext4_es_unregister_shrinker(sbi); 4740eb68d0e2SZheng Liu failed_mount3: 47419105bb14SAl Viro del_timer_sync(&sbi->s_err_report); 4742c5e06d10SJohann Lombardi if (sbi->s_mmp_tsk) 4743c5e06d10SJohann Lombardi kthread_stop(sbi->s_mmp_tsk); 4744ac27a0ecSDave Kleikamp failed_mount2: 4745ac27a0ecSDave Kleikamp for (i = 0; i < db_count; i++) 4746ac27a0ecSDave Kleikamp brelse(sbi->s_group_desc[i]); 4747b93b41d4SAl Viro kvfree(sbi->s_group_desc); 4748ac27a0ecSDave Kleikamp failed_mount: 47490441984aSDarrick J. Wong if (sbi->s_chksum_driver) 47500441984aSDarrick J. Wong crypto_free_shash(sbi->s_chksum_driver); 4751c83ad55eSGabriel Krisman Bertazi 4752c83ad55eSGabriel Krisman Bertazi #ifdef CONFIG_UNICODE 4753c83ad55eSGabriel Krisman Bertazi utf8_unload(sbi->s_encoding); 4754c83ad55eSGabriel Krisman Bertazi #endif 4755c83ad55eSGabriel Krisman Bertazi 4756ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 4757a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) 47580ba33facSTheodore Ts'o kfree(get_qf_name(sb, sbi, i)); 4759ac27a0ecSDave Kleikamp #endif 4760617ba13bSMingming Cao ext4_blkdev_remove(sbi); 4761ac27a0ecSDave Kleikamp brelse(bh); 4762ac27a0ecSDave Kleikamp out_fail: 4763ac27a0ecSDave Kleikamp sb->s_fs_info = NULL; 4764f6830165SManish Katiyar kfree(sbi->s_blockgroup_lock); 47655aee0f8aSTheodore Ts'o out_free_base: 4766ac27a0ecSDave Kleikamp kfree(sbi); 4767d4c402d9SCurt Wohlgemuth kfree(orig_data); 47685e405595SDan Williams fs_put_dax(dax_dev); 476907aa2ea1SLukas Czerner return err ? err : ret; 4770ac27a0ecSDave Kleikamp } 4771ac27a0ecSDave Kleikamp 4772ac27a0ecSDave Kleikamp /* 4773ac27a0ecSDave Kleikamp * Setup any per-fs journal parameters now. We'll do this both on 4774ac27a0ecSDave Kleikamp * initial mount, once the journal has been initialised but before we've 4775ac27a0ecSDave Kleikamp * done any recovery; and again on any subsequent remount. 4776ac27a0ecSDave Kleikamp */ 4777617ba13bSMingming Cao static void ext4_init_journal_params(struct super_block *sb, journal_t *journal) 4778ac27a0ecSDave Kleikamp { 4779617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 4780ac27a0ecSDave Kleikamp 4781ac27a0ecSDave Kleikamp journal->j_commit_interval = sbi->s_commit_interval; 478230773840STheodore Ts'o journal->j_min_batch_time = sbi->s_min_batch_time; 478330773840STheodore Ts'o journal->j_max_batch_time = sbi->s_max_batch_time; 4784ac27a0ecSDave Kleikamp 4785a931da6aSTheodore Ts'o write_lock(&journal->j_state_lock); 4786ac27a0ecSDave Kleikamp if (test_opt(sb, BARRIER)) 4787dab291afSMingming Cao journal->j_flags |= JBD2_BARRIER; 4788ac27a0ecSDave Kleikamp else 4789dab291afSMingming Cao journal->j_flags &= ~JBD2_BARRIER; 47905bf5683aSHidehiro Kawai if (test_opt(sb, DATA_ERR_ABORT)) 47915bf5683aSHidehiro Kawai journal->j_flags |= JBD2_ABORT_ON_SYNCDATA_ERR; 47925bf5683aSHidehiro Kawai else 47935bf5683aSHidehiro Kawai journal->j_flags &= ~JBD2_ABORT_ON_SYNCDATA_ERR; 4794a931da6aSTheodore Ts'o write_unlock(&journal->j_state_lock); 4795ac27a0ecSDave Kleikamp } 4796ac27a0ecSDave Kleikamp 4797c6cb7e77SEric Whitney static struct inode *ext4_get_journal_inode(struct super_block *sb, 4798ac27a0ecSDave Kleikamp unsigned int journal_inum) 4799ac27a0ecSDave Kleikamp { 4800ac27a0ecSDave Kleikamp struct inode *journal_inode; 4801ac27a0ecSDave Kleikamp 4802c6cb7e77SEric Whitney /* 4803c6cb7e77SEric Whitney * Test for the existence of a valid inode on disk. Bad things 4804c6cb7e77SEric Whitney * happen if we iget() an unused inode, as the subsequent iput() 4805c6cb7e77SEric Whitney * will try to delete it. 4806c6cb7e77SEric Whitney */ 48078a363970STheodore Ts'o journal_inode = ext4_iget(sb, journal_inum, EXT4_IGET_SPECIAL); 48081d1fe1eeSDavid Howells if (IS_ERR(journal_inode)) { 4809b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "no journal found"); 4810ac27a0ecSDave Kleikamp return NULL; 4811ac27a0ecSDave Kleikamp } 4812ac27a0ecSDave Kleikamp if (!journal_inode->i_nlink) { 4813ac27a0ecSDave Kleikamp make_bad_inode(journal_inode); 4814ac27a0ecSDave Kleikamp iput(journal_inode); 4815b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "journal inode is deleted"); 4816ac27a0ecSDave Kleikamp return NULL; 4817ac27a0ecSDave Kleikamp } 4818ac27a0ecSDave Kleikamp 4819e5f8eab8STheodore Ts'o jbd_debug(2, "Journal inode found at %p: %lld bytes\n", 4820ac27a0ecSDave Kleikamp journal_inode, journal_inode->i_size); 48211d1fe1eeSDavid Howells if (!S_ISREG(journal_inode->i_mode)) { 4822b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "invalid journal inode"); 4823ac27a0ecSDave Kleikamp iput(journal_inode); 4824ac27a0ecSDave Kleikamp return NULL; 4825ac27a0ecSDave Kleikamp } 4826c6cb7e77SEric Whitney return journal_inode; 4827c6cb7e77SEric Whitney } 4828c6cb7e77SEric Whitney 4829c6cb7e77SEric Whitney static journal_t *ext4_get_journal(struct super_block *sb, 4830c6cb7e77SEric Whitney unsigned int journal_inum) 4831c6cb7e77SEric Whitney { 4832c6cb7e77SEric Whitney struct inode *journal_inode; 4833c6cb7e77SEric Whitney journal_t *journal; 4834c6cb7e77SEric Whitney 4835c6cb7e77SEric Whitney BUG_ON(!ext4_has_feature_journal(sb)); 4836c6cb7e77SEric Whitney 4837c6cb7e77SEric Whitney journal_inode = ext4_get_journal_inode(sb, journal_inum); 4838c6cb7e77SEric Whitney if (!journal_inode) 4839c6cb7e77SEric Whitney return NULL; 4840ac27a0ecSDave Kleikamp 4841dab291afSMingming Cao journal = jbd2_journal_init_inode(journal_inode); 4842ac27a0ecSDave Kleikamp if (!journal) { 4843b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "Could not load journal inode"); 4844ac27a0ecSDave Kleikamp iput(journal_inode); 4845ac27a0ecSDave Kleikamp return NULL; 4846ac27a0ecSDave Kleikamp } 4847ac27a0ecSDave Kleikamp journal->j_private = sb; 4848617ba13bSMingming Cao ext4_init_journal_params(sb, journal); 4849ac27a0ecSDave Kleikamp return journal; 4850ac27a0ecSDave Kleikamp } 4851ac27a0ecSDave Kleikamp 4852617ba13bSMingming Cao static journal_t *ext4_get_dev_journal(struct super_block *sb, 4853ac27a0ecSDave Kleikamp dev_t j_dev) 4854ac27a0ecSDave Kleikamp { 4855ac27a0ecSDave Kleikamp struct buffer_head *bh; 4856ac27a0ecSDave Kleikamp journal_t *journal; 4857617ba13bSMingming Cao ext4_fsblk_t start; 4858617ba13bSMingming Cao ext4_fsblk_t len; 4859ac27a0ecSDave Kleikamp int hblock, blocksize; 4860617ba13bSMingming Cao ext4_fsblk_t sb_block; 4861ac27a0ecSDave Kleikamp unsigned long offset; 4862617ba13bSMingming Cao struct ext4_super_block *es; 4863ac27a0ecSDave Kleikamp struct block_device *bdev; 4864ac27a0ecSDave Kleikamp 4865e2b911c5SDarrick J. Wong BUG_ON(!ext4_has_feature_journal(sb)); 48660390131bSFrank Mayhar 4867b31e1552SEric Sandeen bdev = ext4_blkdev_get(j_dev, sb); 4868ac27a0ecSDave Kleikamp if (bdev == NULL) 4869ac27a0ecSDave Kleikamp return NULL; 4870ac27a0ecSDave Kleikamp 4871ac27a0ecSDave Kleikamp blocksize = sb->s_blocksize; 4872e1defc4fSMartin K. Petersen hblock = bdev_logical_block_size(bdev); 4873ac27a0ecSDave Kleikamp if (blocksize < hblock) { 4874b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 4875b31e1552SEric Sandeen "blocksize too small for journal device"); 4876ac27a0ecSDave Kleikamp goto out_bdev; 4877ac27a0ecSDave Kleikamp } 4878ac27a0ecSDave Kleikamp 4879617ba13bSMingming Cao sb_block = EXT4_MIN_BLOCK_SIZE / blocksize; 4880617ba13bSMingming Cao offset = EXT4_MIN_BLOCK_SIZE % blocksize; 4881ac27a0ecSDave Kleikamp set_blocksize(bdev, blocksize); 4882ac27a0ecSDave Kleikamp if (!(bh = __bread(bdev, sb_block, blocksize))) { 4883b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "couldn't read superblock of " 4884b31e1552SEric Sandeen "external journal"); 4885ac27a0ecSDave Kleikamp goto out_bdev; 4886ac27a0ecSDave Kleikamp } 4887ac27a0ecSDave Kleikamp 48882716b802STheodore Ts'o es = (struct ext4_super_block *) (bh->b_data + offset); 4889617ba13bSMingming Cao if ((le16_to_cpu(es->s_magic) != EXT4_SUPER_MAGIC) || 4890ac27a0ecSDave Kleikamp !(le32_to_cpu(es->s_feature_incompat) & 4891617ba13bSMingming Cao EXT4_FEATURE_INCOMPAT_JOURNAL_DEV)) { 4892b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "external journal has " 4893b31e1552SEric Sandeen "bad superblock"); 4894ac27a0ecSDave Kleikamp brelse(bh); 4895ac27a0ecSDave Kleikamp goto out_bdev; 4896ac27a0ecSDave Kleikamp } 4897ac27a0ecSDave Kleikamp 4898df4763beSDarrick J. Wong if ((le32_to_cpu(es->s_feature_ro_compat) & 4899df4763beSDarrick J. Wong EXT4_FEATURE_RO_COMPAT_METADATA_CSUM) && 4900df4763beSDarrick J. Wong es->s_checksum != ext4_superblock_csum(sb, es)) { 4901df4763beSDarrick J. Wong ext4_msg(sb, KERN_ERR, "external journal has " 4902df4763beSDarrick J. Wong "corrupt superblock"); 4903df4763beSDarrick J. Wong brelse(bh); 4904df4763beSDarrick J. Wong goto out_bdev; 4905df4763beSDarrick J. Wong } 4906df4763beSDarrick J. Wong 4907617ba13bSMingming Cao if (memcmp(EXT4_SB(sb)->s_es->s_journal_uuid, es->s_uuid, 16)) { 4908b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "journal UUID does not match"); 4909ac27a0ecSDave Kleikamp brelse(bh); 4910ac27a0ecSDave Kleikamp goto out_bdev; 4911ac27a0ecSDave Kleikamp } 4912ac27a0ecSDave Kleikamp 4913bd81d8eeSLaurent Vivier len = ext4_blocks_count(es); 4914ac27a0ecSDave Kleikamp start = sb_block + 1; 4915ac27a0ecSDave Kleikamp brelse(bh); /* we're done with the superblock */ 4916ac27a0ecSDave Kleikamp 4917dab291afSMingming Cao journal = jbd2_journal_init_dev(bdev, sb->s_bdev, 4918ac27a0ecSDave Kleikamp start, len, blocksize); 4919ac27a0ecSDave Kleikamp if (!journal) { 4920b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "failed to create device journal"); 4921ac27a0ecSDave Kleikamp goto out_bdev; 4922ac27a0ecSDave Kleikamp } 4923ac27a0ecSDave Kleikamp journal->j_private = sb; 4924dfec8a14SMike Christie ll_rw_block(REQ_OP_READ, REQ_META | REQ_PRIO, 1, &journal->j_sb_buffer); 4925ac27a0ecSDave Kleikamp wait_on_buffer(journal->j_sb_buffer); 4926ac27a0ecSDave Kleikamp if (!buffer_uptodate(journal->j_sb_buffer)) { 4927b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "I/O error on journal device"); 4928ac27a0ecSDave Kleikamp goto out_journal; 4929ac27a0ecSDave Kleikamp } 4930ac27a0ecSDave Kleikamp if (be32_to_cpu(journal->j_superblock->s_nr_users) != 1) { 4931b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "External journal has more than one " 4932b31e1552SEric Sandeen "user (unsupported) - %d", 4933ac27a0ecSDave Kleikamp be32_to_cpu(journal->j_superblock->s_nr_users)); 4934ac27a0ecSDave Kleikamp goto out_journal; 4935ac27a0ecSDave Kleikamp } 4936617ba13bSMingming Cao EXT4_SB(sb)->journal_bdev = bdev; 4937617ba13bSMingming Cao ext4_init_journal_params(sb, journal); 4938ac27a0ecSDave Kleikamp return journal; 49390b8e58a1SAndreas Dilger 4940ac27a0ecSDave Kleikamp out_journal: 4941dab291afSMingming Cao jbd2_journal_destroy(journal); 4942ac27a0ecSDave Kleikamp out_bdev: 4943617ba13bSMingming Cao ext4_blkdev_put(bdev); 4944ac27a0ecSDave Kleikamp return NULL; 4945ac27a0ecSDave Kleikamp } 4946ac27a0ecSDave Kleikamp 4947617ba13bSMingming Cao static int ext4_load_journal(struct super_block *sb, 4948617ba13bSMingming Cao struct ext4_super_block *es, 4949ac27a0ecSDave Kleikamp unsigned long journal_devnum) 4950ac27a0ecSDave Kleikamp { 4951ac27a0ecSDave Kleikamp journal_t *journal; 4952ac27a0ecSDave Kleikamp unsigned int journal_inum = le32_to_cpu(es->s_journal_inum); 4953ac27a0ecSDave Kleikamp dev_t journal_dev; 4954ac27a0ecSDave Kleikamp int err = 0; 4955ac27a0ecSDave Kleikamp int really_read_only; 4956ac27a0ecSDave Kleikamp 4957e2b911c5SDarrick J. Wong BUG_ON(!ext4_has_feature_journal(sb)); 49580390131bSFrank Mayhar 4959ac27a0ecSDave Kleikamp if (journal_devnum && 4960ac27a0ecSDave Kleikamp journal_devnum != le32_to_cpu(es->s_journal_dev)) { 4961b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "external journal device major/minor " 4962b31e1552SEric Sandeen "numbers have changed"); 4963ac27a0ecSDave Kleikamp journal_dev = new_decode_dev(journal_devnum); 4964ac27a0ecSDave Kleikamp } else 4965ac27a0ecSDave Kleikamp journal_dev = new_decode_dev(le32_to_cpu(es->s_journal_dev)); 4966ac27a0ecSDave Kleikamp 4967ac27a0ecSDave Kleikamp really_read_only = bdev_read_only(sb->s_bdev); 4968ac27a0ecSDave Kleikamp 4969ac27a0ecSDave Kleikamp /* 4970ac27a0ecSDave Kleikamp * Are we loading a blank journal or performing recovery after a 4971ac27a0ecSDave Kleikamp * crash? For recovery, we need to check in advance whether we 4972ac27a0ecSDave Kleikamp * can get read-write access to the device. 4973ac27a0ecSDave Kleikamp */ 4974e2b911c5SDarrick J. Wong if (ext4_has_feature_journal_needs_recovery(sb)) { 4975bc98a42cSDavid Howells if (sb_rdonly(sb)) { 4976b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "INFO: recovery " 4977b31e1552SEric Sandeen "required on readonly filesystem"); 4978ac27a0ecSDave Kleikamp if (really_read_only) { 4979b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "write access " 4980d98bf8cdSSimon Ruderich "unavailable, cannot proceed " 4981d98bf8cdSSimon Ruderich "(try mounting with noload)"); 4982ac27a0ecSDave Kleikamp return -EROFS; 4983ac27a0ecSDave Kleikamp } 4984b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "write access will " 4985b31e1552SEric Sandeen "be enabled during recovery"); 4986ac27a0ecSDave Kleikamp } 4987ac27a0ecSDave Kleikamp } 4988ac27a0ecSDave Kleikamp 4989ac27a0ecSDave Kleikamp if (journal_inum && journal_dev) { 4990b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "filesystem has both journal " 4991b31e1552SEric Sandeen "and inode journals!"); 4992ac27a0ecSDave Kleikamp return -EINVAL; 4993ac27a0ecSDave Kleikamp } 4994ac27a0ecSDave Kleikamp 4995ac27a0ecSDave Kleikamp if (journal_inum) { 4996617ba13bSMingming Cao if (!(journal = ext4_get_journal(sb, journal_inum))) 4997ac27a0ecSDave Kleikamp return -EINVAL; 4998ac27a0ecSDave Kleikamp } else { 4999617ba13bSMingming Cao if (!(journal = ext4_get_dev_journal(sb, journal_dev))) 5000ac27a0ecSDave Kleikamp return -EINVAL; 5001ac27a0ecSDave Kleikamp } 5002ac27a0ecSDave Kleikamp 500390576c0bSTheodore Ts'o if (!(journal->j_flags & JBD2_BARRIER)) 5004b31e1552SEric Sandeen ext4_msg(sb, KERN_INFO, "barriers disabled"); 50054776004fSTheodore Ts'o 5006e2b911c5SDarrick J. Wong if (!ext4_has_feature_journal_needs_recovery(sb)) 5007dab291afSMingming Cao err = jbd2_journal_wipe(journal, !really_read_only); 50081c13d5c0STheodore Ts'o if (!err) { 50091c13d5c0STheodore Ts'o char *save = kmalloc(EXT4_S_ERR_LEN, GFP_KERNEL); 50101c13d5c0STheodore Ts'o if (save) 50111c13d5c0STheodore Ts'o memcpy(save, ((char *) es) + 50121c13d5c0STheodore Ts'o EXT4_S_ERR_START, EXT4_S_ERR_LEN); 5013dab291afSMingming Cao err = jbd2_journal_load(journal); 50141c13d5c0STheodore Ts'o if (save) 50151c13d5c0STheodore Ts'o memcpy(((char *) es) + EXT4_S_ERR_START, 50161c13d5c0STheodore Ts'o save, EXT4_S_ERR_LEN); 50171c13d5c0STheodore Ts'o kfree(save); 50181c13d5c0STheodore Ts'o } 5019ac27a0ecSDave Kleikamp 5020ac27a0ecSDave Kleikamp if (err) { 5021b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "error loading journal"); 5022dab291afSMingming Cao jbd2_journal_destroy(journal); 5023ac27a0ecSDave Kleikamp return err; 5024ac27a0ecSDave Kleikamp } 5025ac27a0ecSDave Kleikamp 5026617ba13bSMingming Cao EXT4_SB(sb)->s_journal = journal; 5027617ba13bSMingming Cao ext4_clear_journal_err(sb, es); 5028ac27a0ecSDave Kleikamp 5029c41303ceSMaciej Żenczykowski if (!really_read_only && journal_devnum && 5030ac27a0ecSDave Kleikamp journal_devnum != le32_to_cpu(es->s_journal_dev)) { 5031ac27a0ecSDave Kleikamp es->s_journal_dev = cpu_to_le32(journal_devnum); 5032ac27a0ecSDave Kleikamp 5033ac27a0ecSDave Kleikamp /* Make sure we flush the recovery flag to disk. */ 5034e2d67052STheodore Ts'o ext4_commit_super(sb, 1); 5035ac27a0ecSDave Kleikamp } 5036ac27a0ecSDave Kleikamp 5037ac27a0ecSDave Kleikamp return 0; 5038ac27a0ecSDave Kleikamp } 5039ac27a0ecSDave Kleikamp 5040e2d67052STheodore Ts'o static int ext4_commit_super(struct super_block *sb, int sync) 5041ac27a0ecSDave Kleikamp { 5042e2d67052STheodore Ts'o struct ext4_super_block *es = EXT4_SB(sb)->s_es; 5043617ba13bSMingming Cao struct buffer_head *sbh = EXT4_SB(sb)->s_sbh; 5044c4be0c1dSTakashi Sato int error = 0; 5045ac27a0ecSDave Kleikamp 5046bdfe0cbdSTheodore Ts'o if (!sbh || block_device_ejected(sb)) 5047c4be0c1dSTakashi Sato return error; 5048a17712c8SJon Derrick 5049a17712c8SJon Derrick /* 5050a17712c8SJon Derrick * The superblock bh should be mapped, but it might not be if the 5051a17712c8SJon Derrick * device was hot-removed. Not much we can do but fail the I/O. 5052a17712c8SJon Derrick */ 5053a17712c8SJon Derrick if (!buffer_mapped(sbh)) 5054a17712c8SJon Derrick return error; 5055a17712c8SJon Derrick 505671290b36STheodore Ts'o /* 505771290b36STheodore Ts'o * If the file system is mounted read-only, don't update the 505871290b36STheodore Ts'o * superblock write time. This avoids updating the superblock 505971290b36STheodore Ts'o * write time when we are mounting the root file system 506071290b36STheodore Ts'o * read/only but we need to replay the journal; at that point, 506171290b36STheodore Ts'o * for people who are east of GMT and who make their clock 506271290b36STheodore Ts'o * tick in localtime for Windows bug-for-bug compatibility, 506371290b36STheodore Ts'o * the clock is set in the future, and this will cause e2fsck 506471290b36STheodore Ts'o * to complain and force a full file system check. 506571290b36STheodore Ts'o */ 50661751e8a6SLinus Torvalds if (!(sb->s_flags & SB_RDONLY)) 50676a0678a7SArnd Bergmann ext4_update_tstamp(es, s_wtime); 5068f613dfcbSTheodore Ts'o if (sb->s_bdev->bd_part) 5069afc32f7eSTheodore Ts'o es->s_kbytes_written = 5070afc32f7eSTheodore Ts'o cpu_to_le64(EXT4_SB(sb)->s_kbytes_written + 5071dbae2c55SMichael Callahan ((part_stat_read(sb->s_bdev->bd_part, 5072dbae2c55SMichael Callahan sectors[STAT_WRITE]) - 5073afc32f7eSTheodore Ts'o EXT4_SB(sb)->s_sectors_written_start) >> 1)); 5074f613dfcbSTheodore Ts'o else 5075f613dfcbSTheodore Ts'o es->s_kbytes_written = 5076f613dfcbSTheodore Ts'o cpu_to_le64(EXT4_SB(sb)->s_kbytes_written); 5077d5e03cbbSTheodore Ts'o if (percpu_counter_initialized(&EXT4_SB(sb)->s_freeclusters_counter)) 507857042651STheodore Ts'o ext4_free_blocks_count_set(es, 507957042651STheodore Ts'o EXT4_C2B(EXT4_SB(sb), percpu_counter_sum_positive( 508057042651STheodore Ts'o &EXT4_SB(sb)->s_freeclusters_counter))); 5081d5e03cbbSTheodore Ts'o if (percpu_counter_initialized(&EXT4_SB(sb)->s_freeinodes_counter)) 50827f93cff9STheodore Ts'o es->s_free_inodes_count = 50837f93cff9STheodore Ts'o cpu_to_le32(percpu_counter_sum_positive( 50845d1b1b3fSAneesh Kumar K.V &EXT4_SB(sb)->s_freeinodes_counter)); 5085ac27a0ecSDave Kleikamp BUFFER_TRACE(sbh, "marking dirty"); 508606db49e6STheodore Ts'o ext4_superblock_csum_set(sb); 50871566a48aSTheodore Ts'o if (sync) 50884743f839SPranay Kr. Srivastava lock_buffer(sbh); 5089e8680786STheodore Ts'o if (buffer_write_io_error(sbh) || !buffer_uptodate(sbh)) { 50904743f839SPranay Kr. Srivastava /* 50914743f839SPranay Kr. Srivastava * Oh, dear. A previous attempt to write the 50924743f839SPranay Kr. Srivastava * superblock failed. This could happen because the 50934743f839SPranay Kr. Srivastava * USB device was yanked out. Or it could happen to 50944743f839SPranay Kr. Srivastava * be a transient write error and maybe the block will 50954743f839SPranay Kr. Srivastava * be remapped. Nothing we can do but to retry the 50964743f839SPranay Kr. Srivastava * write and hope for the best. 50974743f839SPranay Kr. Srivastava */ 50984743f839SPranay Kr. Srivastava ext4_msg(sb, KERN_ERR, "previous I/O error to " 50994743f839SPranay Kr. Srivastava "superblock detected"); 51004743f839SPranay Kr. Srivastava clear_buffer_write_io_error(sbh); 51014743f839SPranay Kr. Srivastava set_buffer_uptodate(sbh); 51024743f839SPranay Kr. Srivastava } 5103ac27a0ecSDave Kleikamp mark_buffer_dirty(sbh); 5104914258bfSTheodore Ts'o if (sync) { 51051566a48aSTheodore Ts'o unlock_buffer(sbh); 5106564bc402SDaeho Jeong error = __sync_dirty_buffer(sbh, 510700473374SJan Kara REQ_SYNC | (test_opt(sb, BARRIER) ? REQ_FUA : 0)); 5108c89128a0SJaegeuk Kim if (buffer_write_io_error(sbh)) { 5109b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, "I/O error while writing " 5110b31e1552SEric Sandeen "superblock"); 5111914258bfSTheodore Ts'o clear_buffer_write_io_error(sbh); 5112914258bfSTheodore Ts'o set_buffer_uptodate(sbh); 5113914258bfSTheodore Ts'o } 5114914258bfSTheodore Ts'o } 5115c4be0c1dSTakashi Sato return error; 5116ac27a0ecSDave Kleikamp } 5117ac27a0ecSDave Kleikamp 5118ac27a0ecSDave Kleikamp /* 5119ac27a0ecSDave Kleikamp * Have we just finished recovery? If so, and if we are mounting (or 5120ac27a0ecSDave Kleikamp * remounting) the filesystem readonly, then we will end up with a 5121ac27a0ecSDave Kleikamp * consistent fs on disk. Record that fact. 5122ac27a0ecSDave Kleikamp */ 5123617ba13bSMingming Cao static void ext4_mark_recovery_complete(struct super_block *sb, 5124617ba13bSMingming Cao struct ext4_super_block *es) 5125ac27a0ecSDave Kleikamp { 5126617ba13bSMingming Cao journal_t *journal = EXT4_SB(sb)->s_journal; 5127ac27a0ecSDave Kleikamp 5128e2b911c5SDarrick J. Wong if (!ext4_has_feature_journal(sb)) { 51290390131bSFrank Mayhar BUG_ON(journal != NULL); 51300390131bSFrank Mayhar return; 51310390131bSFrank Mayhar } 5132dab291afSMingming Cao jbd2_journal_lock_updates(journal); 51337ffe1ea8SHidehiro Kawai if (jbd2_journal_flush(journal) < 0) 51347ffe1ea8SHidehiro Kawai goto out; 51357ffe1ea8SHidehiro Kawai 5136bc98a42cSDavid Howells if (ext4_has_feature_journal_needs_recovery(sb) && sb_rdonly(sb)) { 5137e2b911c5SDarrick J. Wong ext4_clear_feature_journal_needs_recovery(sb); 5138e2d67052STheodore Ts'o ext4_commit_super(sb, 1); 5139ac27a0ecSDave Kleikamp } 51407ffe1ea8SHidehiro Kawai 51417ffe1ea8SHidehiro Kawai out: 5142dab291afSMingming Cao jbd2_journal_unlock_updates(journal); 5143ac27a0ecSDave Kleikamp } 5144ac27a0ecSDave Kleikamp 5145ac27a0ecSDave Kleikamp /* 5146ac27a0ecSDave Kleikamp * If we are mounting (or read-write remounting) a filesystem whose journal 5147ac27a0ecSDave Kleikamp * has recorded an error from a previous lifetime, move that error to the 5148ac27a0ecSDave Kleikamp * main filesystem now. 5149ac27a0ecSDave Kleikamp */ 5150617ba13bSMingming Cao static void ext4_clear_journal_err(struct super_block *sb, 5151617ba13bSMingming Cao struct ext4_super_block *es) 5152ac27a0ecSDave Kleikamp { 5153ac27a0ecSDave Kleikamp journal_t *journal; 5154ac27a0ecSDave Kleikamp int j_errno; 5155ac27a0ecSDave Kleikamp const char *errstr; 5156ac27a0ecSDave Kleikamp 5157e2b911c5SDarrick J. Wong BUG_ON(!ext4_has_feature_journal(sb)); 51580390131bSFrank Mayhar 5159617ba13bSMingming Cao journal = EXT4_SB(sb)->s_journal; 5160ac27a0ecSDave Kleikamp 5161ac27a0ecSDave Kleikamp /* 5162ac27a0ecSDave Kleikamp * Now check for any error status which may have been recorded in the 5163617ba13bSMingming Cao * journal by a prior ext4_error() or ext4_abort() 5164ac27a0ecSDave Kleikamp */ 5165ac27a0ecSDave Kleikamp 5166dab291afSMingming Cao j_errno = jbd2_journal_errno(journal); 5167ac27a0ecSDave Kleikamp if (j_errno) { 5168ac27a0ecSDave Kleikamp char nbuf[16]; 5169ac27a0ecSDave Kleikamp 5170617ba13bSMingming Cao errstr = ext4_decode_error(sb, j_errno, nbuf); 517112062dddSEric Sandeen ext4_warning(sb, "Filesystem error recorded " 5172ac27a0ecSDave Kleikamp "from previous mount: %s", errstr); 517312062dddSEric Sandeen ext4_warning(sb, "Marking fs in need of filesystem check."); 5174ac27a0ecSDave Kleikamp 5175617ba13bSMingming Cao EXT4_SB(sb)->s_mount_state |= EXT4_ERROR_FS; 5176617ba13bSMingming Cao es->s_state |= cpu_to_le16(EXT4_ERROR_FS); 5177e2d67052STheodore Ts'o ext4_commit_super(sb, 1); 5178ac27a0ecSDave Kleikamp 5179dab291afSMingming Cao jbd2_journal_clear_err(journal); 5180d796c52eSTheodore Ts'o jbd2_journal_update_sb_errno(journal); 5181ac27a0ecSDave Kleikamp } 5182ac27a0ecSDave Kleikamp } 5183ac27a0ecSDave Kleikamp 5184ac27a0ecSDave Kleikamp /* 5185ac27a0ecSDave Kleikamp * Force the running and committing transactions to commit, 5186ac27a0ecSDave Kleikamp * and wait on the commit. 5187ac27a0ecSDave Kleikamp */ 5188617ba13bSMingming Cao int ext4_force_commit(struct super_block *sb) 5189ac27a0ecSDave Kleikamp { 5190ac27a0ecSDave Kleikamp journal_t *journal; 5191ac27a0ecSDave Kleikamp 5192bc98a42cSDavid Howells if (sb_rdonly(sb)) 5193ac27a0ecSDave Kleikamp return 0; 5194ac27a0ecSDave Kleikamp 5195617ba13bSMingming Cao journal = EXT4_SB(sb)->s_journal; 5196b1deefc9SGuo Chao return ext4_journal_force_commit(journal); 5197ac27a0ecSDave Kleikamp } 5198ac27a0ecSDave Kleikamp 5199617ba13bSMingming Cao static int ext4_sync_fs(struct super_block *sb, int wait) 5200ac27a0ecSDave Kleikamp { 520114ce0cb4STheodore Ts'o int ret = 0; 52029eddacf9SJan Kara tid_t target; 520306a407f1SDmitry Monakhov bool needs_barrier = false; 52048d5d02e6SMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 5205ac27a0ecSDave Kleikamp 520649598e04SJun Piao if (unlikely(ext4_forced_shutdown(sbi))) 52070db1ff22STheodore Ts'o return 0; 52080db1ff22STheodore Ts'o 52099bffad1eSTheodore Ts'o trace_ext4_sync_fs(sb, wait); 52102e8fa54eSJan Kara flush_workqueue(sbi->rsv_conversion_wq); 5211a1177825SJan Kara /* 5212a1177825SJan Kara * Writeback quota in non-journalled quota case - journalled quota has 5213a1177825SJan Kara * no dirty dquots 5214a1177825SJan Kara */ 5215a1177825SJan Kara dquot_writeback_dquots(sb, -1); 521606a407f1SDmitry Monakhov /* 521706a407f1SDmitry Monakhov * Data writeback is possible w/o journal transaction, so barrier must 521806a407f1SDmitry Monakhov * being sent at the end of the function. But we can skip it if 521906a407f1SDmitry Monakhov * transaction_commit will do it for us. 522006a407f1SDmitry Monakhov */ 5221bda32530STheodore Ts'o if (sbi->s_journal) { 522206a407f1SDmitry Monakhov target = jbd2_get_latest_transaction(sbi->s_journal); 522306a407f1SDmitry Monakhov if (wait && sbi->s_journal->j_flags & JBD2_BARRIER && 522406a407f1SDmitry Monakhov !jbd2_trans_will_send_data_barrier(sbi->s_journal, target)) 522506a407f1SDmitry Monakhov needs_barrier = true; 522606a407f1SDmitry Monakhov 52278d5d02e6SMingming Cao if (jbd2_journal_start_commit(sbi->s_journal, &target)) { 5228ac27a0ecSDave Kleikamp if (wait) 5229bda32530STheodore Ts'o ret = jbd2_log_wait_commit(sbi->s_journal, 5230bda32530STheodore Ts'o target); 52310390131bSFrank Mayhar } 5232bda32530STheodore Ts'o } else if (wait && test_opt(sb, BARRIER)) 5233bda32530STheodore Ts'o needs_barrier = true; 523406a407f1SDmitry Monakhov if (needs_barrier) { 523506a407f1SDmitry Monakhov int err; 523606a407f1SDmitry Monakhov err = blkdev_issue_flush(sb->s_bdev, GFP_KERNEL, NULL); 523706a407f1SDmitry Monakhov if (!ret) 523806a407f1SDmitry Monakhov ret = err; 523906a407f1SDmitry Monakhov } 524006a407f1SDmitry Monakhov 524106a407f1SDmitry Monakhov return ret; 524206a407f1SDmitry Monakhov } 524306a407f1SDmitry Monakhov 5244ac27a0ecSDave Kleikamp /* 5245ac27a0ecSDave Kleikamp * LVM calls this function before a (read-only) snapshot is created. This 5246ac27a0ecSDave Kleikamp * gives us a chance to flush the journal completely and mark the fs clean. 5247be4f27d3SYongqiang Yang * 5248be4f27d3SYongqiang Yang * Note that only this function cannot bring a filesystem to be in a clean 52498e8ad8a5SJan Kara * state independently. It relies on upper layer to stop all data & metadata 52508e8ad8a5SJan Kara * modifications. 5251ac27a0ecSDave Kleikamp */ 5252c4be0c1dSTakashi Sato static int ext4_freeze(struct super_block *sb) 5253ac27a0ecSDave Kleikamp { 5254c4be0c1dSTakashi Sato int error = 0; 5255c4be0c1dSTakashi Sato journal_t *journal; 5256ac27a0ecSDave Kleikamp 5257bc98a42cSDavid Howells if (sb_rdonly(sb)) 52589ca92389STheodore Ts'o return 0; 52599ca92389STheodore Ts'o 5260c4be0c1dSTakashi Sato journal = EXT4_SB(sb)->s_journal; 5261ac27a0ecSDave Kleikamp 5262bb044576STheodore Ts'o if (journal) { 5263ac27a0ecSDave Kleikamp /* Now we set up the journal barrier. */ 5264dab291afSMingming Cao jbd2_journal_lock_updates(journal); 52657ffe1ea8SHidehiro Kawai 52667ffe1ea8SHidehiro Kawai /* 5267bb044576STheodore Ts'o * Don't clear the needs_recovery flag if we failed to 5268bb044576STheodore Ts'o * flush the journal. 52697ffe1ea8SHidehiro Kawai */ 5270c4be0c1dSTakashi Sato error = jbd2_journal_flush(journal); 52716b0310fbSEric Sandeen if (error < 0) 52726b0310fbSEric Sandeen goto out; 5273ac27a0ecSDave Kleikamp 5274ac27a0ecSDave Kleikamp /* Journal blocked and flushed, clear needs_recovery flag. */ 5275e2b911c5SDarrick J. Wong ext4_clear_feature_journal_needs_recovery(sb); 5276c642dc9eSEric Sandeen } 5277c642dc9eSEric Sandeen 5278e2d67052STheodore Ts'o error = ext4_commit_super(sb, 1); 52796b0310fbSEric Sandeen out: 5280bb044576STheodore Ts'o if (journal) 52818e8ad8a5SJan Kara /* we rely on upper layer to stop further updates */ 5282bb044576STheodore Ts'o jbd2_journal_unlock_updates(journal); 52836b0310fbSEric Sandeen return error; 5284ac27a0ecSDave Kleikamp } 5285ac27a0ecSDave Kleikamp 5286ac27a0ecSDave Kleikamp /* 5287ac27a0ecSDave Kleikamp * Called by LVM after the snapshot is done. We need to reset the RECOVER 5288ac27a0ecSDave Kleikamp * flag here, even though the filesystem is not technically dirty yet. 5289ac27a0ecSDave Kleikamp */ 5290c4be0c1dSTakashi Sato static int ext4_unfreeze(struct super_block *sb) 5291ac27a0ecSDave Kleikamp { 5292bc98a42cSDavid Howells if (sb_rdonly(sb) || ext4_forced_shutdown(EXT4_SB(sb))) 52939ca92389STheodore Ts'o return 0; 52949ca92389STheodore Ts'o 5295c642dc9eSEric Sandeen if (EXT4_SB(sb)->s_journal) { 52969ca92389STheodore Ts'o /* Reset the needs_recovery flag before the fs is unlocked. */ 5297e2b911c5SDarrick J. Wong ext4_set_feature_journal_needs_recovery(sb); 5298c642dc9eSEric Sandeen } 5299c642dc9eSEric Sandeen 5300e2d67052STheodore Ts'o ext4_commit_super(sb, 1); 5301c4be0c1dSTakashi Sato return 0; 5302ac27a0ecSDave Kleikamp } 5303ac27a0ecSDave Kleikamp 5304673c6100STheodore Ts'o /* 5305673c6100STheodore Ts'o * Structure to save mount options for ext4_remount's benefit 5306673c6100STheodore Ts'o */ 5307673c6100STheodore Ts'o struct ext4_mount_options { 5308673c6100STheodore Ts'o unsigned long s_mount_opt; 5309a2595b8aSTheodore Ts'o unsigned long s_mount_opt2; 531008cefc7aSEric W. Biederman kuid_t s_resuid; 531108cefc7aSEric W. Biederman kgid_t s_resgid; 5312673c6100STheodore Ts'o unsigned long s_commit_interval; 5313673c6100STheodore Ts'o u32 s_min_batch_time, s_max_batch_time; 5314673c6100STheodore Ts'o #ifdef CONFIG_QUOTA 5315673c6100STheodore Ts'o int s_jquota_fmt; 5316a2d4a646SJan Kara char *s_qf_names[EXT4_MAXQUOTAS]; 5317673c6100STheodore Ts'o #endif 5318673c6100STheodore Ts'o }; 5319673c6100STheodore Ts'o 5320617ba13bSMingming Cao static int ext4_remount(struct super_block *sb, int *flags, char *data) 5321ac27a0ecSDave Kleikamp { 5322617ba13bSMingming Cao struct ext4_super_block *es; 5323617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 5324ac27a0ecSDave Kleikamp unsigned long old_sb_flags; 5325617ba13bSMingming Cao struct ext4_mount_options old_opts; 5326c79d967dSChristoph Hellwig int enable_quota = 0; 53278a266467STheodore Ts'o ext4_group_t g; 5328b3881f74STheodore Ts'o unsigned int journal_ioprio = DEFAULT_JOURNAL_IOPRIO; 5329c5e06d10SJohann Lombardi int err = 0; 5330ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 533103dafb5fSChen Gang int i, j; 533233458eabSTheodore Ts'o char *to_free[EXT4_MAXQUOTAS]; 5333ac27a0ecSDave Kleikamp #endif 5334d4c402d9SCurt Wohlgemuth char *orig_data = kstrdup(data, GFP_KERNEL); 5335ac27a0ecSDave Kleikamp 533621ac738eSChengguang Xu if (data && !orig_data) 533721ac738eSChengguang Xu return -ENOMEM; 533821ac738eSChengguang Xu 5339ac27a0ecSDave Kleikamp /* Store the original options */ 5340ac27a0ecSDave Kleikamp old_sb_flags = sb->s_flags; 5341ac27a0ecSDave Kleikamp old_opts.s_mount_opt = sbi->s_mount_opt; 5342a2595b8aSTheodore Ts'o old_opts.s_mount_opt2 = sbi->s_mount_opt2; 5343ac27a0ecSDave Kleikamp old_opts.s_resuid = sbi->s_resuid; 5344ac27a0ecSDave Kleikamp old_opts.s_resgid = sbi->s_resgid; 5345ac27a0ecSDave Kleikamp old_opts.s_commit_interval = sbi->s_commit_interval; 534630773840STheodore Ts'o old_opts.s_min_batch_time = sbi->s_min_batch_time; 534730773840STheodore Ts'o old_opts.s_max_batch_time = sbi->s_max_batch_time; 5348ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 5349ac27a0ecSDave Kleikamp old_opts.s_jquota_fmt = sbi->s_jquota_fmt; 5350a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) 535103dafb5fSChen Gang if (sbi->s_qf_names[i]) { 535233458eabSTheodore Ts'o char *qf_name = get_qf_name(sb, sbi, i); 535333458eabSTheodore Ts'o 535433458eabSTheodore Ts'o old_opts.s_qf_names[i] = kstrdup(qf_name, GFP_KERNEL); 535503dafb5fSChen Gang if (!old_opts.s_qf_names[i]) { 535603dafb5fSChen Gang for (j = 0; j < i; j++) 535703dafb5fSChen Gang kfree(old_opts.s_qf_names[j]); 53583e36a163SWei Yongjun kfree(orig_data); 535903dafb5fSChen Gang return -ENOMEM; 536003dafb5fSChen Gang } 536103dafb5fSChen Gang } else 536203dafb5fSChen Gang old_opts.s_qf_names[i] = NULL; 5363ac27a0ecSDave Kleikamp #endif 5364b3881f74STheodore Ts'o if (sbi->s_journal && sbi->s_journal->j_task->io_context) 5365b3881f74STheodore Ts'o journal_ioprio = sbi->s_journal->j_task->io_context->ioprio; 5366ac27a0ecSDave Kleikamp 5367661aa520SEric Sandeen if (!parse_options(data, sb, NULL, &journal_ioprio, 1)) { 5368ac27a0ecSDave Kleikamp err = -EINVAL; 5369ac27a0ecSDave Kleikamp goto restore_opts; 5370ac27a0ecSDave Kleikamp } 5371ac27a0ecSDave Kleikamp 53726b992ff2SDarrick J. Wong if ((old_opts.s_mount_opt & EXT4_MOUNT_JOURNAL_CHECKSUM) ^ 53736b992ff2SDarrick J. Wong test_opt(sb, JOURNAL_CHECKSUM)) { 53746b992ff2SDarrick J. Wong ext4_msg(sb, KERN_ERR, "changing journal_checksum " 53752d5b86e0SEric Sandeen "during remount not supported; ignoring"); 53762d5b86e0SEric Sandeen sbi->s_mount_opt ^= EXT4_MOUNT_JOURNAL_CHECKSUM; 5377c6d3d56dSDarrick J. Wong } 5378c6d3d56dSDarrick J. Wong 53796ae6514bSPiotr Sarna if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_JOURNAL_DATA) { 53806ae6514bSPiotr Sarna if (test_opt2(sb, EXPLICIT_DELALLOC)) { 53816ae6514bSPiotr Sarna ext4_msg(sb, KERN_ERR, "can't mount with " 53826ae6514bSPiotr Sarna "both data=journal and delalloc"); 53836ae6514bSPiotr Sarna err = -EINVAL; 53846ae6514bSPiotr Sarna goto restore_opts; 53856ae6514bSPiotr Sarna } 53866ae6514bSPiotr Sarna if (test_opt(sb, DIOREAD_NOLOCK)) { 53876ae6514bSPiotr Sarna ext4_msg(sb, KERN_ERR, "can't mount with " 53886ae6514bSPiotr Sarna "both data=journal and dioread_nolock"); 53896ae6514bSPiotr Sarna err = -EINVAL; 53906ae6514bSPiotr Sarna goto restore_opts; 53916ae6514bSPiotr Sarna } 5392923ae0ffSRoss Zwisler if (test_opt(sb, DAX)) { 5393923ae0ffSRoss Zwisler ext4_msg(sb, KERN_ERR, "can't mount with " 5394923ae0ffSRoss Zwisler "both data=journal and dax"); 5395923ae0ffSRoss Zwisler err = -EINVAL; 5396923ae0ffSRoss Zwisler goto restore_opts; 5397923ae0ffSRoss Zwisler } 5398ab04df78SJan Kara } else if (test_opt(sb, DATA_FLAGS) == EXT4_MOUNT_ORDERED_DATA) { 5399ab04df78SJan Kara if (test_opt(sb, JOURNAL_ASYNC_COMMIT)) { 5400ab04df78SJan Kara ext4_msg(sb, KERN_ERR, "can't mount with " 5401ab04df78SJan Kara "journal_async_commit in data=ordered mode"); 5402ab04df78SJan Kara err = -EINVAL; 5403ab04df78SJan Kara goto restore_opts; 5404ab04df78SJan Kara } 5405923ae0ffSRoss Zwisler } 5406923ae0ffSRoss Zwisler 5407cdb7ee4cSTahsin Erdogan if ((sbi->s_mount_opt ^ old_opts.s_mount_opt) & EXT4_MOUNT_NO_MBCACHE) { 5408cdb7ee4cSTahsin Erdogan ext4_msg(sb, KERN_ERR, "can't enable nombcache during remount"); 5409cdb7ee4cSTahsin Erdogan err = -EINVAL; 5410cdb7ee4cSTahsin Erdogan goto restore_opts; 5411cdb7ee4cSTahsin Erdogan } 5412cdb7ee4cSTahsin Erdogan 5413923ae0ffSRoss Zwisler if ((sbi->s_mount_opt ^ old_opts.s_mount_opt) & EXT4_MOUNT_DAX) { 5414923ae0ffSRoss Zwisler ext4_msg(sb, KERN_WARNING, "warning: refusing change of " 5415923ae0ffSRoss Zwisler "dax flag with busy inodes while remounting"); 5416923ae0ffSRoss Zwisler sbi->s_mount_opt ^= EXT4_MOUNT_DAX; 54176ae6514bSPiotr Sarna } 54186ae6514bSPiotr Sarna 54194ab2f15bSTheodore Ts'o if (sbi->s_mount_flags & EXT4_MF_FS_ABORTED) 5420c67d859eSTheodore Ts'o ext4_abort(sb, "Abort forced by user"); 5421ac27a0ecSDave Kleikamp 54221751e8a6SLinus Torvalds sb->s_flags = (sb->s_flags & ~SB_POSIXACL) | 54231751e8a6SLinus Torvalds (test_opt(sb, POSIX_ACL) ? SB_POSIXACL : 0); 5424ac27a0ecSDave Kleikamp 5425ac27a0ecSDave Kleikamp es = sbi->s_es; 5426ac27a0ecSDave Kleikamp 5427b3881f74STheodore Ts'o if (sbi->s_journal) { 5428617ba13bSMingming Cao ext4_init_journal_params(sb, sbi->s_journal); 5429b3881f74STheodore Ts'o set_task_ioprio(sbi->s_journal->j_task, journal_ioprio); 5430b3881f74STheodore Ts'o } 5431ac27a0ecSDave Kleikamp 54321751e8a6SLinus Torvalds if (*flags & SB_LAZYTIME) 54331751e8a6SLinus Torvalds sb->s_flags |= SB_LAZYTIME; 5434a2fd66d0STheodore Ts'o 54351751e8a6SLinus Torvalds if ((bool)(*flags & SB_RDONLY) != sb_rdonly(sb)) { 54364ab2f15bSTheodore Ts'o if (sbi->s_mount_flags & EXT4_MF_FS_ABORTED) { 5437ac27a0ecSDave Kleikamp err = -EROFS; 5438ac27a0ecSDave Kleikamp goto restore_opts; 5439ac27a0ecSDave Kleikamp } 5440ac27a0ecSDave Kleikamp 54411751e8a6SLinus Torvalds if (*flags & SB_RDONLY) { 544238c03b34STheodore Ts'o err = sync_filesystem(sb); 544338c03b34STheodore Ts'o if (err < 0) 544438c03b34STheodore Ts'o goto restore_opts; 54450f0dd62fSChristoph Hellwig err = dquot_suspend(sb, -1); 54460f0dd62fSChristoph Hellwig if (err < 0) 5447c79d967dSChristoph Hellwig goto restore_opts; 5448c79d967dSChristoph Hellwig 5449ac27a0ecSDave Kleikamp /* 5450ac27a0ecSDave Kleikamp * First of all, the unconditional stuff we have to do 5451ac27a0ecSDave Kleikamp * to disable replay of the journal when we next remount 5452ac27a0ecSDave Kleikamp */ 54531751e8a6SLinus Torvalds sb->s_flags |= SB_RDONLY; 5454ac27a0ecSDave Kleikamp 5455ac27a0ecSDave Kleikamp /* 5456ac27a0ecSDave Kleikamp * OK, test if we are remounting a valid rw partition 5457ac27a0ecSDave Kleikamp * readonly, and if so set the rdonly flag and then 5458ac27a0ecSDave Kleikamp * mark the partition as valid again. 5459ac27a0ecSDave Kleikamp */ 5460617ba13bSMingming Cao if (!(es->s_state & cpu_to_le16(EXT4_VALID_FS)) && 5461617ba13bSMingming Cao (sbi->s_mount_state & EXT4_VALID_FS)) 5462ac27a0ecSDave Kleikamp es->s_state = cpu_to_le16(sbi->s_mount_state); 5463ac27a0ecSDave Kleikamp 5464a63c9eb2STheodore Ts'o if (sbi->s_journal) 5465617ba13bSMingming Cao ext4_mark_recovery_complete(sb, es); 54662dca60d9STheodore Ts'o if (sbi->s_mmp_tsk) 54672dca60d9STheodore Ts'o kthread_stop(sbi->s_mmp_tsk); 5468ac27a0ecSDave Kleikamp } else { 5469a13fb1a4SEric Sandeen /* Make sure we can mount this feature set readwrite */ 5470e2b911c5SDarrick J. Wong if (ext4_has_feature_readonly(sb) || 54712cb5cc8bSDarrick J. Wong !ext4_feature_set_ok(sb, 0)) { 5472ac27a0ecSDave Kleikamp err = -EROFS; 5473ac27a0ecSDave Kleikamp goto restore_opts; 5474ac27a0ecSDave Kleikamp } 5475ead6596bSEric Sandeen /* 54768a266467STheodore Ts'o * Make sure the group descriptor checksums 54770b8e58a1SAndreas Dilger * are sane. If they aren't, refuse to remount r/w. 54788a266467STheodore Ts'o */ 54798a266467STheodore Ts'o for (g = 0; g < sbi->s_groups_count; g++) { 54808a266467STheodore Ts'o struct ext4_group_desc *gdp = 54818a266467STheodore Ts'o ext4_get_group_desc(sb, g, NULL); 54828a266467STheodore Ts'o 5483feb0ab32SDarrick J. Wong if (!ext4_group_desc_csum_verify(sb, g, gdp)) { 5484b31e1552SEric Sandeen ext4_msg(sb, KERN_ERR, 5485b31e1552SEric Sandeen "ext4_remount: Checksum for group %u failed (%u!=%u)", 5486e2b911c5SDarrick J. Wong g, le16_to_cpu(ext4_group_desc_csum(sb, g, gdp)), 54878a266467STheodore Ts'o le16_to_cpu(gdp->bg_checksum)); 54886a797d27SDarrick J. Wong err = -EFSBADCRC; 54898a266467STheodore Ts'o goto restore_opts; 54908a266467STheodore Ts'o } 54918a266467STheodore Ts'o } 54928a266467STheodore Ts'o 54938a266467STheodore Ts'o /* 5494ead6596bSEric Sandeen * If we have an unprocessed orphan list hanging 5495ead6596bSEric Sandeen * around from a previously readonly bdev mount, 5496ead6596bSEric Sandeen * require a full umount/remount for now. 5497ead6596bSEric Sandeen */ 5498ead6596bSEric Sandeen if (es->s_last_orphan) { 5499b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "Couldn't " 5500ead6596bSEric Sandeen "remount RDWR because of unprocessed " 5501ead6596bSEric Sandeen "orphan inode list. Please " 5502b31e1552SEric Sandeen "umount/remount instead"); 5503ead6596bSEric Sandeen err = -EINVAL; 5504ead6596bSEric Sandeen goto restore_opts; 5505ead6596bSEric Sandeen } 5506ead6596bSEric Sandeen 5507ac27a0ecSDave Kleikamp /* 5508ac27a0ecSDave Kleikamp * Mounting a RDONLY partition read-write, so reread 5509ac27a0ecSDave Kleikamp * and store the current valid flag. (It may have 5510ac27a0ecSDave Kleikamp * been changed by e2fsck since we originally mounted 5511ac27a0ecSDave Kleikamp * the partition.) 5512ac27a0ecSDave Kleikamp */ 55130390131bSFrank Mayhar if (sbi->s_journal) 5514617ba13bSMingming Cao ext4_clear_journal_err(sb, es); 5515ac27a0ecSDave Kleikamp sbi->s_mount_state = le16_to_cpu(es->s_state); 5516c89128a0SJaegeuk Kim 5517c89128a0SJaegeuk Kim err = ext4_setup_super(sb, es, 0); 5518c89128a0SJaegeuk Kim if (err) 5519c89128a0SJaegeuk Kim goto restore_opts; 5520c89128a0SJaegeuk Kim 55211751e8a6SLinus Torvalds sb->s_flags &= ~SB_RDONLY; 5522e2b911c5SDarrick J. Wong if (ext4_has_feature_mmp(sb)) 5523c5e06d10SJohann Lombardi if (ext4_multi_mount_protect(sb, 5524c5e06d10SJohann Lombardi le64_to_cpu(es->s_mmp_block))) { 5525c5e06d10SJohann Lombardi err = -EROFS; 5526c5e06d10SJohann Lombardi goto restore_opts; 5527c5e06d10SJohann Lombardi } 5528c79d967dSChristoph Hellwig enable_quota = 1; 5529ac27a0ecSDave Kleikamp } 5530ac27a0ecSDave Kleikamp } 5531bfff6873SLukas Czerner 5532bfff6873SLukas Czerner /* 5533bfff6873SLukas Czerner * Reinitialize lazy itable initialization thread based on 5534bfff6873SLukas Czerner * current settings 5535bfff6873SLukas Czerner */ 5536bc98a42cSDavid Howells if (sb_rdonly(sb) || !test_opt(sb, INIT_INODE_TABLE)) 5537bfff6873SLukas Czerner ext4_unregister_li_request(sb); 5538bfff6873SLukas Czerner else { 5539bfff6873SLukas Czerner ext4_group_t first_not_zeroed; 5540bfff6873SLukas Czerner first_not_zeroed = ext4_has_uninit_itable(sb); 5541bfff6873SLukas Czerner ext4_register_li_request(sb, first_not_zeroed); 5542bfff6873SLukas Czerner } 5543bfff6873SLukas Czerner 55446fd058f7STheodore Ts'o ext4_setup_system_zone(sb); 5545c89128a0SJaegeuk Kim if (sbi->s_journal == NULL && !(old_sb_flags & SB_RDONLY)) { 5546c89128a0SJaegeuk Kim err = ext4_commit_super(sb, 1); 5547c89128a0SJaegeuk Kim if (err) 5548c89128a0SJaegeuk Kim goto restore_opts; 5549c89128a0SJaegeuk Kim } 55500390131bSFrank Mayhar 5551ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 5552ac27a0ecSDave Kleikamp /* Release old quota file names */ 5553a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) 5554ac27a0ecSDave Kleikamp kfree(old_opts.s_qf_names[i]); 55557c319d32SAditya Kali if (enable_quota) { 55567c319d32SAditya Kali if (sb_any_quota_suspended(sb)) 55570f0dd62fSChristoph Hellwig dquot_resume(sb, -1); 5558e2b911c5SDarrick J. Wong else if (ext4_has_feature_quota(sb)) { 55597c319d32SAditya Kali err = ext4_enable_quotas(sb); 556007724f98STheodore Ts'o if (err) 55617c319d32SAditya Kali goto restore_opts; 55627c319d32SAditya Kali } 55637c319d32SAditya Kali } 55647c319d32SAditya Kali #endif 5565d4c402d9SCurt Wohlgemuth 55661751e8a6SLinus Torvalds *flags = (*flags & ~SB_LAZYTIME) | (sb->s_flags & SB_LAZYTIME); 5567d4c402d9SCurt Wohlgemuth ext4_msg(sb, KERN_INFO, "re-mounted. Opts: %s", orig_data); 5568d4c402d9SCurt Wohlgemuth kfree(orig_data); 5569ac27a0ecSDave Kleikamp return 0; 55700b8e58a1SAndreas Dilger 5571ac27a0ecSDave Kleikamp restore_opts: 5572ac27a0ecSDave Kleikamp sb->s_flags = old_sb_flags; 5573ac27a0ecSDave Kleikamp sbi->s_mount_opt = old_opts.s_mount_opt; 5574a2595b8aSTheodore Ts'o sbi->s_mount_opt2 = old_opts.s_mount_opt2; 5575ac27a0ecSDave Kleikamp sbi->s_resuid = old_opts.s_resuid; 5576ac27a0ecSDave Kleikamp sbi->s_resgid = old_opts.s_resgid; 5577ac27a0ecSDave Kleikamp sbi->s_commit_interval = old_opts.s_commit_interval; 557830773840STheodore Ts'o sbi->s_min_batch_time = old_opts.s_min_batch_time; 557930773840STheodore Ts'o sbi->s_max_batch_time = old_opts.s_max_batch_time; 5580ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 5581ac27a0ecSDave Kleikamp sbi->s_jquota_fmt = old_opts.s_jquota_fmt; 5582a2d4a646SJan Kara for (i = 0; i < EXT4_MAXQUOTAS; i++) { 558333458eabSTheodore Ts'o to_free[i] = get_qf_name(sb, sbi, i); 558433458eabSTheodore Ts'o rcu_assign_pointer(sbi->s_qf_names[i], old_opts.s_qf_names[i]); 5585ac27a0ecSDave Kleikamp } 558633458eabSTheodore Ts'o synchronize_rcu(); 558733458eabSTheodore Ts'o for (i = 0; i < EXT4_MAXQUOTAS; i++) 558833458eabSTheodore Ts'o kfree(to_free[i]); 5589ac27a0ecSDave Kleikamp #endif 5590d4c402d9SCurt Wohlgemuth kfree(orig_data); 5591ac27a0ecSDave Kleikamp return err; 5592ac27a0ecSDave Kleikamp } 5593ac27a0ecSDave Kleikamp 5594689c958cSLi Xi #ifdef CONFIG_QUOTA 5595689c958cSLi Xi static int ext4_statfs_project(struct super_block *sb, 5596689c958cSLi Xi kprojid_t projid, struct kstatfs *buf) 5597689c958cSLi Xi { 5598689c958cSLi Xi struct kqid qid; 5599689c958cSLi Xi struct dquot *dquot; 5600689c958cSLi Xi u64 limit; 5601689c958cSLi Xi u64 curblock; 5602689c958cSLi Xi 5603689c958cSLi Xi qid = make_kqid_projid(projid); 5604689c958cSLi Xi dquot = dqget(sb, qid); 5605689c958cSLi Xi if (IS_ERR(dquot)) 5606689c958cSLi Xi return PTR_ERR(dquot); 56077b9ca4c6SJan Kara spin_lock(&dquot->dq_dqb_lock); 5608689c958cSLi Xi 5609689c958cSLi Xi limit = (dquot->dq_dqb.dqb_bsoftlimit ? 5610689c958cSLi Xi dquot->dq_dqb.dqb_bsoftlimit : 5611689c958cSLi Xi dquot->dq_dqb.dqb_bhardlimit) >> sb->s_blocksize_bits; 5612689c958cSLi Xi if (limit && buf->f_blocks > limit) { 5613f06925c7SKonstantin Khlebnikov curblock = (dquot->dq_dqb.dqb_curspace + 5614f06925c7SKonstantin Khlebnikov dquot->dq_dqb.dqb_rsvspace) >> sb->s_blocksize_bits; 5615689c958cSLi Xi buf->f_blocks = limit; 5616689c958cSLi Xi buf->f_bfree = buf->f_bavail = 5617689c958cSLi Xi (buf->f_blocks > curblock) ? 5618689c958cSLi Xi (buf->f_blocks - curblock) : 0; 5619689c958cSLi Xi } 5620689c958cSLi Xi 5621689c958cSLi Xi limit = dquot->dq_dqb.dqb_isoftlimit ? 5622689c958cSLi Xi dquot->dq_dqb.dqb_isoftlimit : 5623689c958cSLi Xi dquot->dq_dqb.dqb_ihardlimit; 5624689c958cSLi Xi if (limit && buf->f_files > limit) { 5625689c958cSLi Xi buf->f_files = limit; 5626689c958cSLi Xi buf->f_ffree = 5627689c958cSLi Xi (buf->f_files > dquot->dq_dqb.dqb_curinodes) ? 5628689c958cSLi Xi (buf->f_files - dquot->dq_dqb.dqb_curinodes) : 0; 5629689c958cSLi Xi } 5630689c958cSLi Xi 56317b9ca4c6SJan Kara spin_unlock(&dquot->dq_dqb_lock); 5632689c958cSLi Xi dqput(dquot); 5633689c958cSLi Xi return 0; 5634689c958cSLi Xi } 5635689c958cSLi Xi #endif 5636689c958cSLi Xi 5637617ba13bSMingming Cao static int ext4_statfs(struct dentry *dentry, struct kstatfs *buf) 5638ac27a0ecSDave Kleikamp { 5639ac27a0ecSDave Kleikamp struct super_block *sb = dentry->d_sb; 5640617ba13bSMingming Cao struct ext4_sb_info *sbi = EXT4_SB(sb); 5641617ba13bSMingming Cao struct ext4_super_block *es = sbi->s_es; 564227dd4385SLukas Czerner ext4_fsblk_t overhead = 0, resv_blocks; 5643960cc398SPekka Enberg u64 fsid; 5644d02a9391SKazuya Mio s64 bfree; 564527dd4385SLukas Czerner resv_blocks = EXT4_C2B(sbi, atomic64_read(&sbi->s_resv_clusters)); 5646ac27a0ecSDave Kleikamp 5647952fc18eSTheodore Ts'o if (!test_opt(sb, MINIX_DF)) 5648952fc18eSTheodore Ts'o overhead = sbi->s_overhead; 5649ac27a0ecSDave Kleikamp 5650617ba13bSMingming Cao buf->f_type = EXT4_SUPER_MAGIC; 5651ac27a0ecSDave Kleikamp buf->f_bsize = sb->s_blocksize; 5652b72f78cbSEric Sandeen buf->f_blocks = ext4_blocks_count(es) - EXT4_C2B(sbi, overhead); 565357042651STheodore Ts'o bfree = percpu_counter_sum_positive(&sbi->s_freeclusters_counter) - 565457042651STheodore Ts'o percpu_counter_sum_positive(&sbi->s_dirtyclusters_counter); 5655d02a9391SKazuya Mio /* prevent underflow in case that few free space is available */ 565657042651STheodore Ts'o buf->f_bfree = EXT4_C2B(sbi, max_t(s64, bfree, 0)); 565727dd4385SLukas Czerner buf->f_bavail = buf->f_bfree - 565827dd4385SLukas Czerner (ext4_r_blocks_count(es) + resv_blocks); 565927dd4385SLukas Czerner if (buf->f_bfree < (ext4_r_blocks_count(es) + resv_blocks)) 5660ac27a0ecSDave Kleikamp buf->f_bavail = 0; 5661ac27a0ecSDave Kleikamp buf->f_files = le32_to_cpu(es->s_inodes_count); 566252d9f3b4SPeter Zijlstra buf->f_ffree = percpu_counter_sum_positive(&sbi->s_freeinodes_counter); 5663617ba13bSMingming Cao buf->f_namelen = EXT4_NAME_LEN; 5664960cc398SPekka Enberg fsid = le64_to_cpup((void *)es->s_uuid) ^ 5665960cc398SPekka Enberg le64_to_cpup((void *)es->s_uuid + sizeof(u64)); 5666960cc398SPekka Enberg buf->f_fsid.val[0] = fsid & 0xFFFFFFFFUL; 5667960cc398SPekka Enberg buf->f_fsid.val[1] = (fsid >> 32) & 0xFFFFFFFFUL; 56680b8e58a1SAndreas Dilger 5669689c958cSLi Xi #ifdef CONFIG_QUOTA 5670689c958cSLi Xi if (ext4_test_inode_flag(dentry->d_inode, EXT4_INODE_PROJINHERIT) && 5671689c958cSLi Xi sb_has_quota_limits_enabled(sb, PRJQUOTA)) 5672689c958cSLi Xi ext4_statfs_project(sb, EXT4_I(dentry->d_inode)->i_projid, buf); 5673689c958cSLi Xi #endif 5674ac27a0ecSDave Kleikamp return 0; 5675ac27a0ecSDave Kleikamp } 5676ac27a0ecSDave Kleikamp 5677ac27a0ecSDave Kleikamp 5678ac27a0ecSDave Kleikamp #ifdef CONFIG_QUOTA 5679ac27a0ecSDave Kleikamp 5680bc8230eeSJan Kara /* 5681bc8230eeSJan Kara * Helper functions so that transaction is started before we acquire dqio_sem 5682bc8230eeSJan Kara * to keep correct lock ordering of transaction > dqio_sem 5683bc8230eeSJan Kara */ 5684ac27a0ecSDave Kleikamp static inline struct inode *dquot_to_inode(struct dquot *dquot) 5685ac27a0ecSDave Kleikamp { 56864c376dcaSEric W. Biederman return sb_dqopt(dquot->dq_sb)->files[dquot->dq_id.type]; 5687ac27a0ecSDave Kleikamp } 5688ac27a0ecSDave Kleikamp 5689617ba13bSMingming Cao static int ext4_write_dquot(struct dquot *dquot) 5690ac27a0ecSDave Kleikamp { 5691ac27a0ecSDave Kleikamp int ret, err; 5692ac27a0ecSDave Kleikamp handle_t *handle; 5693ac27a0ecSDave Kleikamp struct inode *inode; 5694ac27a0ecSDave Kleikamp 5695ac27a0ecSDave Kleikamp inode = dquot_to_inode(dquot); 56969924a92aSTheodore Ts'o handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 5697617ba13bSMingming Cao EXT4_QUOTA_TRANS_BLOCKS(dquot->dq_sb)); 5698ac27a0ecSDave Kleikamp if (IS_ERR(handle)) 5699ac27a0ecSDave Kleikamp return PTR_ERR(handle); 5700ac27a0ecSDave Kleikamp ret = dquot_commit(dquot); 5701617ba13bSMingming Cao err = ext4_journal_stop(handle); 5702ac27a0ecSDave Kleikamp if (!ret) 5703ac27a0ecSDave Kleikamp ret = err; 5704ac27a0ecSDave Kleikamp return ret; 5705ac27a0ecSDave Kleikamp } 5706ac27a0ecSDave Kleikamp 5707617ba13bSMingming Cao static int ext4_acquire_dquot(struct dquot *dquot) 5708ac27a0ecSDave Kleikamp { 5709ac27a0ecSDave Kleikamp int ret, err; 5710ac27a0ecSDave Kleikamp handle_t *handle; 5711ac27a0ecSDave Kleikamp 57129924a92aSTheodore Ts'o handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA, 5713617ba13bSMingming Cao EXT4_QUOTA_INIT_BLOCKS(dquot->dq_sb)); 5714ac27a0ecSDave Kleikamp if (IS_ERR(handle)) 5715ac27a0ecSDave Kleikamp return PTR_ERR(handle); 5716ac27a0ecSDave Kleikamp ret = dquot_acquire(dquot); 5717617ba13bSMingming Cao err = ext4_journal_stop(handle); 5718ac27a0ecSDave Kleikamp if (!ret) 5719ac27a0ecSDave Kleikamp ret = err; 5720ac27a0ecSDave Kleikamp return ret; 5721ac27a0ecSDave Kleikamp } 5722ac27a0ecSDave Kleikamp 5723617ba13bSMingming Cao static int ext4_release_dquot(struct dquot *dquot) 5724ac27a0ecSDave Kleikamp { 5725ac27a0ecSDave Kleikamp int ret, err; 5726ac27a0ecSDave Kleikamp handle_t *handle; 5727ac27a0ecSDave Kleikamp 57289924a92aSTheodore Ts'o handle = ext4_journal_start(dquot_to_inode(dquot), EXT4_HT_QUOTA, 5729617ba13bSMingming Cao EXT4_QUOTA_DEL_BLOCKS(dquot->dq_sb)); 57309c3013e9SJan Kara if (IS_ERR(handle)) { 57319c3013e9SJan Kara /* Release dquot anyway to avoid endless cycle in dqput() */ 57329c3013e9SJan Kara dquot_release(dquot); 5733ac27a0ecSDave Kleikamp return PTR_ERR(handle); 57349c3013e9SJan Kara } 5735ac27a0ecSDave Kleikamp ret = dquot_release(dquot); 5736617ba13bSMingming Cao err = ext4_journal_stop(handle); 5737ac27a0ecSDave Kleikamp if (!ret) 5738ac27a0ecSDave Kleikamp ret = err; 5739ac27a0ecSDave Kleikamp return ret; 5740ac27a0ecSDave Kleikamp } 5741ac27a0ecSDave Kleikamp 5742617ba13bSMingming Cao static int ext4_mark_dquot_dirty(struct dquot *dquot) 5743ac27a0ecSDave Kleikamp { 5744262b4662SJan Kara struct super_block *sb = dquot->dq_sb; 5745262b4662SJan Kara struct ext4_sb_info *sbi = EXT4_SB(sb); 5746262b4662SJan Kara 57472c8be6b2SJan Kara /* Are we journaling quotas? */ 5748e2b911c5SDarrick J. Wong if (ext4_has_feature_quota(sb) || 5749262b4662SJan Kara sbi->s_qf_names[USRQUOTA] || sbi->s_qf_names[GRPQUOTA]) { 5750ac27a0ecSDave Kleikamp dquot_mark_dquot_dirty(dquot); 5751617ba13bSMingming Cao return ext4_write_dquot(dquot); 5752ac27a0ecSDave Kleikamp } else { 5753ac27a0ecSDave Kleikamp return dquot_mark_dquot_dirty(dquot); 5754ac27a0ecSDave Kleikamp } 5755ac27a0ecSDave Kleikamp } 5756ac27a0ecSDave Kleikamp 5757617ba13bSMingming Cao static int ext4_write_info(struct super_block *sb, int type) 5758ac27a0ecSDave Kleikamp { 5759ac27a0ecSDave Kleikamp int ret, err; 5760ac27a0ecSDave Kleikamp handle_t *handle; 5761ac27a0ecSDave Kleikamp 5762ac27a0ecSDave Kleikamp /* Data block + inode block */ 57632b0143b5SDavid Howells handle = ext4_journal_start(d_inode(sb->s_root), EXT4_HT_QUOTA, 2); 5764ac27a0ecSDave Kleikamp if (IS_ERR(handle)) 5765ac27a0ecSDave Kleikamp return PTR_ERR(handle); 5766ac27a0ecSDave Kleikamp ret = dquot_commit_info(sb, type); 5767617ba13bSMingming Cao err = ext4_journal_stop(handle); 5768ac27a0ecSDave Kleikamp if (!ret) 5769ac27a0ecSDave Kleikamp ret = err; 5770ac27a0ecSDave Kleikamp return ret; 5771ac27a0ecSDave Kleikamp } 5772ac27a0ecSDave Kleikamp 5773ac27a0ecSDave Kleikamp /* 5774ac27a0ecSDave Kleikamp * Turn on quotas during mount time - we need to find 5775ac27a0ecSDave Kleikamp * the quota file and such... 5776ac27a0ecSDave Kleikamp */ 5777617ba13bSMingming Cao static int ext4_quota_on_mount(struct super_block *sb, int type) 5778ac27a0ecSDave Kleikamp { 577933458eabSTheodore Ts'o return dquot_quota_on_mount(sb, get_qf_name(sb, EXT4_SB(sb), type), 5780617ba13bSMingming Cao EXT4_SB(sb)->s_jquota_fmt, type); 5781ac27a0ecSDave Kleikamp } 5782ac27a0ecSDave Kleikamp 5783daf647d2STheodore Ts'o static void lockdep_set_quota_inode(struct inode *inode, int subclass) 5784daf647d2STheodore Ts'o { 5785daf647d2STheodore Ts'o struct ext4_inode_info *ei = EXT4_I(inode); 5786daf647d2STheodore Ts'o 5787daf647d2STheodore Ts'o /* The first argument of lockdep_set_subclass has to be 5788daf647d2STheodore Ts'o * *exactly* the same as the argument to init_rwsem() --- in 5789daf647d2STheodore Ts'o * this case, in init_once() --- or lockdep gets unhappy 5790daf647d2STheodore Ts'o * because the name of the lock is set using the 5791daf647d2STheodore Ts'o * stringification of the argument to init_rwsem(). 5792daf647d2STheodore Ts'o */ 5793daf647d2STheodore Ts'o (void) ei; /* shut up clang warning if !CONFIG_LOCKDEP */ 5794daf647d2STheodore Ts'o lockdep_set_subclass(&ei->i_data_sem, subclass); 5795daf647d2STheodore Ts'o } 5796daf647d2STheodore Ts'o 5797ac27a0ecSDave Kleikamp /* 5798ac27a0ecSDave Kleikamp * Standard function to be called on quota_on 5799ac27a0ecSDave Kleikamp */ 5800617ba13bSMingming Cao static int ext4_quota_on(struct super_block *sb, int type, int format_id, 58018c54ca9cSAl Viro const struct path *path) 5802ac27a0ecSDave Kleikamp { 5803ac27a0ecSDave Kleikamp int err; 5804ac27a0ecSDave Kleikamp 5805ac27a0ecSDave Kleikamp if (!test_opt(sb, QUOTA)) 5806ac27a0ecSDave Kleikamp return -EINVAL; 58070623543bSJan Kara 5808ac27a0ecSDave Kleikamp /* Quotafile not on the same filesystem? */ 5809d8c9584eSAl Viro if (path->dentry->d_sb != sb) 5810ac27a0ecSDave Kleikamp return -EXDEV; 58110623543bSJan Kara /* Journaling quota? */ 58120623543bSJan Kara if (EXT4_SB(sb)->s_qf_names[type]) { 58132b2d6d01STheodore Ts'o /* Quotafile not in fs root? */ 5814f00c9e44SJan Kara if (path->dentry->d_parent != sb->s_root) 5815b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, 5816b31e1552SEric Sandeen "Quota file not on filesystem root. " 5817b31e1552SEric Sandeen "Journaled quota will not work"); 581891389240SJan Kara sb_dqopt(sb)->flags |= DQUOT_NOLIST_DIRTY; 581991389240SJan Kara } else { 582091389240SJan Kara /* 582191389240SJan Kara * Clear the flag just in case mount options changed since 582291389240SJan Kara * last time. 582391389240SJan Kara */ 582491389240SJan Kara sb_dqopt(sb)->flags &= ~DQUOT_NOLIST_DIRTY; 58250623543bSJan Kara } 58260623543bSJan Kara 58270623543bSJan Kara /* 58280623543bSJan Kara * When we journal data on quota file, we have to flush journal to see 58290623543bSJan Kara * all updates to the file when we bypass pagecache... 58300623543bSJan Kara */ 58310390131bSFrank Mayhar if (EXT4_SB(sb)->s_journal && 58322b0143b5SDavid Howells ext4_should_journal_data(d_inode(path->dentry))) { 58330623543bSJan Kara /* 58340623543bSJan Kara * We don't need to lock updates but journal_flush() could 58350623543bSJan Kara * otherwise be livelocked... 58360623543bSJan Kara */ 58370623543bSJan Kara jbd2_journal_lock_updates(EXT4_SB(sb)->s_journal); 58387ffe1ea8SHidehiro Kawai err = jbd2_journal_flush(EXT4_SB(sb)->s_journal); 58390623543bSJan Kara jbd2_journal_unlock_updates(EXT4_SB(sb)->s_journal); 5840f00c9e44SJan Kara if (err) 58417ffe1ea8SHidehiro Kawai return err; 58427ffe1ea8SHidehiro Kawai } 5843957153fcSJan Kara 5844daf647d2STheodore Ts'o lockdep_set_quota_inode(path->dentry->d_inode, I_DATA_SEM_QUOTA); 5845daf647d2STheodore Ts'o err = dquot_quota_on(sb, type, format_id, path); 5846957153fcSJan Kara if (err) { 5847daf647d2STheodore Ts'o lockdep_set_quota_inode(path->dentry->d_inode, 5848daf647d2STheodore Ts'o I_DATA_SEM_NORMAL); 5849957153fcSJan Kara } else { 5850957153fcSJan Kara struct inode *inode = d_inode(path->dentry); 5851957153fcSJan Kara handle_t *handle; 5852957153fcSJan Kara 585361a92987SJan Kara /* 585461a92987SJan Kara * Set inode flags to prevent userspace from messing with quota 585561a92987SJan Kara * files. If this fails, we return success anyway since quotas 585661a92987SJan Kara * are already enabled and this is not a hard failure. 585761a92987SJan Kara */ 5858957153fcSJan Kara inode_lock(inode); 5859957153fcSJan Kara handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1); 5860957153fcSJan Kara if (IS_ERR(handle)) 5861957153fcSJan Kara goto unlock_inode; 5862957153fcSJan Kara EXT4_I(inode)->i_flags |= EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL; 5863957153fcSJan Kara inode_set_flags(inode, S_NOATIME | S_IMMUTABLE, 5864957153fcSJan Kara S_NOATIME | S_IMMUTABLE); 5865957153fcSJan Kara ext4_mark_inode_dirty(handle, inode); 5866957153fcSJan Kara ext4_journal_stop(handle); 5867957153fcSJan Kara unlock_inode: 5868957153fcSJan Kara inode_unlock(inode); 5869957153fcSJan Kara } 5870daf647d2STheodore Ts'o return err; 5871ac27a0ecSDave Kleikamp } 5872ac27a0ecSDave Kleikamp 58737c319d32SAditya Kali static int ext4_quota_enable(struct super_block *sb, int type, int format_id, 58747c319d32SAditya Kali unsigned int flags) 58757c319d32SAditya Kali { 58767c319d32SAditya Kali int err; 58777c319d32SAditya Kali struct inode *qf_inode; 5878a2d4a646SJan Kara unsigned long qf_inums[EXT4_MAXQUOTAS] = { 58797c319d32SAditya Kali le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum), 5880689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum), 5881689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum) 58827c319d32SAditya Kali }; 58837c319d32SAditya Kali 5884e2b911c5SDarrick J. Wong BUG_ON(!ext4_has_feature_quota(sb)); 58857c319d32SAditya Kali 58867c319d32SAditya Kali if (!qf_inums[type]) 58877c319d32SAditya Kali return -EPERM; 58887c319d32SAditya Kali 58898a363970STheodore Ts'o qf_inode = ext4_iget(sb, qf_inums[type], EXT4_IGET_SPECIAL); 58907c319d32SAditya Kali if (IS_ERR(qf_inode)) { 58917c319d32SAditya Kali ext4_error(sb, "Bad quota inode # %lu", qf_inums[type]); 58927c319d32SAditya Kali return PTR_ERR(qf_inode); 58937c319d32SAditya Kali } 58947c319d32SAditya Kali 5895bcb13850SJan Kara /* Don't account quota for quota files to avoid recursion */ 5896bcb13850SJan Kara qf_inode->i_flags |= S_NOQUOTA; 5897daf647d2STheodore Ts'o lockdep_set_quota_inode(qf_inode, I_DATA_SEM_QUOTA); 58987212b95eSJan Kara err = dquot_load_quota_inode(qf_inode, type, format_id, flags); 5899daf647d2STheodore Ts'o if (err) 5900daf647d2STheodore Ts'o lockdep_set_quota_inode(qf_inode, I_DATA_SEM_NORMAL); 590161157b24SPan Bian iput(qf_inode); 59027c319d32SAditya Kali 59037c319d32SAditya Kali return err; 59047c319d32SAditya Kali } 59057c319d32SAditya Kali 59067c319d32SAditya Kali /* Enable usage tracking for all quota types. */ 59077c319d32SAditya Kali static int ext4_enable_quotas(struct super_block *sb) 59087c319d32SAditya Kali { 59097c319d32SAditya Kali int type, err = 0; 5910a2d4a646SJan Kara unsigned long qf_inums[EXT4_MAXQUOTAS] = { 59117c319d32SAditya Kali le32_to_cpu(EXT4_SB(sb)->s_es->s_usr_quota_inum), 5912689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_grp_quota_inum), 5913689c958cSLi Xi le32_to_cpu(EXT4_SB(sb)->s_es->s_prj_quota_inum) 59147c319d32SAditya Kali }; 591549da9392SJan Kara bool quota_mopt[EXT4_MAXQUOTAS] = { 591649da9392SJan Kara test_opt(sb, USRQUOTA), 591749da9392SJan Kara test_opt(sb, GRPQUOTA), 591849da9392SJan Kara test_opt(sb, PRJQUOTA), 591949da9392SJan Kara }; 59207c319d32SAditya Kali 592191389240SJan Kara sb_dqopt(sb)->flags |= DQUOT_QUOTA_SYS_FILE | DQUOT_NOLIST_DIRTY; 5922a2d4a646SJan Kara for (type = 0; type < EXT4_MAXQUOTAS; type++) { 59237c319d32SAditya Kali if (qf_inums[type]) { 59247c319d32SAditya Kali err = ext4_quota_enable(sb, type, QFMT_VFS_V1, 592549da9392SJan Kara DQUOT_USAGE_ENABLED | 592649da9392SJan Kara (quota_mopt[type] ? DQUOT_LIMITS_ENABLED : 0)); 59277c319d32SAditya Kali if (err) { 59287c319d32SAditya Kali ext4_warning(sb, 592972ba7450STheodore Ts'o "Failed to enable quota tracking " 593072ba7450STheodore Ts'o "(type=%d, err=%d). Please run " 593172ba7450STheodore Ts'o "e2fsck to fix.", type, err); 59327f144fd0SJunichi Uekawa for (type--; type >= 0; type--) 59337f144fd0SJunichi Uekawa dquot_quota_off(sb, type); 59347f144fd0SJunichi Uekawa 59357c319d32SAditya Kali return err; 59367c319d32SAditya Kali } 59377c319d32SAditya Kali } 59387c319d32SAditya Kali } 59397c319d32SAditya Kali return 0; 59407c319d32SAditya Kali } 59417c319d32SAditya Kali 5942ca0e05e4SDmitry Monakhov static int ext4_quota_off(struct super_block *sb, int type) 5943ca0e05e4SDmitry Monakhov { 594421f97697SJan Kara struct inode *inode = sb_dqopt(sb)->files[type]; 594521f97697SJan Kara handle_t *handle; 5946957153fcSJan Kara int err; 594721f97697SJan Kara 594887009d86SDmitry Monakhov /* Force all delayed allocation blocks to be allocated. 594987009d86SDmitry Monakhov * Caller already holds s_umount sem */ 595087009d86SDmitry Monakhov if (test_opt(sb, DELALLOC)) 5951ca0e05e4SDmitry Monakhov sync_filesystem(sb); 5952ca0e05e4SDmitry Monakhov 5953957153fcSJan Kara if (!inode || !igrab(inode)) 59540b268590SAmir Goldstein goto out; 59550b268590SAmir Goldstein 5956957153fcSJan Kara err = dquot_quota_off(sb, type); 5957964edf66SJan Kara if (err || ext4_has_feature_quota(sb)) 5958957153fcSJan Kara goto out_put; 5959957153fcSJan Kara 5960957153fcSJan Kara inode_lock(inode); 596161a92987SJan Kara /* 596261a92987SJan Kara * Update modification times of quota files when userspace can 596361a92987SJan Kara * start looking at them. If we fail, we return success anyway since 596461a92987SJan Kara * this is not a hard failure and quotas are already disabled. 596561a92987SJan Kara */ 59669924a92aSTheodore Ts'o handle = ext4_journal_start(inode, EXT4_HT_QUOTA, 1); 596721f97697SJan Kara if (IS_ERR(handle)) 5968957153fcSJan Kara goto out_unlock; 5969957153fcSJan Kara EXT4_I(inode)->i_flags &= ~(EXT4_NOATIME_FL | EXT4_IMMUTABLE_FL); 5970957153fcSJan Kara inode_set_flags(inode, 0, S_NOATIME | S_IMMUTABLE); 5971eeca7ea1SDeepa Dinamani inode->i_mtime = inode->i_ctime = current_time(inode); 597221f97697SJan Kara ext4_mark_inode_dirty(handle, inode); 597321f97697SJan Kara ext4_journal_stop(handle); 5974957153fcSJan Kara out_unlock: 5975957153fcSJan Kara inode_unlock(inode); 5976957153fcSJan Kara out_put: 5977964edf66SJan Kara lockdep_set_quota_inode(inode, I_DATA_SEM_NORMAL); 5978957153fcSJan Kara iput(inode); 5979957153fcSJan Kara return err; 598021f97697SJan Kara out: 5981ca0e05e4SDmitry Monakhov return dquot_quota_off(sb, type); 5982ca0e05e4SDmitry Monakhov } 5983ca0e05e4SDmitry Monakhov 5984ac27a0ecSDave Kleikamp /* Read data from quotafile - avoid pagecache and such because we cannot afford 5985ac27a0ecSDave Kleikamp * acquiring the locks... As quota files are never truncated and quota code 5986ac27a0ecSDave Kleikamp * itself serializes the operations (and no one else should touch the files) 5987ac27a0ecSDave Kleikamp * we don't have to be afraid of races */ 5988617ba13bSMingming Cao static ssize_t ext4_quota_read(struct super_block *sb, int type, char *data, 5989ac27a0ecSDave Kleikamp size_t len, loff_t off) 5990ac27a0ecSDave Kleikamp { 5991ac27a0ecSDave Kleikamp struct inode *inode = sb_dqopt(sb)->files[type]; 5992725d26d3SAneesh Kumar K.V ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb); 5993ac27a0ecSDave Kleikamp int offset = off & (sb->s_blocksize - 1); 5994ac27a0ecSDave Kleikamp int tocopy; 5995ac27a0ecSDave Kleikamp size_t toread; 5996ac27a0ecSDave Kleikamp struct buffer_head *bh; 5997ac27a0ecSDave Kleikamp loff_t i_size = i_size_read(inode); 5998ac27a0ecSDave Kleikamp 5999ac27a0ecSDave Kleikamp if (off > i_size) 6000ac27a0ecSDave Kleikamp return 0; 6001ac27a0ecSDave Kleikamp if (off+len > i_size) 6002ac27a0ecSDave Kleikamp len = i_size-off; 6003ac27a0ecSDave Kleikamp toread = len; 6004ac27a0ecSDave Kleikamp while (toread > 0) { 6005ac27a0ecSDave Kleikamp tocopy = sb->s_blocksize - offset < toread ? 6006ac27a0ecSDave Kleikamp sb->s_blocksize - offset : toread; 60071c215028STheodore Ts'o bh = ext4_bread(NULL, inode, blk, 0); 60081c215028STheodore Ts'o if (IS_ERR(bh)) 60091c215028STheodore Ts'o return PTR_ERR(bh); 6010ac27a0ecSDave Kleikamp if (!bh) /* A hole? */ 6011ac27a0ecSDave Kleikamp memset(data, 0, tocopy); 6012ac27a0ecSDave Kleikamp else 6013ac27a0ecSDave Kleikamp memcpy(data, bh->b_data+offset, tocopy); 6014ac27a0ecSDave Kleikamp brelse(bh); 6015ac27a0ecSDave Kleikamp offset = 0; 6016ac27a0ecSDave Kleikamp toread -= tocopy; 6017ac27a0ecSDave Kleikamp data += tocopy; 6018ac27a0ecSDave Kleikamp blk++; 6019ac27a0ecSDave Kleikamp } 6020ac27a0ecSDave Kleikamp return len; 6021ac27a0ecSDave Kleikamp } 6022ac27a0ecSDave Kleikamp 6023ac27a0ecSDave Kleikamp /* Write to quotafile (we know the transaction is already started and has 6024ac27a0ecSDave Kleikamp * enough credits) */ 6025617ba13bSMingming Cao static ssize_t ext4_quota_write(struct super_block *sb, int type, 6026ac27a0ecSDave Kleikamp const char *data, size_t len, loff_t off) 6027ac27a0ecSDave Kleikamp { 6028ac27a0ecSDave Kleikamp struct inode *inode = sb_dqopt(sb)->files[type]; 6029725d26d3SAneesh Kumar K.V ext4_lblk_t blk = off >> EXT4_BLOCK_SIZE_BITS(sb); 60301c215028STheodore Ts'o int err, offset = off & (sb->s_blocksize - 1); 6031c5e298aeSTheodore Ts'o int retries = 0; 6032ac27a0ecSDave Kleikamp struct buffer_head *bh; 6033ac27a0ecSDave Kleikamp handle_t *handle = journal_current_handle(); 6034ac27a0ecSDave Kleikamp 60350390131bSFrank Mayhar if (EXT4_SB(sb)->s_journal && !handle) { 6036b31e1552SEric Sandeen ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)" 6037b31e1552SEric Sandeen " cancelled because transaction is not started", 60389c3013e9SJan Kara (unsigned long long)off, (unsigned long long)len); 60399c3013e9SJan Kara return -EIO; 60409c3013e9SJan Kara } 604167eeb568SDmitry Monakhov /* 604267eeb568SDmitry Monakhov * Since we account only one data block in transaction credits, 604367eeb568SDmitry Monakhov * then it is impossible to cross a block boundary. 604467eeb568SDmitry Monakhov */ 604567eeb568SDmitry Monakhov if (sb->s_blocksize - offset < len) { 604667eeb568SDmitry Monakhov ext4_msg(sb, KERN_WARNING, "Quota write (off=%llu, len=%llu)" 604767eeb568SDmitry Monakhov " cancelled because not block aligned", 604867eeb568SDmitry Monakhov (unsigned long long)off, (unsigned long long)len); 604967eeb568SDmitry Monakhov return -EIO; 605067eeb568SDmitry Monakhov } 605167eeb568SDmitry Monakhov 6052c5e298aeSTheodore Ts'o do { 6053c5e298aeSTheodore Ts'o bh = ext4_bread(handle, inode, blk, 6054c5e298aeSTheodore Ts'o EXT4_GET_BLOCKS_CREATE | 6055c5e298aeSTheodore Ts'o EXT4_GET_BLOCKS_METADATA_NOFAIL); 6056c5e298aeSTheodore Ts'o } while (IS_ERR(bh) && (PTR_ERR(bh) == -ENOSPC) && 6057c5e298aeSTheodore Ts'o ext4_should_retry_alloc(inode->i_sb, &retries)); 60581c215028STheodore Ts'o if (IS_ERR(bh)) 60591c215028STheodore Ts'o return PTR_ERR(bh); 6060ac27a0ecSDave Kleikamp if (!bh) 6061ac27a0ecSDave Kleikamp goto out; 60625d601255Sliang xie BUFFER_TRACE(bh, "get write access"); 6063617ba13bSMingming Cao err = ext4_journal_get_write_access(handle, bh); 6064ac27a0ecSDave Kleikamp if (err) { 6065ac27a0ecSDave Kleikamp brelse(bh); 60661c215028STheodore Ts'o return err; 6067ac27a0ecSDave Kleikamp } 6068ac27a0ecSDave Kleikamp lock_buffer(bh); 606967eeb568SDmitry Monakhov memcpy(bh->b_data+offset, data, len); 6070ac27a0ecSDave Kleikamp flush_dcache_page(bh->b_page); 6071ac27a0ecSDave Kleikamp unlock_buffer(bh); 60720390131bSFrank Mayhar err = ext4_handle_dirty_metadata(handle, NULL, bh); 6073ac27a0ecSDave Kleikamp brelse(bh); 6074ac27a0ecSDave Kleikamp out: 607567eeb568SDmitry Monakhov if (inode->i_size < off + len) { 607667eeb568SDmitry Monakhov i_size_write(inode, off + len); 6077617ba13bSMingming Cao EXT4_I(inode)->i_disksize = inode->i_size; 6078617ba13bSMingming Cao ext4_mark_inode_dirty(handle, inode); 607921f97697SJan Kara } 608067eeb568SDmitry Monakhov return len; 6081ac27a0ecSDave Kleikamp } 6082ac27a0ecSDave Kleikamp #endif 6083ac27a0ecSDave Kleikamp 6084152a0836SAl Viro static struct dentry *ext4_mount(struct file_system_type *fs_type, int flags, 6085152a0836SAl Viro const char *dev_name, void *data) 6086ac27a0ecSDave Kleikamp { 6087152a0836SAl Viro return mount_bdev(fs_type, flags, dev_name, data, ext4_fill_super); 6088ac27a0ecSDave Kleikamp } 6089ac27a0ecSDave Kleikamp 6090c290ea01SJan Kara #if !defined(CONFIG_EXT2_FS) && !defined(CONFIG_EXT2_FS_MODULE) && defined(CONFIG_EXT4_USE_FOR_EXT2) 609124b58424STheodore Ts'o static inline void register_as_ext2(void) 609224b58424STheodore Ts'o { 609324b58424STheodore Ts'o int err = register_filesystem(&ext2_fs_type); 609424b58424STheodore Ts'o if (err) 609524b58424STheodore Ts'o printk(KERN_WARNING 609624b58424STheodore Ts'o "EXT4-fs: Unable to register as ext2 (%d)\n", err); 609724b58424STheodore Ts'o } 609824b58424STheodore Ts'o 609924b58424STheodore Ts'o static inline void unregister_as_ext2(void) 610024b58424STheodore Ts'o { 610124b58424STheodore Ts'o unregister_filesystem(&ext2_fs_type); 610224b58424STheodore Ts'o } 61032035e776STheodore Ts'o 61042035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb) 61052035e776STheodore Ts'o { 6106e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext2_incompat_features(sb)) 61072035e776STheodore Ts'o return 0; 6108bc98a42cSDavid Howells if (sb_rdonly(sb)) 61092035e776STheodore Ts'o return 1; 6110e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext2_ro_compat_features(sb)) 61112035e776STheodore Ts'o return 0; 61122035e776STheodore Ts'o return 1; 61132035e776STheodore Ts'o } 611424b58424STheodore Ts'o #else 611524b58424STheodore Ts'o static inline void register_as_ext2(void) { } 611624b58424STheodore Ts'o static inline void unregister_as_ext2(void) { } 61172035e776STheodore Ts'o static inline int ext2_feature_set_ok(struct super_block *sb) { return 0; } 611824b58424STheodore Ts'o #endif 611924b58424STheodore Ts'o 612024b58424STheodore Ts'o static inline void register_as_ext3(void) 612124b58424STheodore Ts'o { 612224b58424STheodore Ts'o int err = register_filesystem(&ext3_fs_type); 612324b58424STheodore Ts'o if (err) 612424b58424STheodore Ts'o printk(KERN_WARNING 612524b58424STheodore Ts'o "EXT4-fs: Unable to register as ext3 (%d)\n", err); 612624b58424STheodore Ts'o } 612724b58424STheodore Ts'o 612824b58424STheodore Ts'o static inline void unregister_as_ext3(void) 612924b58424STheodore Ts'o { 613024b58424STheodore Ts'o unregister_filesystem(&ext3_fs_type); 613124b58424STheodore Ts'o } 61322035e776STheodore Ts'o 61332035e776STheodore Ts'o static inline int ext3_feature_set_ok(struct super_block *sb) 61342035e776STheodore Ts'o { 6135e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext3_incompat_features(sb)) 61362035e776STheodore Ts'o return 0; 6137e2b911c5SDarrick J. Wong if (!ext4_has_feature_journal(sb)) 61382035e776STheodore Ts'o return 0; 6139bc98a42cSDavid Howells if (sb_rdonly(sb)) 61402035e776STheodore Ts'o return 1; 6141e2b911c5SDarrick J. Wong if (ext4_has_unknown_ext3_ro_compat_features(sb)) 61422035e776STheodore Ts'o return 0; 61432035e776STheodore Ts'o return 1; 61442035e776STheodore Ts'o } 614524b58424STheodore Ts'o 614603010a33STheodore Ts'o static struct file_system_type ext4_fs_type = { 6147ac27a0ecSDave Kleikamp .owner = THIS_MODULE, 614803010a33STheodore Ts'o .name = "ext4", 6149152a0836SAl Viro .mount = ext4_mount, 6150ac27a0ecSDave Kleikamp .kill_sb = kill_block_super, 6151ac27a0ecSDave Kleikamp .fs_flags = FS_REQUIRES_DEV, 6152ac27a0ecSDave Kleikamp }; 61537f78e035SEric W. Biederman MODULE_ALIAS_FS("ext4"); 6154ac27a0ecSDave Kleikamp 6155e9e3bcecSEric Sandeen /* Shared across all ext4 file systems */ 6156e9e3bcecSEric Sandeen wait_queue_head_t ext4__ioend_wq[EXT4_WQ_HASH_SZ]; 6157e9e3bcecSEric Sandeen 61585dabfc78STheodore Ts'o static int __init ext4_init_fs(void) 6159ac27a0ecSDave Kleikamp { 6160e9e3bcecSEric Sandeen int i, err; 6161c9de560dSAlex Tomas 6162e294a537STheodore Ts'o ratelimit_state_init(&ext4_mount_msg_ratelimit, 30 * HZ, 64); 616307c0c5d8SAl Viro ext4_li_info = NULL; 616407c0c5d8SAl Viro mutex_init(&ext4_li_mtx); 616507c0c5d8SAl Viro 61669a4c8019SCarlos Maiolino /* Build-time check for flags consistency */ 616712e9b892SDmitry Monakhov ext4_check_flag_values(); 6168e9e3bcecSEric Sandeen 6169e142d052SJan Kara for (i = 0; i < EXT4_WQ_HASH_SZ; i++) 6170e9e3bcecSEric Sandeen init_waitqueue_head(&ext4__ioend_wq[i]); 6171e9e3bcecSEric Sandeen 617251865fdaSZheng Liu err = ext4_init_es(); 61736fd058f7STheodore Ts'o if (err) 61746fd058f7STheodore Ts'o return err; 617551865fdaSZheng Liu 61761dc0aa46SEric Whitney err = ext4_init_pending(); 61771dc0aa46SEric Whitney if (err) 617822cfe4b4SEric Biggers goto out7; 617922cfe4b4SEric Biggers 618022cfe4b4SEric Biggers err = ext4_init_post_read_processing(); 618122cfe4b4SEric Biggers if (err) 61821dc0aa46SEric Whitney goto out6; 61831dc0aa46SEric Whitney 618451865fdaSZheng Liu err = ext4_init_pageio(); 618551865fdaSZheng Liu if (err) 6186b5799018STheodore Ts'o goto out5; 618751865fdaSZheng Liu 61885dabfc78STheodore Ts'o err = ext4_init_system_zone(); 6189bd2d0210STheodore Ts'o if (err) 6190b5799018STheodore Ts'o goto out4; 6191857ac889SLukas Czerner 6192b5799018STheodore Ts'o err = ext4_init_sysfs(); 6193dd68314cSTheodore Ts'o if (err) 6194b5799018STheodore Ts'o goto out3; 6195857ac889SLukas Czerner 61965dabfc78STheodore Ts'o err = ext4_init_mballoc(); 6197ac27a0ecSDave Kleikamp if (err) 6198c9de560dSAlex Tomas goto out2; 6199ac27a0ecSDave Kleikamp err = init_inodecache(); 6200ac27a0ecSDave Kleikamp if (err) 6201ac27a0ecSDave Kleikamp goto out1; 620224b58424STheodore Ts'o register_as_ext3(); 62032035e776STheodore Ts'o register_as_ext2(); 620403010a33STheodore Ts'o err = register_filesystem(&ext4_fs_type); 6205ac27a0ecSDave Kleikamp if (err) 6206ac27a0ecSDave Kleikamp goto out; 6207bfff6873SLukas Czerner 6208ac27a0ecSDave Kleikamp return 0; 6209ac27a0ecSDave Kleikamp out: 621024b58424STheodore Ts'o unregister_as_ext2(); 621124b58424STheodore Ts'o unregister_as_ext3(); 6212ac27a0ecSDave Kleikamp destroy_inodecache(); 6213ac27a0ecSDave Kleikamp out1: 62145dabfc78STheodore Ts'o ext4_exit_mballoc(); 62159c191f70ST Makphaibulchoke out2: 6216b5799018STheodore Ts'o ext4_exit_sysfs(); 6217b5799018STheodore Ts'o out3: 6218dd68314cSTheodore Ts'o ext4_exit_system_zone(); 6219b5799018STheodore Ts'o out4: 62205dabfc78STheodore Ts'o ext4_exit_pageio(); 6221b5799018STheodore Ts'o out5: 622222cfe4b4SEric Biggers ext4_exit_post_read_processing(); 62231dc0aa46SEric Whitney out6: 622422cfe4b4SEric Biggers ext4_exit_pending(); 622522cfe4b4SEric Biggers out7: 622651865fdaSZheng Liu ext4_exit_es(); 622751865fdaSZheng Liu 6228ac27a0ecSDave Kleikamp return err; 6229ac27a0ecSDave Kleikamp } 6230ac27a0ecSDave Kleikamp 62315dabfc78STheodore Ts'o static void __exit ext4_exit_fs(void) 6232ac27a0ecSDave Kleikamp { 6233bfff6873SLukas Czerner ext4_destroy_lazyinit_thread(); 623424b58424STheodore Ts'o unregister_as_ext2(); 623524b58424STheodore Ts'o unregister_as_ext3(); 623603010a33STheodore Ts'o unregister_filesystem(&ext4_fs_type); 6237ac27a0ecSDave Kleikamp destroy_inodecache(); 62385dabfc78STheodore Ts'o ext4_exit_mballoc(); 6239b5799018STheodore Ts'o ext4_exit_sysfs(); 62405dabfc78STheodore Ts'o ext4_exit_system_zone(); 62415dabfc78STheodore Ts'o ext4_exit_pageio(); 624222cfe4b4SEric Biggers ext4_exit_post_read_processing(); 6243dd12ed14SEric Sandeen ext4_exit_es(); 62441dc0aa46SEric Whitney ext4_exit_pending(); 6245ac27a0ecSDave Kleikamp } 6246ac27a0ecSDave Kleikamp 6247ac27a0ecSDave Kleikamp MODULE_AUTHOR("Remy Card, Stephen Tweedie, Andrew Morton, Andreas Dilger, Theodore Ts'o and others"); 624883982b6fSTheodore Ts'o MODULE_DESCRIPTION("Fourth Extended Filesystem"); 6249ac27a0ecSDave Kleikamp MODULE_LICENSE("GPL"); 62507ef79ad5STheodore Ts'o MODULE_SOFTDEP("pre: crc32c"); 62515dabfc78STheodore Ts'o module_init(ext4_init_fs) 62525dabfc78STheodore Ts'o module_exit(ext4_exit_fs) 6253