11da177e4SLinus Torvalds /* 27b718769SNathan Scott * Copyright (c) 2000-2002,2005 Silicon Graphics, Inc. 37b718769SNathan Scott * All Rights Reserved. 41da177e4SLinus Torvalds * 57b718769SNathan Scott * This program is free software; you can redistribute it and/or 67b718769SNathan Scott * modify it under the terms of the GNU General Public License as 71da177e4SLinus Torvalds * published by the Free Software Foundation. 81da177e4SLinus Torvalds * 97b718769SNathan Scott * This program is distributed in the hope that it would be useful, 107b718769SNathan Scott * but WITHOUT ANY WARRANTY; without even the implied warranty of 117b718769SNathan Scott * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 127b718769SNathan Scott * GNU General Public License for more details. 131da177e4SLinus Torvalds * 147b718769SNathan Scott * You should have received a copy of the GNU General Public License 157b718769SNathan Scott * along with this program; if not, write the Free Software Foundation, 167b718769SNathan Scott * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA 171da177e4SLinus Torvalds */ 181da177e4SLinus Torvalds #include "xfs.h" 19a844f451SNathan Scott #include "xfs_fs.h" 201da177e4SLinus Torvalds #include "xfs_types.h" 21a844f451SNathan Scott #include "xfs_bit.h" 221da177e4SLinus Torvalds #include "xfs_log.h" 23a844f451SNathan Scott #include "xfs_inum.h" 241da177e4SLinus Torvalds #include "xfs_trans.h" 251da177e4SLinus Torvalds #include "xfs_sb.h" 261da177e4SLinus Torvalds #include "xfs_ag.h" 27a844f451SNathan Scott #include "xfs_dir2.h" 281da177e4SLinus Torvalds #include "xfs_dmapi.h" 291da177e4SLinus Torvalds #include "xfs_mount.h" 30a844f451SNathan Scott #include "xfs_bmap_btree.h" 31a844f451SNathan Scott #include "xfs_alloc_btree.h" 32a844f451SNathan Scott #include "xfs_ialloc_btree.h" 33a844f451SNathan Scott #include "xfs_dir2_sf.h" 34a844f451SNathan Scott #include "xfs_attr_sf.h" 35a844f451SNathan Scott #include "xfs_dinode.h" 36a844f451SNathan Scott #include "xfs_inode.h" 37a844f451SNathan Scott #include "xfs_buf_item.h" 381da177e4SLinus Torvalds #include "xfs_trans_priv.h" 391da177e4SLinus Torvalds #include "xfs_error.h" 401da177e4SLinus Torvalds #include "xfs_rw.h" 410b1b213fSChristoph Hellwig #include "xfs_trace.h" 421da177e4SLinus Torvalds 431da177e4SLinus Torvalds 441da177e4SLinus Torvalds STATIC xfs_buf_t *xfs_trans_buf_item_match(xfs_trans_t *, xfs_buftarg_t *, 451da177e4SLinus Torvalds xfs_daddr_t, int); 461da177e4SLinus Torvalds STATIC xfs_buf_t *xfs_trans_buf_item_match_all(xfs_trans_t *, xfs_buftarg_t *, 471da177e4SLinus Torvalds xfs_daddr_t, int); 481da177e4SLinus Torvalds 49d7e84f41SChristoph Hellwig /* 50d7e84f41SChristoph Hellwig * Add the locked buffer to the transaction. 51d7e84f41SChristoph Hellwig * 52d7e84f41SChristoph Hellwig * The buffer must be locked, and it cannot be associated with any 53d7e84f41SChristoph Hellwig * transaction. 54d7e84f41SChristoph Hellwig * 55d7e84f41SChristoph Hellwig * If the buffer does not yet have a buf log item associated with it, 56d7e84f41SChristoph Hellwig * then allocate one for it. Then add the buf item to the transaction. 57d7e84f41SChristoph Hellwig */ 58d7e84f41SChristoph Hellwig STATIC void 59d7e84f41SChristoph Hellwig _xfs_trans_bjoin( 60d7e84f41SChristoph Hellwig struct xfs_trans *tp, 61d7e84f41SChristoph Hellwig struct xfs_buf *bp, 62d7e84f41SChristoph Hellwig int reset_recur) 63d7e84f41SChristoph Hellwig { 64d7e84f41SChristoph Hellwig struct xfs_buf_log_item *bip; 65d7e84f41SChristoph Hellwig 66d7e84f41SChristoph Hellwig ASSERT(XFS_BUF_ISBUSY(bp)); 67d7e84f41SChristoph Hellwig ASSERT(XFS_BUF_FSPRIVATE2(bp, void *) == NULL); 68d7e84f41SChristoph Hellwig 69d7e84f41SChristoph Hellwig /* 70d7e84f41SChristoph Hellwig * The xfs_buf_log_item pointer is stored in b_fsprivate. If 71d7e84f41SChristoph Hellwig * it doesn't have one yet, then allocate one and initialize it. 72d7e84f41SChristoph Hellwig * The checks to see if one is there are in xfs_buf_item_init(). 73d7e84f41SChristoph Hellwig */ 74d7e84f41SChristoph Hellwig xfs_buf_item_init(bp, tp->t_mountp); 75d7e84f41SChristoph Hellwig bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 76d7e84f41SChristoph Hellwig ASSERT(!(bip->bli_flags & XFS_BLI_STALE)); 77d7e84f41SChristoph Hellwig ASSERT(!(bip->bli_format.blf_flags & XFS_BLI_CANCEL)); 78d7e84f41SChristoph Hellwig ASSERT(!(bip->bli_flags & XFS_BLI_LOGGED)); 79d7e84f41SChristoph Hellwig if (reset_recur) 80d7e84f41SChristoph Hellwig bip->bli_recur = 0; 81d7e84f41SChristoph Hellwig 82d7e84f41SChristoph Hellwig /* 83d7e84f41SChristoph Hellwig * Take a reference for this transaction on the buf item. 84d7e84f41SChristoph Hellwig */ 85d7e84f41SChristoph Hellwig atomic_inc(&bip->bli_refcount); 86d7e84f41SChristoph Hellwig 87d7e84f41SChristoph Hellwig /* 88d7e84f41SChristoph Hellwig * Get a log_item_desc to point at the new item. 89d7e84f41SChristoph Hellwig */ 90d7e84f41SChristoph Hellwig (void) xfs_trans_add_item(tp, (xfs_log_item_t *)bip); 91d7e84f41SChristoph Hellwig 92d7e84f41SChristoph Hellwig /* 93d7e84f41SChristoph Hellwig * Initialize b_fsprivate2 so we can find it with incore_match() 94d7e84f41SChristoph Hellwig * in xfs_trans_get_buf() and friends above. 95d7e84f41SChristoph Hellwig */ 96d7e84f41SChristoph Hellwig XFS_BUF_SET_FSPRIVATE2(bp, tp); 97d7e84f41SChristoph Hellwig 98d7e84f41SChristoph Hellwig } 99d7e84f41SChristoph Hellwig 100d7e84f41SChristoph Hellwig void 101d7e84f41SChristoph Hellwig xfs_trans_bjoin( 102d7e84f41SChristoph Hellwig struct xfs_trans *tp, 103d7e84f41SChristoph Hellwig struct xfs_buf *bp) 104d7e84f41SChristoph Hellwig { 105d7e84f41SChristoph Hellwig _xfs_trans_bjoin(tp, bp, 0); 106d7e84f41SChristoph Hellwig trace_xfs_trans_bjoin(bp->b_fspriv); 107d7e84f41SChristoph Hellwig } 1081da177e4SLinus Torvalds 1091da177e4SLinus Torvalds /* 1101da177e4SLinus Torvalds * Get and lock the buffer for the caller if it is not already 1111da177e4SLinus Torvalds * locked within the given transaction. If it is already locked 1121da177e4SLinus Torvalds * within the transaction, just increment its lock recursion count 1131da177e4SLinus Torvalds * and return a pointer to it. 1141da177e4SLinus Torvalds * 1151da177e4SLinus Torvalds * Use the fast path function xfs_trans_buf_item_match() or the buffer 1161da177e4SLinus Torvalds * cache routine incore_match() to find the buffer 1171da177e4SLinus Torvalds * if it is already owned by this transaction. 1181da177e4SLinus Torvalds * 1191da177e4SLinus Torvalds * If we don't already own the buffer, use get_buf() to get it. 1201da177e4SLinus Torvalds * If it doesn't yet have an associated xfs_buf_log_item structure, 1211da177e4SLinus Torvalds * then allocate one and add the item to this transaction. 1221da177e4SLinus Torvalds * 1231da177e4SLinus Torvalds * If the transaction pointer is NULL, make this just a normal 1241da177e4SLinus Torvalds * get_buf() call. 1251da177e4SLinus Torvalds */ 1261da177e4SLinus Torvalds xfs_buf_t * 1271da177e4SLinus Torvalds xfs_trans_get_buf(xfs_trans_t *tp, 1281da177e4SLinus Torvalds xfs_buftarg_t *target_dev, 1291da177e4SLinus Torvalds xfs_daddr_t blkno, 1301da177e4SLinus Torvalds int len, 1311da177e4SLinus Torvalds uint flags) 1321da177e4SLinus Torvalds { 1331da177e4SLinus Torvalds xfs_buf_t *bp; 1341da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 1351da177e4SLinus Torvalds 1361da177e4SLinus Torvalds if (flags == 0) 1370cadda1cSChristoph Hellwig flags = XBF_LOCK | XBF_MAPPED; 1381da177e4SLinus Torvalds 1391da177e4SLinus Torvalds /* 1401da177e4SLinus Torvalds * Default to a normal get_buf() call if the tp is NULL. 1411da177e4SLinus Torvalds */ 1426ad112bfSChristoph Hellwig if (tp == NULL) 1430cadda1cSChristoph Hellwig return xfs_buf_get(target_dev, blkno, len, 1440cadda1cSChristoph Hellwig flags | XBF_DONT_BLOCK); 1451da177e4SLinus Torvalds 1461da177e4SLinus Torvalds /* 1471da177e4SLinus Torvalds * If we find the buffer in the cache with this transaction 1481da177e4SLinus Torvalds * pointer in its b_fsprivate2 field, then we know we already 1491da177e4SLinus Torvalds * have it locked. In this case we just increment the lock 1501da177e4SLinus Torvalds * recursion count and return the buffer to the caller. 1511da177e4SLinus Torvalds */ 1521da177e4SLinus Torvalds if (tp->t_items.lic_next == NULL) { 1531da177e4SLinus Torvalds bp = xfs_trans_buf_item_match(tp, target_dev, blkno, len); 1541da177e4SLinus Torvalds } else { 1551da177e4SLinus Torvalds bp = xfs_trans_buf_item_match_all(tp, target_dev, blkno, len); 1561da177e4SLinus Torvalds } 1571da177e4SLinus Torvalds if (bp != NULL) { 1581da177e4SLinus Torvalds ASSERT(XFS_BUF_VALUSEMA(bp) <= 0); 1590b1b213fSChristoph Hellwig if (XFS_FORCED_SHUTDOWN(tp->t_mountp)) 1601da177e4SLinus Torvalds XFS_BUF_SUPER_STALE(bp); 1610b1b213fSChristoph Hellwig 1621da177e4SLinus Torvalds /* 1631da177e4SLinus Torvalds * If the buffer is stale then it was binval'ed 1641da177e4SLinus Torvalds * since last read. This doesn't matter since the 1651da177e4SLinus Torvalds * caller isn't allowed to use the data anyway. 1661da177e4SLinus Torvalds */ 1670b1b213fSChristoph Hellwig else if (XFS_BUF_ISSTALE(bp)) 1681da177e4SLinus Torvalds ASSERT(!XFS_BUF_ISDELAYWRITE(bp)); 1690b1b213fSChristoph Hellwig 1701da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 1711da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 1721da177e4SLinus Torvalds ASSERT(bip != NULL); 1731da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 1741da177e4SLinus Torvalds bip->bli_recur++; 1750b1b213fSChristoph Hellwig trace_xfs_trans_get_buf_recur(bip); 1761da177e4SLinus Torvalds return (bp); 1771da177e4SLinus Torvalds } 1781da177e4SLinus Torvalds 1791da177e4SLinus Torvalds /* 1800cadda1cSChristoph Hellwig * We always specify the XBF_DONT_BLOCK flag within a transaction 1810cadda1cSChristoph Hellwig * so that get_buf does not try to push out a delayed write buffer 1821da177e4SLinus Torvalds * which might cause another transaction to take place (if the 1831da177e4SLinus Torvalds * buffer was delayed alloc). Such recursive transactions can 1841da177e4SLinus Torvalds * easily deadlock with our current transaction as well as cause 1851da177e4SLinus Torvalds * us to run out of stack space. 1861da177e4SLinus Torvalds */ 1870cadda1cSChristoph Hellwig bp = xfs_buf_get(target_dev, blkno, len, flags | XBF_DONT_BLOCK); 1881da177e4SLinus Torvalds if (bp == NULL) { 1891da177e4SLinus Torvalds return NULL; 1901da177e4SLinus Torvalds } 1911da177e4SLinus Torvalds 1921da177e4SLinus Torvalds ASSERT(!XFS_BUF_GETERROR(bp)); 1931da177e4SLinus Torvalds 194d7e84f41SChristoph Hellwig _xfs_trans_bjoin(tp, bp, 1); 195d7e84f41SChristoph Hellwig trace_xfs_trans_get_buf(bp->b_fspriv); 1961da177e4SLinus Torvalds return (bp); 1971da177e4SLinus Torvalds } 1981da177e4SLinus Torvalds 1991da177e4SLinus Torvalds /* 2001da177e4SLinus Torvalds * Get and lock the superblock buffer of this file system for the 2011da177e4SLinus Torvalds * given transaction. 2021da177e4SLinus Torvalds * 2031da177e4SLinus Torvalds * We don't need to use incore_match() here, because the superblock 2041da177e4SLinus Torvalds * buffer is a private buffer which we keep a pointer to in the 2051da177e4SLinus Torvalds * mount structure. 2061da177e4SLinus Torvalds */ 2071da177e4SLinus Torvalds xfs_buf_t * 2081da177e4SLinus Torvalds xfs_trans_getsb(xfs_trans_t *tp, 2091da177e4SLinus Torvalds struct xfs_mount *mp, 2101da177e4SLinus Torvalds int flags) 2111da177e4SLinus Torvalds { 2121da177e4SLinus Torvalds xfs_buf_t *bp; 2131da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 2141da177e4SLinus Torvalds 2151da177e4SLinus Torvalds /* 2161da177e4SLinus Torvalds * Default to just trying to lock the superblock buffer 2171da177e4SLinus Torvalds * if tp is NULL. 2181da177e4SLinus Torvalds */ 2191da177e4SLinus Torvalds if (tp == NULL) { 2201da177e4SLinus Torvalds return (xfs_getsb(mp, flags)); 2211da177e4SLinus Torvalds } 2221da177e4SLinus Torvalds 2231da177e4SLinus Torvalds /* 2241da177e4SLinus Torvalds * If the superblock buffer already has this transaction 2251da177e4SLinus Torvalds * pointer in its b_fsprivate2 field, then we know we already 2261da177e4SLinus Torvalds * have it locked. In this case we just increment the lock 2271da177e4SLinus Torvalds * recursion count and return the buffer to the caller. 2281da177e4SLinus Torvalds */ 2291da177e4SLinus Torvalds bp = mp->m_sb_bp; 2301da177e4SLinus Torvalds if (XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp) { 2311da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t*); 2321da177e4SLinus Torvalds ASSERT(bip != NULL); 2331da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 2341da177e4SLinus Torvalds bip->bli_recur++; 2350b1b213fSChristoph Hellwig trace_xfs_trans_getsb_recur(bip); 2361da177e4SLinus Torvalds return (bp); 2371da177e4SLinus Torvalds } 2381da177e4SLinus Torvalds 2391da177e4SLinus Torvalds bp = xfs_getsb(mp, flags); 240d7e84f41SChristoph Hellwig if (bp == NULL) 2411da177e4SLinus Torvalds return NULL; 2421da177e4SLinus Torvalds 243d7e84f41SChristoph Hellwig _xfs_trans_bjoin(tp, bp, 1); 244d7e84f41SChristoph Hellwig trace_xfs_trans_getsb(bp->b_fspriv); 2451da177e4SLinus Torvalds return (bp); 2461da177e4SLinus Torvalds } 2471da177e4SLinus Torvalds 2481da177e4SLinus Torvalds #ifdef DEBUG 2491da177e4SLinus Torvalds xfs_buftarg_t *xfs_error_target; 2501da177e4SLinus Torvalds int xfs_do_error; 2511da177e4SLinus Torvalds int xfs_req_num; 2521da177e4SLinus Torvalds int xfs_error_mod = 33; 2531da177e4SLinus Torvalds #endif 2541da177e4SLinus Torvalds 2551da177e4SLinus Torvalds /* 2561da177e4SLinus Torvalds * Get and lock the buffer for the caller if it is not already 2571da177e4SLinus Torvalds * locked within the given transaction. If it has not yet been 2581da177e4SLinus Torvalds * read in, read it from disk. If it is already locked 2591da177e4SLinus Torvalds * within the transaction and already read in, just increment its 2601da177e4SLinus Torvalds * lock recursion count and return a pointer to it. 2611da177e4SLinus Torvalds * 2621da177e4SLinus Torvalds * Use the fast path function xfs_trans_buf_item_match() or the buffer 2631da177e4SLinus Torvalds * cache routine incore_match() to find the buffer 2641da177e4SLinus Torvalds * if it is already owned by this transaction. 2651da177e4SLinus Torvalds * 2661da177e4SLinus Torvalds * If we don't already own the buffer, use read_buf() to get it. 2671da177e4SLinus Torvalds * If it doesn't yet have an associated xfs_buf_log_item structure, 2681da177e4SLinus Torvalds * then allocate one and add the item to this transaction. 2691da177e4SLinus Torvalds * 2701da177e4SLinus Torvalds * If the transaction pointer is NULL, make this just a normal 2711da177e4SLinus Torvalds * read_buf() call. 2721da177e4SLinus Torvalds */ 2731da177e4SLinus Torvalds int 2741da177e4SLinus Torvalds xfs_trans_read_buf( 2751da177e4SLinus Torvalds xfs_mount_t *mp, 2761da177e4SLinus Torvalds xfs_trans_t *tp, 2771da177e4SLinus Torvalds xfs_buftarg_t *target, 2781da177e4SLinus Torvalds xfs_daddr_t blkno, 2791da177e4SLinus Torvalds int len, 2801da177e4SLinus Torvalds uint flags, 2811da177e4SLinus Torvalds xfs_buf_t **bpp) 2821da177e4SLinus Torvalds { 2831da177e4SLinus Torvalds xfs_buf_t *bp; 2841da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 2851da177e4SLinus Torvalds int error; 2861da177e4SLinus Torvalds 2871da177e4SLinus Torvalds if (flags == 0) 2880cadda1cSChristoph Hellwig flags = XBF_LOCK | XBF_MAPPED; 2891da177e4SLinus Torvalds 2901da177e4SLinus Torvalds /* 2911da177e4SLinus Torvalds * Default to a normal get_buf() call if the tp is NULL. 2921da177e4SLinus Torvalds */ 2931da177e4SLinus Torvalds if (tp == NULL) { 2940cadda1cSChristoph Hellwig bp = xfs_buf_read(target, blkno, len, flags | XBF_DONT_BLOCK); 2951da177e4SLinus Torvalds if (!bp) 2960cadda1cSChristoph Hellwig return (flags & XBF_TRYLOCK) ? 297a3f74ffbSDavid Chinner EAGAIN : XFS_ERROR(ENOMEM); 2981da177e4SLinus Torvalds 299a0f7bfd3SJulia Lawall if (XFS_BUF_GETERROR(bp) != 0) { 3001da177e4SLinus Torvalds xfs_ioerror_alert("xfs_trans_read_buf", mp, 3011da177e4SLinus Torvalds bp, blkno); 3021da177e4SLinus Torvalds error = XFS_BUF_GETERROR(bp); 3031da177e4SLinus Torvalds xfs_buf_relse(bp); 3041da177e4SLinus Torvalds return error; 3051da177e4SLinus Torvalds } 3061da177e4SLinus Torvalds #ifdef DEBUG 307a0f7bfd3SJulia Lawall if (xfs_do_error) { 3081da177e4SLinus Torvalds if (xfs_error_target == target) { 3091da177e4SLinus Torvalds if (((xfs_req_num++) % xfs_error_mod) == 0) { 3101da177e4SLinus Torvalds xfs_buf_relse(bp); 311b6574520SNathan Scott cmn_err(CE_DEBUG, "Returning error!\n"); 3121da177e4SLinus Torvalds return XFS_ERROR(EIO); 3131da177e4SLinus Torvalds } 3141da177e4SLinus Torvalds } 3151da177e4SLinus Torvalds } 3161da177e4SLinus Torvalds #endif 3171da177e4SLinus Torvalds if (XFS_FORCED_SHUTDOWN(mp)) 3181da177e4SLinus Torvalds goto shutdown_abort; 3191da177e4SLinus Torvalds *bpp = bp; 3201da177e4SLinus Torvalds return 0; 3211da177e4SLinus Torvalds } 3221da177e4SLinus Torvalds 3231da177e4SLinus Torvalds /* 3241da177e4SLinus Torvalds * If we find the buffer in the cache with this transaction 3251da177e4SLinus Torvalds * pointer in its b_fsprivate2 field, then we know we already 3261da177e4SLinus Torvalds * have it locked. If it is already read in we just increment 3271da177e4SLinus Torvalds * the lock recursion count and return the buffer to the caller. 3281da177e4SLinus Torvalds * If the buffer is not yet read in, then we read it in, increment 3291da177e4SLinus Torvalds * the lock recursion count, and return it to the caller. 3301da177e4SLinus Torvalds */ 3311da177e4SLinus Torvalds if (tp->t_items.lic_next == NULL) { 3321da177e4SLinus Torvalds bp = xfs_trans_buf_item_match(tp, target, blkno, len); 3331da177e4SLinus Torvalds } else { 3341da177e4SLinus Torvalds bp = xfs_trans_buf_item_match_all(tp, target, blkno, len); 3351da177e4SLinus Torvalds } 3361da177e4SLinus Torvalds if (bp != NULL) { 3371da177e4SLinus Torvalds ASSERT(XFS_BUF_VALUSEMA(bp) <= 0); 3381da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 3391da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 3401da177e4SLinus Torvalds ASSERT((XFS_BUF_ISERROR(bp)) == 0); 3411da177e4SLinus Torvalds if (!(XFS_BUF_ISDONE(bp))) { 3420b1b213fSChristoph Hellwig trace_xfs_trans_read_buf_io(bp, _RET_IP_); 3431da177e4SLinus Torvalds ASSERT(!XFS_BUF_ISASYNC(bp)); 3441da177e4SLinus Torvalds XFS_BUF_READ(bp); 3451da177e4SLinus Torvalds xfsbdstrat(tp->t_mountp, bp); 346d64e31a2SDavid Chinner error = xfs_iowait(bp); 347d64e31a2SDavid Chinner if (error) { 3481da177e4SLinus Torvalds xfs_ioerror_alert("xfs_trans_read_buf", mp, 3491da177e4SLinus Torvalds bp, blkno); 3501da177e4SLinus Torvalds xfs_buf_relse(bp); 3511da177e4SLinus Torvalds /* 352d64e31a2SDavid Chinner * We can gracefully recover from most read 353d64e31a2SDavid Chinner * errors. Ones we can't are those that happen 354d64e31a2SDavid Chinner * after the transaction's already dirty. 3551da177e4SLinus Torvalds */ 3561da177e4SLinus Torvalds if (tp->t_flags & XFS_TRANS_DIRTY) 3571da177e4SLinus Torvalds xfs_force_shutdown(tp->t_mountp, 3587d04a335SNathan Scott SHUTDOWN_META_IO_ERROR); 3591da177e4SLinus Torvalds return error; 3601da177e4SLinus Torvalds } 3611da177e4SLinus Torvalds } 3621da177e4SLinus Torvalds /* 3631da177e4SLinus Torvalds * We never locked this buf ourselves, so we shouldn't 3641da177e4SLinus Torvalds * brelse it either. Just get out. 3651da177e4SLinus Torvalds */ 3661da177e4SLinus Torvalds if (XFS_FORCED_SHUTDOWN(mp)) { 3670b1b213fSChristoph Hellwig trace_xfs_trans_read_buf_shut(bp, _RET_IP_); 3681da177e4SLinus Torvalds *bpp = NULL; 3691da177e4SLinus Torvalds return XFS_ERROR(EIO); 3701da177e4SLinus Torvalds } 3711da177e4SLinus Torvalds 3721da177e4SLinus Torvalds 3731da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t*); 3741da177e4SLinus Torvalds bip->bli_recur++; 3751da177e4SLinus Torvalds 3761da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 3770b1b213fSChristoph Hellwig trace_xfs_trans_read_buf_recur(bip); 3781da177e4SLinus Torvalds *bpp = bp; 3791da177e4SLinus Torvalds return 0; 3801da177e4SLinus Torvalds } 3811da177e4SLinus Torvalds 3821da177e4SLinus Torvalds /* 3830cadda1cSChristoph Hellwig * We always specify the XBF_DONT_BLOCK flag within a transaction 3840cadda1cSChristoph Hellwig * so that get_buf does not try to push out a delayed write buffer 3851da177e4SLinus Torvalds * which might cause another transaction to take place (if the 3861da177e4SLinus Torvalds * buffer was delayed alloc). Such recursive transactions can 3871da177e4SLinus Torvalds * easily deadlock with our current transaction as well as cause 3881da177e4SLinus Torvalds * us to run out of stack space. 3891da177e4SLinus Torvalds */ 3900cadda1cSChristoph Hellwig bp = xfs_buf_read(target, blkno, len, flags | XBF_DONT_BLOCK); 3911da177e4SLinus Torvalds if (bp == NULL) { 3921da177e4SLinus Torvalds *bpp = NULL; 3931da177e4SLinus Torvalds return 0; 3941da177e4SLinus Torvalds } 3951da177e4SLinus Torvalds if (XFS_BUF_GETERROR(bp) != 0) { 3961da177e4SLinus Torvalds XFS_BUF_SUPER_STALE(bp); 3971da177e4SLinus Torvalds error = XFS_BUF_GETERROR(bp); 3981da177e4SLinus Torvalds 3991da177e4SLinus Torvalds xfs_ioerror_alert("xfs_trans_read_buf", mp, 4001da177e4SLinus Torvalds bp, blkno); 4011da177e4SLinus Torvalds if (tp->t_flags & XFS_TRANS_DIRTY) 4027d04a335SNathan Scott xfs_force_shutdown(tp->t_mountp, SHUTDOWN_META_IO_ERROR); 4031da177e4SLinus Torvalds xfs_buf_relse(bp); 4041da177e4SLinus Torvalds return error; 4051da177e4SLinus Torvalds } 4061da177e4SLinus Torvalds #ifdef DEBUG 4071da177e4SLinus Torvalds if (xfs_do_error && !(tp->t_flags & XFS_TRANS_DIRTY)) { 4081da177e4SLinus Torvalds if (xfs_error_target == target) { 4091da177e4SLinus Torvalds if (((xfs_req_num++) % xfs_error_mod) == 0) { 4101da177e4SLinus Torvalds xfs_force_shutdown(tp->t_mountp, 4117d04a335SNathan Scott SHUTDOWN_META_IO_ERROR); 4121da177e4SLinus Torvalds xfs_buf_relse(bp); 413b6574520SNathan Scott cmn_err(CE_DEBUG, "Returning trans error!\n"); 4141da177e4SLinus Torvalds return XFS_ERROR(EIO); 4151da177e4SLinus Torvalds } 4161da177e4SLinus Torvalds } 4171da177e4SLinus Torvalds } 4181da177e4SLinus Torvalds #endif 4191da177e4SLinus Torvalds if (XFS_FORCED_SHUTDOWN(mp)) 4201da177e4SLinus Torvalds goto shutdown_abort; 4211da177e4SLinus Torvalds 422d7e84f41SChristoph Hellwig _xfs_trans_bjoin(tp, bp, 1); 423d7e84f41SChristoph Hellwig trace_xfs_trans_read_buf(bp->b_fspriv); 4241da177e4SLinus Torvalds 4251da177e4SLinus Torvalds *bpp = bp; 4261da177e4SLinus Torvalds return 0; 4271da177e4SLinus Torvalds 4281da177e4SLinus Torvalds shutdown_abort: 4291da177e4SLinus Torvalds /* 4301da177e4SLinus Torvalds * the theory here is that buffer is good but we're 4311da177e4SLinus Torvalds * bailing out because the filesystem is being forcibly 4321da177e4SLinus Torvalds * shut down. So we should leave the b_flags alone since 4331da177e4SLinus Torvalds * the buffer's not staled and just get out. 4341da177e4SLinus Torvalds */ 4351da177e4SLinus Torvalds #if defined(DEBUG) 4361da177e4SLinus Torvalds if (XFS_BUF_ISSTALE(bp) && XFS_BUF_ISDELAYWRITE(bp)) 4371da177e4SLinus Torvalds cmn_err(CE_NOTE, "about to pop assert, bp == 0x%p", bp); 4381da177e4SLinus Torvalds #endif 4390cadda1cSChristoph Hellwig ASSERT((XFS_BUF_BFLAGS(bp) & (XBF_STALE|XBF_DELWRI)) != 4400cadda1cSChristoph Hellwig (XBF_STALE|XBF_DELWRI)); 4411da177e4SLinus Torvalds 4420b1b213fSChristoph Hellwig trace_xfs_trans_read_buf_shut(bp, _RET_IP_); 4431da177e4SLinus Torvalds xfs_buf_relse(bp); 4441da177e4SLinus Torvalds *bpp = NULL; 4451da177e4SLinus Torvalds return XFS_ERROR(EIO); 4461da177e4SLinus Torvalds } 4471da177e4SLinus Torvalds 4481da177e4SLinus Torvalds 4491da177e4SLinus Torvalds /* 4501da177e4SLinus Torvalds * Release the buffer bp which was previously acquired with one of the 4511da177e4SLinus Torvalds * xfs_trans_... buffer allocation routines if the buffer has not 4521da177e4SLinus Torvalds * been modified within this transaction. If the buffer is modified 4531da177e4SLinus Torvalds * within this transaction, do decrement the recursion count but do 4541da177e4SLinus Torvalds * not release the buffer even if the count goes to 0. If the buffer is not 4551da177e4SLinus Torvalds * modified within the transaction, decrement the recursion count and 4561da177e4SLinus Torvalds * release the buffer if the recursion count goes to 0. 4571da177e4SLinus Torvalds * 4581da177e4SLinus Torvalds * If the buffer is to be released and it was not modified before 4591da177e4SLinus Torvalds * this transaction began, then free the buf_log_item associated with it. 4601da177e4SLinus Torvalds * 4611da177e4SLinus Torvalds * If the transaction pointer is NULL, make this just a normal 4621da177e4SLinus Torvalds * brelse() call. 4631da177e4SLinus Torvalds */ 4641da177e4SLinus Torvalds void 4651da177e4SLinus Torvalds xfs_trans_brelse(xfs_trans_t *tp, 4661da177e4SLinus Torvalds xfs_buf_t *bp) 4671da177e4SLinus Torvalds { 4681da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 4691da177e4SLinus Torvalds xfs_log_item_t *lip; 4701da177e4SLinus Torvalds xfs_log_item_desc_t *lidp; 4711da177e4SLinus Torvalds 4721da177e4SLinus Torvalds /* 4731da177e4SLinus Torvalds * Default to a normal brelse() call if the tp is NULL. 4741da177e4SLinus Torvalds */ 4751da177e4SLinus Torvalds if (tp == NULL) { 4761da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, void *) == NULL); 4771da177e4SLinus Torvalds /* 4781da177e4SLinus Torvalds * If there's a buf log item attached to the buffer, 4791da177e4SLinus Torvalds * then let the AIL know that the buffer is being 4801da177e4SLinus Torvalds * unlocked. 4811da177e4SLinus Torvalds */ 4821da177e4SLinus Torvalds if (XFS_BUF_FSPRIVATE(bp, void *) != NULL) { 4831da177e4SLinus Torvalds lip = XFS_BUF_FSPRIVATE(bp, xfs_log_item_t *); 4841da177e4SLinus Torvalds if (lip->li_type == XFS_LI_BUF) { 4851da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp,xfs_buf_log_item_t*); 486783a2f65SDavid Chinner xfs_trans_unlocked_item(bip->bli_item.li_ailp, 4871da177e4SLinus Torvalds lip); 4881da177e4SLinus Torvalds } 4891da177e4SLinus Torvalds } 4901da177e4SLinus Torvalds xfs_buf_relse(bp); 4911da177e4SLinus Torvalds return; 4921da177e4SLinus Torvalds } 4931da177e4SLinus Torvalds 4941da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 4951da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 4961da177e4SLinus Torvalds ASSERT(bip->bli_item.li_type == XFS_LI_BUF); 4971da177e4SLinus Torvalds ASSERT(!(bip->bli_flags & XFS_BLI_STALE)); 4981da177e4SLinus Torvalds ASSERT(!(bip->bli_format.blf_flags & XFS_BLI_CANCEL)); 4991da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 5001da177e4SLinus Torvalds 5011da177e4SLinus Torvalds /* 5021da177e4SLinus Torvalds * Find the item descriptor pointing to this buffer's 5031da177e4SLinus Torvalds * log item. It must be there. 5041da177e4SLinus Torvalds */ 5051da177e4SLinus Torvalds lidp = xfs_trans_find_item(tp, (xfs_log_item_t*)bip); 5061da177e4SLinus Torvalds ASSERT(lidp != NULL); 5071da177e4SLinus Torvalds 5080b1b213fSChristoph Hellwig trace_xfs_trans_brelse(bip); 5090b1b213fSChristoph Hellwig 5101da177e4SLinus Torvalds /* 5111da177e4SLinus Torvalds * If the release is just for a recursive lock, 5121da177e4SLinus Torvalds * then decrement the count and return. 5131da177e4SLinus Torvalds */ 5141da177e4SLinus Torvalds if (bip->bli_recur > 0) { 5151da177e4SLinus Torvalds bip->bli_recur--; 5161da177e4SLinus Torvalds return; 5171da177e4SLinus Torvalds } 5181da177e4SLinus Torvalds 5191da177e4SLinus Torvalds /* 5201da177e4SLinus Torvalds * If the buffer is dirty within this transaction, we can't 5211da177e4SLinus Torvalds * release it until we commit. 5221da177e4SLinus Torvalds */ 5230b1b213fSChristoph Hellwig if (lidp->lid_flags & XFS_LID_DIRTY) 5241da177e4SLinus Torvalds return; 5251da177e4SLinus Torvalds 5261da177e4SLinus Torvalds /* 5271da177e4SLinus Torvalds * If the buffer has been invalidated, then we can't release 5281da177e4SLinus Torvalds * it until the transaction commits to disk unless it is re-dirtied 5291da177e4SLinus Torvalds * as part of this transaction. This prevents us from pulling 5301da177e4SLinus Torvalds * the item from the AIL before we should. 5311da177e4SLinus Torvalds */ 5320b1b213fSChristoph Hellwig if (bip->bli_flags & XFS_BLI_STALE) 5331da177e4SLinus Torvalds return; 5341da177e4SLinus Torvalds 5351da177e4SLinus Torvalds ASSERT(!(bip->bli_flags & XFS_BLI_LOGGED)); 5361da177e4SLinus Torvalds 5371da177e4SLinus Torvalds /* 5381da177e4SLinus Torvalds * Free up the log item descriptor tracking the released item. 5391da177e4SLinus Torvalds */ 5401da177e4SLinus Torvalds xfs_trans_free_item(tp, lidp); 5411da177e4SLinus Torvalds 5421da177e4SLinus Torvalds /* 5431da177e4SLinus Torvalds * Clear the hold flag in the buf log item if it is set. 5441da177e4SLinus Torvalds * We wouldn't want the next user of the buffer to 5451da177e4SLinus Torvalds * get confused. 5461da177e4SLinus Torvalds */ 5471da177e4SLinus Torvalds if (bip->bli_flags & XFS_BLI_HOLD) { 5481da177e4SLinus Torvalds bip->bli_flags &= ~XFS_BLI_HOLD; 5491da177e4SLinus Torvalds } 5501da177e4SLinus Torvalds 5511da177e4SLinus Torvalds /* 5521da177e4SLinus Torvalds * Drop our reference to the buf log item. 5531da177e4SLinus Torvalds */ 5541da177e4SLinus Torvalds atomic_dec(&bip->bli_refcount); 5551da177e4SLinus Torvalds 5561da177e4SLinus Torvalds /* 5571da177e4SLinus Torvalds * If the buf item is not tracking data in the log, then 5581da177e4SLinus Torvalds * we must free it before releasing the buffer back to the 5591da177e4SLinus Torvalds * free pool. Before releasing the buffer to the free pool, 5601da177e4SLinus Torvalds * clear the transaction pointer in b_fsprivate2 to dissolve 5611da177e4SLinus Torvalds * its relation to this transaction. 5621da177e4SLinus Torvalds */ 5631da177e4SLinus Torvalds if (!xfs_buf_item_dirty(bip)) { 5641da177e4SLinus Torvalds /*** 5651da177e4SLinus Torvalds ASSERT(bp->b_pincount == 0); 5661da177e4SLinus Torvalds ***/ 5671da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) == 0); 5681da177e4SLinus Torvalds ASSERT(!(bip->bli_item.li_flags & XFS_LI_IN_AIL)); 5691da177e4SLinus Torvalds ASSERT(!(bip->bli_flags & XFS_BLI_INODE_ALLOC_BUF)); 5701da177e4SLinus Torvalds xfs_buf_item_relse(bp); 5711da177e4SLinus Torvalds bip = NULL; 5721da177e4SLinus Torvalds } 5731da177e4SLinus Torvalds XFS_BUF_SET_FSPRIVATE2(bp, NULL); 5741da177e4SLinus Torvalds 5751da177e4SLinus Torvalds /* 5761da177e4SLinus Torvalds * If we've still got a buf log item on the buffer, then 5771da177e4SLinus Torvalds * tell the AIL that the buffer is being unlocked. 5781da177e4SLinus Torvalds */ 5791da177e4SLinus Torvalds if (bip != NULL) { 580783a2f65SDavid Chinner xfs_trans_unlocked_item(bip->bli_item.li_ailp, 5811da177e4SLinus Torvalds (xfs_log_item_t*)bip); 5821da177e4SLinus Torvalds } 5831da177e4SLinus Torvalds 5841da177e4SLinus Torvalds xfs_buf_relse(bp); 5851da177e4SLinus Torvalds return; 5861da177e4SLinus Torvalds } 5871da177e4SLinus Torvalds 5881da177e4SLinus Torvalds /* 5891da177e4SLinus Torvalds * Mark the buffer as not needing to be unlocked when the buf item's 5901da177e4SLinus Torvalds * IOP_UNLOCK() routine is called. The buffer must already be locked 5911da177e4SLinus Torvalds * and associated with the given transaction. 5921da177e4SLinus Torvalds */ 5931da177e4SLinus Torvalds /* ARGSUSED */ 5941da177e4SLinus Torvalds void 5951da177e4SLinus Torvalds xfs_trans_bhold(xfs_trans_t *tp, 5961da177e4SLinus Torvalds xfs_buf_t *bp) 5971da177e4SLinus Torvalds { 5981da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 5991da177e4SLinus Torvalds 6001da177e4SLinus Torvalds ASSERT(XFS_BUF_ISBUSY(bp)); 6011da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 6021da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 6031da177e4SLinus Torvalds 6041da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 6051da177e4SLinus Torvalds ASSERT(!(bip->bli_flags & XFS_BLI_STALE)); 6061da177e4SLinus Torvalds ASSERT(!(bip->bli_format.blf_flags & XFS_BLI_CANCEL)); 6071da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 6081da177e4SLinus Torvalds bip->bli_flags |= XFS_BLI_HOLD; 6090b1b213fSChristoph Hellwig trace_xfs_trans_bhold(bip); 6101da177e4SLinus Torvalds } 6111da177e4SLinus Torvalds 6121da177e4SLinus Torvalds /* 613efa092f3STim Shimmin * Cancel the previous buffer hold request made on this buffer 614efa092f3STim Shimmin * for this transaction. 615efa092f3STim Shimmin */ 616efa092f3STim Shimmin void 617efa092f3STim Shimmin xfs_trans_bhold_release(xfs_trans_t *tp, 618efa092f3STim Shimmin xfs_buf_t *bp) 619efa092f3STim Shimmin { 620efa092f3STim Shimmin xfs_buf_log_item_t *bip; 621efa092f3STim Shimmin 622efa092f3STim Shimmin ASSERT(XFS_BUF_ISBUSY(bp)); 623efa092f3STim Shimmin ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 624efa092f3STim Shimmin ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 625efa092f3STim Shimmin 626efa092f3STim Shimmin bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 627efa092f3STim Shimmin ASSERT(!(bip->bli_flags & XFS_BLI_STALE)); 628efa092f3STim Shimmin ASSERT(!(bip->bli_format.blf_flags & XFS_BLI_CANCEL)); 629efa092f3STim Shimmin ASSERT(atomic_read(&bip->bli_refcount) > 0); 630efa092f3STim Shimmin ASSERT(bip->bli_flags & XFS_BLI_HOLD); 631efa092f3STim Shimmin bip->bli_flags &= ~XFS_BLI_HOLD; 6320b1b213fSChristoph Hellwig 6330b1b213fSChristoph Hellwig trace_xfs_trans_bhold_release(bip); 634efa092f3STim Shimmin } 635efa092f3STim Shimmin 636efa092f3STim Shimmin /* 6371da177e4SLinus Torvalds * This is called to mark bytes first through last inclusive of the given 6381da177e4SLinus Torvalds * buffer as needing to be logged when the transaction is committed. 6391da177e4SLinus Torvalds * The buffer must already be associated with the given transaction. 6401da177e4SLinus Torvalds * 6411da177e4SLinus Torvalds * First and last are numbers relative to the beginning of this buffer, 6421da177e4SLinus Torvalds * so the first byte in the buffer is numbered 0 regardless of the 6431da177e4SLinus Torvalds * value of b_blkno. 6441da177e4SLinus Torvalds */ 6451da177e4SLinus Torvalds void 6461da177e4SLinus Torvalds xfs_trans_log_buf(xfs_trans_t *tp, 6471da177e4SLinus Torvalds xfs_buf_t *bp, 6481da177e4SLinus Torvalds uint first, 6491da177e4SLinus Torvalds uint last) 6501da177e4SLinus Torvalds { 6511da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 6521da177e4SLinus Torvalds xfs_log_item_desc_t *lidp; 6531da177e4SLinus Torvalds 6541da177e4SLinus Torvalds ASSERT(XFS_BUF_ISBUSY(bp)); 6551da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 6561da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 6571da177e4SLinus Torvalds ASSERT((first <= last) && (last < XFS_BUF_COUNT(bp))); 6581da177e4SLinus Torvalds ASSERT((XFS_BUF_IODONE_FUNC(bp) == NULL) || 6591da177e4SLinus Torvalds (XFS_BUF_IODONE_FUNC(bp) == xfs_buf_iodone_callbacks)); 6601da177e4SLinus Torvalds 6611da177e4SLinus Torvalds /* 6621da177e4SLinus Torvalds * Mark the buffer as needing to be written out eventually, 6631da177e4SLinus Torvalds * and set its iodone function to remove the buffer's buf log 6641da177e4SLinus Torvalds * item from the AIL and free it when the buffer is flushed 6651da177e4SLinus Torvalds * to disk. See xfs_buf_attach_iodone() for more details 6661da177e4SLinus Torvalds * on li_cb and xfs_buf_iodone_callbacks(). 6671da177e4SLinus Torvalds * If we end up aborting this transaction, we trap this buffer 6681da177e4SLinus Torvalds * inside the b_bdstrat callback so that this won't get written to 6691da177e4SLinus Torvalds * disk. 6701da177e4SLinus Torvalds */ 6711da177e4SLinus Torvalds XFS_BUF_DELAYWRITE(bp); 6721da177e4SLinus Torvalds XFS_BUF_DONE(bp); 6731da177e4SLinus Torvalds 6741da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 6751da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 6761da177e4SLinus Torvalds XFS_BUF_SET_IODONE_FUNC(bp, xfs_buf_iodone_callbacks); 6771da177e4SLinus Torvalds bip->bli_item.li_cb = (void(*)(xfs_buf_t*,xfs_log_item_t*))xfs_buf_iodone; 6781da177e4SLinus Torvalds 6790b1b213fSChristoph Hellwig trace_xfs_trans_log_buf(bip); 6800b1b213fSChristoph Hellwig 6811da177e4SLinus Torvalds /* 6821da177e4SLinus Torvalds * If we invalidated the buffer within this transaction, then 6831da177e4SLinus Torvalds * cancel the invalidation now that we're dirtying the buffer 6841da177e4SLinus Torvalds * again. There are no races with the code in xfs_buf_item_unpin(), 6851da177e4SLinus Torvalds * because we have a reference to the buffer this entire time. 6861da177e4SLinus Torvalds */ 6871da177e4SLinus Torvalds if (bip->bli_flags & XFS_BLI_STALE) { 6881da177e4SLinus Torvalds bip->bli_flags &= ~XFS_BLI_STALE; 6891da177e4SLinus Torvalds ASSERT(XFS_BUF_ISSTALE(bp)); 6901da177e4SLinus Torvalds XFS_BUF_UNSTALE(bp); 6911da177e4SLinus Torvalds bip->bli_format.blf_flags &= ~XFS_BLI_CANCEL; 6921da177e4SLinus Torvalds } 6931da177e4SLinus Torvalds 6941da177e4SLinus Torvalds lidp = xfs_trans_find_item(tp, (xfs_log_item_t*)bip); 6951da177e4SLinus Torvalds ASSERT(lidp != NULL); 6961da177e4SLinus Torvalds 6971da177e4SLinus Torvalds tp->t_flags |= XFS_TRANS_DIRTY; 6981da177e4SLinus Torvalds lidp->lid_flags |= XFS_LID_DIRTY; 6991da177e4SLinus Torvalds bip->bli_flags |= XFS_BLI_LOGGED; 7001da177e4SLinus Torvalds xfs_buf_item_log(bip, first, last); 7011da177e4SLinus Torvalds } 7021da177e4SLinus Torvalds 7031da177e4SLinus Torvalds 7041da177e4SLinus Torvalds /* 7051da177e4SLinus Torvalds * This called to invalidate a buffer that is being used within 7061da177e4SLinus Torvalds * a transaction. Typically this is because the blocks in the 7071da177e4SLinus Torvalds * buffer are being freed, so we need to prevent it from being 7081da177e4SLinus Torvalds * written out when we're done. Allowing it to be written again 7091da177e4SLinus Torvalds * might overwrite data in the free blocks if they are reallocated 7101da177e4SLinus Torvalds * to a file. 7111da177e4SLinus Torvalds * 7121da177e4SLinus Torvalds * We prevent the buffer from being written out by clearing the 7131da177e4SLinus Torvalds * B_DELWRI flag. We can't always 7141da177e4SLinus Torvalds * get rid of the buf log item at this point, though, because 7151da177e4SLinus Torvalds * the buffer may still be pinned by another transaction. If that 7161da177e4SLinus Torvalds * is the case, then we'll wait until the buffer is committed to 7171da177e4SLinus Torvalds * disk for the last time (we can tell by the ref count) and 7181da177e4SLinus Torvalds * free it in xfs_buf_item_unpin(). Until it is cleaned up we 7191da177e4SLinus Torvalds * will keep the buffer locked so that the buffer and buf log item 7201da177e4SLinus Torvalds * are not reused. 7211da177e4SLinus Torvalds */ 7221da177e4SLinus Torvalds void 7231da177e4SLinus Torvalds xfs_trans_binval( 7241da177e4SLinus Torvalds xfs_trans_t *tp, 7251da177e4SLinus Torvalds xfs_buf_t *bp) 7261da177e4SLinus Torvalds { 7271da177e4SLinus Torvalds xfs_log_item_desc_t *lidp; 7281da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 7291da177e4SLinus Torvalds 7301da177e4SLinus Torvalds ASSERT(XFS_BUF_ISBUSY(bp)); 7311da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 7321da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 7331da177e4SLinus Torvalds 7341da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 7351da177e4SLinus Torvalds lidp = xfs_trans_find_item(tp, (xfs_log_item_t*)bip); 7361da177e4SLinus Torvalds ASSERT(lidp != NULL); 7371da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 7381da177e4SLinus Torvalds 7390b1b213fSChristoph Hellwig trace_xfs_trans_binval(bip); 7400b1b213fSChristoph Hellwig 7411da177e4SLinus Torvalds if (bip->bli_flags & XFS_BLI_STALE) { 7421da177e4SLinus Torvalds /* 7431da177e4SLinus Torvalds * If the buffer is already invalidated, then 7441da177e4SLinus Torvalds * just return. 7451da177e4SLinus Torvalds */ 7461da177e4SLinus Torvalds ASSERT(!(XFS_BUF_ISDELAYWRITE(bp))); 7471da177e4SLinus Torvalds ASSERT(XFS_BUF_ISSTALE(bp)); 7481da177e4SLinus Torvalds ASSERT(!(bip->bli_flags & (XFS_BLI_LOGGED | XFS_BLI_DIRTY))); 7491da177e4SLinus Torvalds ASSERT(!(bip->bli_format.blf_flags & XFS_BLI_INODE_BUF)); 7501da177e4SLinus Torvalds ASSERT(bip->bli_format.blf_flags & XFS_BLI_CANCEL); 7511da177e4SLinus Torvalds ASSERT(lidp->lid_flags & XFS_LID_DIRTY); 7521da177e4SLinus Torvalds ASSERT(tp->t_flags & XFS_TRANS_DIRTY); 7531da177e4SLinus Torvalds return; 7541da177e4SLinus Torvalds } 7551da177e4SLinus Torvalds 7561da177e4SLinus Torvalds /* 7571da177e4SLinus Torvalds * Clear the dirty bit in the buffer and set the STALE flag 7581da177e4SLinus Torvalds * in the buf log item. The STALE flag will be used in 7591da177e4SLinus Torvalds * xfs_buf_item_unpin() to determine if it should clean up 7601da177e4SLinus Torvalds * when the last reference to the buf item is given up. 7611da177e4SLinus Torvalds * We set the XFS_BLI_CANCEL flag in the buf log format structure 7621da177e4SLinus Torvalds * and log the buf item. This will be used at recovery time 7631da177e4SLinus Torvalds * to determine that copies of the buffer in the log before 7641da177e4SLinus Torvalds * this should not be replayed. 7651da177e4SLinus Torvalds * We mark the item descriptor and the transaction dirty so 7661da177e4SLinus Torvalds * that we'll hold the buffer until after the commit. 7671da177e4SLinus Torvalds * 7681da177e4SLinus Torvalds * Since we're invalidating the buffer, we also clear the state 7691da177e4SLinus Torvalds * about which parts of the buffer have been logged. We also 7701da177e4SLinus Torvalds * clear the flag indicating that this is an inode buffer since 7711da177e4SLinus Torvalds * the data in the buffer will no longer be valid. 7721da177e4SLinus Torvalds * 7731da177e4SLinus Torvalds * We set the stale bit in the buffer as well since we're getting 7741da177e4SLinus Torvalds * rid of it. 7751da177e4SLinus Torvalds */ 7761da177e4SLinus Torvalds XFS_BUF_UNDELAYWRITE(bp); 7771da177e4SLinus Torvalds XFS_BUF_STALE(bp); 7781da177e4SLinus Torvalds bip->bli_flags |= XFS_BLI_STALE; 7791da177e4SLinus Torvalds bip->bli_flags &= ~(XFS_BLI_LOGGED | XFS_BLI_DIRTY); 7801da177e4SLinus Torvalds bip->bli_format.blf_flags &= ~XFS_BLI_INODE_BUF; 7811da177e4SLinus Torvalds bip->bli_format.blf_flags |= XFS_BLI_CANCEL; 7821da177e4SLinus Torvalds memset((char *)(bip->bli_format.blf_data_map), 0, 7831da177e4SLinus Torvalds (bip->bli_format.blf_map_size * sizeof(uint))); 784*8e123850SDave Chinner lidp->lid_flags |= XFS_LID_DIRTY; 7851da177e4SLinus Torvalds tp->t_flags |= XFS_TRANS_DIRTY; 7861da177e4SLinus Torvalds } 7871da177e4SLinus Torvalds 7881da177e4SLinus Torvalds /* 7891da177e4SLinus Torvalds * This call is used to indicate that the buffer contains on-disk 7901da177e4SLinus Torvalds * inodes which must be handled specially during recovery. They 7911da177e4SLinus Torvalds * require special handling because only the di_next_unlinked from 7921da177e4SLinus Torvalds * the inodes in the buffer should be recovered. The rest of the 7931da177e4SLinus Torvalds * data in the buffer is logged via the inodes themselves. 7941da177e4SLinus Torvalds * 7951da177e4SLinus Torvalds * All we do is set the XFS_BLI_INODE_BUF flag in the buffer's log 7961da177e4SLinus Torvalds * format structure so that we'll know what to do at recovery time. 7971da177e4SLinus Torvalds */ 7981da177e4SLinus Torvalds /* ARGSUSED */ 7991da177e4SLinus Torvalds void 8001da177e4SLinus Torvalds xfs_trans_inode_buf( 8011da177e4SLinus Torvalds xfs_trans_t *tp, 8021da177e4SLinus Torvalds xfs_buf_t *bp) 8031da177e4SLinus Torvalds { 8041da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 8051da177e4SLinus Torvalds 8061da177e4SLinus Torvalds ASSERT(XFS_BUF_ISBUSY(bp)); 8071da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 8081da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 8091da177e4SLinus Torvalds 8101da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 8111da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 8121da177e4SLinus Torvalds 8131da177e4SLinus Torvalds bip->bli_format.blf_flags |= XFS_BLI_INODE_BUF; 8141da177e4SLinus Torvalds } 8151da177e4SLinus Torvalds 8161da177e4SLinus Torvalds /* 8171da177e4SLinus Torvalds * This call is used to indicate that the buffer is going to 8181da177e4SLinus Torvalds * be staled and was an inode buffer. This means it gets 8191da177e4SLinus Torvalds * special processing during unpin - where any inodes 8201da177e4SLinus Torvalds * associated with the buffer should be removed from ail. 8211da177e4SLinus Torvalds * There is also special processing during recovery, 8221da177e4SLinus Torvalds * any replay of the inodes in the buffer needs to be 8231da177e4SLinus Torvalds * prevented as the buffer may have been reused. 8241da177e4SLinus Torvalds */ 8251da177e4SLinus Torvalds void 8261da177e4SLinus Torvalds xfs_trans_stale_inode_buf( 8271da177e4SLinus Torvalds xfs_trans_t *tp, 8281da177e4SLinus Torvalds xfs_buf_t *bp) 8291da177e4SLinus Torvalds { 8301da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 8311da177e4SLinus Torvalds 8321da177e4SLinus Torvalds ASSERT(XFS_BUF_ISBUSY(bp)); 8331da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 8341da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 8351da177e4SLinus Torvalds 8361da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 8371da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 8381da177e4SLinus Torvalds 8391da177e4SLinus Torvalds bip->bli_flags |= XFS_BLI_STALE_INODE; 8401da177e4SLinus Torvalds bip->bli_item.li_cb = (void(*)(xfs_buf_t*,xfs_log_item_t*)) 8411da177e4SLinus Torvalds xfs_buf_iodone; 8421da177e4SLinus Torvalds } 8431da177e4SLinus Torvalds 8441da177e4SLinus Torvalds 8451da177e4SLinus Torvalds 8461da177e4SLinus Torvalds /* 8471da177e4SLinus Torvalds * Mark the buffer as being one which contains newly allocated 8481da177e4SLinus Torvalds * inodes. We need to make sure that even if this buffer is 8491da177e4SLinus Torvalds * relogged as an 'inode buf' we still recover all of the inode 8501da177e4SLinus Torvalds * images in the face of a crash. This works in coordination with 8511da177e4SLinus Torvalds * xfs_buf_item_committed() to ensure that the buffer remains in the 8521da177e4SLinus Torvalds * AIL at its original location even after it has been relogged. 8531da177e4SLinus Torvalds */ 8541da177e4SLinus Torvalds /* ARGSUSED */ 8551da177e4SLinus Torvalds void 8561da177e4SLinus Torvalds xfs_trans_inode_alloc_buf( 8571da177e4SLinus Torvalds xfs_trans_t *tp, 8581da177e4SLinus Torvalds xfs_buf_t *bp) 8591da177e4SLinus Torvalds { 8601da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 8611da177e4SLinus Torvalds 8621da177e4SLinus Torvalds ASSERT(XFS_BUF_ISBUSY(bp)); 8631da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 8641da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 8651da177e4SLinus Torvalds 8661da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 8671da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 8681da177e4SLinus Torvalds 8691da177e4SLinus Torvalds bip->bli_flags |= XFS_BLI_INODE_ALLOC_BUF; 8701da177e4SLinus Torvalds } 8711da177e4SLinus Torvalds 8721da177e4SLinus Torvalds 8731da177e4SLinus Torvalds /* 8741da177e4SLinus Torvalds * Similar to xfs_trans_inode_buf(), this marks the buffer as a cluster of 8751da177e4SLinus Torvalds * dquots. However, unlike in inode buffer recovery, dquot buffers get 8761da177e4SLinus Torvalds * recovered in their entirety. (Hence, no XFS_BLI_DQUOT_ALLOC_BUF flag). 8771da177e4SLinus Torvalds * The only thing that makes dquot buffers different from regular 8781da177e4SLinus Torvalds * buffers is that we must not replay dquot bufs when recovering 8791da177e4SLinus Torvalds * if a _corresponding_ quotaoff has happened. We also have to distinguish 8801da177e4SLinus Torvalds * between usr dquot bufs and grp dquot bufs, because usr and grp quotas 8811da177e4SLinus Torvalds * can be turned off independently. 8821da177e4SLinus Torvalds */ 8831da177e4SLinus Torvalds /* ARGSUSED */ 8841da177e4SLinus Torvalds void 8851da177e4SLinus Torvalds xfs_trans_dquot_buf( 8861da177e4SLinus Torvalds xfs_trans_t *tp, 8871da177e4SLinus Torvalds xfs_buf_t *bp, 8881da177e4SLinus Torvalds uint type) 8891da177e4SLinus Torvalds { 8901da177e4SLinus Torvalds xfs_buf_log_item_t *bip; 8911da177e4SLinus Torvalds 8921da177e4SLinus Torvalds ASSERT(XFS_BUF_ISBUSY(bp)); 8931da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE2(bp, xfs_trans_t *) == tp); 8941da177e4SLinus Torvalds ASSERT(XFS_BUF_FSPRIVATE(bp, void *) != NULL); 8951da177e4SLinus Torvalds ASSERT(type == XFS_BLI_UDQUOT_BUF || 896c8ad20ffSNathan Scott type == XFS_BLI_PDQUOT_BUF || 8971da177e4SLinus Torvalds type == XFS_BLI_GDQUOT_BUF); 8981da177e4SLinus Torvalds 8991da177e4SLinus Torvalds bip = XFS_BUF_FSPRIVATE(bp, xfs_buf_log_item_t *); 9001da177e4SLinus Torvalds ASSERT(atomic_read(&bip->bli_refcount) > 0); 9011da177e4SLinus Torvalds 9021da177e4SLinus Torvalds bip->bli_format.blf_flags |= type; 9031da177e4SLinus Torvalds } 9041da177e4SLinus Torvalds 9051da177e4SLinus Torvalds /* 9061da177e4SLinus Torvalds * Check to see if a buffer matching the given parameters is already 9071da177e4SLinus Torvalds * a part of the given transaction. Only check the first, embedded 9081da177e4SLinus Torvalds * chunk, since we don't want to spend all day scanning large transactions. 9091da177e4SLinus Torvalds */ 9101da177e4SLinus Torvalds STATIC xfs_buf_t * 9111da177e4SLinus Torvalds xfs_trans_buf_item_match( 9121da177e4SLinus Torvalds xfs_trans_t *tp, 9131da177e4SLinus Torvalds xfs_buftarg_t *target, 9141da177e4SLinus Torvalds xfs_daddr_t blkno, 9151da177e4SLinus Torvalds int len) 9161da177e4SLinus Torvalds { 9171da177e4SLinus Torvalds xfs_log_item_chunk_t *licp; 9181da177e4SLinus Torvalds xfs_log_item_desc_t *lidp; 9191da177e4SLinus Torvalds xfs_buf_log_item_t *blip; 9201da177e4SLinus Torvalds xfs_buf_t *bp; 9211da177e4SLinus Torvalds int i; 9221da177e4SLinus Torvalds 9231da177e4SLinus Torvalds bp = NULL; 9241da177e4SLinus Torvalds len = BBTOB(len); 9251da177e4SLinus Torvalds licp = &tp->t_items; 92639dab9d7SEric Sandeen if (!xfs_lic_are_all_free(licp)) { 9271da177e4SLinus Torvalds for (i = 0; i < licp->lic_unused; i++) { 9281da177e4SLinus Torvalds /* 9291da177e4SLinus Torvalds * Skip unoccupied slots. 9301da177e4SLinus Torvalds */ 93139dab9d7SEric Sandeen if (xfs_lic_isfree(licp, i)) { 9321da177e4SLinus Torvalds continue; 9331da177e4SLinus Torvalds } 9341da177e4SLinus Torvalds 93539dab9d7SEric Sandeen lidp = xfs_lic_slot(licp, i); 9361da177e4SLinus Torvalds blip = (xfs_buf_log_item_t *)lidp->lid_item; 9371da177e4SLinus Torvalds if (blip->bli_item.li_type != XFS_LI_BUF) { 9381da177e4SLinus Torvalds continue; 9391da177e4SLinus Torvalds } 9401da177e4SLinus Torvalds 9411da177e4SLinus Torvalds bp = blip->bli_buf; 9421da177e4SLinus Torvalds if ((XFS_BUF_TARGET(bp) == target) && 9431da177e4SLinus Torvalds (XFS_BUF_ADDR(bp) == blkno) && 9441da177e4SLinus Torvalds (XFS_BUF_COUNT(bp) == len)) { 9451da177e4SLinus Torvalds /* 9461da177e4SLinus Torvalds * We found it. Break out and 9471da177e4SLinus Torvalds * return the pointer to the buffer. 9481da177e4SLinus Torvalds */ 9491da177e4SLinus Torvalds break; 9501da177e4SLinus Torvalds } else { 9511da177e4SLinus Torvalds bp = NULL; 9521da177e4SLinus Torvalds } 9531da177e4SLinus Torvalds } 9541da177e4SLinus Torvalds } 9551da177e4SLinus Torvalds return bp; 9561da177e4SLinus Torvalds } 9571da177e4SLinus Torvalds 9581da177e4SLinus Torvalds /* 9591da177e4SLinus Torvalds * Check to see if a buffer matching the given parameters is already 9601da177e4SLinus Torvalds * a part of the given transaction. Check all the chunks, we 9611da177e4SLinus Torvalds * want to be thorough. 9621da177e4SLinus Torvalds */ 9631da177e4SLinus Torvalds STATIC xfs_buf_t * 9641da177e4SLinus Torvalds xfs_trans_buf_item_match_all( 9651da177e4SLinus Torvalds xfs_trans_t *tp, 9661da177e4SLinus Torvalds xfs_buftarg_t *target, 9671da177e4SLinus Torvalds xfs_daddr_t blkno, 9681da177e4SLinus Torvalds int len) 9691da177e4SLinus Torvalds { 9701da177e4SLinus Torvalds xfs_log_item_chunk_t *licp; 9711da177e4SLinus Torvalds xfs_log_item_desc_t *lidp; 9721da177e4SLinus Torvalds xfs_buf_log_item_t *blip; 9731da177e4SLinus Torvalds xfs_buf_t *bp; 9741da177e4SLinus Torvalds int i; 9751da177e4SLinus Torvalds 9761da177e4SLinus Torvalds bp = NULL; 9771da177e4SLinus Torvalds len = BBTOB(len); 9781da177e4SLinus Torvalds for (licp = &tp->t_items; licp != NULL; licp = licp->lic_next) { 97939dab9d7SEric Sandeen if (xfs_lic_are_all_free(licp)) { 9801da177e4SLinus Torvalds ASSERT(licp == &tp->t_items); 9811da177e4SLinus Torvalds ASSERT(licp->lic_next == NULL); 9821da177e4SLinus Torvalds return NULL; 9831da177e4SLinus Torvalds } 9841da177e4SLinus Torvalds for (i = 0; i < licp->lic_unused; i++) { 9851da177e4SLinus Torvalds /* 9861da177e4SLinus Torvalds * Skip unoccupied slots. 9871da177e4SLinus Torvalds */ 98839dab9d7SEric Sandeen if (xfs_lic_isfree(licp, i)) { 9891da177e4SLinus Torvalds continue; 9901da177e4SLinus Torvalds } 9911da177e4SLinus Torvalds 99239dab9d7SEric Sandeen lidp = xfs_lic_slot(licp, i); 9931da177e4SLinus Torvalds blip = (xfs_buf_log_item_t *)lidp->lid_item; 9941da177e4SLinus Torvalds if (blip->bli_item.li_type != XFS_LI_BUF) { 9951da177e4SLinus Torvalds continue; 9961da177e4SLinus Torvalds } 9971da177e4SLinus Torvalds 9981da177e4SLinus Torvalds bp = blip->bli_buf; 9991da177e4SLinus Torvalds if ((XFS_BUF_TARGET(bp) == target) && 10001da177e4SLinus Torvalds (XFS_BUF_ADDR(bp) == blkno) && 10011da177e4SLinus Torvalds (XFS_BUF_COUNT(bp) == len)) { 10021da177e4SLinus Torvalds /* 10031da177e4SLinus Torvalds * We found it. Break out and 10041da177e4SLinus Torvalds * return the pointer to the buffer. 10051da177e4SLinus Torvalds */ 10061da177e4SLinus Torvalds return bp; 10071da177e4SLinus Torvalds } 10081da177e4SLinus Torvalds } 10091da177e4SLinus Torvalds } 10101da177e4SLinus Torvalds return NULL; 10111da177e4SLinus Torvalds } 1012