Commit 5ff0b9e1 authored by Linus Torvalds's avatar Linus Torvalds

Merge tag 'xfs-for-linus-3.18-rc1' of git://git.kernel.org/pub/scm/linux/kernel/git/dgc/linux-xfs

Pull xfs update from Dave Chinner:
 "This update contains:
   - various cleanups
   - log recovery debug hooks
   - seek hole/data implementation merge
   - extent shift rework to fix collapse range bugs
   - various sparse warning fixes
   - log recovery transaction processing rework to fix use after free
     bugs
   - metadata buffer IO infrastructuer rework to ensure all buffers
     under IO have valid reference counts
   - various fixes for ondisk flags, writeback and zero range corner
     cases"

* tag 'xfs-for-linus-3.18-rc1' of git://git.kernel.org/pub/scm/linux/kernel/git/dgc/linux-xfs: (56 commits)
  xfs: fix agno increment in xfs_inumbers() loop
  xfs: xfs_iflush_done checks the wrong log item callback
  xfs: flush the range before zero range conversion
  xfs: restore buffer_head unwritten bit on ioend cancel
  xfs: check for null dquot in xfs_quota_calc_throttle()
  xfs: fix crc field handling in xfs_sb_to/from_disk
  xfs: don't send null bp to xfs_trans_brelse()
  xfs: check for inode size overflow in xfs_new_eof()
  xfs: only set extent size hint when asked
  xfs: project id inheritance is a directory only flag
  xfs: kill time.h
  xfs: compat_xfs_bstat does not have forkoff
  xfs: simplify xfs_zero_remaining_bytes
  xfs: check xfs_buf_read_uncached returns correctly
  xfs: introduce xfs_buf_submit[_wait]
  xfs: kill xfs_bioerror_relse
  xfs: xfs_bioerror can die.
  xfs: kill xfs_bdstrat_cb
  xfs: rework xfs_buf_bio_endio error handling
  xfs: xfs_buf_ioend and xfs_buf_iodone_work duplicate functionality
  ...
parents 77c688ac 6889e783
...@@ -21,7 +21,6 @@ ...@@ -21,7 +21,6 @@
#include <linux/swap.h> #include <linux/swap.h>
#include <linux/blkdev.h> #include <linux/blkdev.h>
#include <linux/backing-dev.h> #include <linux/backing-dev.h>
#include "time.h"
#include "kmem.h" #include "kmem.h"
#include "xfs_message.h" #include "xfs_message.h"
......
...@@ -2209,6 +2209,10 @@ xfs_agf_verify( ...@@ -2209,6 +2209,10 @@ xfs_agf_verify(
be32_to_cpu(agf->agf_flcount) <= XFS_AGFL_SIZE(mp))) be32_to_cpu(agf->agf_flcount) <= XFS_AGFL_SIZE(mp)))
return false; return false;
if (be32_to_cpu(agf->agf_levels[XFS_BTNUM_BNO]) > XFS_BTREE_MAXLEVELS ||
be32_to_cpu(agf->agf_levels[XFS_BTNUM_CNT]) > XFS_BTREE_MAXLEVELS)
return false;
/* /*
* during growfs operations, the perag is not fully initialised, * during growfs operations, the perag is not fully initialised,
* so we can't use it for any useful checking. growfs ensures we can't * so we can't use it for any useful checking. growfs ensures we can't
......
This diff is collapsed.
...@@ -178,9 +178,8 @@ int xfs_check_nostate_extents(struct xfs_ifork *ifp, xfs_extnum_t idx, ...@@ -178,9 +178,8 @@ int xfs_check_nostate_extents(struct xfs_ifork *ifp, xfs_extnum_t idx,
xfs_extnum_t num); xfs_extnum_t num);
uint xfs_default_attroffset(struct xfs_inode *ip); uint xfs_default_attroffset(struct xfs_inode *ip);
int xfs_bmap_shift_extents(struct xfs_trans *tp, struct xfs_inode *ip, int xfs_bmap_shift_extents(struct xfs_trans *tp, struct xfs_inode *ip,
int *done, xfs_fileoff_t start_fsb, xfs_fileoff_t start_fsb, xfs_fileoff_t offset_shift_fsb,
xfs_fileoff_t offset_shift_fsb, xfs_extnum_t *current_ext, int *done, xfs_fileoff_t *next_fsb, xfs_fsblock_t *firstblock,
xfs_fsblock_t *firstblock, struct xfs_bmap_free *flist, struct xfs_bmap_free *flist, int num_exts);
int num_exts);
#endif /* __XFS_BMAP_H__ */ #endif /* __XFS_BMAP_H__ */
...@@ -2563,6 +2563,7 @@ xfs_da_get_buf( ...@@ -2563,6 +2563,7 @@ xfs_da_get_buf(
mapp, nmap, 0); mapp, nmap, 0);
error = bp ? bp->b_error : -EIO; error = bp ? bp->b_error : -EIO;
if (error) { if (error) {
if (bp)
xfs_trans_brelse(trans, bp); xfs_trans_brelse(trans, bp);
goto out_free; goto out_free;
} }
......
...@@ -270,7 +270,6 @@ xfs_dir3_data_get_ftype( ...@@ -270,7 +270,6 @@ xfs_dir3_data_get_ftype(
{ {
__uint8_t ftype = dep->name[dep->namelen]; __uint8_t ftype = dep->name[dep->namelen];
ASSERT(ftype < XFS_DIR3_FT_MAX);
if (ftype >= XFS_DIR3_FT_MAX) if (ftype >= XFS_DIR3_FT_MAX)
return XFS_DIR3_FT_UNKNOWN; return XFS_DIR3_FT_UNKNOWN;
return ftype; return ftype;
......
...@@ -237,7 +237,8 @@ xfs_dir_init( ...@@ -237,7 +237,8 @@ xfs_dir_init(
} }
/* /*
Enter a name in a directory. * Enter a name in a directory, or check for available space.
* If inum is 0, only the available space test is performed.
*/ */
int int
xfs_dir_createname( xfs_dir_createname(
...@@ -254,10 +255,12 @@ xfs_dir_createname( ...@@ -254,10 +255,12 @@ xfs_dir_createname(
int v; /* type-checking value */ int v; /* type-checking value */
ASSERT(S_ISDIR(dp->i_d.di_mode)); ASSERT(S_ISDIR(dp->i_d.di_mode));
if (inum) {
rval = xfs_dir_ino_validate(tp->t_mountp, inum); rval = xfs_dir_ino_validate(tp->t_mountp, inum);
if (rval) if (rval)
return rval; return rval;
XFS_STATS_INC(xs_dir_create); XFS_STATS_INC(xs_dir_create);
}
args = kmem_zalloc(sizeof(*args), KM_SLEEP | KM_NOFS); args = kmem_zalloc(sizeof(*args), KM_SLEEP | KM_NOFS);
if (!args) if (!args)
...@@ -276,6 +279,8 @@ xfs_dir_createname( ...@@ -276,6 +279,8 @@ xfs_dir_createname(
args->whichfork = XFS_DATA_FORK; args->whichfork = XFS_DATA_FORK;
args->trans = tp; args->trans = tp;
args->op_flags = XFS_DA_OP_ADDNAME | XFS_DA_OP_OKNOENT; args->op_flags = XFS_DA_OP_ADDNAME | XFS_DA_OP_OKNOENT;
if (!inum)
args->op_flags |= XFS_DA_OP_JUSTCHECK;
if (dp->i_d.di_format == XFS_DINODE_FMT_LOCAL) { if (dp->i_d.di_format == XFS_DINODE_FMT_LOCAL) {
rval = xfs_dir2_sf_addname(args); rval = xfs_dir2_sf_addname(args);
...@@ -535,62 +540,14 @@ xfs_dir_replace( ...@@ -535,62 +540,14 @@ xfs_dir_replace(
/* /*
* See if this entry can be added to the directory without allocating space. * See if this entry can be added to the directory without allocating space.
* First checks that the caller couldn't reserve enough space (resblks = 0).
*/ */
int int
xfs_dir_canenter( xfs_dir_canenter(
xfs_trans_t *tp, xfs_trans_t *tp,
xfs_inode_t *dp, xfs_inode_t *dp,
struct xfs_name *name, /* name of entry to add */ struct xfs_name *name) /* name of entry to add */
uint resblks)
{ {
struct xfs_da_args *args; return xfs_dir_createname(tp, dp, name, 0, NULL, NULL, 0);
int rval;
int v; /* type-checking value */
if (resblks)
return 0;
ASSERT(S_ISDIR(dp->i_d.di_mode));
args = kmem_zalloc(sizeof(*args), KM_SLEEP | KM_NOFS);
if (!args)
return -ENOMEM;
args->geo = dp->i_mount->m_dir_geo;
args->name = name->name;
args->namelen = name->len;
args->filetype = name->type;
args->hashval = dp->i_mount->m_dirnameops->hashname(name);
args->dp = dp;
args->whichfork = XFS_DATA_FORK;
args->trans = tp;
args->op_flags = XFS_DA_OP_JUSTCHECK | XFS_DA_OP_ADDNAME |
XFS_DA_OP_OKNOENT;
if (dp->i_d.di_format == XFS_DINODE_FMT_LOCAL) {
rval = xfs_dir2_sf_addname(args);
goto out_free;
}
rval = xfs_dir2_isblock(args, &v);
if (rval)
goto out_free;
if (v) {
rval = xfs_dir2_block_addname(args);
goto out_free;
}
rval = xfs_dir2_isleaf(args, &v);
if (rval)
goto out_free;
if (v)
rval = xfs_dir2_leaf_addname(args);
else
rval = xfs_dir2_node_addname(args);
out_free:
kmem_free(args);
return rval;
} }
/* /*
......
...@@ -136,7 +136,7 @@ extern int xfs_dir_replace(struct xfs_trans *tp, struct xfs_inode *dp, ...@@ -136,7 +136,7 @@ extern int xfs_dir_replace(struct xfs_trans *tp, struct xfs_inode *dp,
xfs_fsblock_t *first, xfs_fsblock_t *first,
struct xfs_bmap_free *flist, xfs_extlen_t tot); struct xfs_bmap_free *flist, xfs_extlen_t tot);
extern int xfs_dir_canenter(struct xfs_trans *tp, struct xfs_inode *dp, extern int xfs_dir_canenter(struct xfs_trans *tp, struct xfs_inode *dp,
struct xfs_name *name, uint resblks); struct xfs_name *name);
/* /*
* Direct call from the bmap code, bypassing the generic directory layer. * Direct call from the bmap code, bypassing the generic directory layer.
......
...@@ -1076,8 +1076,8 @@ xfs_dialloc_ag_finobt_newino( ...@@ -1076,8 +1076,8 @@ xfs_dialloc_ag_finobt_newino(
int i; int i;
if (agi->agi_newino != cpu_to_be32(NULLAGINO)) { if (agi->agi_newino != cpu_to_be32(NULLAGINO)) {
error = xfs_inobt_lookup(cur, agi->agi_newino, XFS_LOOKUP_EQ, error = xfs_inobt_lookup(cur, be32_to_cpu(agi->agi_newino),
&i); XFS_LOOKUP_EQ, &i);
if (error) if (error)
return error; return error;
if (i == 1) { if (i == 1) {
...@@ -1085,7 +1085,6 @@ xfs_dialloc_ag_finobt_newino( ...@@ -1085,7 +1085,6 @@ xfs_dialloc_ag_finobt_newino(
if (error) if (error)
return error; return error;
XFS_WANT_CORRUPTED_RETURN(i == 1); XFS_WANT_CORRUPTED_RETURN(i == 1);
return 0; return 0;
} }
} }
...@@ -2051,6 +2050,8 @@ xfs_agi_verify( ...@@ -2051,6 +2050,8 @@ xfs_agi_verify(
if (!XFS_AGI_GOOD_VERSION(be32_to_cpu(agi->agi_versionnum))) if (!XFS_AGI_GOOD_VERSION(be32_to_cpu(agi->agi_versionnum)))
return false; return false;
if (be32_to_cpu(agi->agi_level) > XFS_BTREE_MAXLEVELS)
return false;
/* /*
* during growfs operations, the perag is not fully initialised, * during growfs operations, the perag is not fully initialised,
* so we can't use it for any useful checking. growfs ensures we can't * so we can't use it for any useful checking. growfs ensures we can't
......
...@@ -424,20 +424,24 @@ xfs_rtfind_forw( ...@@ -424,20 +424,24 @@ xfs_rtfind_forw(
} }
/* /*
* Read and modify the summary information for a given extent size, * Read and/or modify the summary information for a given extent size,
* bitmap block combination. * bitmap block combination.
* Keeps track of a current summary block, so we don't keep reading * Keeps track of a current summary block, so we don't keep reading
* it from the buffer cache. * it from the buffer cache.
*
* Summary information is returned in *sum if specified.
* If no delta is specified, returns summary only.
*/ */
int int
xfs_rtmodify_summary( xfs_rtmodify_summary_int(
xfs_mount_t *mp, /* file system mount point */ xfs_mount_t *mp, /* file system mount structure */
xfs_trans_t *tp, /* transaction pointer */ xfs_trans_t *tp, /* transaction pointer */
int log, /* log2 of extent size */ int log, /* log2 of extent size */
xfs_rtblock_t bbno, /* bitmap block number */ xfs_rtblock_t bbno, /* bitmap block number */
int delta, /* change to make to summary info */ int delta, /* change to make to summary info */
xfs_buf_t **rbpp, /* in/out: summary block buffer */ xfs_buf_t **rbpp, /* in/out: summary block buffer */
xfs_fsblock_t *rsb) /* in/out: summary block number */ xfs_fsblock_t *rsb, /* in/out: summary block number */
xfs_suminfo_t *sum) /* out: summary info for this block */
{ {
xfs_buf_t *bp; /* buffer for the summary block */ xfs_buf_t *bp; /* buffer for the summary block */
int error; /* error value */ int error; /* error value */
...@@ -456,7 +460,7 @@ xfs_rtmodify_summary( ...@@ -456,7 +460,7 @@ xfs_rtmodify_summary(
/* /*
* If we have an old buffer, and the block number matches, use that. * If we have an old buffer, and the block number matches, use that.
*/ */
if (rbpp && *rbpp && *rsb == sb) if (*rbpp && *rsb == sb)
bp = *rbpp; bp = *rbpp;
/* /*
* Otherwise we have to get the buffer. * Otherwise we have to get the buffer.
...@@ -465,7 +469,7 @@ xfs_rtmodify_summary( ...@@ -465,7 +469,7 @@ xfs_rtmodify_summary(
/* /*
* If there was an old one, get rid of it first. * If there was an old one, get rid of it first.
*/ */
if (rbpp && *rbpp) if (*rbpp)
xfs_trans_brelse(tp, *rbpp); xfs_trans_brelse(tp, *rbpp);
error = xfs_rtbuf_get(mp, tp, sb, 1, &bp); error = xfs_rtbuf_get(mp, tp, sb, 1, &bp);
if (error) { if (error) {
...@@ -474,21 +478,38 @@ xfs_rtmodify_summary( ...@@ -474,21 +478,38 @@ xfs_rtmodify_summary(
/* /*
* Remember this buffer and block for the next call. * Remember this buffer and block for the next call.
*/ */
if (rbpp) {
*rbpp = bp; *rbpp = bp;
*rsb = sb; *rsb = sb;
} }
}
/* /*
* Point to the summary information, modify and log it. * Point to the summary information, modify/log it, and/or copy it out.
*/ */
sp = XFS_SUMPTR(mp, bp, so); sp = XFS_SUMPTR(mp, bp, so);
if (delta) {
uint first = (uint)((char *)sp - (char *)bp->b_addr);
*sp += delta; *sp += delta;
xfs_trans_log_buf(tp, bp, (uint)((char *)sp - (char *)bp->b_addr), xfs_trans_log_buf(tp, bp, first, first + sizeof(*sp) - 1);
(uint)((char *)sp - (char *)bp->b_addr + sizeof(*sp) - 1)); }
if (sum)
*sum = *sp;
return 0; return 0;
} }
int
xfs_rtmodify_summary(
xfs_mount_t *mp, /* file system mount structure */
xfs_trans_t *tp, /* transaction pointer */
int log, /* log2 of extent size */
xfs_rtblock_t bbno, /* bitmap block number */
int delta, /* change to make to summary info */
xfs_buf_t **rbpp, /* in/out: summary block buffer */
xfs_fsblock_t *rsb) /* in/out: summary block number */
{
return xfs_rtmodify_summary_int(mp, tp, log, bbno,
delta, rbpp, rsb, NULL);
}
/* /*
* Set the given range of bitmap bits to the given value. * Set the given range of bitmap bits to the given value.
* Do whatever I/O and logging is required. * Do whatever I/O and logging is required.
......
...@@ -279,11 +279,13 @@ xfs_mount_validate_sb( ...@@ -279,11 +279,13 @@ xfs_mount_validate_sb(
sbp->sb_blocklog < XFS_MIN_BLOCKSIZE_LOG || sbp->sb_blocklog < XFS_MIN_BLOCKSIZE_LOG ||
sbp->sb_blocklog > XFS_MAX_BLOCKSIZE_LOG || sbp->sb_blocklog > XFS_MAX_BLOCKSIZE_LOG ||
sbp->sb_blocksize != (1 << sbp->sb_blocklog) || sbp->sb_blocksize != (1 << sbp->sb_blocklog) ||
sbp->sb_dirblklog > XFS_MAX_BLOCKSIZE_LOG ||
sbp->sb_inodesize < XFS_DINODE_MIN_SIZE || sbp->sb_inodesize < XFS_DINODE_MIN_SIZE ||
sbp->sb_inodesize > XFS_DINODE_MAX_SIZE || sbp->sb_inodesize > XFS_DINODE_MAX_SIZE ||
sbp->sb_inodelog < XFS_DINODE_MIN_LOG || sbp->sb_inodelog < XFS_DINODE_MIN_LOG ||
sbp->sb_inodelog > XFS_DINODE_MAX_LOG || sbp->sb_inodelog > XFS_DINODE_MAX_LOG ||
sbp->sb_inodesize != (1 << sbp->sb_inodelog) || sbp->sb_inodesize != (1 << sbp->sb_inodelog) ||
sbp->sb_logsunit > XLOG_MAX_RECORD_BSIZE ||
sbp->sb_inopblock != howmany(sbp->sb_blocksize,sbp->sb_inodesize) || sbp->sb_inopblock != howmany(sbp->sb_blocksize,sbp->sb_inodesize) ||
(sbp->sb_blocklog - sbp->sb_inodelog != sbp->sb_inopblog) || (sbp->sb_blocklog - sbp->sb_inodelog != sbp->sb_inopblog) ||
(sbp->sb_rextsize * sbp->sb_blocksize > XFS_MAX_RTEXTSIZE) || (sbp->sb_rextsize * sbp->sb_blocksize > XFS_MAX_RTEXTSIZE) ||
...@@ -443,6 +445,8 @@ __xfs_sb_from_disk( ...@@ -443,6 +445,8 @@ __xfs_sb_from_disk(
to->sb_features_incompat = be32_to_cpu(from->sb_features_incompat); to->sb_features_incompat = be32_to_cpu(from->sb_features_incompat);
to->sb_features_log_incompat = to->sb_features_log_incompat =
be32_to_cpu(from->sb_features_log_incompat); be32_to_cpu(from->sb_features_log_incompat);
/* crc is only used on disk, not in memory; just init to 0 here. */
to->sb_crc = 0;
to->sb_pad = 0; to->sb_pad = 0;
to->sb_pquotino = be64_to_cpu(from->sb_pquotino); to->sb_pquotino = be64_to_cpu(from->sb_pquotino);
to->sb_lsn = be64_to_cpu(from->sb_lsn); to->sb_lsn = be64_to_cpu(from->sb_lsn);
...@@ -548,6 +552,9 @@ xfs_sb_to_disk( ...@@ -548,6 +552,9 @@ xfs_sb_to_disk(
if (!fields) if (!fields)
return; return;
/* We should never write the crc here, it's updated in the IO path */
fields &= ~XFS_SB_CRC;
xfs_sb_quota_to_disk(to, from, &fields); xfs_sb_quota_to_disk(to, from, &fields);
while (fields) { while (fields) {
f = (xfs_sb_field_t)xfs_lowbit64((__uint64_t)fields); f = (xfs_sb_field_t)xfs_lowbit64((__uint64_t)fields);
......
/*
* Copyright (c) 2000-2003,2005 Silicon Graphics, Inc.
* All Rights Reserved.
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License as
* published by the Free Software Foundation.
*
* This program is distributed in the hope that it would be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
*/
#ifndef __XFS_SUPPORT_TIME_H__
#define __XFS_SUPPORT_TIME_H__
#include <linux/sched.h>
#include <linux/time.h>
typedef struct timespec timespec_t;
static inline void delay(long ticks)
{
schedule_timeout_uninterruptible(ticks);
}
static inline void nanotime(struct timespec *tvp)
{
*tvp = CURRENT_TIME;
}
#endif /* __XFS_SUPPORT_TIME_H__ */
...@@ -434,10 +434,22 @@ xfs_start_page_writeback( ...@@ -434,10 +434,22 @@ xfs_start_page_writeback(
{ {
ASSERT(PageLocked(page)); ASSERT(PageLocked(page));
ASSERT(!PageWriteback(page)); ASSERT(!PageWriteback(page));
if (clear_dirty)
/*
* if the page was not fully cleaned, we need to ensure that the higher
* layers come back to it correctly. That means we need to keep the page
* dirty, and for WB_SYNC_ALL writeback we need to ensure the
* PAGECACHE_TAG_TOWRITE index mark is not removed so another attempt to
* write this page in this writeback sweep will be made.
*/
if (clear_dirty) {
clear_page_dirty_for_io(page); clear_page_dirty_for_io(page);
set_page_writeback(page); set_page_writeback(page);
} else
set_page_writeback_keepwrite(page);
unlock_page(page); unlock_page(page);
/* If no buffers on the page are to be written, finish it here */ /* If no buffers on the page are to be written, finish it here */
if (!buffers) if (!buffers)
end_page_writeback(page); end_page_writeback(page);
...@@ -548,6 +560,13 @@ xfs_cancel_ioend( ...@@ -548,6 +560,13 @@ xfs_cancel_ioend(
do { do {
next_bh = bh->b_private; next_bh = bh->b_private;
clear_buffer_async_write(bh); clear_buffer_async_write(bh);
/*
* The unwritten flag is cleared when added to the
* ioend. We're not submitting for I/O so mark the
* buffer unwritten again for next time around.
*/
if (ioend->io_type == XFS_IO_UNWRITTEN)
set_buffer_unwritten(bh);
unlock_buffer(bh); unlock_buffer(bh);
} while ((bh = next_bh) != NULL); } while ((bh = next_bh) != NULL);
......
...@@ -1122,14 +1122,6 @@ xfs_zero_remaining_bytes( ...@@ -1122,14 +1122,6 @@ xfs_zero_remaining_bytes(
if (endoff > XFS_ISIZE(ip)) if (endoff > XFS_ISIZE(ip))
endoff = XFS_ISIZE(ip); endoff = XFS_ISIZE(ip);
bp = xfs_buf_get_uncached(XFS_IS_REALTIME_INODE(ip) ?
mp->m_rtdev_targp : mp->m_ddev_targp,
BTOBB(mp->m_sb.sb_blocksize), 0);
if (!bp)
return -ENOMEM;
xfs_buf_unlock(bp);
for (offset = startoff; offset <= endoff; offset = lastoffset + 1) { for (offset = startoff; offset <= endoff; offset = lastoffset + 1) {
uint lock_mode; uint lock_mode;
...@@ -1152,42 +1144,24 @@ xfs_zero_remaining_bytes( ...@@ -1152,42 +1144,24 @@ xfs_zero_remaining_bytes(
ASSERT(imap.br_startblock != DELAYSTARTBLOCK); ASSERT(imap.br_startblock != DELAYSTARTBLOCK);
if (imap.br_state == XFS_EXT_UNWRITTEN) if (imap.br_state == XFS_EXT_UNWRITTEN)
continue; continue;
XFS_BUF_UNDONE(bp);
XFS_BUF_UNWRITE(bp);
XFS_BUF_READ(bp);
XFS_BUF_SET_ADDR(bp, xfs_fsb_to_db(ip, imap.br_startblock));
if (XFS_FORCED_SHUTDOWN(mp)) { error = xfs_buf_read_uncached(XFS_IS_REALTIME_INODE(ip) ?
error = -EIO; mp->m_rtdev_targp : mp->m_ddev_targp,
break; xfs_fsb_to_db(ip, imap.br_startblock),
} BTOBB(mp->m_sb.sb_blocksize),
xfs_buf_iorequest(bp); 0, &bp, NULL);
error = xfs_buf_iowait(bp); if (error)
if (error) { return error;
xfs_buf_ioerror_alert(bp,
"xfs_zero_remaining_bytes(read)");
break;
}
memset(bp->b_addr + memset(bp->b_addr +
(offset - XFS_FSB_TO_B(mp, imap.br_startoff)), (offset - XFS_FSB_TO_B(mp, imap.br_startoff)),
0, lastoffset - offset + 1); 0, lastoffset - offset + 1);
XFS_BUF_UNDONE(bp);
XFS_BUF_UNREAD(bp);
XFS_BUF_WRITE(bp);
if (XFS_FORCED_SHUTDOWN(mp)) { error = xfs_bwrite(bp);
error = -EIO; xfs_buf_relse(bp);
break; if (error)
} return error;
xfs_buf_iorequest(bp);
error = xfs_buf_iowait(bp);
if (error) {
xfs_buf_ioerror_alert(bp,
"xfs_zero_remaining_bytes(write)");
break;
}
} }
xfs_buf_free(bp);
return error; return error;
} }
...@@ -1205,6 +1179,7 @@ xfs_free_file_space( ...@@ -1205,6 +1179,7 @@ xfs_free_file_space(
xfs_bmap_free_t free_list; xfs_bmap_free_t free_list;
xfs_bmbt_irec_t imap; xfs_bmbt_irec_t imap;
xfs_off_t ioffset; xfs_off_t ioffset;
xfs_off_t iendoffset;
xfs_extlen_t mod=0; xfs_extlen_t mod=0;
xfs_mount_t *mp; xfs_mount_t *mp;
int nimap; int nimap;
...@@ -1233,12 +1208,13 @@ xfs_free_file_space( ...@@ -1233,12 +1208,13 @@ xfs_free_file_space(
inode_dio_wait(VFS_I(ip)); inode_dio_wait(VFS_I(ip));
rounding = max_t(xfs_off_t, 1 << mp->m_sb.sb_blocklog, PAGE_CACHE_SIZE); rounding = max_t(xfs_off_t, 1 << mp->m_sb.sb_blocklog, PAGE_CACHE_SIZE);
ioffset = offset & ~(rounding - 1); ioffset = round_down(offset, rounding);
error = filemap_write_and_wait_range(VFS_I(ip)->i_mapping, iendoffset = round_up(offset + len, rounding) - 1;
ioffset, -1); error = filemap_write_and_wait_range(VFS_I(ip)->i_mapping, ioffset,
iendoffset);
if (error) if (error)
goto out; goto out;
truncate_pagecache_range(VFS_I(ip), ioffset, -1); truncate_pagecache_range(VFS_I(ip), ioffset, iendoffset);
/* /*
* Need to zero the stuff we're not freeing, on disk. * Need to zero the stuff we're not freeing, on disk.
...@@ -1392,14 +1368,14 @@ xfs_zero_file_space( ...@@ -1392,14 +1368,14 @@ xfs_zero_file_space(
if (start_boundary < end_boundary - 1) { if (start_boundary < end_boundary - 1) {
/* /*
* punch out delayed allocation blocks and the page cache over * Writeback the range to ensure any inode size updates due to
* the conversion range * appending writes make it to disk (otherwise we could just
* punch out the delalloc blocks).
*/ */
xfs_ilock(ip, XFS_ILOCK_EXCL); error = filemap_write_and_wait_range(VFS_I(ip)->i_mapping,
error = xfs_bmap_punch_delalloc_range(ip, start_boundary, end_boundary - 1);
XFS_B_TO_FSBT(mp, start_boundary), if (error)
XFS_B_TO_FSB(mp, end_boundary - start_boundary)); goto out;
xfs_iunlock(ip, XFS_ILOCK_EXCL);
truncate_pagecache_range(VFS_I(ip), start_boundary, truncate_pagecache_range(VFS_I(ip), start_boundary,
end_boundary - 1); end_boundary - 1);
...@@ -1456,41 +1432,47 @@ xfs_collapse_file_space( ...@@ -1456,41 +1432,47 @@ xfs_collapse_file_space(
struct xfs_mount *mp = ip->i_mount; struct xfs_mount *mp = ip->i_mount;
struct xfs_trans *tp; struct xfs_trans *tp;
int error; int error;
xfs_extnum_t current_ext = 0;
struct xfs_bmap_free free_list; struct xfs_bmap_free free_list;
xfs_fsblock_t first_block; xfs_fsblock_t first_block;
int committed; int committed;
xfs_fileoff_t start_fsb; xfs_fileoff_t start_fsb;
xfs_fileoff_t next_fsb;
xfs_fileoff_t shift_fsb; xfs_fileoff_t shift_fsb;
ASSERT(xfs_isilocked(ip, XFS_IOLOCK_EXCL)); ASSERT(xfs_isilocked(ip, XFS_IOLOCK_EXCL));
trace_xfs_collapse_file_space(ip); trace_xfs_collapse_file_space(ip);
start_fsb = XFS_B_TO_FSB(mp, offset + len); next_fsb = XFS_B_TO_FSB(mp, offset + len);
shift_fsb = XFS_B_TO_FSB(mp, len); shift_fsb = XFS_B_TO_FSB(mp, len);
/* error = xfs_free_file_space(ip, offset, len);
* Writeback the entire file and force remove any post-eof blocks. The
* writeback prevents changes to the extent list via concurrent
* writeback and the eofblocks trim prevents the extent shift algorithm
* from running into a post-eof delalloc extent.
*
* XXX: This is a temporary fix until the extent shift loop below is
* converted to use offsets and lookups within the ILOCK rather than
* carrying around the index into the extent list for the next
* iteration.
*/
error = filemap_write_and_wait(VFS_I(ip)->i_mapping);
if (error) if (error)
return error; return error;
/*
* Trim eofblocks to avoid shifting uninitialized post-eof preallocation
* into the accessible region of the file.
*/
if (xfs_can_free_eofblocks(ip, true)) { if (xfs_can_free_eofblocks(ip, true)) {
error = xfs_free_eofblocks(mp, ip, false); error = xfs_free_eofblocks(mp, ip, false);
if (error) if (error)
return error; return error;
} }
error = xfs_free_file_space(ip, offset, len); /*
* Writeback and invalidate cache for the remainder of the file as we're
* about to shift down every extent from the collapse range to EOF. The
* free of the collapse range above might have already done some of
* this, but we shouldn't rely on it to do anything outside of the range
* that was freed.
*/
error = filemap_write_and_wait_range(VFS_I(ip)->i_mapping,
offset + len, -1);
if (error)
return error;
error = invalidate_inode_pages2_range(VFS_I(ip)->i_mapping,
(offset + len) >> PAGE_CACHE_SHIFT, -1);
if (error) if (error)
return error; return error;
...@@ -1525,9 +1507,9 @@ xfs_collapse_file_space( ...@@ -1525,9 +1507,9 @@ xfs_collapse_file_space(
* We are using the write transaction in which max 2 bmbt * We are using the write transaction in which max 2 bmbt
* updates are allowed * updates are allowed
*/ */
error = xfs_bmap_shift_extents(tp, ip, &done, start_fsb, start_fsb = next_fsb;
shift_fsb, &current_ext, error = xfs_bmap_shift_extents(tp, ip, start_fsb, shift_fsb,
&first_block, &free_list, &done, &next_fsb, &first_block, &free_list,
XFS_BMAP_MAX_SHIFT_EXTENTS); XFS_BMAP_MAX_SHIFT_EXTENTS);
if (error) if (error)
goto out; goto out;
...@@ -1638,7 +1620,7 @@ xfs_swap_extents_check_format( ...@@ -1638,7 +1620,7 @@ xfs_swap_extents_check_format(
return 0; return 0;
} }
int static int
xfs_swap_extent_flush( xfs_swap_extent_flush(
struct xfs_inode *ip) struct xfs_inode *ip)
{ {
......
This diff is collapsed.
...@@ -158,6 +158,7 @@ typedef struct xfs_buf { ...@@ -158,6 +158,7 @@ typedef struct xfs_buf {
struct list_head b_lru; /* lru list */ struct list_head b_lru; /* lru list */
spinlock_t b_lock; /* internal state lock */ spinlock_t b_lock; /* internal state lock */
unsigned int b_state; /* internal state flags */ unsigned int b_state; /* internal state flags */
int b_io_error; /* internal IO error state */
wait_queue_head_t b_waiters; /* unpin waiters */ wait_queue_head_t b_waiters; /* unpin waiters */
struct list_head b_list; struct list_head b_list;
struct xfs_perag *b_pag; /* contains rbtree root */ struct xfs_perag *b_pag; /* contains rbtree root */
...@@ -268,8 +269,8 @@ int xfs_buf_associate_memory(struct xfs_buf *bp, void *mem, size_t length); ...@@ -268,8 +269,8 @@ int xfs_buf_associate_memory(struct xfs_buf *bp, void *mem, size_t length);
struct xfs_buf *xfs_buf_get_uncached(struct xfs_buftarg *target, size_t numblks, struct xfs_buf *xfs_buf_get_uncached(struct xfs_buftarg *target, size_t numblks,
int flags); int flags);
struct xfs_buf *xfs_buf_read_uncached(struct xfs_buftarg *target, int xfs_buf_read_uncached(struct xfs_buftarg *target, xfs_daddr_t daddr,
xfs_daddr_t daddr, size_t numblks, int flags, size_t numblks, int flags, struct xfs_buf **bpp,
const struct xfs_buf_ops *ops); const struct xfs_buf_ops *ops);
void xfs_buf_hold(struct xfs_buf *bp); void xfs_buf_hold(struct xfs_buf *bp);
...@@ -286,18 +287,16 @@ extern void xfs_buf_unlock(xfs_buf_t *); ...@@ -286,18 +287,16 @@ extern void xfs_buf_unlock(xfs_buf_t *);
/* Buffer Read and Write Routines */ /* Buffer Read and Write Routines */
extern int xfs_bwrite(struct xfs_buf *bp); extern int xfs_bwrite(struct xfs_buf *bp);
extern void xfs_buf_ioend(xfs_buf_t *, int); extern void xfs_buf_ioend(struct xfs_buf *bp);
extern void xfs_buf_ioerror(xfs_buf_t *, int); extern void xfs_buf_ioerror(xfs_buf_t *, int);
extern void xfs_buf_ioerror_alert(struct xfs_buf *, const char *func); extern void xfs_buf_ioerror_alert(struct xfs_buf *, const char *func);
extern void xfs_buf_iorequest(xfs_buf_t *); extern void xfs_buf_submit(struct xfs_buf *bp);
extern int xfs_buf_iowait(xfs_buf_t *); extern int xfs_buf_submit_wait(struct xfs_buf *bp);
extern void xfs_buf_iomove(xfs_buf_t *, size_t, size_t, void *, extern void xfs_buf_iomove(xfs_buf_t *, size_t, size_t, void *,
xfs_buf_rw_t); xfs_buf_rw_t);
#define xfs_buf_zero(bp, off, len) \ #define xfs_buf_zero(bp, off, len) \
xfs_buf_iomove((bp), (off), (len), NULL, XBRW_ZERO) xfs_buf_iomove((bp), (off), (len), NULL, XBRW_ZERO)
extern int xfs_bioerror_relse(struct xfs_buf *);
/* Buffer Utility Routines */ /* Buffer Utility Routines */
extern xfs_caddr_t xfs_buf_offset(xfs_buf_t *, size_t); extern xfs_caddr_t xfs_buf_offset(xfs_buf_t *, size_t);
......
...@@ -491,7 +491,7 @@ xfs_buf_item_unpin( ...@@ -491,7 +491,7 @@ xfs_buf_item_unpin(
xfs_buf_ioerror(bp, -EIO); xfs_buf_ioerror(bp, -EIO);
XFS_BUF_UNDONE(bp); XFS_BUF_UNDONE(bp);
xfs_buf_stale(bp); xfs_buf_stale(bp);
xfs_buf_ioend(bp, 0); xfs_buf_ioend(bp);
} }
} }
...@@ -501,7 +501,7 @@ xfs_buf_item_unpin( ...@@ -501,7 +501,7 @@ xfs_buf_item_unpin(
* buffer being bad.. * buffer being bad..
*/ */
DEFINE_RATELIMIT_STATE(xfs_buf_write_fail_rl_state, 30 * HZ, 10); static DEFINE_RATELIMIT_STATE(xfs_buf_write_fail_rl_state, 30 * HZ, 10);
STATIC uint STATIC uint
xfs_buf_item_push( xfs_buf_item_push(
...@@ -1081,7 +1081,7 @@ xfs_buf_iodone_callbacks( ...@@ -1081,7 +1081,7 @@ xfs_buf_iodone_callbacks(
* a way to shut the filesystem down if the writes keep failing. * a way to shut the filesystem down if the writes keep failing.
* *
* In practice we'll shut the filesystem down soon as non-transient * In practice we'll shut the filesystem down soon as non-transient
* erorrs tend to affect the whole device and a failing log write * errors tend to affect the whole device and a failing log write
* will make us give up. But we really ought to do better here. * will make us give up. But we really ought to do better here.
*/ */
if (XFS_BUF_ISASYNC(bp)) { if (XFS_BUF_ISASYNC(bp)) {
...@@ -1094,7 +1094,7 @@ xfs_buf_iodone_callbacks( ...@@ -1094,7 +1094,7 @@ xfs_buf_iodone_callbacks(
if (!(bp->b_flags & (XBF_STALE|XBF_WRITE_FAIL))) { if (!(bp->b_flags & (XBF_STALE|XBF_WRITE_FAIL))) {
bp->b_flags |= XBF_WRITE | XBF_ASYNC | bp->b_flags |= XBF_WRITE | XBF_ASYNC |
XBF_DONE | XBF_WRITE_FAIL; XBF_DONE | XBF_WRITE_FAIL;
xfs_buf_iorequest(bp); xfs_buf_submit(bp);
} else { } else {
xfs_buf_relse(bp); xfs_buf_relse(bp);
} }
...@@ -1115,7 +1115,7 @@ xfs_buf_iodone_callbacks( ...@@ -1115,7 +1115,7 @@ xfs_buf_iodone_callbacks(
xfs_buf_do_callbacks(bp); xfs_buf_do_callbacks(bp);
bp->b_fspriv = NULL; bp->b_fspriv = NULL;
bp->b_iodone = NULL; bp->b_iodone = NULL;
xfs_buf_ioend(bp, 0); xfs_buf_ioend(bp);
} }
/* /*
......
...@@ -983,7 +983,7 @@ xfs_vm_page_mkwrite( ...@@ -983,7 +983,7 @@ xfs_vm_page_mkwrite(
/* /*
* This type is designed to indicate the type of offset we would like * This type is designed to indicate the type of offset we would like
* to search from page cache for either xfs_seek_data() or xfs_seek_hole(). * to search from page cache for xfs_seek_hole_data().
*/ */
enum { enum {
HOLE_OFF = 0, HOLE_OFF = 0,
...@@ -1040,7 +1040,7 @@ xfs_lookup_buffer_offset( ...@@ -1040,7 +1040,7 @@ xfs_lookup_buffer_offset(
/* /*
* This routine is called to find out and return a data or hole offset * This routine is called to find out and return a data or hole offset
* from the page cache for unwritten extents according to the desired * from the page cache for unwritten extents according to the desired
* type for xfs_seek_data() or xfs_seek_hole(). * type for xfs_seek_hole_data().
* *
* The argument offset is used to tell where we start to search from the * The argument offset is used to tell where we start to search from the
* page cache. Map is used to figure out the end points of the range to * page cache. Map is used to figure out the end points of the range to
...@@ -1200,9 +1200,10 @@ xfs_find_get_desired_pgoff( ...@@ -1200,9 +1200,10 @@ xfs_find_get_desired_pgoff(
} }
STATIC loff_t STATIC loff_t
xfs_seek_data( xfs_seek_hole_data(
struct file *file, struct file *file,
loff_t start) loff_t start,
int whence)
{ {
struct inode *inode = file->f_mapping->host; struct inode *inode = file->f_mapping->host;
struct xfs_inode *ip = XFS_I(inode); struct xfs_inode *ip = XFS_I(inode);
...@@ -1214,6 +1215,9 @@ xfs_seek_data( ...@@ -1214,6 +1215,9 @@ xfs_seek_data(
uint lock; uint lock;
int error; int error;
if (XFS_FORCED_SHUTDOWN(mp))
return -EIO;
lock = xfs_ilock_data_map_shared(ip); lock = xfs_ilock_data_map_shared(ip);
isize = i_size_read(inode); isize = i_size_read(inode);
...@@ -1228,6 +1232,7 @@ xfs_seek_data( ...@@ -1228,6 +1232,7 @@ xfs_seek_data(
*/ */
fsbno = XFS_B_TO_FSBT(mp, start); fsbno = XFS_B_TO_FSBT(mp, start);
end = XFS_B_TO_FSB(mp, isize); end = XFS_B_TO_FSB(mp, isize);
for (;;) { for (;;) {
struct xfs_bmbt_irec map[2]; struct xfs_bmbt_irec map[2];
int nmap = 2; int nmap = 2;
...@@ -1248,155 +1253,79 @@ xfs_seek_data( ...@@ -1248,155 +1253,79 @@ xfs_seek_data(
offset = max_t(loff_t, start, offset = max_t(loff_t, start,
XFS_FSB_TO_B(mp, map[i].br_startoff)); XFS_FSB_TO_B(mp, map[i].br_startoff));
/* Landed in a data extent */ /* Landed in the hole we wanted? */
if (map[i].br_startblock == DELAYSTARTBLOCK || if (whence == SEEK_HOLE &&
map[i].br_startblock == HOLESTARTBLOCK)
goto out;
/* Landed in the data extent we wanted? */
if (whence == SEEK_DATA &&
(map[i].br_startblock == DELAYSTARTBLOCK ||
(map[i].br_state == XFS_EXT_NORM && (map[i].br_state == XFS_EXT_NORM &&
!isnullstartblock(map[i].br_startblock))) !isnullstartblock(map[i].br_startblock))))
goto out; goto out;
/* /*
* Landed in an unwritten extent, try to search data * Landed in an unwritten extent, try to search
* from page cache. * for hole or data from page cache.
*/ */
if (map[i].br_state == XFS_EXT_UNWRITTEN) { if (map[i].br_state == XFS_EXT_UNWRITTEN) {
if (xfs_find_get_desired_pgoff(inode, &map[i], if (xfs_find_get_desired_pgoff(inode, &map[i],
DATA_OFF, &offset)) whence == SEEK_HOLE ? HOLE_OFF : DATA_OFF,
&offset))
goto out; goto out;
} }
} }
/* /*
* map[0] is hole or its an unwritten extent but * We only received one extent out of the two requested. This
* without data in page cache. Probably means that * means we've hit EOF and didn't find what we are looking for.
* we are reading after EOF if nothing in map[1].
*/ */
if (nmap == 1) { if (nmap == 1) {
error = -ENXIO;
goto out_unlock;
}
ASSERT(i > 1);
/*
* Nothing was found, proceed to the next round of search
* if reading offset not beyond or hit EOF.
*/
fsbno = map[i - 1].br_startoff + map[i - 1].br_blockcount;
start = XFS_FSB_TO_B(mp, fsbno);
if (start >= isize) {
error = -ENXIO;
goto out_unlock;
}
}
out:
offset = vfs_setpos(file, offset, inode->i_sb->s_maxbytes);
out_unlock:
xfs_iunlock(ip, lock);
if (error)
return error;
return offset;
}
STATIC loff_t
xfs_seek_hole(
struct file *file,
loff_t start)
{
struct inode *inode = file->f_mapping->host;
struct xfs_inode *ip = XFS_I(inode);
struct xfs_mount *mp = ip->i_mount;
loff_t uninitialized_var(offset);
xfs_fsize_t isize;
xfs_fileoff_t fsbno;
xfs_filblks_t end;
uint lock;
int error;
if (XFS_FORCED_SHUTDOWN(mp))
return -EIO;
lock = xfs_ilock_data_map_shared(ip);
isize = i_size_read(inode);
if (start >= isize) {
error = -ENXIO;
goto out_unlock;
}
fsbno = XFS_B_TO_FSBT(mp, start);
end = XFS_B_TO_FSB(mp, isize);
for (;;) {
struct xfs_bmbt_irec map[2];
int nmap = 2;
unsigned int i;
error = xfs_bmapi_read(ip, fsbno, end - fsbno, map, &nmap,
XFS_BMAPI_ENTIRE);
if (error)
goto out_unlock;
/* No extents at given offset, must be beyond EOF */
if (nmap == 0) {
error = -ENXIO;
goto out_unlock;
}
for (i = 0; i < nmap; i++) {
offset = max_t(loff_t, start,
XFS_FSB_TO_B(mp, map[i].br_startoff));
/* Landed in a hole */
if (map[i].br_startblock == HOLESTARTBLOCK)
goto out;
/*
* Landed in an unwritten extent, try to search hole
* from page cache.
*/
if (map[i].br_state == XFS_EXT_UNWRITTEN) {
if (xfs_find_get_desired_pgoff(inode, &map[i],
HOLE_OFF, &offset))
goto out;
}
}
/* /*
* map[0] contains data or its unwritten but contains * If we were looking for a hole, set offset to
* data in page cache, probably means that we are * the end of the file (i.e., there is an implicit
* reading after EOF. We should fix offset to point
* to the end of the file(i.e., there is an implicit
* hole at the end of any file). * hole at the end of any file).
*/ */
if (nmap == 1) { if (whence == SEEK_HOLE) {
offset = isize; offset = isize;
break; break;
} }
/*
* If we were looking for data, it's nowhere to be found
*/
ASSERT(whence == SEEK_DATA);
error = -ENXIO;
goto out_unlock;
}
ASSERT(i > 1); ASSERT(i > 1);
/* /*
* Both mappings contains data, proceed to the next round of * Nothing was found, proceed to the next round of search
* search if the current reading offset not beyond or hit EOF. * if the next reading offset is not at or beyond EOF.
*/ */
fsbno = map[i - 1].br_startoff + map[i - 1].br_blockcount; fsbno = map[i - 1].br_startoff + map[i - 1].br_blockcount;
start = XFS_FSB_TO_B(mp, fsbno); start = XFS_FSB_TO_B(mp, fsbno);
if (start >= isize) { if (start >= isize) {
if (whence == SEEK_HOLE) {
offset = isize; offset = isize;
break; break;
} }
ASSERT(whence == SEEK_DATA);
error = -ENXIO;
goto out_unlock;
}
} }
out: out:
/* /*
* At this point, we must have found a hole. However, the returned * If at this point we have found the hole we wanted, the returned
* offset may be bigger than the file size as it may be aligned to * offset may be bigger than the file size as it may be aligned to
* page boundary for unwritten extents, we need to deal with this * page boundary for unwritten extents. We need to deal with this
* situation in particular. * situation in particular.
*/ */
if (whence == SEEK_HOLE)
offset = min_t(loff_t, offset, isize); offset = min_t(loff_t, offset, isize);
offset = vfs_setpos(file, offset, inode->i_sb->s_maxbytes); offset = vfs_setpos(file, offset, inode->i_sb->s_maxbytes);
...@@ -1412,17 +1341,16 @@ STATIC loff_t ...@@ -1412,17 +1341,16 @@ STATIC loff_t
xfs_file_llseek( xfs_file_llseek(
struct file *file, struct file *file,
loff_t offset, loff_t offset,
int origin) int whence)
{ {
switch (origin) { switch (whence) {
case SEEK_END: case SEEK_END:
case SEEK_CUR: case SEEK_CUR:
case SEEK_SET: case SEEK_SET:
return generic_file_llseek(file, offset, origin); return generic_file_llseek(file, offset, whence);
case SEEK_DATA:
return xfs_seek_data(file, offset);
case SEEK_HOLE: case SEEK_HOLE:
return xfs_seek_hole(file, offset); case SEEK_DATA:
return xfs_seek_hole_data(file, offset, whence);
default: default:
return -EINVAL; return -EINVAL;
} }
......
...@@ -172,16 +172,11 @@ xfs_growfs_data_private( ...@@ -172,16 +172,11 @@ xfs_growfs_data_private(
if ((error = xfs_sb_validate_fsb_count(&mp->m_sb, nb))) if ((error = xfs_sb_validate_fsb_count(&mp->m_sb, nb)))
return error; return error;
dpct = pct - mp->m_sb.sb_imax_pct; dpct = pct - mp->m_sb.sb_imax_pct;
bp = xfs_buf_read_uncached(mp->m_ddev_targp, error = xfs_buf_read_uncached(mp->m_ddev_targp,
XFS_FSB_TO_BB(mp, nb) - XFS_FSS_TO_BB(mp, 1), XFS_FSB_TO_BB(mp, nb) - XFS_FSS_TO_BB(mp, 1),
XFS_FSS_TO_BB(mp, 1), 0, NULL); XFS_FSS_TO_BB(mp, 1), 0, &bp, NULL);
if (!bp) if (error)
return -EIO;
if (bp->b_error) {
error = bp->b_error;
xfs_buf_relse(bp);
return error; return error;
}
xfs_buf_relse(bp); xfs_buf_relse(bp);
new = nb; /* use new as a temporary here */ new = nb; /* use new as a temporary here */
......
...@@ -43,3 +43,7 @@ xfs_param_t xfs_params = { ...@@ -43,3 +43,7 @@ xfs_param_t xfs_params = {
.fstrm_timer = { 1, 30*100, 3600*100}, .fstrm_timer = { 1, 30*100, 3600*100},
.eofb_timer = { 1, 300, 3600*24}, .eofb_timer = { 1, 300, 3600*24},
}; };
struct xfs_globals xfs_globals = {
.log_recovery_delay = 0, /* no delay by default */
};
...@@ -33,7 +33,6 @@ ...@@ -33,7 +33,6 @@
#include "xfs_trace.h" #include "xfs_trace.h"
#include "xfs_icache.h" #include "xfs_icache.h"
#include "xfs_bmap_util.h" #include "xfs_bmap_util.h"
#include "xfs_quota.h"
#include "xfs_dquot_item.h" #include "xfs_dquot_item.h"
#include "xfs_dquot.h" #include "xfs_dquot.h"
......
...@@ -654,7 +654,7 @@ xfs_ialloc( ...@@ -654,7 +654,7 @@ xfs_ialloc(
xfs_inode_t *ip; xfs_inode_t *ip;
uint flags; uint flags;
int error; int error;
timespec_t tv; struct timespec tv;
/* /*
* Call the space management code to pick * Call the space management code to pick
...@@ -720,7 +720,7 @@ xfs_ialloc( ...@@ -720,7 +720,7 @@ xfs_ialloc(
ip->i_d.di_nextents = 0; ip->i_d.di_nextents = 0;
ASSERT(ip->i_d.di_nblocks == 0); ASSERT(ip->i_d.di_nblocks == 0);
nanotime(&tv); tv = current_fs_time(mp->m_super);
ip->i_d.di_mtime.t_sec = (__int32_t)tv.tv_sec; ip->i_d.di_mtime.t_sec = (__int32_t)tv.tv_sec;
ip->i_d.di_mtime.t_nsec = (__int32_t)tv.tv_nsec; ip->i_d.di_mtime.t_nsec = (__int32_t)tv.tv_nsec;
ip->i_d.di_atime = ip->i_d.di_mtime; ip->i_d.di_atime = ip->i_d.di_mtime;
...@@ -769,6 +769,8 @@ xfs_ialloc( ...@@ -769,6 +769,8 @@ xfs_ialloc(
di_flags |= XFS_DIFLAG_EXTSZINHERIT; di_flags |= XFS_DIFLAG_EXTSZINHERIT;
ip->i_d.di_extsize = pip->i_d.di_extsize; ip->i_d.di_extsize = pip->i_d.di_extsize;
} }
if (pip->i_d.di_flags & XFS_DIFLAG_PROJINHERIT)
di_flags |= XFS_DIFLAG_PROJINHERIT;
} else if (S_ISREG(mode)) { } else if (S_ISREG(mode)) {
if (pip->i_d.di_flags & XFS_DIFLAG_RTINHERIT) if (pip->i_d.di_flags & XFS_DIFLAG_RTINHERIT)
di_flags |= XFS_DIFLAG_REALTIME; di_flags |= XFS_DIFLAG_REALTIME;
...@@ -789,8 +791,6 @@ xfs_ialloc( ...@@ -789,8 +791,6 @@ xfs_ialloc(
if ((pip->i_d.di_flags & XFS_DIFLAG_NOSYMLINKS) && if ((pip->i_d.di_flags & XFS_DIFLAG_NOSYMLINKS) &&
xfs_inherit_nosymlinks) xfs_inherit_nosymlinks)
di_flags |= XFS_DIFLAG_NOSYMLINKS; di_flags |= XFS_DIFLAG_NOSYMLINKS;
if (pip->i_d.di_flags & XFS_DIFLAG_PROJINHERIT)
di_flags |= XFS_DIFLAG_PROJINHERIT;
if ((pip->i_d.di_flags & XFS_DIFLAG_NODEFRAG) && if ((pip->i_d.di_flags & XFS_DIFLAG_NODEFRAG) &&
xfs_inherit_nodefrag) xfs_inherit_nodefrag)
di_flags |= XFS_DIFLAG_NODEFRAG; di_flags |= XFS_DIFLAG_NODEFRAG;
...@@ -1153,9 +1153,11 @@ xfs_create( ...@@ -1153,9 +1153,11 @@ xfs_create(
if (error) if (error)
goto out_trans_cancel; goto out_trans_cancel;
error = xfs_dir_canenter(tp, dp, name, resblks); if (!resblks) {
error = xfs_dir_canenter(tp, dp, name);
if (error) if (error)
goto out_trans_cancel; goto out_trans_cancel;
}
/* /*
* A newly created regular or special file just has one directory * A newly created regular or special file just has one directory
...@@ -1421,9 +1423,11 @@ xfs_link( ...@@ -1421,9 +1423,11 @@ xfs_link(
goto error_return; goto error_return;
} }
error = xfs_dir_canenter(tp, tdp, target_name, resblks); if (!resblks) {
error = xfs_dir_canenter(tp, tdp, target_name);
if (error) if (error)
goto error_return; goto error_return;
}
xfs_bmap_init(&free_list, &first_block); xfs_bmap_init(&free_list, &first_block);
...@@ -2759,9 +2763,11 @@ xfs_rename( ...@@ -2759,9 +2763,11 @@ xfs_rename(
* If there's no space reservation, check the entry will * If there's no space reservation, check the entry will
* fit before actually inserting it. * fit before actually inserting it.
*/ */
error = xfs_dir_canenter(tp, target_dp, target_name, spaceres); if (!spaceres) {
error = xfs_dir_canenter(tp, target_dp, target_name);
if (error) if (error)
goto error_return; goto error_return;
}
/* /*
* If target does not exist and the rename crosses * If target does not exist and the rename crosses
* directories, adjust the target directory link count * directories, adjust the target directory link count
...@@ -3056,7 +3062,7 @@ xfs_iflush_cluster( ...@@ -3056,7 +3062,7 @@ xfs_iflush_cluster(
XFS_BUF_UNDONE(bp); XFS_BUF_UNDONE(bp);
xfs_buf_stale(bp); xfs_buf_stale(bp);
xfs_buf_ioerror(bp, -EIO); xfs_buf_ioerror(bp, -EIO);
xfs_buf_ioend(bp, 0); xfs_buf_ioend(bp);
} else { } else {
xfs_buf_stale(bp); xfs_buf_stale(bp);
xfs_buf_relse(bp); xfs_buf_relse(bp);
......
...@@ -102,7 +102,7 @@ xfs_new_eof(struct xfs_inode *ip, xfs_fsize_t new_size) ...@@ -102,7 +102,7 @@ xfs_new_eof(struct xfs_inode *ip, xfs_fsize_t new_size)
{ {
xfs_fsize_t i_size = i_size_read(VFS_I(ip)); xfs_fsize_t i_size = i_size_read(VFS_I(ip));
if (new_size > i_size) if (new_size > i_size || new_size < 0)
new_size = i_size; new_size = i_size;
return new_size > ip->i_d.di_size ? new_size : 0; return new_size > ip->i_d.di_size ? new_size : 0;
} }
......
...@@ -615,7 +615,7 @@ xfs_iflush_done( ...@@ -615,7 +615,7 @@ xfs_iflush_done(
blip = bp->b_fspriv; blip = bp->b_fspriv;
prev = NULL; prev = NULL;
while (blip != NULL) { while (blip != NULL) {
if (lip->li_cb != xfs_iflush_done) { if (blip->li_cb != xfs_iflush_done) {
prev = blip; prev = blip;
blip = blip->li_bio_list; blip = blip->li_bio_list;
continue; continue;
......
...@@ -968,8 +968,6 @@ xfs_set_diflags( ...@@ -968,8 +968,6 @@ xfs_set_diflags(
di_flags |= XFS_DIFLAG_NOATIME; di_flags |= XFS_DIFLAG_NOATIME;
if (xflags & XFS_XFLAG_NODUMP) if (xflags & XFS_XFLAG_NODUMP)
di_flags |= XFS_DIFLAG_NODUMP; di_flags |= XFS_DIFLAG_NODUMP;
if (xflags & XFS_XFLAG_PROJINHERIT)
di_flags |= XFS_DIFLAG_PROJINHERIT;
if (xflags & XFS_XFLAG_NODEFRAG) if (xflags & XFS_XFLAG_NODEFRAG)
di_flags |= XFS_DIFLAG_NODEFRAG; di_flags |= XFS_DIFLAG_NODEFRAG;
if (xflags & XFS_XFLAG_FILESTREAM) if (xflags & XFS_XFLAG_FILESTREAM)
...@@ -981,6 +979,8 @@ xfs_set_diflags( ...@@ -981,6 +979,8 @@ xfs_set_diflags(
di_flags |= XFS_DIFLAG_NOSYMLINKS; di_flags |= XFS_DIFLAG_NOSYMLINKS;
if (xflags & XFS_XFLAG_EXTSZINHERIT) if (xflags & XFS_XFLAG_EXTSZINHERIT)
di_flags |= XFS_DIFLAG_EXTSZINHERIT; di_flags |= XFS_DIFLAG_EXTSZINHERIT;
if (xflags & XFS_XFLAG_PROJINHERIT)
di_flags |= XFS_DIFLAG_PROJINHERIT;
} else if (S_ISREG(ip->i_d.di_mode)) { } else if (S_ISREG(ip->i_d.di_mode)) {
if (xflags & XFS_XFLAG_REALTIME) if (xflags & XFS_XFLAG_REALTIME)
di_flags |= XFS_DIFLAG_REALTIME; di_flags |= XFS_DIFLAG_REALTIME;
...@@ -1231,13 +1231,25 @@ xfs_ioctl_setattr( ...@@ -1231,13 +1231,25 @@ xfs_ioctl_setattr(
} }
if (mask & FSX_EXTSIZE)
ip->i_d.di_extsize = fa->fsx_extsize >> mp->m_sb.sb_blocklog;
if (mask & FSX_XFLAGS) { if (mask & FSX_XFLAGS) {
xfs_set_diflags(ip, fa->fsx_xflags); xfs_set_diflags(ip, fa->fsx_xflags);
xfs_diflags_to_linux(ip); xfs_diflags_to_linux(ip);
} }
/*
* Only set the extent size hint if we've already determined that the
* extent size hint should be set on the inode. If no extent size flags
* are set on the inode then unconditionally clear the extent size hint.
*/
if (mask & FSX_EXTSIZE) {
int extsize = 0;
if (ip->i_d.di_flags &
(XFS_DIFLAG_EXTSIZE | XFS_DIFLAG_EXTSZINHERIT))
extsize = fa->fsx_extsize >> mp->m_sb.sb_blocklog;
ip->i_d.di_extsize = extsize;
}
xfs_trans_ichgtime(tp, ip, XFS_ICHGTIME_CHG); xfs_trans_ichgtime(tp, ip, XFS_ICHGTIME_CHG);
xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE); xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE);
...@@ -1349,7 +1361,7 @@ xfs_ioc_setxflags( ...@@ -1349,7 +1361,7 @@ xfs_ioc_setxflags(
STATIC int STATIC int
xfs_getbmap_format(void **ap, struct getbmapx *bmv, int *full) xfs_getbmap_format(void **ap, struct getbmapx *bmv, int *full)
{ {
struct getbmap __user *base = *ap; struct getbmap __user *base = (struct getbmap __user *)*ap;
/* copy only getbmap portion (not getbmapx) */ /* copy only getbmap portion (not getbmapx) */
if (copy_to_user(base, bmv, sizeof(struct getbmap))) if (copy_to_user(base, bmv, sizeof(struct getbmap)))
...@@ -1380,7 +1392,7 @@ xfs_ioc_getbmap( ...@@ -1380,7 +1392,7 @@ xfs_ioc_getbmap(
bmx.bmv_iflags |= BMV_IF_NO_DMAPI_READ; bmx.bmv_iflags |= BMV_IF_NO_DMAPI_READ;
error = xfs_getbmap(ip, &bmx, xfs_getbmap_format, error = xfs_getbmap(ip, &bmx, xfs_getbmap_format,
(struct getbmap *)arg+1); (__force struct getbmap *)arg+1);
if (error) if (error)
return error; return error;
...@@ -1393,7 +1405,7 @@ xfs_ioc_getbmap( ...@@ -1393,7 +1405,7 @@ xfs_ioc_getbmap(
STATIC int STATIC int
xfs_getbmapx_format(void **ap, struct getbmapx *bmv, int *full) xfs_getbmapx_format(void **ap, struct getbmapx *bmv, int *full)
{ {
struct getbmapx __user *base = *ap; struct getbmapx __user *base = (struct getbmapx __user *)*ap;
if (copy_to_user(base, bmv, sizeof(struct getbmapx))) if (copy_to_user(base, bmv, sizeof(struct getbmapx)))
return -EFAULT; return -EFAULT;
...@@ -1420,7 +1432,7 @@ xfs_ioc_getbmapx( ...@@ -1420,7 +1432,7 @@ xfs_ioc_getbmapx(
return -EINVAL; return -EINVAL;
error = xfs_getbmap(ip, &bmx, xfs_getbmapx_format, error = xfs_getbmap(ip, &bmx, xfs_getbmapx_format,
(struct getbmapx *)arg+1); (__force struct getbmapx *)arg+1);
if (error) if (error)
return error; return error;
......
...@@ -160,6 +160,7 @@ xfs_ioctl32_bstat_copyin( ...@@ -160,6 +160,7 @@ xfs_ioctl32_bstat_copyin(
get_user(bstat->bs_gen, &bstat32->bs_gen) || get_user(bstat->bs_gen, &bstat32->bs_gen) ||
get_user(bstat->bs_projid_lo, &bstat32->bs_projid_lo) || get_user(bstat->bs_projid_lo, &bstat32->bs_projid_lo) ||
get_user(bstat->bs_projid_hi, &bstat32->bs_projid_hi) || get_user(bstat->bs_projid_hi, &bstat32->bs_projid_hi) ||
get_user(bstat->bs_forkoff, &bstat32->bs_forkoff) ||
get_user(bstat->bs_dmevmask, &bstat32->bs_dmevmask) || get_user(bstat->bs_dmevmask, &bstat32->bs_dmevmask) ||
get_user(bstat->bs_dmstate, &bstat32->bs_dmstate) || get_user(bstat->bs_dmstate, &bstat32->bs_dmstate) ||
get_user(bstat->bs_aextents, &bstat32->bs_aextents)) get_user(bstat->bs_aextents, &bstat32->bs_aextents))
...@@ -214,6 +215,7 @@ xfs_bulkstat_one_fmt_compat( ...@@ -214,6 +215,7 @@ xfs_bulkstat_one_fmt_compat(
put_user(buffer->bs_gen, &p32->bs_gen) || put_user(buffer->bs_gen, &p32->bs_gen) ||
put_user(buffer->bs_projid, &p32->bs_projid) || put_user(buffer->bs_projid, &p32->bs_projid) ||
put_user(buffer->bs_projid_hi, &p32->bs_projid_hi) || put_user(buffer->bs_projid_hi, &p32->bs_projid_hi) ||
put_user(buffer->bs_forkoff, &p32->bs_forkoff) ||
put_user(buffer->bs_dmevmask, &p32->bs_dmevmask) || put_user(buffer->bs_dmevmask, &p32->bs_dmevmask) ||
put_user(buffer->bs_dmstate, &p32->bs_dmstate) || put_user(buffer->bs_dmstate, &p32->bs_dmstate) ||
put_user(buffer->bs_aextents, &p32->bs_aextents)) put_user(buffer->bs_aextents, &p32->bs_aextents))
......
...@@ -67,8 +67,9 @@ typedef struct compat_xfs_bstat { ...@@ -67,8 +67,9 @@ typedef struct compat_xfs_bstat {
__u32 bs_gen; /* generation count */ __u32 bs_gen; /* generation count */
__u16 bs_projid_lo; /* lower part of project id */ __u16 bs_projid_lo; /* lower part of project id */
#define bs_projid bs_projid_lo /* (previously just bs_projid) */ #define bs_projid bs_projid_lo /* (previously just bs_projid) */
__u16 bs_forkoff; /* inode fork offset in bytes */
__u16 bs_projid_hi; /* high part of project id */ __u16 bs_projid_hi; /* high part of project id */
unsigned char bs_pad[12]; /* pad space, unused */ unsigned char bs_pad[10]; /* pad space, unused */
__u32 bs_dmevmask; /* DMIG event mask */ __u32 bs_dmevmask; /* DMIG event mask */
__u16 bs_dmstate; /* DMIG state info */ __u16 bs_dmstate; /* DMIG state info */
__u16 bs_aextents; /* attribute number of extents */ __u16 bs_aextents; /* attribute number of extents */
......
...@@ -404,8 +404,8 @@ xfs_quota_calc_throttle( ...@@ -404,8 +404,8 @@ xfs_quota_calc_throttle(
int shift = 0; int shift = 0;
struct xfs_dquot *dq = xfs_inode_dquot(ip, type); struct xfs_dquot *dq = xfs_inode_dquot(ip, type);
/* over hi wmark, squash the prealloc completely */ /* no dq, or over hi wmark, squash the prealloc completely */
if (dq->q_res_bcount >= dq->q_prealloc_hi_wmark) { if (!dq || dq->q_res_bcount >= dq->q_prealloc_hi_wmark) {
*qblocks = 0; *qblocks = 0;
*qfreesp = 0; *qfreesp = 0;
return; return;
......
...@@ -849,6 +849,36 @@ xfs_setattr_size( ...@@ -849,6 +849,36 @@ xfs_setattr_size(
return error; return error;
truncate_setsize(inode, newsize); truncate_setsize(inode, newsize);
/*
* The "we can't serialise against page faults" pain gets worse.
*
* If the file is mapped then we have to clean the page at the old EOF
* when extending the file. Extending the file can expose changes the
* underlying page mapping (e.g. from beyond EOF to a hole or
* unwritten), and so on the next attempt to write to that page we need
* to remap it for write. i.e. we need .page_mkwrite() to be called.
* Hence we need to clean the page to clean the pte and so a new write
* fault will be triggered appropriately.
*
* If we do it before we change the inode size, then we can race with a
* page fault that maps the page with exactly the same problem. If we do
* it after we change the file size, then a new page fault can come in
* and allocate space before we've run the rest of the truncate
* transaction. That's kinda grotesque, but it's better than have data
* over a hole, and so that's the lesser evil that has been chosen here.
*
* The real solution, however, is to have some mechanism for locking out
* page faults while a truncate is in progress.
*/
if (newsize > oldsize && mapping_mapped(VFS_I(ip)->i_mapping)) {
error = filemap_write_and_wait_range(
VFS_I(ip)->i_mapping,
round_down(oldsize, PAGE_CACHE_SIZE),
round_up(oldsize, PAGE_CACHE_SIZE) - 1);
if (error)
return error;
}
tp = xfs_trans_alloc(mp, XFS_TRANS_SETATTR_SIZE); tp = xfs_trans_alloc(mp, XFS_TRANS_SETATTR_SIZE);
error = xfs_trans_reserve(tp, &M_RES(mp)->tr_itruncate, 0, 0); error = xfs_trans_reserve(tp, &M_RES(mp)->tr_itruncate, 0, 0);
if (error) if (error)
......
...@@ -639,7 +639,8 @@ xfs_inumbers( ...@@ -639,7 +639,8 @@ xfs_inumbers(
xfs_buf_relse(agbp); xfs_buf_relse(agbp);
agbp = NULL; agbp = NULL;
agino = 0; agino = 0;
} while (++agno < mp->m_sb.sb_agcount); agno++;
} while (agno < mp->m_sb.sb_agcount);
if (!error) { if (!error) {
if (bufidx) { if (bufidx) {
......
...@@ -56,7 +56,6 @@ typedef __uint64_t __psunsigned_t; ...@@ -56,7 +56,6 @@ typedef __uint64_t __psunsigned_t;
#include "kmem.h" #include "kmem.h"
#include "mrlock.h" #include "mrlock.h"
#include "time.h"
#include "uuid.h" #include "uuid.h"
#include <linux/semaphore.h> #include <linux/semaphore.h>
...@@ -179,6 +178,11 @@ typedef __uint64_t __psunsigned_t; ...@@ -179,6 +178,11 @@ typedef __uint64_t __psunsigned_t;
#define MAX(a,b) (max(a,b)) #define MAX(a,b) (max(a,b))
#define howmany(x, y) (((x)+((y)-1))/(y)) #define howmany(x, y) (((x)+((y)-1))/(y))
static inline void delay(long ticks)
{
schedule_timeout_uninterruptible(ticks);
}
/* /*
* XFS wrapper structure for sysfs support. It depends on external data * XFS wrapper structure for sysfs support. It depends on external data
* structures and is embedded in various internal data structures to implement * structures and is embedded in various internal data structures to implement
......
...@@ -1678,7 +1678,7 @@ xlog_bdstrat( ...@@ -1678,7 +1678,7 @@ xlog_bdstrat(
if (iclog->ic_state & XLOG_STATE_IOERROR) { if (iclog->ic_state & XLOG_STATE_IOERROR) {
xfs_buf_ioerror(bp, -EIO); xfs_buf_ioerror(bp, -EIO);
xfs_buf_stale(bp); xfs_buf_stale(bp);
xfs_buf_ioend(bp, 0); xfs_buf_ioend(bp);
/* /*
* It would seem logical to return EIO here, but we rely on * It would seem logical to return EIO here, but we rely on
* the log state machine to propagate I/O errors instead of * the log state machine to propagate I/O errors instead of
...@@ -1688,7 +1688,7 @@ xlog_bdstrat( ...@@ -1688,7 +1688,7 @@ xlog_bdstrat(
return 0; return 0;
} }
xfs_buf_iorequest(bp); xfs_buf_submit(bp);
return 0; return 0;
} }
...@@ -3867,18 +3867,17 @@ xlog_state_ioerror( ...@@ -3867,18 +3867,17 @@ xlog_state_ioerror(
* This is called from xfs_force_shutdown, when we're forcibly * This is called from xfs_force_shutdown, when we're forcibly
* shutting down the filesystem, typically because of an IO error. * shutting down the filesystem, typically because of an IO error.
* Our main objectives here are to make sure that: * Our main objectives here are to make sure that:
* a. the filesystem gets marked 'SHUTDOWN' for all interested * a. if !logerror, flush the logs to disk. Anything modified
* after this is ignored.
* b. the filesystem gets marked 'SHUTDOWN' for all interested
* parties to find out, 'atomically'. * parties to find out, 'atomically'.
* b. those who're sleeping on log reservations, pinned objects and * c. those who're sleeping on log reservations, pinned objects and
* other resources get woken up, and be told the bad news. * other resources get woken up, and be told the bad news.
* c. nothing new gets queued up after (a) and (b) are done. * d. nothing new gets queued up after (b) and (c) are done.
* d. if !logerror, flush the iclogs to disk, then seal them off
* for business.
* *
* Note: for delayed logging the !logerror case needs to flush the regions * Note: for the !logerror case we need to flush the regions held in memory out
* held in memory out to the iclogs before flushing them to disk. This needs * to disk first. This needs to be done before the log is marked as shutdown,
* to be done before the log is marked as shutdown, otherwise the flush to the * otherwise the iclog writes will fail.
* iclogs will fail.
*/ */
int int
xfs_log_force_umount( xfs_log_force_umount(
...@@ -3910,16 +3909,16 @@ xfs_log_force_umount( ...@@ -3910,16 +3909,16 @@ xfs_log_force_umount(
ASSERT(XLOG_FORCED_SHUTDOWN(log)); ASSERT(XLOG_FORCED_SHUTDOWN(log));
return 1; return 1;
} }
retval = 0;
/* /*
* Flush the in memory commit item list before marking the log as * Flush all the completed transactions to disk before marking the log
* being shut down. We need to do it in this order to ensure all the * being shut down. We need to do it in this order to ensure that
* completed transactions are flushed to disk with the xfs_log_force() * completed operations are safely on disk before we shut down, and that
* call below. * we don't have to issue any buffer IO after the shutdown flags are set
* to guarantee this.
*/ */
if (!logerror) if (!logerror)
xlog_cil_force(log); _xfs_log_force(mp, XFS_LOG_SYNC, NULL);
/* /*
* mark the filesystem and the as in a shutdown state and wake * mark the filesystem and the as in a shutdown state and wake
...@@ -3931,17 +3930,10 @@ xfs_log_force_umount( ...@@ -3931,17 +3930,10 @@ xfs_log_force_umount(
XFS_BUF_DONE(mp->m_sb_bp); XFS_BUF_DONE(mp->m_sb_bp);
/* /*
* This flag is sort of redundant because of the mount flag, but * Mark the log and the iclogs with IO error flags to prevent any
* it's good to maintain the separation between the log and the rest * further log IO from being issued or completed.
* of XFS.
*/ */
log->l_flags |= XLOG_IO_ERROR; log->l_flags |= XLOG_IO_ERROR;
/*
* If we hit a log error, we want to mark all the iclogs IOERROR
* while we're still holding the loglock.
*/
if (logerror)
retval = xlog_state_ioerror(log); retval = xlog_state_ioerror(log);
spin_unlock(&log->l_icloglock); spin_unlock(&log->l_icloglock);
...@@ -3955,19 +3947,6 @@ xfs_log_force_umount( ...@@ -3955,19 +3947,6 @@ xfs_log_force_umount(
xlog_grant_head_wake_all(&log->l_reserve_head); xlog_grant_head_wake_all(&log->l_reserve_head);
xlog_grant_head_wake_all(&log->l_write_head); xlog_grant_head_wake_all(&log->l_write_head);
if (!(log->l_iclog->ic_state & XLOG_STATE_IOERROR)) {
ASSERT(!logerror);
/*
* Force the incore logs to disk before shutting the
* log down completely.
*/
_xfs_log_force(mp, XFS_LOG_SYNC, NULL);
spin_lock(&log->l_icloglock);
retval = xlog_state_ioerror(log);
spin_unlock(&log->l_icloglock);
}
/* /*
* Wake up everybody waiting on xfs_log_force. Wake the CIL push first * Wake up everybody waiting on xfs_log_force. Wake the CIL push first
* as if the log writes were completed. The abort handling in the log * as if the log writes were completed. The abort handling in the log
......
...@@ -463,12 +463,40 @@ xlog_cil_push( ...@@ -463,12 +463,40 @@ xlog_cil_push(
spin_unlock(&cil->xc_push_lock); spin_unlock(&cil->xc_push_lock);
goto out_skip; goto out_skip;
} }
spin_unlock(&cil->xc_push_lock);
/* check for a previously pushed seqeunce */ /* check for a previously pushed seqeunce */
if (push_seq < cil->xc_ctx->sequence) if (push_seq < cil->xc_ctx->sequence) {
spin_unlock(&cil->xc_push_lock);
goto out_skip; goto out_skip;
}
/*
* We are now going to push this context, so add it to the committing
* list before we do anything else. This ensures that anyone waiting on
* this push can easily detect the difference between a "push in
* progress" and "CIL is empty, nothing to do".
*
* IOWs, a wait loop can now check for:
* the current sequence not being found on the committing list;
* an empty CIL; and
* an unchanged sequence number
* to detect a push that had nothing to do and therefore does not need
* waiting on. If the CIL is not empty, we get put on the committing
* list before emptying the CIL and bumping the sequence number. Hence
* an empty CIL and an unchanged sequence number means we jumped out
* above after doing nothing.
*
* Hence the waiter will either find the commit sequence on the
* committing list or the sequence number will be unchanged and the CIL
* still dirty. In that latter case, the push has not yet started, and
* so the waiter will have to continue trying to check the CIL
* committing list until it is found. In extreme cases of delay, the
* sequence may fully commit between the attempts the wait makes to wait
* on the commit sequence.
*/
list_add(&ctx->committing, &cil->xc_committing);
spin_unlock(&cil->xc_push_lock);
/* /*
* pull all the log vectors off the items in the CIL, and * pull all the log vectors off the items in the CIL, and
...@@ -532,7 +560,6 @@ xlog_cil_push( ...@@ -532,7 +560,6 @@ xlog_cil_push(
*/ */
spin_lock(&cil->xc_push_lock); spin_lock(&cil->xc_push_lock);
cil->xc_current_sequence = new_ctx->sequence; cil->xc_current_sequence = new_ctx->sequence;
list_add(&ctx->committing, &cil->xc_committing);
spin_unlock(&cil->xc_push_lock); spin_unlock(&cil->xc_push_lock);
up_write(&cil->xc_ctx_lock); up_write(&cil->xc_ctx_lock);
...@@ -855,13 +882,15 @@ xlog_cil_force_lsn( ...@@ -855,13 +882,15 @@ xlog_cil_force_lsn(
* Hence by the time we have got here it our sequence may not have been * Hence by the time we have got here it our sequence may not have been
* pushed yet. This is true if the current sequence still matches the * pushed yet. This is true if the current sequence still matches the
* push sequence after the above wait loop and the CIL still contains * push sequence after the above wait loop and the CIL still contains
* dirty objects. * dirty objects. This is guaranteed by the push code first adding the
* context to the committing list before emptying the CIL.
* *
* When the push occurs, it will empty the CIL and atomically increment * Hence if we don't find the context in the committing list and the
* the currect sequence past the push sequence and move it into the * current sequence number is unchanged then the CIL contents are
* committing list. Of course, if the CIL is clean at the time of the * significant. If the CIL is empty, if means there was nothing to push
* push, it won't have pushed the CIL at all, so in that case we should * and that means there is nothing to wait for. If the CIL is not empty,
* try the push for this sequence again from the start just in case. * it means we haven't yet started the push, because if it had started
* we would have found the context on the committing list.
*/ */
if (sequence == cil->xc_current_sequence && if (sequence == cil->xc_current_sequence &&
!list_empty(&cil->xc_cil)) { !list_empty(&cil->xc_cil)) {
......
This diff is collapsed.
...@@ -61,8 +61,6 @@ static DEFINE_MUTEX(xfs_uuid_table_mutex); ...@@ -61,8 +61,6 @@ static DEFINE_MUTEX(xfs_uuid_table_mutex);
static int xfs_uuid_table_size; static int xfs_uuid_table_size;
static uuid_t *xfs_uuid_table; static uuid_t *xfs_uuid_table;
extern struct kset *xfs_kset;
/* /*
* See if the UUID is unique among mounted XFS filesystems. * See if the UUID is unique among mounted XFS filesystems.
* Mount fails if UUID is nil or a FS with the same UUID is already mounted. * Mount fails if UUID is nil or a FS with the same UUID is already mounted.
...@@ -302,21 +300,15 @@ xfs_readsb( ...@@ -302,21 +300,15 @@ xfs_readsb(
* access to the superblock. * access to the superblock.
*/ */
reread: reread:
bp = xfs_buf_read_uncached(mp->m_ddev_targp, XFS_SB_DADDR, error = xfs_buf_read_uncached(mp->m_ddev_targp, XFS_SB_DADDR,
BTOBB(sector_size), 0, buf_ops); BTOBB(sector_size), 0, &bp, buf_ops);
if (!bp) { if (error) {
if (loud)
xfs_warn(mp, "SB buffer read failed");
return -EIO;
}
if (bp->b_error) {
error = bp->b_error;
if (loud) if (loud)
xfs_warn(mp, "SB validate failed with error %d.", error); xfs_warn(mp, "SB validate failed with error %d.", error);
/* bad CRC means corrupted metadata */ /* bad CRC means corrupted metadata */
if (error == -EFSBADCRC) if (error == -EFSBADCRC)
error = -EFSCORRUPTED; error = -EFSCORRUPTED;
goto release_buf; return error;
} }
/* /*
...@@ -546,40 +538,43 @@ xfs_set_inoalignment(xfs_mount_t *mp) ...@@ -546,40 +538,43 @@ xfs_set_inoalignment(xfs_mount_t *mp)
* Check that the data (and log if separate) is an ok size. * Check that the data (and log if separate) is an ok size.
*/ */
STATIC int STATIC int
xfs_check_sizes(xfs_mount_t *mp) xfs_check_sizes(
struct xfs_mount *mp)
{ {
xfs_buf_t *bp; struct xfs_buf *bp;
xfs_daddr_t d; xfs_daddr_t d;
int error;
d = (xfs_daddr_t)XFS_FSB_TO_BB(mp, mp->m_sb.sb_dblocks); d = (xfs_daddr_t)XFS_FSB_TO_BB(mp, mp->m_sb.sb_dblocks);
if (XFS_BB_TO_FSB(mp, d) != mp->m_sb.sb_dblocks) { if (XFS_BB_TO_FSB(mp, d) != mp->m_sb.sb_dblocks) {
xfs_warn(mp, "filesystem size mismatch detected"); xfs_warn(mp, "filesystem size mismatch detected");
return -EFBIG; return -EFBIG;
} }
bp = xfs_buf_read_uncached(mp->m_ddev_targp, error = xfs_buf_read_uncached(mp->m_ddev_targp,
d - XFS_FSS_TO_BB(mp, 1), d - XFS_FSS_TO_BB(mp, 1),
XFS_FSS_TO_BB(mp, 1), 0, NULL); XFS_FSS_TO_BB(mp, 1), 0, &bp, NULL);
if (!bp) { if (error) {
xfs_warn(mp, "last sector read failed"); xfs_warn(mp, "last sector read failed");
return -EIO; return error;
} }
xfs_buf_relse(bp); xfs_buf_relse(bp);
if (mp->m_logdev_targp != mp->m_ddev_targp) { if (mp->m_logdev_targp == mp->m_ddev_targp)
return 0;
d = (xfs_daddr_t)XFS_FSB_TO_BB(mp, mp->m_sb.sb_logblocks); d = (xfs_daddr_t)XFS_FSB_TO_BB(mp, mp->m_sb.sb_logblocks);
if (XFS_BB_TO_FSB(mp, d) != mp->m_sb.sb_logblocks) { if (XFS_BB_TO_FSB(mp, d) != mp->m_sb.sb_logblocks) {
xfs_warn(mp, "log size mismatch detected"); xfs_warn(mp, "log size mismatch detected");
return -EFBIG; return -EFBIG;
} }
bp = xfs_buf_read_uncached(mp->m_logdev_targp, error = xfs_buf_read_uncached(mp->m_logdev_targp,
d - XFS_FSB_TO_BB(mp, 1), d - XFS_FSB_TO_BB(mp, 1),
XFS_FSB_TO_BB(mp, 1), 0, NULL); XFS_FSB_TO_BB(mp, 1), 0, &bp, NULL);
if (!bp) { if (error) {
xfs_warn(mp, "log device read failed"); xfs_warn(mp, "log device read failed");
return -EIO; return error;
} }
xfs_buf_relse(bp); xfs_buf_relse(bp);
}
return 0; return 0;
} }
...@@ -729,7 +724,6 @@ xfs_mountfs( ...@@ -729,7 +724,6 @@ xfs_mountfs(
xfs_set_maxicount(mp); xfs_set_maxicount(mp);
mp->m_kobj.kobject.kset = xfs_kset;
error = xfs_sysfs_init(&mp->m_kobj, &xfs_mp_ktype, NULL, mp->m_fsname); error = xfs_sysfs_init(&mp->m_kobj, &xfs_mp_ktype, NULL, mp->m_fsname);
if (error) if (error)
goto out; goto out;
......
...@@ -304,7 +304,8 @@ _xfs_mru_cache_reap( ...@@ -304,7 +304,8 @@ _xfs_mru_cache_reap(
int int
xfs_mru_cache_init(void) xfs_mru_cache_init(void)
{ {
xfs_mru_reap_wq = alloc_workqueue("xfs_mru_cache", WQ_MEM_RECLAIM, 1); xfs_mru_reap_wq = alloc_workqueue("xfs_mru_cache",
WQ_MEM_RECLAIM|WQ_FREEZABLE, 1);
if (!xfs_mru_reap_wq) if (!xfs_mru_reap_wq)
return -ENOMEM; return -ENOMEM;
return 0; return 0;
......
...@@ -434,6 +434,7 @@ xfs_qm_dquot_isolate( ...@@ -434,6 +434,7 @@ xfs_qm_dquot_isolate(
struct list_head *item, struct list_head *item,
spinlock_t *lru_lock, spinlock_t *lru_lock,
void *arg) void *arg)
__releases(lru_lock) __acquires(lru_lock)
{ {
struct xfs_dquot *dqp = container_of(item, struct xfs_dquot *dqp = container_of(item,
struct xfs_dquot, q_lru); struct xfs_dquot, q_lru);
......
...@@ -46,7 +46,7 @@ ...@@ -46,7 +46,7 @@
* Keeps track of a current summary block, so we don't keep reading * Keeps track of a current summary block, so we don't keep reading
* it from the buffer cache. * it from the buffer cache.
*/ */
STATIC int /* error */ static int
xfs_rtget_summary( xfs_rtget_summary(
xfs_mount_t *mp, /* file system mount structure */ xfs_mount_t *mp, /* file system mount structure */
xfs_trans_t *tp, /* transaction pointer */ xfs_trans_t *tp, /* transaction pointer */
...@@ -56,60 +56,9 @@ xfs_rtget_summary( ...@@ -56,60 +56,9 @@ xfs_rtget_summary(
xfs_fsblock_t *rsb, /* in/out: summary block number */ xfs_fsblock_t *rsb, /* in/out: summary block number */
xfs_suminfo_t *sum) /* out: summary info for this block */ xfs_suminfo_t *sum) /* out: summary info for this block */
{ {
xfs_buf_t *bp; /* buffer for summary block */ return xfs_rtmodify_summary_int(mp, tp, log, bbno, 0, rbpp, rsb, sum);
int error; /* error value */
xfs_fsblock_t sb; /* summary fsblock */
int so; /* index into the summary file */
xfs_suminfo_t *sp; /* pointer to returned data */
/*
* Compute entry number in the summary file.
*/
so = XFS_SUMOFFS(mp, log, bbno);
/*
* Compute the block number in the summary file.
*/
sb = XFS_SUMOFFSTOBLOCK(mp, so);
/*
* If we have an old buffer, and the block number matches, use that.
*/
if (rbpp && *rbpp && *rsb == sb)
bp = *rbpp;
/*
* Otherwise we have to get the buffer.
*/
else {
/*
* If there was an old one, get rid of it first.
*/
if (rbpp && *rbpp)
xfs_trans_brelse(tp, *rbpp);
error = xfs_rtbuf_get(mp, tp, sb, 1, &bp);
if (error) {
return error;
}
/*
* Remember this buffer and block for the next call.
*/
if (rbpp) {
*rbpp = bp;
*rsb = sb;
}
}
/*
* Point to the summary information & copy it out.
*/
sp = XFS_SUMPTR(mp, bp, so);
*sum = *sp;
/*
* Drop the buffer if we're not asked to remember it.
*/
if (!rbpp)
xfs_trans_brelse(tp, bp);
return 0;
} }
/* /*
* Return whether there are any free extents in the size range given * Return whether there are any free extents in the size range given
* by low and high, for the bitmap block bbno. * by low and high, for the bitmap block bbno.
...@@ -972,16 +921,11 @@ xfs_growfs_rt( ...@@ -972,16 +921,11 @@ xfs_growfs_rt(
/* /*
* Read in the last block of the device, make sure it exists. * Read in the last block of the device, make sure it exists.
*/ */
bp = xfs_buf_read_uncached(mp->m_rtdev_targp, error = xfs_buf_read_uncached(mp->m_rtdev_targp,
XFS_FSB_TO_BB(mp, nrblocks - 1), XFS_FSB_TO_BB(mp, nrblocks - 1),
XFS_FSB_TO_BB(mp, 1), 0, NULL); XFS_FSB_TO_BB(mp, 1), 0, &bp, NULL);
if (!bp) if (error)
return -EIO;
if (bp->b_error) {
error = bp->b_error;
xfs_buf_relse(bp);
return error; return error;
}
xfs_buf_relse(bp); xfs_buf_relse(bp);
/* /*
...@@ -1235,11 +1179,12 @@ xfs_rtallocate_extent( ...@@ -1235,11 +1179,12 @@ xfs_rtallocate_extent(
*/ */
int /* error */ int /* error */
xfs_rtmount_init( xfs_rtmount_init(
xfs_mount_t *mp) /* file system mount structure */ struct xfs_mount *mp) /* file system mount structure */
{ {
xfs_buf_t *bp; /* buffer for last block of subvolume */ struct xfs_buf *bp; /* buffer for last block of subvolume */
struct xfs_sb *sbp; /* filesystem superblock copy in mount */
xfs_daddr_t d; /* address of last block of subvolume */ xfs_daddr_t d; /* address of last block of subvolume */
xfs_sb_t *sbp; /* filesystem superblock copy in mount */ int error;
sbp = &mp->m_sb; sbp = &mp->m_sb;
if (sbp->sb_rblocks == 0) if (sbp->sb_rblocks == 0)
...@@ -1265,14 +1210,12 @@ xfs_rtmount_init( ...@@ -1265,14 +1210,12 @@ xfs_rtmount_init(
(unsigned long long) mp->m_sb.sb_rblocks); (unsigned long long) mp->m_sb.sb_rblocks);
return -EFBIG; return -EFBIG;
} }
bp = xfs_buf_read_uncached(mp->m_rtdev_targp, error = xfs_buf_read_uncached(mp->m_rtdev_targp,
d - XFS_FSB_TO_BB(mp, 1), d - XFS_FSB_TO_BB(mp, 1),
XFS_FSB_TO_BB(mp, 1), 0, NULL); XFS_FSB_TO_BB(mp, 1), 0, &bp, NULL);
if (!bp || bp->b_error) { if (error) {
xfs_warn(mp, "realtime device size check failed"); xfs_warn(mp, "realtime device size check failed");
if (bp) return error;
xfs_buf_relse(bp);
return -EIO;
} }
xfs_buf_relse(bp); xfs_buf_relse(bp);
return 0; return 0;
......
...@@ -111,6 +111,10 @@ int xfs_rtfind_forw(struct xfs_mount *mp, struct xfs_trans *tp, ...@@ -111,6 +111,10 @@ int xfs_rtfind_forw(struct xfs_mount *mp, struct xfs_trans *tp,
xfs_rtblock_t *rtblock); xfs_rtblock_t *rtblock);
int xfs_rtmodify_range(struct xfs_mount *mp, struct xfs_trans *tp, int xfs_rtmodify_range(struct xfs_mount *mp, struct xfs_trans *tp,
xfs_rtblock_t start, xfs_extlen_t len, int val); xfs_rtblock_t start, xfs_extlen_t len, int val);
int xfs_rtmodify_summary_int(struct xfs_mount *mp, struct xfs_trans *tp,
int log, xfs_rtblock_t bbno, int delta,
xfs_buf_t **rbpp, xfs_fsblock_t *rsb,
xfs_suminfo_t *sum);
int xfs_rtmodify_summary(struct xfs_mount *mp, struct xfs_trans *tp, int log, int xfs_rtmodify_summary(struct xfs_mount *mp, struct xfs_trans *tp, int log,
xfs_rtblock_t bbno, int delta, xfs_buf_t **rbpp, xfs_rtblock_t bbno, int delta, xfs_buf_t **rbpp,
xfs_fsblock_t *rsb); xfs_fsblock_t *rsb);
......
...@@ -47,6 +47,7 @@ ...@@ -47,6 +47,7 @@
#include "xfs_dinode.h" #include "xfs_dinode.h"
#include "xfs_filestream.h" #include "xfs_filestream.h"
#include "xfs_quota.h" #include "xfs_quota.h"
#include "xfs_sysfs.h"
#include <linux/namei.h> #include <linux/namei.h>
#include <linux/init.h> #include <linux/init.h>
...@@ -61,7 +62,11 @@ ...@@ -61,7 +62,11 @@
static const struct super_operations xfs_super_operations; static const struct super_operations xfs_super_operations;
static kmem_zone_t *xfs_ioend_zone; static kmem_zone_t *xfs_ioend_zone;
mempool_t *xfs_ioend_pool; mempool_t *xfs_ioend_pool;
struct kset *xfs_kset;
static struct kset *xfs_kset; /* top-level xfs sysfs dir */
#ifdef DEBUG
static struct xfs_kobj xfs_dbg_kobj; /* global debug sysfs attrs */
#endif
#define MNTOPT_LOGBUFS "logbufs" /* number of XFS log buffers */ #define MNTOPT_LOGBUFS "logbufs" /* number of XFS log buffers */
#define MNTOPT_LOGBSIZE "logbsize" /* size of XFS log buffers */ #define MNTOPT_LOGBSIZE "logbsize" /* size of XFS log buffers */
...@@ -838,32 +843,32 @@ xfs_init_mount_workqueues( ...@@ -838,32 +843,32 @@ xfs_init_mount_workqueues(
struct xfs_mount *mp) struct xfs_mount *mp)
{ {
mp->m_data_workqueue = alloc_workqueue("xfs-data/%s", mp->m_data_workqueue = alloc_workqueue("xfs-data/%s",
WQ_MEM_RECLAIM, 0, mp->m_fsname); WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
if (!mp->m_data_workqueue) if (!mp->m_data_workqueue)
goto out; goto out;
mp->m_unwritten_workqueue = alloc_workqueue("xfs-conv/%s", mp->m_unwritten_workqueue = alloc_workqueue("xfs-conv/%s",
WQ_MEM_RECLAIM, 0, mp->m_fsname); WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
if (!mp->m_unwritten_workqueue) if (!mp->m_unwritten_workqueue)
goto out_destroy_data_iodone_queue; goto out_destroy_data_iodone_queue;
mp->m_cil_workqueue = alloc_workqueue("xfs-cil/%s", mp->m_cil_workqueue = alloc_workqueue("xfs-cil/%s",
WQ_MEM_RECLAIM, 0, mp->m_fsname); WQ_MEM_RECLAIM|WQ_FREEZABLE, 0, mp->m_fsname);
if (!mp->m_cil_workqueue) if (!mp->m_cil_workqueue)
goto out_destroy_unwritten; goto out_destroy_unwritten;
mp->m_reclaim_workqueue = alloc_workqueue("xfs-reclaim/%s", mp->m_reclaim_workqueue = alloc_workqueue("xfs-reclaim/%s",
0, 0, mp->m_fsname); WQ_FREEZABLE, 0, mp->m_fsname);
if (!mp->m_reclaim_workqueue) if (!mp->m_reclaim_workqueue)
goto out_destroy_cil; goto out_destroy_cil;
mp->m_log_workqueue = alloc_workqueue("xfs-log/%s", mp->m_log_workqueue = alloc_workqueue("xfs-log/%s",
0, 0, mp->m_fsname); WQ_FREEZABLE, 0, mp->m_fsname);
if (!mp->m_log_workqueue) if (!mp->m_log_workqueue)
goto out_destroy_reclaim; goto out_destroy_reclaim;
mp->m_eofblocks_workqueue = alloc_workqueue("xfs-eofblocks/%s", mp->m_eofblocks_workqueue = alloc_workqueue("xfs-eofblocks/%s",
0, 0, mp->m_fsname); WQ_FREEZABLE, 0, mp->m_fsname);
if (!mp->m_eofblocks_workqueue) if (!mp->m_eofblocks_workqueue)
goto out_destroy_log; goto out_destroy_log;
...@@ -1406,6 +1411,7 @@ xfs_fs_fill_super( ...@@ -1406,6 +1411,7 @@ xfs_fs_fill_super(
atomic_set(&mp->m_active_trans, 0); atomic_set(&mp->m_active_trans, 0);
INIT_DELAYED_WORK(&mp->m_reclaim_work, xfs_reclaim_worker); INIT_DELAYED_WORK(&mp->m_reclaim_work, xfs_reclaim_worker);
INIT_DELAYED_WORK(&mp->m_eofblocks_work, xfs_eofblocks_worker); INIT_DELAYED_WORK(&mp->m_eofblocks_work, xfs_eofblocks_worker);
mp->m_kobj.kobject.kset = xfs_kset;
mp->m_super = sb; mp->m_super = sb;
sb->s_fs_info = mp; sb->s_fs_info = mp;
...@@ -1715,7 +1721,8 @@ xfs_init_workqueues(void) ...@@ -1715,7 +1721,8 @@ xfs_init_workqueues(void)
* AGs in all the filesystems mounted. Hence use the default large * AGs in all the filesystems mounted. Hence use the default large
* max_active value for this workqueue. * max_active value for this workqueue.
*/ */
xfs_alloc_wq = alloc_workqueue("xfsalloc", WQ_MEM_RECLAIM, 0); xfs_alloc_wq = alloc_workqueue("xfsalloc",
WQ_MEM_RECLAIM|WQ_FREEZABLE, 0);
if (!xfs_alloc_wq) if (!xfs_alloc_wq)
return -ENOMEM; return -ENOMEM;
...@@ -1768,9 +1775,16 @@ init_xfs_fs(void) ...@@ -1768,9 +1775,16 @@ init_xfs_fs(void)
goto out_sysctl_unregister;; goto out_sysctl_unregister;;
} }
error = xfs_qm_init(); #ifdef DEBUG
xfs_dbg_kobj.kobject.kset = xfs_kset;
error = xfs_sysfs_init(&xfs_dbg_kobj, &xfs_dbg_ktype, NULL, "debug");
if (error) if (error)
goto out_kset_unregister; goto out_kset_unregister;
#endif
error = xfs_qm_init();
if (error)
goto out_remove_kobj;
error = register_filesystem(&xfs_fs_type); error = register_filesystem(&xfs_fs_type);
if (error) if (error)
...@@ -1779,7 +1793,11 @@ init_xfs_fs(void) ...@@ -1779,7 +1793,11 @@ init_xfs_fs(void)
out_qm_exit: out_qm_exit:
xfs_qm_exit(); xfs_qm_exit();
out_remove_kobj:
#ifdef DEBUG
xfs_sysfs_del(&xfs_dbg_kobj);
out_kset_unregister: out_kset_unregister:
#endif
kset_unregister(xfs_kset); kset_unregister(xfs_kset);
out_sysctl_unregister: out_sysctl_unregister:
xfs_sysctl_unregister(); xfs_sysctl_unregister();
...@@ -1802,6 +1820,9 @@ exit_xfs_fs(void) ...@@ -1802,6 +1820,9 @@ exit_xfs_fs(void)
{ {
xfs_qm_exit(); xfs_qm_exit();
unregister_filesystem(&xfs_fs_type); unregister_filesystem(&xfs_fs_type);
#ifdef DEBUG
xfs_sysfs_del(&xfs_dbg_kobj);
#endif
kset_unregister(xfs_kset); kset_unregister(xfs_kset);
xfs_sysctl_unregister(); xfs_sysctl_unregister();
xfs_cleanup_procfs(); xfs_cleanup_procfs();
......
...@@ -269,9 +269,11 @@ xfs_symlink( ...@@ -269,9 +269,11 @@ xfs_symlink(
/* /*
* Check for ability to enter directory entry, if no space reserved. * Check for ability to enter directory entry, if no space reserved.
*/ */
error = xfs_dir_canenter(tp, dp, link_name, resblks); if (!resblks) {
error = xfs_dir_canenter(tp, dp, link_name);
if (error) if (error)
goto error_return; goto error_return;
}
/* /*
* Initialize the bmap freelist prior to calling either * Initialize the bmap freelist prior to calling either
* bmapi or the directory create code. * bmapi or the directory create code.
......
...@@ -92,6 +92,11 @@ enum { ...@@ -92,6 +92,11 @@ enum {
extern xfs_param_t xfs_params; extern xfs_param_t xfs_params;
struct xfs_globals {
int log_recovery_delay; /* log recovery delay (secs) */
};
extern struct xfs_globals xfs_globals;
#ifdef CONFIG_SYSCTL #ifdef CONFIG_SYSCTL
extern int xfs_sysctl_register(void); extern int xfs_sysctl_register(void);
extern void xfs_sysctl_unregister(void); extern void xfs_sysctl_unregister(void);
......
...@@ -51,6 +51,80 @@ struct kobj_type xfs_mp_ktype = { ...@@ -51,6 +51,80 @@ struct kobj_type xfs_mp_ktype = {
.release = xfs_sysfs_release, .release = xfs_sysfs_release,
}; };
#ifdef DEBUG
/* debug */
STATIC ssize_t
log_recovery_delay_store(
const char *buf,
size_t count,
void *data)
{
int ret;
int val;
ret = kstrtoint(buf, 0, &val);
if (ret)
return ret;
if (val < 0 || val > 60)
return -EINVAL;
xfs_globals.log_recovery_delay = val;
return count;
}
STATIC ssize_t
log_recovery_delay_show(
char *buf,
void *data)
{
return snprintf(buf, PAGE_SIZE, "%d\n", xfs_globals.log_recovery_delay);
}
XFS_SYSFS_ATTR_RW(log_recovery_delay);
static struct attribute *xfs_dbg_attrs[] = {
ATTR_LIST(log_recovery_delay),
NULL,
};
STATIC ssize_t
xfs_dbg_show(
struct kobject *kobject,
struct attribute *attr,
char *buf)
{
struct xfs_sysfs_attr *xfs_attr = to_attr(attr);
return xfs_attr->show ? xfs_attr->show(buf, NULL) : 0;
}
STATIC ssize_t
xfs_dbg_store(
struct kobject *kobject,
struct attribute *attr,
const char *buf,
size_t count)
{
struct xfs_sysfs_attr *xfs_attr = to_attr(attr);
return xfs_attr->store ? xfs_attr->store(buf, count, NULL) : 0;
}
static struct sysfs_ops xfs_dbg_ops = {
.show = xfs_dbg_show,
.store = xfs_dbg_store,
};
struct kobj_type xfs_dbg_ktype = {
.release = xfs_sysfs_release,
.sysfs_ops = &xfs_dbg_ops,
.default_attrs = xfs_dbg_attrs,
};
#endif /* DEBUG */
/* xlog */ /* xlog */
STATIC ssize_t STATIC ssize_t
......
...@@ -20,6 +20,7 @@ ...@@ -20,6 +20,7 @@
#define __XFS_SYSFS_H__ #define __XFS_SYSFS_H__
extern struct kobj_type xfs_mp_ktype; /* xfs_mount */ extern struct kobj_type xfs_mp_ktype; /* xfs_mount */
extern struct kobj_type xfs_dbg_ktype; /* debug */
extern struct kobj_type xfs_log_ktype; /* xlog */ extern struct kobj_type xfs_log_ktype; /* xlog */
static inline struct xfs_kobj * static inline struct xfs_kobj *
......
...@@ -349,7 +349,8 @@ DEFINE_BUF_EVENT(xfs_buf_free); ...@@ -349,7 +349,8 @@ DEFINE_BUF_EVENT(xfs_buf_free);
DEFINE_BUF_EVENT(xfs_buf_hold); DEFINE_BUF_EVENT(xfs_buf_hold);
DEFINE_BUF_EVENT(xfs_buf_rele); DEFINE_BUF_EVENT(xfs_buf_rele);
DEFINE_BUF_EVENT(xfs_buf_iodone); DEFINE_BUF_EVENT(xfs_buf_iodone);
DEFINE_BUF_EVENT(xfs_buf_iorequest); DEFINE_BUF_EVENT(xfs_buf_submit);
DEFINE_BUF_EVENT(xfs_buf_submit_wait);
DEFINE_BUF_EVENT(xfs_buf_bawrite); DEFINE_BUF_EVENT(xfs_buf_bawrite);
DEFINE_BUF_EVENT(xfs_buf_lock); DEFINE_BUF_EVENT(xfs_buf_lock);
DEFINE_BUF_EVENT(xfs_buf_lock_done); DEFINE_BUF_EVENT(xfs_buf_lock_done);
......
...@@ -318,19 +318,9 @@ xfs_trans_read_buf_map( ...@@ -318,19 +318,9 @@ xfs_trans_read_buf_map(
XFS_BUF_READ(bp); XFS_BUF_READ(bp);
bp->b_ops = ops; bp->b_ops = ops;
/* error = xfs_buf_submit_wait(bp);
* XXX(hch): clean up the error handling here to be less
* of a mess..
*/
if (XFS_FORCED_SHUTDOWN(mp)) {
trace_xfs_bdstrat_shut(bp, _RET_IP_);
xfs_bioerror_relse(bp);
} else {
xfs_buf_iorequest(bp);
}
error = xfs_buf_iowait(bp);
if (error) { if (error) {
if (!XFS_FORCED_SHUTDOWN(mp))
xfs_buf_ioerror_alert(bp, __func__); xfs_buf_ioerror_alert(bp, __func__);
xfs_buf_relse(bp); xfs_buf_relse(bp);
/* /*
......
...@@ -70,7 +70,7 @@ xfs_trans_ichgtime( ...@@ -70,7 +70,7 @@ xfs_trans_ichgtime(
int flags) int flags)
{ {
struct inode *inode = VFS_I(ip); struct inode *inode = VFS_I(ip);
timespec_t tv; struct timespec tv;
ASSERT(tp); ASSERT(tp);
ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL)); ASSERT(xfs_isilocked(ip, XFS_ILOCK_EXCL));
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment