2005-04-16 22:20:36 +00:00
|
|
|
/*
|
2006-06-09 04:48:12 +00:00
|
|
|
* Copyright (c) 2000-2006 Silicon Graphics, Inc.
|
2005-11-02 03:58:39 +00:00
|
|
|
* All Rights Reserved.
|
2005-04-16 22:20:36 +00:00
|
|
|
*
|
2005-11-02 03:58:39 +00:00
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License as
|
2005-04-16 22:20:36 +00:00
|
|
|
* published by the Free Software Foundation.
|
|
|
|
*
|
2005-11-02 03:58:39 +00:00
|
|
|
* This program is distributed in the hope that it would be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
2005-04-16 22:20:36 +00:00
|
|
|
*
|
2005-11-02 03:58:39 +00:00
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program; if not, write the Free Software Foundation,
|
|
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
2005-04-16 22:20:36 +00:00
|
|
|
*/
|
|
|
|
#ifndef __XFS_BMAP_H__
|
|
|
|
#define __XFS_BMAP_H__
|
|
|
|
|
|
|
|
struct getbmap;
|
|
|
|
struct xfs_bmbt_irec;
|
2006-03-14 02:29:52 +00:00
|
|
|
struct xfs_ifork;
|
2005-04-16 22:20:36 +00:00
|
|
|
struct xfs_inode;
|
|
|
|
struct xfs_mount;
|
|
|
|
struct xfs_trans;
|
|
|
|
|
2007-11-23 05:28:09 +00:00
|
|
|
extern kmem_zone_t *xfs_bmap_free_item_zone;
|
|
|
|
|
2015-01-08 23:46:49 +00:00
|
|
|
/*
|
|
|
|
* Argument structure for xfs_bmap_alloc.
|
|
|
|
*/
|
|
|
|
struct xfs_bmalloca {
|
|
|
|
xfs_fsblock_t *firstblock; /* i/o first block allocated */
|
2016-08-03 01:19:29 +00:00
|
|
|
struct xfs_defer_ops *dfops; /* bmap freelist */
|
2015-01-08 23:46:49 +00:00
|
|
|
struct xfs_trans *tp; /* transaction pointer */
|
|
|
|
struct xfs_inode *ip; /* incore inode pointer */
|
|
|
|
struct xfs_bmbt_irec prev; /* extent before the new one */
|
|
|
|
struct xfs_bmbt_irec got; /* extent after, or delayed */
|
|
|
|
|
|
|
|
xfs_fileoff_t offset; /* offset in file filling in */
|
|
|
|
xfs_extlen_t length; /* i/o length asked/allocated */
|
|
|
|
xfs_fsblock_t blkno; /* starting block of new extent */
|
|
|
|
|
|
|
|
struct xfs_btree_cur *cur; /* btree cursor */
|
|
|
|
xfs_extnum_t idx; /* current extent index */
|
|
|
|
int nallocs;/* number of extents alloc'd */
|
|
|
|
int logflags;/* flags for transaction logging */
|
|
|
|
|
|
|
|
xfs_extlen_t total; /* total blocks needed for xaction */
|
|
|
|
xfs_extlen_t minlen; /* minimum allocation size (blocks) */
|
|
|
|
xfs_extlen_t minleft; /* amount must be left after alloc */
|
|
|
|
bool eof; /* set if allocating past last extent */
|
|
|
|
bool wasdel; /* replacing a delayed allocation */
|
|
|
|
bool aeof; /* allocated space at eof */
|
|
|
|
bool conv; /* overwriting unwritten extents */
|
xfs: remote attribute blocks aren't really userdata
When adding a new remote attribute, we write the attribute to the
new extent before the allocation transaction is committed. This
means we cannot reuse busy extents as that violates crash
consistency semantics. Hence we currently treat remote attribute
extent allocation like userdata because it has the same overwrite
ordering constraints as userdata.
Unfortunately, this also allows the allocator to incorrectly apply
extent size hints to the remote attribute extent allocation. This
results in interesting failures, such as transaction block
reservation overruns and in-memory inode attribute fork corruption.
To fix this, we need to separate the busy extent reuse configuration
from the userdata configuration. This changes the definition of
XFS_BMAPI_METADATA slightly - it now means that allocation is
metadata and reuse of busy extents is acceptible due to the metadata
ordering semantics of the journal. If this flag is not set, it
means the allocation is that has unordered data writeback, and hence
busy extent reuse is not allowed. It no longer implies the
allocation is for user data, just that the data write will not be
strictly ordered. This matches the semantics for both user data
and remote attribute block allocation.
As such, This patch changes the "userdata" field to a "datatype"
field, and adds a "no busy reuse" flag to the field.
When we detect an unordered data extent allocation, we immediately set
the no reuse flag. We then set the "user data" flags based on the
inode fork we are allocating the extent to. Hence we only set
userdata flags on data fork allocations now and consider attribute
fork remote extents to be an unordered metadata extent.
The result is that remote attribute extents now have the expected
allocation semantics, and the data fork allocation behaviour is
completely unchanged.
It should be noted that there may be other ways to fix this (e.g.
use ordered metadata buffers for the remote attribute extent data
write) but they are more invasive and difficult to validate both
from a design and implementation POV. Hence this patch takes the
simple, obvious route to fixing the problem...
Reported-and-tested-by: Ross Zwisler <ross.zwisler@linux.intel.com>
Signed-off-by: Dave Chinner <dchinner@redhat.com>
Reviewed-by: Christoph Hellwig <hch@lst.de>
Signed-off-by: Dave Chinner <david@fromorbit.com>
2016-09-25 22:21:28 +00:00
|
|
|
int datatype;/* data type being allocated */
|
2015-01-08 23:46:49 +00:00
|
|
|
int flags;
|
|
|
|
};
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
/*
|
|
|
|
* List of extents to be free "later".
|
|
|
|
* The list is kept sorted on xbf_startblock.
|
|
|
|
*/
|
2016-08-03 01:18:10 +00:00
|
|
|
struct xfs_extent_free_item
|
2005-04-16 22:20:36 +00:00
|
|
|
{
|
2016-08-03 01:18:10 +00:00
|
|
|
xfs_fsblock_t xefi_startblock;/* starting fs block number */
|
|
|
|
xfs_extlen_t xefi_blockcount;/* number of blocks in extent */
|
|
|
|
struct list_head xefi_list;
|
2016-08-03 01:33:42 +00:00
|
|
|
struct xfs_owner_info xefi_oinfo; /* extent owner */
|
2016-06-21 01:53:28 +00:00
|
|
|
};
|
2005-04-16 22:20:36 +00:00
|
|
|
|
|
|
|
#define XFS_BMAP_MAX_NMAP 4
|
|
|
|
|
|
|
|
/*
|
2011-09-18 20:40:52 +00:00
|
|
|
* Flags for xfs_bmapi_*
|
2005-04-16 22:20:36 +00:00
|
|
|
*/
|
2011-09-18 20:40:52 +00:00
|
|
|
#define XFS_BMAPI_ENTIRE 0x001 /* return entire extent, not trimmed */
|
|
|
|
#define XFS_BMAPI_METADATA 0x002 /* mapping metadata not user data */
|
|
|
|
#define XFS_BMAPI_ATTRFORK 0x004 /* use attribute fork not data */
|
|
|
|
#define XFS_BMAPI_PREALLOC 0x008 /* preallocation op: unwritten space */
|
|
|
|
#define XFS_BMAPI_IGSTATE 0x010 /* Ignore state - */
|
2005-04-16 22:20:36 +00:00
|
|
|
/* combine contig. space */
|
2011-09-18 20:40:52 +00:00
|
|
|
#define XFS_BMAPI_CONTIG 0x020 /* must allocate only one extent */
|
2010-08-24 02:02:11 +00:00
|
|
|
/*
|
|
|
|
* unwritten extent conversion - this needs write cache flushing and no additional
|
|
|
|
* allocation alignments. When specified with XFS_BMAPI_PREALLOC it converts
|
|
|
|
* from written to unwritten, otherwise convert from unwritten to written.
|
|
|
|
*/
|
2011-09-18 20:40:52 +00:00
|
|
|
#define XFS_BMAPI_CONVERT 0x040
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2015-11-03 01:27:22 +00:00
|
|
|
/*
|
|
|
|
* allocate zeroed extents - this requires all newly allocated user data extents
|
|
|
|
* to be initialised to zero. It will be ignored if XFS_BMAPI_METADATA is set.
|
|
|
|
* Use in conjunction with XFS_BMAPI_CONVERT to convert unwritten extents found
|
|
|
|
* during the allocation range to zeroed written extents.
|
|
|
|
*/
|
|
|
|
#define XFS_BMAPI_ZERO 0x080
|
|
|
|
|
2016-10-03 16:11:27 +00:00
|
|
|
/*
|
|
|
|
* Map the inode offset to the block given in ap->firstblock. Primarily
|
|
|
|
* used for reflink. The range must be in a hole, and this flag cannot be
|
|
|
|
* turned on with PREALLOC or CONVERT, and cannot be used on the attr fork.
|
|
|
|
*/
|
|
|
|
#define XFS_BMAPI_REMAP 0x100
|
|
|
|
|
2009-12-14 23:14:59 +00:00
|
|
|
#define XFS_BMAPI_FLAGS \
|
|
|
|
{ XFS_BMAPI_ENTIRE, "ENTIRE" }, \
|
|
|
|
{ XFS_BMAPI_METADATA, "METADATA" }, \
|
|
|
|
{ XFS_BMAPI_ATTRFORK, "ATTRFORK" }, \
|
|
|
|
{ XFS_BMAPI_PREALLOC, "PREALLOC" }, \
|
|
|
|
{ XFS_BMAPI_IGSTATE, "IGSTATE" }, \
|
|
|
|
{ XFS_BMAPI_CONTIG, "CONTIG" }, \
|
2015-11-03 01:27:22 +00:00
|
|
|
{ XFS_BMAPI_CONVERT, "CONVERT" }, \
|
2016-10-03 16:11:27 +00:00
|
|
|
{ XFS_BMAPI_ZERO, "ZERO" }, \
|
|
|
|
{ XFS_BMAPI_REMAP, "REMAP" }
|
2009-12-14 23:14:59 +00:00
|
|
|
|
|
|
|
|
2005-11-02 03:38:42 +00:00
|
|
|
static inline int xfs_bmapi_aflag(int w)
|
|
|
|
{
|
|
|
|
return (w == XFS_ATTR_FORK ? XFS_BMAPI_ATTRFORK : 0);
|
|
|
|
}
|
2005-04-16 22:20:36 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Special values for xfs_bmbt_irec_t br_startblock field.
|
|
|
|
*/
|
|
|
|
#define DELAYSTARTBLOCK ((xfs_fsblock_t)-1LL)
|
|
|
|
#define HOLESTARTBLOCK ((xfs_fsblock_t)-2LL)
|
|
|
|
|
2009-11-25 00:00:19 +00:00
|
|
|
/*
|
|
|
|
* Flags for xfs_bmap_add_extent*.
|
|
|
|
*/
|
|
|
|
#define BMAP_LEFT_CONTIG (1 << 0)
|
|
|
|
#define BMAP_RIGHT_CONTIG (1 << 1)
|
|
|
|
#define BMAP_LEFT_FILLING (1 << 2)
|
|
|
|
#define BMAP_RIGHT_FILLING (1 << 3)
|
|
|
|
#define BMAP_LEFT_DELAY (1 << 4)
|
|
|
|
#define BMAP_RIGHT_DELAY (1 << 5)
|
|
|
|
#define BMAP_LEFT_VALID (1 << 6)
|
|
|
|
#define BMAP_RIGHT_VALID (1 << 7)
|
2009-11-25 00:00:21 +00:00
|
|
|
#define BMAP_ATTRFORK (1 << 8)
|
2009-11-25 00:00:19 +00:00
|
|
|
|
2009-12-14 23:14:59 +00:00
|
|
|
#define XFS_BMAP_EXT_FLAGS \
|
|
|
|
{ BMAP_LEFT_CONTIG, "LC" }, \
|
|
|
|
{ BMAP_RIGHT_CONTIG, "RC" }, \
|
|
|
|
{ BMAP_LEFT_FILLING, "LF" }, \
|
|
|
|
{ BMAP_RIGHT_FILLING, "RF" }, \
|
|
|
|
{ BMAP_ATTRFORK, "ATTR" }
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2014-02-23 23:58:19 +00:00
|
|
|
|
|
|
|
/*
|
|
|
|
* This macro is used to determine how many extents will be shifted
|
|
|
|
* in one write transaction. We could require two splits,
|
|
|
|
* an extent move on the first and an extent merge on the second,
|
|
|
|
* So it is proper that one extent is shifted inside write transaction
|
|
|
|
* at a time.
|
|
|
|
*/
|
|
|
|
#define XFS_BMAP_MAX_SHIFT_EXTENTS 1
|
|
|
|
|
2015-03-25 04:08:56 +00:00
|
|
|
enum shift_direction {
|
|
|
|
SHIFT_LEFT = 0,
|
|
|
|
SHIFT_RIGHT,
|
|
|
|
};
|
|
|
|
|
2013-08-12 10:49:51 +00:00
|
|
|
#ifdef DEBUG
|
2011-09-18 20:41:07 +00:00
|
|
|
void xfs_bmap_trace_exlist(struct xfs_inode *ip, xfs_extnum_t cnt,
|
|
|
|
int whichfork, unsigned long caller_ip);
|
2007-07-11 01:09:47 +00:00
|
|
|
#define XFS_BMAP_TRACE_EXLIST(ip,c,w) \
|
2009-12-14 23:14:59 +00:00
|
|
|
xfs_bmap_trace_exlist(ip,c,w, _THIS_IP_)
|
|
|
|
#else
|
2007-07-11 01:09:47 +00:00
|
|
|
#define XFS_BMAP_TRACE_EXLIST(ip,c,w)
|
2009-12-14 23:14:59 +00:00
|
|
|
#endif
|
2005-04-16 22:20:36 +00:00
|
|
|
|
2011-09-18 20:41:07 +00:00
|
|
|
int xfs_bmap_add_attrfork(struct xfs_inode *ip, int size, int rsvd);
|
2013-07-09 21:04:00 +00:00
|
|
|
void xfs_bmap_local_to_extents_empty(struct xfs_inode *ip, int whichfork);
|
2016-08-03 01:19:29 +00:00
|
|
|
void xfs_bmap_add_free(struct xfs_mount *mp, struct xfs_defer_ops *dfops,
|
2016-08-03 01:33:42 +00:00
|
|
|
xfs_fsblock_t bno, xfs_filblks_t len,
|
|
|
|
struct xfs_owner_info *oinfo);
|
2011-09-18 20:41:07 +00:00
|
|
|
void xfs_bmap_compute_maxlevels(struct xfs_mount *mp, int whichfork);
|
|
|
|
int xfs_bmap_first_unused(struct xfs_trans *tp, struct xfs_inode *ip,
|
|
|
|
xfs_extlen_t len, xfs_fileoff_t *unused, int whichfork);
|
|
|
|
int xfs_bmap_last_before(struct xfs_trans *tp, struct xfs_inode *ip,
|
|
|
|
xfs_fileoff_t *last_block, int whichfork);
|
2014-04-14 08:58:05 +00:00
|
|
|
int xfs_bmap_last_offset(struct xfs_inode *ip, xfs_fileoff_t *unused,
|
|
|
|
int whichfork);
|
2011-09-18 20:41:07 +00:00
|
|
|
int xfs_bmap_one_block(struct xfs_inode *ip, int whichfork);
|
|
|
|
int xfs_bmap_read_extents(struct xfs_trans *tp, struct xfs_inode *ip,
|
|
|
|
int whichfork);
|
2011-09-18 20:40:45 +00:00
|
|
|
int xfs_bmapi_read(struct xfs_inode *ip, xfs_fileoff_t bno,
|
|
|
|
xfs_filblks_t len, struct xfs_bmbt_irec *mval,
|
|
|
|
int *nmap, int flags);
|
2011-09-18 20:40:52 +00:00
|
|
|
int xfs_bmapi_write(struct xfs_trans *tp, struct xfs_inode *ip,
|
|
|
|
xfs_fileoff_t bno, xfs_filblks_t len, int flags,
|
|
|
|
xfs_fsblock_t *firstblock, xfs_extlen_t total,
|
|
|
|
struct xfs_bmbt_irec *mval, int *nmap,
|
2016-08-03 01:19:29 +00:00
|
|
|
struct xfs_defer_ops *dfops);
|
2011-09-18 20:41:07 +00:00
|
|
|
int xfs_bunmapi(struct xfs_trans *tp, struct xfs_inode *ip,
|
|
|
|
xfs_fileoff_t bno, xfs_filblks_t len, int flags,
|
|
|
|
xfs_extnum_t nexts, xfs_fsblock_t *firstblock,
|
2016-08-03 01:19:29 +00:00
|
|
|
struct xfs_defer_ops *dfops, int *done);
|
2011-09-18 20:41:07 +00:00
|
|
|
int xfs_check_nostate_extents(struct xfs_ifork *ifp, xfs_extnum_t idx,
|
|
|
|
xfs_extnum_t num);
|
|
|
|
uint xfs_default_attroffset(struct xfs_inode *ip);
|
2014-02-23 23:58:19 +00:00
|
|
|
int xfs_bmap_shift_extents(struct xfs_trans *tp, struct xfs_inode *ip,
|
2015-03-25 04:08:56 +00:00
|
|
|
xfs_fileoff_t *next_fsb, xfs_fileoff_t offset_shift_fsb,
|
|
|
|
int *done, xfs_fileoff_t stop_fsb, xfs_fsblock_t *firstblock,
|
2016-08-03 01:19:29 +00:00
|
|
|
struct xfs_defer_ops *dfops, enum shift_direction direction,
|
2015-03-25 04:08:56 +00:00
|
|
|
int num_exts);
|
|
|
|
int xfs_bmap_split_extent(struct xfs_inode *ip, xfs_fileoff_t split_offset);
|
2016-09-19 01:10:21 +00:00
|
|
|
struct xfs_bmbt_rec_host *
|
|
|
|
xfs_bmap_search_extents(struct xfs_inode *ip, xfs_fileoff_t bno,
|
|
|
|
int fork, int *eofp, xfs_extnum_t *lastxp,
|
|
|
|
struct xfs_bmbt_irec *gotp, struct xfs_bmbt_irec *prevp);
|
|
|
|
int xfs_bmapi_reserve_delalloc(struct xfs_inode *ip, xfs_fileoff_t aoff,
|
|
|
|
xfs_filblks_t len, struct xfs_bmbt_irec *got,
|
|
|
|
struct xfs_bmbt_irec *prev, xfs_extnum_t *lastx, int eof);
|
2009-03-29 17:26:46 +00:00
|
|
|
|
2016-10-03 16:11:26 +00:00
|
|
|
enum xfs_bmap_intent_type {
|
|
|
|
XFS_BMAP_MAP = 1,
|
|
|
|
XFS_BMAP_UNMAP,
|
|
|
|
};
|
|
|
|
|
|
|
|
struct xfs_bmap_intent {
|
|
|
|
struct list_head bi_list;
|
|
|
|
enum xfs_bmap_intent_type bi_type;
|
|
|
|
struct xfs_inode *bi_owner;
|
|
|
|
int bi_whichfork;
|
|
|
|
struct xfs_bmbt_irec bi_bmap;
|
|
|
|
};
|
|
|
|
|
2005-04-16 22:20:36 +00:00
|
|
|
#endif /* __XFS_BMAP_H__ */
|