mirror of
https://github.com/torvalds/linux.git
synced 2024-12-23 03:11:46 +00:00
260074cd84
For loosely coupled pNFS/flexfiles systems, there is often no advantage at all in going through the MDS for I/O, since the MDS is subject to the same limitations as all other clients when talking to DSes. If a DS is unresponsive, I/O through the MDS will fail. For such systems, the only scalable solution is to have the pNFS clients retry doing pNFS, and so the protocol now provides a flag that allows the pNFS server to signal this. If LAYOUTGET returns FF_FLAGS_NO_IO_THRU_MDS, then we should assume that the MDS wants the client to retry using these devices, even if they were previously marked as being unavailable. To do so, we add a helper, ff_layout_mark_devices_valid() that will be called from layoutget. Signed-off-by: Trond Myklebust <trond.myklebust@primarydata.com>
195 lines
5.2 KiB
C
195 lines
5.2 KiB
C
/*
|
|
* NFSv4 flexfile layout driver data structures.
|
|
*
|
|
* Copyright (c) 2014, Primary Data, Inc. All rights reserved.
|
|
*
|
|
* Tao Peng <bergwolf@primarydata.com>
|
|
*/
|
|
|
|
#ifndef FS_NFS_NFS4FLEXFILELAYOUT_H
|
|
#define FS_NFS_NFS4FLEXFILELAYOUT_H
|
|
|
|
#define FF_FLAGS_NO_LAYOUTCOMMIT 1
|
|
#define FF_FLAGS_NO_IO_THRU_MDS 2
|
|
|
|
#include "../pnfs.h"
|
|
|
|
/* XXX: Let's filter out insanely large mirror count for now to avoid oom
|
|
* due to network error etc. */
|
|
#define NFS4_FLEXFILE_LAYOUT_MAX_MIRROR_CNT 4096
|
|
|
|
/* LAYOUTSTATS report interval in ms */
|
|
#define FF_LAYOUTSTATS_REPORT_INTERVAL (60000L)
|
|
|
|
struct nfs4_ff_ds_version {
|
|
u32 version;
|
|
u32 minor_version;
|
|
u32 rsize;
|
|
u32 wsize;
|
|
bool tightly_coupled;
|
|
};
|
|
|
|
/* chained in global deviceid hlist */
|
|
struct nfs4_ff_layout_ds {
|
|
struct nfs4_deviceid_node id_node;
|
|
u32 ds_versions_cnt;
|
|
struct nfs4_ff_ds_version *ds_versions;
|
|
struct nfs4_pnfs_ds *ds;
|
|
};
|
|
|
|
struct nfs4_ff_layout_ds_err {
|
|
struct list_head list; /* linked in mirror error_list */
|
|
u64 offset;
|
|
u64 length;
|
|
int status;
|
|
enum nfs_opnum4 opnum;
|
|
nfs4_stateid stateid;
|
|
struct nfs4_deviceid deviceid;
|
|
};
|
|
|
|
struct nfs4_ff_io_stat {
|
|
__u64 ops_requested;
|
|
__u64 bytes_requested;
|
|
__u64 ops_completed;
|
|
__u64 bytes_completed;
|
|
__u64 bytes_not_delivered;
|
|
ktime_t total_busy_time;
|
|
ktime_t aggregate_completion_time;
|
|
};
|
|
|
|
struct nfs4_ff_busy_timer {
|
|
ktime_t start_time;
|
|
atomic_t n_ops;
|
|
};
|
|
|
|
struct nfs4_ff_layoutstat {
|
|
struct nfs4_ff_io_stat io_stat;
|
|
struct nfs4_ff_busy_timer busy_timer;
|
|
};
|
|
|
|
struct nfs4_ff_layout_mirror {
|
|
struct pnfs_layout_hdr *layout;
|
|
struct list_head mirrors;
|
|
u32 ds_count;
|
|
u32 efficiency;
|
|
struct nfs4_ff_layout_ds *mirror_ds;
|
|
u32 fh_versions_cnt;
|
|
struct nfs_fh *fh_versions;
|
|
nfs4_stateid stateid;
|
|
u32 uid;
|
|
u32 gid;
|
|
struct rpc_cred *cred;
|
|
atomic_t ref;
|
|
spinlock_t lock;
|
|
struct nfs4_ff_layoutstat read_stat;
|
|
struct nfs4_ff_layoutstat write_stat;
|
|
ktime_t start_time;
|
|
ktime_t last_report_time;
|
|
};
|
|
|
|
struct nfs4_ff_layout_segment {
|
|
struct pnfs_layout_segment generic_hdr;
|
|
u64 stripe_unit;
|
|
u32 flags;
|
|
u32 mirror_array_cnt;
|
|
struct nfs4_ff_layout_mirror **mirror_array;
|
|
};
|
|
|
|
struct nfs4_flexfile_layout {
|
|
struct pnfs_layout_hdr generic_hdr;
|
|
struct pnfs_ds_commit_info commit_info;
|
|
struct list_head mirrors;
|
|
struct list_head error_list; /* nfs4_ff_layout_ds_err */
|
|
};
|
|
|
|
static inline struct nfs4_flexfile_layout *
|
|
FF_LAYOUT_FROM_HDR(struct pnfs_layout_hdr *lo)
|
|
{
|
|
return container_of(lo, struct nfs4_flexfile_layout, generic_hdr);
|
|
}
|
|
|
|
static inline struct nfs4_ff_layout_segment *
|
|
FF_LAYOUT_LSEG(struct pnfs_layout_segment *lseg)
|
|
{
|
|
return container_of(lseg,
|
|
struct nfs4_ff_layout_segment,
|
|
generic_hdr);
|
|
}
|
|
|
|
static inline struct nfs4_deviceid_node *
|
|
FF_LAYOUT_DEVID_NODE(struct pnfs_layout_segment *lseg, u32 idx)
|
|
{
|
|
if (idx >= FF_LAYOUT_LSEG(lseg)->mirror_array_cnt ||
|
|
FF_LAYOUT_LSEG(lseg)->mirror_array[idx] == NULL ||
|
|
FF_LAYOUT_LSEG(lseg)->mirror_array[idx]->mirror_ds == NULL)
|
|
return NULL;
|
|
return &FF_LAYOUT_LSEG(lseg)->mirror_array[idx]->mirror_ds->id_node;
|
|
}
|
|
|
|
static inline struct nfs4_ff_layout_ds *
|
|
FF_LAYOUT_MIRROR_DS(struct nfs4_deviceid_node *node)
|
|
{
|
|
return container_of(node, struct nfs4_ff_layout_ds, id_node);
|
|
}
|
|
|
|
static inline struct nfs4_ff_layout_mirror *
|
|
FF_LAYOUT_COMP(struct pnfs_layout_segment *lseg, u32 idx)
|
|
{
|
|
if (idx >= FF_LAYOUT_LSEG(lseg)->mirror_array_cnt)
|
|
return NULL;
|
|
return FF_LAYOUT_LSEG(lseg)->mirror_array[idx];
|
|
}
|
|
|
|
static inline u32
|
|
FF_LAYOUT_MIRROR_COUNT(struct pnfs_layout_segment *lseg)
|
|
{
|
|
return FF_LAYOUT_LSEG(lseg)->mirror_array_cnt;
|
|
}
|
|
|
|
static inline bool
|
|
ff_layout_no_fallback_to_mds(struct pnfs_layout_segment *lseg)
|
|
{
|
|
return FF_LAYOUT_LSEG(lseg)->flags & FF_FLAGS_NO_IO_THRU_MDS;
|
|
}
|
|
|
|
static inline bool
|
|
ff_layout_test_devid_unavailable(struct nfs4_deviceid_node *node)
|
|
{
|
|
return nfs4_test_deviceid_unavailable(node);
|
|
}
|
|
|
|
static inline int
|
|
nfs4_ff_layout_ds_version(struct pnfs_layout_segment *lseg, u32 ds_idx)
|
|
{
|
|
return FF_LAYOUT_COMP(lseg, ds_idx)->mirror_ds->ds_versions[0].version;
|
|
}
|
|
|
|
struct nfs4_ff_layout_ds *
|
|
nfs4_ff_alloc_deviceid_node(struct nfs_server *server, struct pnfs_device *pdev,
|
|
gfp_t gfp_flags);
|
|
void nfs4_ff_layout_put_deviceid(struct nfs4_ff_layout_ds *mirror_ds);
|
|
void nfs4_ff_layout_free_deviceid(struct nfs4_ff_layout_ds *mirror_ds);
|
|
int ff_layout_track_ds_error(struct nfs4_flexfile_layout *flo,
|
|
struct nfs4_ff_layout_mirror *mirror, u64 offset,
|
|
u64 length, int status, enum nfs_opnum4 opnum,
|
|
gfp_t gfp_flags);
|
|
int ff_layout_encode_ds_ioerr(struct nfs4_flexfile_layout *flo,
|
|
struct xdr_stream *xdr, int *count,
|
|
const struct pnfs_layout_range *range);
|
|
struct nfs_fh *
|
|
nfs4_ff_layout_select_ds_fh(struct pnfs_layout_segment *lseg, u32 mirror_idx);
|
|
|
|
struct nfs4_pnfs_ds *
|
|
nfs4_ff_layout_prepare_ds(struct pnfs_layout_segment *lseg, u32 ds_idx,
|
|
bool fail_return);
|
|
|
|
struct rpc_clnt *
|
|
nfs4_ff_find_or_create_ds_client(struct pnfs_layout_segment *lseg,
|
|
u32 ds_idx,
|
|
struct nfs_client *ds_clp,
|
|
struct inode *inode);
|
|
struct rpc_cred *ff_layout_get_ds_cred(struct pnfs_layout_segment *lseg,
|
|
u32 ds_idx, struct rpc_cred *mdscred);
|
|
bool ff_layout_has_available_ds(struct pnfs_layout_segment *lseg);
|
|
#endif /* FS_NFS_NFS4FLEXFILELAYOUT_H */
|