xref: /OK3568_Linux_fs/kernel/fs/nfs/flexfilelayout/flexfilelayout.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * NFSv4 flexfile layout driver data structures.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Copyright (c) 2014, Primary Data, Inc. All rights reserved.
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  * Tao Peng <bergwolf@primarydata.com>
8*4882a593Smuzhiyun  */
9*4882a593Smuzhiyun 
10*4882a593Smuzhiyun #ifndef FS_NFS_NFS4FLEXFILELAYOUT_H
11*4882a593Smuzhiyun #define FS_NFS_NFS4FLEXFILELAYOUT_H
12*4882a593Smuzhiyun 
13*4882a593Smuzhiyun #define FF_FLAGS_NO_LAYOUTCOMMIT 1
14*4882a593Smuzhiyun #define FF_FLAGS_NO_IO_THRU_MDS  2
15*4882a593Smuzhiyun #define FF_FLAGS_NO_READ_IO      4
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #include <linux/refcount.h>
18*4882a593Smuzhiyun #include "../pnfs.h"
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun /* XXX: Let's filter out insanely large mirror count for now to avoid oom
21*4882a593Smuzhiyun  * due to network error etc. */
22*4882a593Smuzhiyun #define NFS4_FLEXFILE_LAYOUT_MAX_MIRROR_CNT 4096
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun /* LAYOUTSTATS report interval in ms */
25*4882a593Smuzhiyun #define FF_LAYOUTSTATS_REPORT_INTERVAL (60000L)
26*4882a593Smuzhiyun #define FF_LAYOUTSTATS_MAXDEV 4
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun struct nfs4_ff_ds_version {
29*4882a593Smuzhiyun 	u32				version;
30*4882a593Smuzhiyun 	u32				minor_version;
31*4882a593Smuzhiyun 	u32				rsize;
32*4882a593Smuzhiyun 	u32				wsize;
33*4882a593Smuzhiyun 	bool				tightly_coupled;
34*4882a593Smuzhiyun };
35*4882a593Smuzhiyun 
36*4882a593Smuzhiyun /* chained in global deviceid hlist */
37*4882a593Smuzhiyun struct nfs4_ff_layout_ds {
38*4882a593Smuzhiyun 	struct nfs4_deviceid_node	id_node;
39*4882a593Smuzhiyun 	u32				ds_versions_cnt;
40*4882a593Smuzhiyun 	struct nfs4_ff_ds_version	*ds_versions;
41*4882a593Smuzhiyun 	struct nfs4_pnfs_ds		*ds;
42*4882a593Smuzhiyun };
43*4882a593Smuzhiyun 
44*4882a593Smuzhiyun struct nfs4_ff_layout_ds_err {
45*4882a593Smuzhiyun 	struct list_head		list; /* linked in mirror error_list */
46*4882a593Smuzhiyun 	u64				offset;
47*4882a593Smuzhiyun 	u64				length;
48*4882a593Smuzhiyun 	int				status;
49*4882a593Smuzhiyun 	enum nfs_opnum4			opnum;
50*4882a593Smuzhiyun 	nfs4_stateid			stateid;
51*4882a593Smuzhiyun 	struct nfs4_deviceid		deviceid;
52*4882a593Smuzhiyun };
53*4882a593Smuzhiyun 
54*4882a593Smuzhiyun struct nfs4_ff_io_stat {
55*4882a593Smuzhiyun 	__u64				ops_requested;
56*4882a593Smuzhiyun 	__u64				bytes_requested;
57*4882a593Smuzhiyun 	__u64				ops_completed;
58*4882a593Smuzhiyun 	__u64				bytes_completed;
59*4882a593Smuzhiyun 	__u64				bytes_not_delivered;
60*4882a593Smuzhiyun 	ktime_t				total_busy_time;
61*4882a593Smuzhiyun 	ktime_t				aggregate_completion_time;
62*4882a593Smuzhiyun };
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun struct nfs4_ff_busy_timer {
65*4882a593Smuzhiyun 	ktime_t start_time;
66*4882a593Smuzhiyun 	atomic_t n_ops;
67*4882a593Smuzhiyun };
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun struct nfs4_ff_layoutstat {
70*4882a593Smuzhiyun 	struct nfs4_ff_io_stat io_stat;
71*4882a593Smuzhiyun 	struct nfs4_ff_busy_timer busy_timer;
72*4882a593Smuzhiyun };
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun struct nfs4_ff_layout_mirror {
75*4882a593Smuzhiyun 	struct pnfs_layout_hdr		*layout;
76*4882a593Smuzhiyun 	struct list_head		mirrors;
77*4882a593Smuzhiyun 	u32				ds_count;
78*4882a593Smuzhiyun 	u32				efficiency;
79*4882a593Smuzhiyun 	struct nfs4_deviceid		devid;
80*4882a593Smuzhiyun 	struct nfs4_ff_layout_ds	*mirror_ds;
81*4882a593Smuzhiyun 	u32				fh_versions_cnt;
82*4882a593Smuzhiyun 	struct nfs_fh			*fh_versions;
83*4882a593Smuzhiyun 	nfs4_stateid			stateid;
84*4882a593Smuzhiyun 	const struct cred __rcu		*ro_cred;
85*4882a593Smuzhiyun 	const struct cred __rcu		*rw_cred;
86*4882a593Smuzhiyun 	refcount_t			ref;
87*4882a593Smuzhiyun 	spinlock_t			lock;
88*4882a593Smuzhiyun 	unsigned long			flags;
89*4882a593Smuzhiyun 	struct nfs4_ff_layoutstat	read_stat;
90*4882a593Smuzhiyun 	struct nfs4_ff_layoutstat	write_stat;
91*4882a593Smuzhiyun 	ktime_t				start_time;
92*4882a593Smuzhiyun 	u32				report_interval;
93*4882a593Smuzhiyun };
94*4882a593Smuzhiyun 
95*4882a593Smuzhiyun #define NFS4_FF_MIRROR_STAT_AVAIL	(0)
96*4882a593Smuzhiyun 
97*4882a593Smuzhiyun struct nfs4_ff_layout_segment {
98*4882a593Smuzhiyun 	struct pnfs_layout_segment	generic_hdr;
99*4882a593Smuzhiyun 	u64				stripe_unit;
100*4882a593Smuzhiyun 	u32				flags;
101*4882a593Smuzhiyun 	u32				mirror_array_cnt;
102*4882a593Smuzhiyun 	struct nfs4_ff_layout_mirror	*mirror_array[];
103*4882a593Smuzhiyun };
104*4882a593Smuzhiyun 
105*4882a593Smuzhiyun struct nfs4_flexfile_layout {
106*4882a593Smuzhiyun 	struct pnfs_layout_hdr generic_hdr;
107*4882a593Smuzhiyun 	struct pnfs_ds_commit_info commit_info;
108*4882a593Smuzhiyun 	struct list_head	mirrors;
109*4882a593Smuzhiyun 	struct list_head	error_list; /* nfs4_ff_layout_ds_err */
110*4882a593Smuzhiyun 	ktime_t			last_report_time; /* Layoutstat report times */
111*4882a593Smuzhiyun };
112*4882a593Smuzhiyun 
113*4882a593Smuzhiyun struct nfs4_flexfile_layoutreturn_args {
114*4882a593Smuzhiyun 	struct list_head errors;
115*4882a593Smuzhiyun 	struct nfs42_layoutstat_devinfo devinfo[FF_LAYOUTSTATS_MAXDEV];
116*4882a593Smuzhiyun 	unsigned int num_errors;
117*4882a593Smuzhiyun 	unsigned int num_dev;
118*4882a593Smuzhiyun 	struct page *pages[1];
119*4882a593Smuzhiyun };
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun static inline struct nfs4_flexfile_layout *
FF_LAYOUT_FROM_HDR(struct pnfs_layout_hdr * lo)122*4882a593Smuzhiyun FF_LAYOUT_FROM_HDR(struct pnfs_layout_hdr *lo)
123*4882a593Smuzhiyun {
124*4882a593Smuzhiyun 	return container_of(lo, struct nfs4_flexfile_layout, generic_hdr);
125*4882a593Smuzhiyun }
126*4882a593Smuzhiyun 
127*4882a593Smuzhiyun static inline struct nfs4_ff_layout_segment *
FF_LAYOUT_LSEG(struct pnfs_layout_segment * lseg)128*4882a593Smuzhiyun FF_LAYOUT_LSEG(struct pnfs_layout_segment *lseg)
129*4882a593Smuzhiyun {
130*4882a593Smuzhiyun 	return container_of(lseg,
131*4882a593Smuzhiyun 			    struct nfs4_ff_layout_segment,
132*4882a593Smuzhiyun 			    generic_hdr);
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun 
135*4882a593Smuzhiyun static inline struct nfs4_ff_layout_ds *
FF_LAYOUT_MIRROR_DS(struct nfs4_deviceid_node * node)136*4882a593Smuzhiyun FF_LAYOUT_MIRROR_DS(struct nfs4_deviceid_node *node)
137*4882a593Smuzhiyun {
138*4882a593Smuzhiyun 	return container_of(node, struct nfs4_ff_layout_ds, id_node);
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun 
141*4882a593Smuzhiyun static inline struct nfs4_ff_layout_mirror *
FF_LAYOUT_COMP(struct pnfs_layout_segment * lseg,u32 idx)142*4882a593Smuzhiyun FF_LAYOUT_COMP(struct pnfs_layout_segment *lseg, u32 idx)
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun 	struct nfs4_ff_layout_segment *fls = FF_LAYOUT_LSEG(lseg);
145*4882a593Smuzhiyun 
146*4882a593Smuzhiyun 	if (idx < fls->mirror_array_cnt)
147*4882a593Smuzhiyun 		return fls->mirror_array[idx];
148*4882a593Smuzhiyun 	return NULL;
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun static inline struct nfs4_deviceid_node *
FF_LAYOUT_DEVID_NODE(struct pnfs_layout_segment * lseg,u32 idx)152*4882a593Smuzhiyun FF_LAYOUT_DEVID_NODE(struct pnfs_layout_segment *lseg, u32 idx)
153*4882a593Smuzhiyun {
154*4882a593Smuzhiyun 	struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, idx);
155*4882a593Smuzhiyun 
156*4882a593Smuzhiyun 	if (mirror != NULL) {
157*4882a593Smuzhiyun 		struct nfs4_ff_layout_ds *mirror_ds = mirror->mirror_ds;
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun 		if (!IS_ERR_OR_NULL(mirror_ds))
160*4882a593Smuzhiyun 			return &mirror_ds->id_node;
161*4882a593Smuzhiyun 	}
162*4882a593Smuzhiyun 	return NULL;
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun static inline u32
FF_LAYOUT_MIRROR_COUNT(struct pnfs_layout_segment * lseg)166*4882a593Smuzhiyun FF_LAYOUT_MIRROR_COUNT(struct pnfs_layout_segment *lseg)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun 	return FF_LAYOUT_LSEG(lseg)->mirror_array_cnt;
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun static inline bool
ff_layout_no_fallback_to_mds(struct pnfs_layout_segment * lseg)172*4882a593Smuzhiyun ff_layout_no_fallback_to_mds(struct pnfs_layout_segment *lseg)
173*4882a593Smuzhiyun {
174*4882a593Smuzhiyun 	return FF_LAYOUT_LSEG(lseg)->flags & FF_FLAGS_NO_IO_THRU_MDS;
175*4882a593Smuzhiyun }
176*4882a593Smuzhiyun 
177*4882a593Smuzhiyun static inline bool
ff_layout_no_read_on_rw(struct pnfs_layout_segment * lseg)178*4882a593Smuzhiyun ff_layout_no_read_on_rw(struct pnfs_layout_segment *lseg)
179*4882a593Smuzhiyun {
180*4882a593Smuzhiyun 	return FF_LAYOUT_LSEG(lseg)->flags & FF_FLAGS_NO_READ_IO;
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun 
183*4882a593Smuzhiyun static inline int
nfs4_ff_layout_ds_version(const struct nfs4_ff_layout_mirror * mirror)184*4882a593Smuzhiyun nfs4_ff_layout_ds_version(const struct nfs4_ff_layout_mirror *mirror)
185*4882a593Smuzhiyun {
186*4882a593Smuzhiyun 	return mirror->mirror_ds->ds_versions[0].version;
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun struct nfs4_ff_layout_ds *
190*4882a593Smuzhiyun nfs4_ff_alloc_deviceid_node(struct nfs_server *server, struct pnfs_device *pdev,
191*4882a593Smuzhiyun 			    gfp_t gfp_flags);
192*4882a593Smuzhiyun void nfs4_ff_layout_put_deviceid(struct nfs4_ff_layout_ds *mirror_ds);
193*4882a593Smuzhiyun void nfs4_ff_layout_free_deviceid(struct nfs4_ff_layout_ds *mirror_ds);
194*4882a593Smuzhiyun int ff_layout_track_ds_error(struct nfs4_flexfile_layout *flo,
195*4882a593Smuzhiyun 			     struct nfs4_ff_layout_mirror *mirror, u64 offset,
196*4882a593Smuzhiyun 			     u64 length, int status, enum nfs_opnum4 opnum,
197*4882a593Smuzhiyun 			     gfp_t gfp_flags);
198*4882a593Smuzhiyun void ff_layout_send_layouterror(struct pnfs_layout_segment *lseg);
199*4882a593Smuzhiyun int ff_layout_encode_ds_ioerr(struct xdr_stream *xdr, const struct list_head *head);
200*4882a593Smuzhiyun void ff_layout_free_ds_ioerr(struct list_head *head);
201*4882a593Smuzhiyun unsigned int ff_layout_fetch_ds_ioerr(struct pnfs_layout_hdr *lo,
202*4882a593Smuzhiyun 		const struct pnfs_layout_range *range,
203*4882a593Smuzhiyun 		struct list_head *head,
204*4882a593Smuzhiyun 		unsigned int maxnum);
205*4882a593Smuzhiyun struct nfs_fh *
206*4882a593Smuzhiyun nfs4_ff_layout_select_ds_fh(struct nfs4_ff_layout_mirror *mirror);
207*4882a593Smuzhiyun void
208*4882a593Smuzhiyun nfs4_ff_layout_select_ds_stateid(const struct nfs4_ff_layout_mirror *mirror,
209*4882a593Smuzhiyun 		nfs4_stateid *stateid);
210*4882a593Smuzhiyun 
211*4882a593Smuzhiyun struct nfs4_pnfs_ds *
212*4882a593Smuzhiyun nfs4_ff_layout_prepare_ds(struct pnfs_layout_segment *lseg,
213*4882a593Smuzhiyun 			  struct nfs4_ff_layout_mirror *mirror,
214*4882a593Smuzhiyun 			  bool fail_return);
215*4882a593Smuzhiyun 
216*4882a593Smuzhiyun struct rpc_clnt *
217*4882a593Smuzhiyun nfs4_ff_find_or_create_ds_client(struct nfs4_ff_layout_mirror *mirror,
218*4882a593Smuzhiyun 				 struct nfs_client *ds_clp,
219*4882a593Smuzhiyun 				 struct inode *inode);
220*4882a593Smuzhiyun const struct cred *ff_layout_get_ds_cred(struct nfs4_ff_layout_mirror *mirror,
221*4882a593Smuzhiyun 					 const struct pnfs_layout_range *range,
222*4882a593Smuzhiyun 					 const struct cred *mdscred);
223*4882a593Smuzhiyun bool ff_layout_avoid_mds_available_ds(struct pnfs_layout_segment *lseg);
224*4882a593Smuzhiyun bool ff_layout_avoid_read_on_rw(struct pnfs_layout_segment *lseg);
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun #endif /* FS_NFS_NFS4FLEXFILELAYOUT_H */
227