1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun
3*4882a593Smuzhiyun #include <linux/ceph/ceph_debug.h>
4*4882a593Smuzhiyun
5*4882a593Smuzhiyun #include <linux/backing-dev.h>
6*4882a593Smuzhiyun #include <linux/ctype.h>
7*4882a593Smuzhiyun #include <linux/fs.h>
8*4882a593Smuzhiyun #include <linux/inet.h>
9*4882a593Smuzhiyun #include <linux/in6.h>
10*4882a593Smuzhiyun #include <linux/module.h>
11*4882a593Smuzhiyun #include <linux/mount.h>
12*4882a593Smuzhiyun #include <linux/fs_context.h>
13*4882a593Smuzhiyun #include <linux/fs_parser.h>
14*4882a593Smuzhiyun #include <linux/sched.h>
15*4882a593Smuzhiyun #include <linux/seq_file.h>
16*4882a593Smuzhiyun #include <linux/slab.h>
17*4882a593Smuzhiyun #include <linux/statfs.h>
18*4882a593Smuzhiyun #include <linux/string.h>
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun #include "super.h"
21*4882a593Smuzhiyun #include "mds_client.h"
22*4882a593Smuzhiyun #include "cache.h"
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #include <linux/ceph/ceph_features.h>
25*4882a593Smuzhiyun #include <linux/ceph/decode.h>
26*4882a593Smuzhiyun #include <linux/ceph/mon_client.h>
27*4882a593Smuzhiyun #include <linux/ceph/auth.h>
28*4882a593Smuzhiyun #include <linux/ceph/debugfs.h>
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun static DEFINE_SPINLOCK(ceph_fsc_lock);
31*4882a593Smuzhiyun static LIST_HEAD(ceph_fsc_list);
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun /*
34*4882a593Smuzhiyun * Ceph superblock operations
35*4882a593Smuzhiyun *
36*4882a593Smuzhiyun * Handle the basics of mounting, unmounting.
37*4882a593Smuzhiyun */
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun /*
40*4882a593Smuzhiyun * super ops
41*4882a593Smuzhiyun */
ceph_put_super(struct super_block * s)42*4882a593Smuzhiyun static void ceph_put_super(struct super_block *s)
43*4882a593Smuzhiyun {
44*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(s);
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun dout("put_super\n");
47*4882a593Smuzhiyun ceph_mdsc_close_sessions(fsc->mdsc);
48*4882a593Smuzhiyun }
49*4882a593Smuzhiyun
ceph_statfs(struct dentry * dentry,struct kstatfs * buf)50*4882a593Smuzhiyun static int ceph_statfs(struct dentry *dentry, struct kstatfs *buf)
51*4882a593Smuzhiyun {
52*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_inode_to_client(d_inode(dentry));
53*4882a593Smuzhiyun struct ceph_mon_client *monc = &fsc->client->monc;
54*4882a593Smuzhiyun struct ceph_statfs st;
55*4882a593Smuzhiyun int i, err;
56*4882a593Smuzhiyun u64 data_pool;
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun if (fsc->mdsc->mdsmap->m_num_data_pg_pools == 1) {
59*4882a593Smuzhiyun data_pool = fsc->mdsc->mdsmap->m_data_pg_pools[0];
60*4882a593Smuzhiyun } else {
61*4882a593Smuzhiyun data_pool = CEPH_NOPOOL;
62*4882a593Smuzhiyun }
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun dout("statfs\n");
65*4882a593Smuzhiyun err = ceph_monc_do_statfs(monc, data_pool, &st);
66*4882a593Smuzhiyun if (err < 0)
67*4882a593Smuzhiyun return err;
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun /* fill in kstatfs */
70*4882a593Smuzhiyun buf->f_type = CEPH_SUPER_MAGIC; /* ?? */
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun /*
73*4882a593Smuzhiyun * express utilization in terms of large blocks to avoid
74*4882a593Smuzhiyun * overflow on 32-bit machines.
75*4882a593Smuzhiyun *
76*4882a593Smuzhiyun * NOTE: for the time being, we make bsize == frsize to humor
77*4882a593Smuzhiyun * not-yet-ancient versions of glibc that are broken.
78*4882a593Smuzhiyun * Someday, we will probably want to report a real block
79*4882a593Smuzhiyun * size... whatever that may mean for a network file system!
80*4882a593Smuzhiyun */
81*4882a593Smuzhiyun buf->f_bsize = 1 << CEPH_BLOCK_SHIFT;
82*4882a593Smuzhiyun buf->f_frsize = 1 << CEPH_BLOCK_SHIFT;
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun /*
85*4882a593Smuzhiyun * By default use root quota for stats; fallback to overall filesystem
86*4882a593Smuzhiyun * usage if using 'noquotadf' mount option or if the root dir doesn't
87*4882a593Smuzhiyun * have max_bytes quota set.
88*4882a593Smuzhiyun */
89*4882a593Smuzhiyun if (ceph_test_mount_opt(fsc, NOQUOTADF) ||
90*4882a593Smuzhiyun !ceph_quota_update_statfs(fsc, buf)) {
91*4882a593Smuzhiyun buf->f_blocks = le64_to_cpu(st.kb) >> (CEPH_BLOCK_SHIFT-10);
92*4882a593Smuzhiyun buf->f_bfree = le64_to_cpu(st.kb_avail) >> (CEPH_BLOCK_SHIFT-10);
93*4882a593Smuzhiyun buf->f_bavail = le64_to_cpu(st.kb_avail) >> (CEPH_BLOCK_SHIFT-10);
94*4882a593Smuzhiyun }
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun buf->f_files = le64_to_cpu(st.num_objects);
97*4882a593Smuzhiyun buf->f_ffree = -1;
98*4882a593Smuzhiyun buf->f_namelen = NAME_MAX;
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun /* Must convert the fsid, for consistent values across arches */
101*4882a593Smuzhiyun buf->f_fsid.val[0] = 0;
102*4882a593Smuzhiyun mutex_lock(&monc->mutex);
103*4882a593Smuzhiyun for (i = 0 ; i < sizeof(monc->monmap->fsid) / sizeof(__le32) ; ++i)
104*4882a593Smuzhiyun buf->f_fsid.val[0] ^= le32_to_cpu(((__le32 *)&monc->monmap->fsid)[i]);
105*4882a593Smuzhiyun mutex_unlock(&monc->mutex);
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun /* fold the fs_cluster_id into the upper bits */
108*4882a593Smuzhiyun buf->f_fsid.val[1] = monc->fs_cluster_id;
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun return 0;
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun
ceph_sync_fs(struct super_block * sb,int wait)113*4882a593Smuzhiyun static int ceph_sync_fs(struct super_block *sb, int wait)
114*4882a593Smuzhiyun {
115*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(sb);
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun if (!wait) {
118*4882a593Smuzhiyun dout("sync_fs (non-blocking)\n");
119*4882a593Smuzhiyun ceph_flush_dirty_caps(fsc->mdsc);
120*4882a593Smuzhiyun dout("sync_fs (non-blocking) done\n");
121*4882a593Smuzhiyun return 0;
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun dout("sync_fs (blocking)\n");
125*4882a593Smuzhiyun ceph_osdc_sync(&fsc->client->osdc);
126*4882a593Smuzhiyun ceph_mdsc_sync(fsc->mdsc);
127*4882a593Smuzhiyun dout("sync_fs (blocking) done\n");
128*4882a593Smuzhiyun return 0;
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun /*
132*4882a593Smuzhiyun * mount options
133*4882a593Smuzhiyun */
134*4882a593Smuzhiyun enum {
135*4882a593Smuzhiyun Opt_wsize,
136*4882a593Smuzhiyun Opt_rsize,
137*4882a593Smuzhiyun Opt_rasize,
138*4882a593Smuzhiyun Opt_caps_wanted_delay_min,
139*4882a593Smuzhiyun Opt_caps_wanted_delay_max,
140*4882a593Smuzhiyun Opt_caps_max,
141*4882a593Smuzhiyun Opt_readdir_max_entries,
142*4882a593Smuzhiyun Opt_readdir_max_bytes,
143*4882a593Smuzhiyun Opt_congestion_kb,
144*4882a593Smuzhiyun /* int args above */
145*4882a593Smuzhiyun Opt_snapdirname,
146*4882a593Smuzhiyun Opt_mds_namespace,
147*4882a593Smuzhiyun Opt_recover_session,
148*4882a593Smuzhiyun Opt_source,
149*4882a593Smuzhiyun /* string args above */
150*4882a593Smuzhiyun Opt_dirstat,
151*4882a593Smuzhiyun Opt_rbytes,
152*4882a593Smuzhiyun Opt_asyncreaddir,
153*4882a593Smuzhiyun Opt_dcache,
154*4882a593Smuzhiyun Opt_ino32,
155*4882a593Smuzhiyun Opt_fscache,
156*4882a593Smuzhiyun Opt_poolperm,
157*4882a593Smuzhiyun Opt_require_active_mds,
158*4882a593Smuzhiyun Opt_acl,
159*4882a593Smuzhiyun Opt_quotadf,
160*4882a593Smuzhiyun Opt_copyfrom,
161*4882a593Smuzhiyun Opt_wsync,
162*4882a593Smuzhiyun };
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun enum ceph_recover_session_mode {
165*4882a593Smuzhiyun ceph_recover_session_no,
166*4882a593Smuzhiyun ceph_recover_session_clean
167*4882a593Smuzhiyun };
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun static const struct constant_table ceph_param_recover[] = {
170*4882a593Smuzhiyun { "no", ceph_recover_session_no },
171*4882a593Smuzhiyun { "clean", ceph_recover_session_clean },
172*4882a593Smuzhiyun {}
173*4882a593Smuzhiyun };
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun static const struct fs_parameter_spec ceph_mount_parameters[] = {
176*4882a593Smuzhiyun fsparam_flag_no ("acl", Opt_acl),
177*4882a593Smuzhiyun fsparam_flag_no ("asyncreaddir", Opt_asyncreaddir),
178*4882a593Smuzhiyun fsparam_s32 ("caps_max", Opt_caps_max),
179*4882a593Smuzhiyun fsparam_u32 ("caps_wanted_delay_max", Opt_caps_wanted_delay_max),
180*4882a593Smuzhiyun fsparam_u32 ("caps_wanted_delay_min", Opt_caps_wanted_delay_min),
181*4882a593Smuzhiyun fsparam_u32 ("write_congestion_kb", Opt_congestion_kb),
182*4882a593Smuzhiyun fsparam_flag_no ("copyfrom", Opt_copyfrom),
183*4882a593Smuzhiyun fsparam_flag_no ("dcache", Opt_dcache),
184*4882a593Smuzhiyun fsparam_flag_no ("dirstat", Opt_dirstat),
185*4882a593Smuzhiyun fsparam_flag_no ("fsc", Opt_fscache), // fsc|nofsc
186*4882a593Smuzhiyun fsparam_string ("fsc", Opt_fscache), // fsc=...
187*4882a593Smuzhiyun fsparam_flag_no ("ino32", Opt_ino32),
188*4882a593Smuzhiyun fsparam_string ("mds_namespace", Opt_mds_namespace),
189*4882a593Smuzhiyun fsparam_flag_no ("poolperm", Opt_poolperm),
190*4882a593Smuzhiyun fsparam_flag_no ("quotadf", Opt_quotadf),
191*4882a593Smuzhiyun fsparam_u32 ("rasize", Opt_rasize),
192*4882a593Smuzhiyun fsparam_flag_no ("rbytes", Opt_rbytes),
193*4882a593Smuzhiyun fsparam_u32 ("readdir_max_bytes", Opt_readdir_max_bytes),
194*4882a593Smuzhiyun fsparam_u32 ("readdir_max_entries", Opt_readdir_max_entries),
195*4882a593Smuzhiyun fsparam_enum ("recover_session", Opt_recover_session, ceph_param_recover),
196*4882a593Smuzhiyun fsparam_flag_no ("require_active_mds", Opt_require_active_mds),
197*4882a593Smuzhiyun fsparam_u32 ("rsize", Opt_rsize),
198*4882a593Smuzhiyun fsparam_string ("snapdirname", Opt_snapdirname),
199*4882a593Smuzhiyun fsparam_string ("source", Opt_source),
200*4882a593Smuzhiyun fsparam_u32 ("wsize", Opt_wsize),
201*4882a593Smuzhiyun fsparam_flag_no ("wsync", Opt_wsync),
202*4882a593Smuzhiyun {}
203*4882a593Smuzhiyun };
204*4882a593Smuzhiyun
205*4882a593Smuzhiyun struct ceph_parse_opts_ctx {
206*4882a593Smuzhiyun struct ceph_options *copts;
207*4882a593Smuzhiyun struct ceph_mount_options *opts;
208*4882a593Smuzhiyun };
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun /*
211*4882a593Smuzhiyun * Remove adjacent slashes and then the trailing slash, unless it is
212*4882a593Smuzhiyun * the only remaining character.
213*4882a593Smuzhiyun *
214*4882a593Smuzhiyun * E.g. "//dir1////dir2///" --> "/dir1/dir2", "///" --> "/".
215*4882a593Smuzhiyun */
canonicalize_path(char * path)216*4882a593Smuzhiyun static void canonicalize_path(char *path)
217*4882a593Smuzhiyun {
218*4882a593Smuzhiyun int i, j = 0;
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun for (i = 0; path[i] != '\0'; i++) {
221*4882a593Smuzhiyun if (path[i] != '/' || j < 1 || path[j - 1] != '/')
222*4882a593Smuzhiyun path[j++] = path[i];
223*4882a593Smuzhiyun }
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun if (j > 1 && path[j - 1] == '/')
226*4882a593Smuzhiyun j--;
227*4882a593Smuzhiyun path[j] = '\0';
228*4882a593Smuzhiyun }
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun /*
231*4882a593Smuzhiyun * Parse the source parameter. Distinguish the server list from the path.
232*4882a593Smuzhiyun *
233*4882a593Smuzhiyun * The source will look like:
234*4882a593Smuzhiyun * <server_spec>[,<server_spec>...]:[<path>]
235*4882a593Smuzhiyun * where
236*4882a593Smuzhiyun * <server_spec> is <ip>[:<port>]
237*4882a593Smuzhiyun * <path> is optional, but if present must begin with '/'
238*4882a593Smuzhiyun */
ceph_parse_source(struct fs_parameter * param,struct fs_context * fc)239*4882a593Smuzhiyun static int ceph_parse_source(struct fs_parameter *param, struct fs_context *fc)
240*4882a593Smuzhiyun {
241*4882a593Smuzhiyun struct ceph_parse_opts_ctx *pctx = fc->fs_private;
242*4882a593Smuzhiyun struct ceph_mount_options *fsopt = pctx->opts;
243*4882a593Smuzhiyun char *dev_name = param->string, *dev_name_end;
244*4882a593Smuzhiyun int ret;
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun dout("%s '%s'\n", __func__, dev_name);
247*4882a593Smuzhiyun if (!dev_name || !*dev_name)
248*4882a593Smuzhiyun return invalfc(fc, "Empty source");
249*4882a593Smuzhiyun
250*4882a593Smuzhiyun dev_name_end = strchr(dev_name, '/');
251*4882a593Smuzhiyun if (dev_name_end) {
252*4882a593Smuzhiyun /*
253*4882a593Smuzhiyun * The server_path will include the whole chars from userland
254*4882a593Smuzhiyun * including the leading '/'.
255*4882a593Smuzhiyun */
256*4882a593Smuzhiyun kfree(fsopt->server_path);
257*4882a593Smuzhiyun fsopt->server_path = kstrdup(dev_name_end, GFP_KERNEL);
258*4882a593Smuzhiyun if (!fsopt->server_path)
259*4882a593Smuzhiyun return -ENOMEM;
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun canonicalize_path(fsopt->server_path);
262*4882a593Smuzhiyun } else {
263*4882a593Smuzhiyun dev_name_end = dev_name + strlen(dev_name);
264*4882a593Smuzhiyun }
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun dev_name_end--; /* back up to ':' separator */
267*4882a593Smuzhiyun if (dev_name_end < dev_name || *dev_name_end != ':')
268*4882a593Smuzhiyun return invalfc(fc, "No path or : separator in source");
269*4882a593Smuzhiyun
270*4882a593Smuzhiyun dout("device name '%.*s'\n", (int)(dev_name_end - dev_name), dev_name);
271*4882a593Smuzhiyun if (fsopt->server_path)
272*4882a593Smuzhiyun dout("server path '%s'\n", fsopt->server_path);
273*4882a593Smuzhiyun
274*4882a593Smuzhiyun ret = ceph_parse_mon_ips(param->string, dev_name_end - dev_name,
275*4882a593Smuzhiyun pctx->copts, fc->log.log);
276*4882a593Smuzhiyun if (ret)
277*4882a593Smuzhiyun return ret;
278*4882a593Smuzhiyun
279*4882a593Smuzhiyun fc->source = param->string;
280*4882a593Smuzhiyun param->string = NULL;
281*4882a593Smuzhiyun return 0;
282*4882a593Smuzhiyun }
283*4882a593Smuzhiyun
ceph_parse_mount_param(struct fs_context * fc,struct fs_parameter * param)284*4882a593Smuzhiyun static int ceph_parse_mount_param(struct fs_context *fc,
285*4882a593Smuzhiyun struct fs_parameter *param)
286*4882a593Smuzhiyun {
287*4882a593Smuzhiyun struct ceph_parse_opts_ctx *pctx = fc->fs_private;
288*4882a593Smuzhiyun struct ceph_mount_options *fsopt = pctx->opts;
289*4882a593Smuzhiyun struct fs_parse_result result;
290*4882a593Smuzhiyun unsigned int mode;
291*4882a593Smuzhiyun int token, ret;
292*4882a593Smuzhiyun
293*4882a593Smuzhiyun ret = ceph_parse_param(param, pctx->copts, fc->log.log);
294*4882a593Smuzhiyun if (ret != -ENOPARAM)
295*4882a593Smuzhiyun return ret;
296*4882a593Smuzhiyun
297*4882a593Smuzhiyun token = fs_parse(fc, ceph_mount_parameters, param, &result);
298*4882a593Smuzhiyun dout("%s fs_parse '%s' token %d\n", __func__, param->key, token);
299*4882a593Smuzhiyun if (token < 0)
300*4882a593Smuzhiyun return token;
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun switch (token) {
303*4882a593Smuzhiyun case Opt_snapdirname:
304*4882a593Smuzhiyun kfree(fsopt->snapdir_name);
305*4882a593Smuzhiyun fsopt->snapdir_name = param->string;
306*4882a593Smuzhiyun param->string = NULL;
307*4882a593Smuzhiyun break;
308*4882a593Smuzhiyun case Opt_mds_namespace:
309*4882a593Smuzhiyun kfree(fsopt->mds_namespace);
310*4882a593Smuzhiyun fsopt->mds_namespace = param->string;
311*4882a593Smuzhiyun param->string = NULL;
312*4882a593Smuzhiyun break;
313*4882a593Smuzhiyun case Opt_recover_session:
314*4882a593Smuzhiyun mode = result.uint_32;
315*4882a593Smuzhiyun if (mode == ceph_recover_session_no)
316*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_CLEANRECOVER;
317*4882a593Smuzhiyun else if (mode == ceph_recover_session_clean)
318*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_CLEANRECOVER;
319*4882a593Smuzhiyun else
320*4882a593Smuzhiyun BUG();
321*4882a593Smuzhiyun break;
322*4882a593Smuzhiyun case Opt_source:
323*4882a593Smuzhiyun if (fc->source)
324*4882a593Smuzhiyun return invalfc(fc, "Multiple sources specified");
325*4882a593Smuzhiyun return ceph_parse_source(param, fc);
326*4882a593Smuzhiyun case Opt_wsize:
327*4882a593Smuzhiyun if (result.uint_32 < PAGE_SIZE ||
328*4882a593Smuzhiyun result.uint_32 > CEPH_MAX_WRITE_SIZE)
329*4882a593Smuzhiyun goto out_of_range;
330*4882a593Smuzhiyun fsopt->wsize = ALIGN(result.uint_32, PAGE_SIZE);
331*4882a593Smuzhiyun break;
332*4882a593Smuzhiyun case Opt_rsize:
333*4882a593Smuzhiyun if (result.uint_32 < PAGE_SIZE ||
334*4882a593Smuzhiyun result.uint_32 > CEPH_MAX_READ_SIZE)
335*4882a593Smuzhiyun goto out_of_range;
336*4882a593Smuzhiyun fsopt->rsize = ALIGN(result.uint_32, PAGE_SIZE);
337*4882a593Smuzhiyun break;
338*4882a593Smuzhiyun case Opt_rasize:
339*4882a593Smuzhiyun fsopt->rasize = ALIGN(result.uint_32, PAGE_SIZE);
340*4882a593Smuzhiyun break;
341*4882a593Smuzhiyun case Opt_caps_wanted_delay_min:
342*4882a593Smuzhiyun if (result.uint_32 < 1)
343*4882a593Smuzhiyun goto out_of_range;
344*4882a593Smuzhiyun fsopt->caps_wanted_delay_min = result.uint_32;
345*4882a593Smuzhiyun break;
346*4882a593Smuzhiyun case Opt_caps_wanted_delay_max:
347*4882a593Smuzhiyun if (result.uint_32 < 1)
348*4882a593Smuzhiyun goto out_of_range;
349*4882a593Smuzhiyun fsopt->caps_wanted_delay_max = result.uint_32;
350*4882a593Smuzhiyun break;
351*4882a593Smuzhiyun case Opt_caps_max:
352*4882a593Smuzhiyun if (result.int_32 < 0)
353*4882a593Smuzhiyun goto out_of_range;
354*4882a593Smuzhiyun fsopt->caps_max = result.int_32;
355*4882a593Smuzhiyun break;
356*4882a593Smuzhiyun case Opt_readdir_max_entries:
357*4882a593Smuzhiyun if (result.uint_32 < 1)
358*4882a593Smuzhiyun goto out_of_range;
359*4882a593Smuzhiyun fsopt->max_readdir = result.uint_32;
360*4882a593Smuzhiyun break;
361*4882a593Smuzhiyun case Opt_readdir_max_bytes:
362*4882a593Smuzhiyun if (result.uint_32 < PAGE_SIZE && result.uint_32 != 0)
363*4882a593Smuzhiyun goto out_of_range;
364*4882a593Smuzhiyun fsopt->max_readdir_bytes = result.uint_32;
365*4882a593Smuzhiyun break;
366*4882a593Smuzhiyun case Opt_congestion_kb:
367*4882a593Smuzhiyun if (result.uint_32 < 1024) /* at least 1M */
368*4882a593Smuzhiyun goto out_of_range;
369*4882a593Smuzhiyun fsopt->congestion_kb = result.uint_32;
370*4882a593Smuzhiyun break;
371*4882a593Smuzhiyun case Opt_dirstat:
372*4882a593Smuzhiyun if (!result.negated)
373*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_DIRSTAT;
374*4882a593Smuzhiyun else
375*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_DIRSTAT;
376*4882a593Smuzhiyun break;
377*4882a593Smuzhiyun case Opt_rbytes:
378*4882a593Smuzhiyun if (!result.negated)
379*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_RBYTES;
380*4882a593Smuzhiyun else
381*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_RBYTES;
382*4882a593Smuzhiyun break;
383*4882a593Smuzhiyun case Opt_asyncreaddir:
384*4882a593Smuzhiyun if (!result.negated)
385*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_NOASYNCREADDIR;
386*4882a593Smuzhiyun else
387*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_NOASYNCREADDIR;
388*4882a593Smuzhiyun break;
389*4882a593Smuzhiyun case Opt_dcache:
390*4882a593Smuzhiyun if (!result.negated)
391*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_DCACHE;
392*4882a593Smuzhiyun else
393*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_DCACHE;
394*4882a593Smuzhiyun break;
395*4882a593Smuzhiyun case Opt_ino32:
396*4882a593Smuzhiyun if (!result.negated)
397*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_INO32;
398*4882a593Smuzhiyun else
399*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_INO32;
400*4882a593Smuzhiyun break;
401*4882a593Smuzhiyun
402*4882a593Smuzhiyun case Opt_fscache:
403*4882a593Smuzhiyun #ifdef CONFIG_CEPH_FSCACHE
404*4882a593Smuzhiyun kfree(fsopt->fscache_uniq);
405*4882a593Smuzhiyun fsopt->fscache_uniq = NULL;
406*4882a593Smuzhiyun if (result.negated) {
407*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_FSCACHE;
408*4882a593Smuzhiyun } else {
409*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_FSCACHE;
410*4882a593Smuzhiyun fsopt->fscache_uniq = param->string;
411*4882a593Smuzhiyun param->string = NULL;
412*4882a593Smuzhiyun }
413*4882a593Smuzhiyun break;
414*4882a593Smuzhiyun #else
415*4882a593Smuzhiyun return invalfc(fc, "fscache support is disabled");
416*4882a593Smuzhiyun #endif
417*4882a593Smuzhiyun case Opt_poolperm:
418*4882a593Smuzhiyun if (!result.negated)
419*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_NOPOOLPERM;
420*4882a593Smuzhiyun else
421*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_NOPOOLPERM;
422*4882a593Smuzhiyun break;
423*4882a593Smuzhiyun case Opt_require_active_mds:
424*4882a593Smuzhiyun if (!result.negated)
425*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_MOUNTWAIT;
426*4882a593Smuzhiyun else
427*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_MOUNTWAIT;
428*4882a593Smuzhiyun break;
429*4882a593Smuzhiyun case Opt_quotadf:
430*4882a593Smuzhiyun if (!result.negated)
431*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_NOQUOTADF;
432*4882a593Smuzhiyun else
433*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_NOQUOTADF;
434*4882a593Smuzhiyun break;
435*4882a593Smuzhiyun case Opt_copyfrom:
436*4882a593Smuzhiyun if (!result.negated)
437*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_NOCOPYFROM;
438*4882a593Smuzhiyun else
439*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_NOCOPYFROM;
440*4882a593Smuzhiyun break;
441*4882a593Smuzhiyun case Opt_acl:
442*4882a593Smuzhiyun if (!result.negated) {
443*4882a593Smuzhiyun #ifdef CONFIG_CEPH_FS_POSIX_ACL
444*4882a593Smuzhiyun fc->sb_flags |= SB_POSIXACL;
445*4882a593Smuzhiyun #else
446*4882a593Smuzhiyun return invalfc(fc, "POSIX ACL support is disabled");
447*4882a593Smuzhiyun #endif
448*4882a593Smuzhiyun } else {
449*4882a593Smuzhiyun fc->sb_flags &= ~SB_POSIXACL;
450*4882a593Smuzhiyun }
451*4882a593Smuzhiyun break;
452*4882a593Smuzhiyun case Opt_wsync:
453*4882a593Smuzhiyun if (!result.negated)
454*4882a593Smuzhiyun fsopt->flags &= ~CEPH_MOUNT_OPT_ASYNC_DIROPS;
455*4882a593Smuzhiyun else
456*4882a593Smuzhiyun fsopt->flags |= CEPH_MOUNT_OPT_ASYNC_DIROPS;
457*4882a593Smuzhiyun break;
458*4882a593Smuzhiyun default:
459*4882a593Smuzhiyun BUG();
460*4882a593Smuzhiyun }
461*4882a593Smuzhiyun return 0;
462*4882a593Smuzhiyun
463*4882a593Smuzhiyun out_of_range:
464*4882a593Smuzhiyun return invalfc(fc, "%s out of range", param->key);
465*4882a593Smuzhiyun }
466*4882a593Smuzhiyun
destroy_mount_options(struct ceph_mount_options * args)467*4882a593Smuzhiyun static void destroy_mount_options(struct ceph_mount_options *args)
468*4882a593Smuzhiyun {
469*4882a593Smuzhiyun dout("destroy_mount_options %p\n", args);
470*4882a593Smuzhiyun if (!args)
471*4882a593Smuzhiyun return;
472*4882a593Smuzhiyun
473*4882a593Smuzhiyun kfree(args->snapdir_name);
474*4882a593Smuzhiyun kfree(args->mds_namespace);
475*4882a593Smuzhiyun kfree(args->server_path);
476*4882a593Smuzhiyun kfree(args->fscache_uniq);
477*4882a593Smuzhiyun kfree(args);
478*4882a593Smuzhiyun }
479*4882a593Smuzhiyun
strcmp_null(const char * s1,const char * s2)480*4882a593Smuzhiyun static int strcmp_null(const char *s1, const char *s2)
481*4882a593Smuzhiyun {
482*4882a593Smuzhiyun if (!s1 && !s2)
483*4882a593Smuzhiyun return 0;
484*4882a593Smuzhiyun if (s1 && !s2)
485*4882a593Smuzhiyun return -1;
486*4882a593Smuzhiyun if (!s1 && s2)
487*4882a593Smuzhiyun return 1;
488*4882a593Smuzhiyun return strcmp(s1, s2);
489*4882a593Smuzhiyun }
490*4882a593Smuzhiyun
compare_mount_options(struct ceph_mount_options * new_fsopt,struct ceph_options * new_opt,struct ceph_fs_client * fsc)491*4882a593Smuzhiyun static int compare_mount_options(struct ceph_mount_options *new_fsopt,
492*4882a593Smuzhiyun struct ceph_options *new_opt,
493*4882a593Smuzhiyun struct ceph_fs_client *fsc)
494*4882a593Smuzhiyun {
495*4882a593Smuzhiyun struct ceph_mount_options *fsopt1 = new_fsopt;
496*4882a593Smuzhiyun struct ceph_mount_options *fsopt2 = fsc->mount_options;
497*4882a593Smuzhiyun int ofs = offsetof(struct ceph_mount_options, snapdir_name);
498*4882a593Smuzhiyun int ret;
499*4882a593Smuzhiyun
500*4882a593Smuzhiyun ret = memcmp(fsopt1, fsopt2, ofs);
501*4882a593Smuzhiyun if (ret)
502*4882a593Smuzhiyun return ret;
503*4882a593Smuzhiyun
504*4882a593Smuzhiyun ret = strcmp_null(fsopt1->snapdir_name, fsopt2->snapdir_name);
505*4882a593Smuzhiyun if (ret)
506*4882a593Smuzhiyun return ret;
507*4882a593Smuzhiyun
508*4882a593Smuzhiyun ret = strcmp_null(fsopt1->mds_namespace, fsopt2->mds_namespace);
509*4882a593Smuzhiyun if (ret)
510*4882a593Smuzhiyun return ret;
511*4882a593Smuzhiyun
512*4882a593Smuzhiyun ret = strcmp_null(fsopt1->server_path, fsopt2->server_path);
513*4882a593Smuzhiyun if (ret)
514*4882a593Smuzhiyun return ret;
515*4882a593Smuzhiyun
516*4882a593Smuzhiyun ret = strcmp_null(fsopt1->fscache_uniq, fsopt2->fscache_uniq);
517*4882a593Smuzhiyun if (ret)
518*4882a593Smuzhiyun return ret;
519*4882a593Smuzhiyun
520*4882a593Smuzhiyun return ceph_compare_options(new_opt, fsc->client);
521*4882a593Smuzhiyun }
522*4882a593Smuzhiyun
523*4882a593Smuzhiyun /**
524*4882a593Smuzhiyun * ceph_show_options - Show mount options in /proc/mounts
525*4882a593Smuzhiyun * @m: seq_file to write to
526*4882a593Smuzhiyun * @root: root of that (sub)tree
527*4882a593Smuzhiyun */
ceph_show_options(struct seq_file * m,struct dentry * root)528*4882a593Smuzhiyun static int ceph_show_options(struct seq_file *m, struct dentry *root)
529*4882a593Smuzhiyun {
530*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(root->d_sb);
531*4882a593Smuzhiyun struct ceph_mount_options *fsopt = fsc->mount_options;
532*4882a593Smuzhiyun size_t pos;
533*4882a593Smuzhiyun int ret;
534*4882a593Smuzhiyun
535*4882a593Smuzhiyun /* a comma between MNT/MS and client options */
536*4882a593Smuzhiyun seq_putc(m, ',');
537*4882a593Smuzhiyun pos = m->count;
538*4882a593Smuzhiyun
539*4882a593Smuzhiyun ret = ceph_print_client_options(m, fsc->client, false);
540*4882a593Smuzhiyun if (ret)
541*4882a593Smuzhiyun return ret;
542*4882a593Smuzhiyun
543*4882a593Smuzhiyun /* retract our comma if no client options */
544*4882a593Smuzhiyun if (m->count == pos)
545*4882a593Smuzhiyun m->count--;
546*4882a593Smuzhiyun
547*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_DIRSTAT)
548*4882a593Smuzhiyun seq_puts(m, ",dirstat");
549*4882a593Smuzhiyun if ((fsopt->flags & CEPH_MOUNT_OPT_RBYTES))
550*4882a593Smuzhiyun seq_puts(m, ",rbytes");
551*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_NOASYNCREADDIR)
552*4882a593Smuzhiyun seq_puts(m, ",noasyncreaddir");
553*4882a593Smuzhiyun if ((fsopt->flags & CEPH_MOUNT_OPT_DCACHE) == 0)
554*4882a593Smuzhiyun seq_puts(m, ",nodcache");
555*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_INO32)
556*4882a593Smuzhiyun seq_puts(m, ",ino32");
557*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_FSCACHE) {
558*4882a593Smuzhiyun seq_show_option(m, "fsc", fsopt->fscache_uniq);
559*4882a593Smuzhiyun }
560*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_NOPOOLPERM)
561*4882a593Smuzhiyun seq_puts(m, ",nopoolperm");
562*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_NOQUOTADF)
563*4882a593Smuzhiyun seq_puts(m, ",noquotadf");
564*4882a593Smuzhiyun
565*4882a593Smuzhiyun #ifdef CONFIG_CEPH_FS_POSIX_ACL
566*4882a593Smuzhiyun if (root->d_sb->s_flags & SB_POSIXACL)
567*4882a593Smuzhiyun seq_puts(m, ",acl");
568*4882a593Smuzhiyun else
569*4882a593Smuzhiyun seq_puts(m, ",noacl");
570*4882a593Smuzhiyun #endif
571*4882a593Smuzhiyun
572*4882a593Smuzhiyun if ((fsopt->flags & CEPH_MOUNT_OPT_NOCOPYFROM) == 0)
573*4882a593Smuzhiyun seq_puts(m, ",copyfrom");
574*4882a593Smuzhiyun
575*4882a593Smuzhiyun if (fsopt->mds_namespace)
576*4882a593Smuzhiyun seq_show_option(m, "mds_namespace", fsopt->mds_namespace);
577*4882a593Smuzhiyun
578*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_CLEANRECOVER)
579*4882a593Smuzhiyun seq_show_option(m, "recover_session", "clean");
580*4882a593Smuzhiyun
581*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_ASYNC_DIROPS)
582*4882a593Smuzhiyun seq_puts(m, ",nowsync");
583*4882a593Smuzhiyun
584*4882a593Smuzhiyun if (fsopt->wsize != CEPH_MAX_WRITE_SIZE)
585*4882a593Smuzhiyun seq_printf(m, ",wsize=%u", fsopt->wsize);
586*4882a593Smuzhiyun if (fsopt->rsize != CEPH_MAX_READ_SIZE)
587*4882a593Smuzhiyun seq_printf(m, ",rsize=%u", fsopt->rsize);
588*4882a593Smuzhiyun if (fsopt->rasize != CEPH_RASIZE_DEFAULT)
589*4882a593Smuzhiyun seq_printf(m, ",rasize=%u", fsopt->rasize);
590*4882a593Smuzhiyun if (fsopt->congestion_kb != default_congestion_kb())
591*4882a593Smuzhiyun seq_printf(m, ",write_congestion_kb=%u", fsopt->congestion_kb);
592*4882a593Smuzhiyun if (fsopt->caps_max)
593*4882a593Smuzhiyun seq_printf(m, ",caps_max=%d", fsopt->caps_max);
594*4882a593Smuzhiyun if (fsopt->caps_wanted_delay_min != CEPH_CAPS_WANTED_DELAY_MIN_DEFAULT)
595*4882a593Smuzhiyun seq_printf(m, ",caps_wanted_delay_min=%u",
596*4882a593Smuzhiyun fsopt->caps_wanted_delay_min);
597*4882a593Smuzhiyun if (fsopt->caps_wanted_delay_max != CEPH_CAPS_WANTED_DELAY_MAX_DEFAULT)
598*4882a593Smuzhiyun seq_printf(m, ",caps_wanted_delay_max=%u",
599*4882a593Smuzhiyun fsopt->caps_wanted_delay_max);
600*4882a593Smuzhiyun if (fsopt->max_readdir != CEPH_MAX_READDIR_DEFAULT)
601*4882a593Smuzhiyun seq_printf(m, ",readdir_max_entries=%u", fsopt->max_readdir);
602*4882a593Smuzhiyun if (fsopt->max_readdir_bytes != CEPH_MAX_READDIR_BYTES_DEFAULT)
603*4882a593Smuzhiyun seq_printf(m, ",readdir_max_bytes=%u", fsopt->max_readdir_bytes);
604*4882a593Smuzhiyun if (strcmp(fsopt->snapdir_name, CEPH_SNAPDIRNAME_DEFAULT))
605*4882a593Smuzhiyun seq_show_option(m, "snapdirname", fsopt->snapdir_name);
606*4882a593Smuzhiyun
607*4882a593Smuzhiyun return 0;
608*4882a593Smuzhiyun }
609*4882a593Smuzhiyun
610*4882a593Smuzhiyun /*
611*4882a593Smuzhiyun * handle any mon messages the standard library doesn't understand.
612*4882a593Smuzhiyun * return error if we don't either.
613*4882a593Smuzhiyun */
extra_mon_dispatch(struct ceph_client * client,struct ceph_msg * msg)614*4882a593Smuzhiyun static int extra_mon_dispatch(struct ceph_client *client, struct ceph_msg *msg)
615*4882a593Smuzhiyun {
616*4882a593Smuzhiyun struct ceph_fs_client *fsc = client->private;
617*4882a593Smuzhiyun int type = le16_to_cpu(msg->hdr.type);
618*4882a593Smuzhiyun
619*4882a593Smuzhiyun switch (type) {
620*4882a593Smuzhiyun case CEPH_MSG_MDS_MAP:
621*4882a593Smuzhiyun ceph_mdsc_handle_mdsmap(fsc->mdsc, msg);
622*4882a593Smuzhiyun return 0;
623*4882a593Smuzhiyun case CEPH_MSG_FS_MAP_USER:
624*4882a593Smuzhiyun ceph_mdsc_handle_fsmap(fsc->mdsc, msg);
625*4882a593Smuzhiyun return 0;
626*4882a593Smuzhiyun default:
627*4882a593Smuzhiyun return -1;
628*4882a593Smuzhiyun }
629*4882a593Smuzhiyun }
630*4882a593Smuzhiyun
631*4882a593Smuzhiyun /*
632*4882a593Smuzhiyun * create a new fs client
633*4882a593Smuzhiyun *
634*4882a593Smuzhiyun * Success or not, this function consumes @fsopt and @opt.
635*4882a593Smuzhiyun */
create_fs_client(struct ceph_mount_options * fsopt,struct ceph_options * opt)636*4882a593Smuzhiyun static struct ceph_fs_client *create_fs_client(struct ceph_mount_options *fsopt,
637*4882a593Smuzhiyun struct ceph_options *opt)
638*4882a593Smuzhiyun {
639*4882a593Smuzhiyun struct ceph_fs_client *fsc;
640*4882a593Smuzhiyun int err;
641*4882a593Smuzhiyun
642*4882a593Smuzhiyun fsc = kzalloc(sizeof(*fsc), GFP_KERNEL);
643*4882a593Smuzhiyun if (!fsc) {
644*4882a593Smuzhiyun err = -ENOMEM;
645*4882a593Smuzhiyun goto fail;
646*4882a593Smuzhiyun }
647*4882a593Smuzhiyun
648*4882a593Smuzhiyun fsc->client = ceph_create_client(opt, fsc);
649*4882a593Smuzhiyun if (IS_ERR(fsc->client)) {
650*4882a593Smuzhiyun err = PTR_ERR(fsc->client);
651*4882a593Smuzhiyun goto fail;
652*4882a593Smuzhiyun }
653*4882a593Smuzhiyun opt = NULL; /* fsc->client now owns this */
654*4882a593Smuzhiyun
655*4882a593Smuzhiyun fsc->client->extra_mon_dispatch = extra_mon_dispatch;
656*4882a593Smuzhiyun ceph_set_opt(fsc->client, ABORT_ON_FULL);
657*4882a593Smuzhiyun
658*4882a593Smuzhiyun if (!fsopt->mds_namespace) {
659*4882a593Smuzhiyun ceph_monc_want_map(&fsc->client->monc, CEPH_SUB_MDSMAP,
660*4882a593Smuzhiyun 0, true);
661*4882a593Smuzhiyun } else {
662*4882a593Smuzhiyun ceph_monc_want_map(&fsc->client->monc, CEPH_SUB_FSMAP,
663*4882a593Smuzhiyun 0, false);
664*4882a593Smuzhiyun }
665*4882a593Smuzhiyun
666*4882a593Smuzhiyun fsc->mount_options = fsopt;
667*4882a593Smuzhiyun
668*4882a593Smuzhiyun fsc->sb = NULL;
669*4882a593Smuzhiyun fsc->mount_state = CEPH_MOUNT_MOUNTING;
670*4882a593Smuzhiyun fsc->filp_gen = 1;
671*4882a593Smuzhiyun fsc->have_copy_from2 = true;
672*4882a593Smuzhiyun
673*4882a593Smuzhiyun atomic_long_set(&fsc->writeback_count, 0);
674*4882a593Smuzhiyun
675*4882a593Smuzhiyun err = -ENOMEM;
676*4882a593Smuzhiyun /*
677*4882a593Smuzhiyun * The number of concurrent works can be high but they don't need
678*4882a593Smuzhiyun * to be processed in parallel, limit concurrency.
679*4882a593Smuzhiyun */
680*4882a593Smuzhiyun fsc->inode_wq = alloc_workqueue("ceph-inode", WQ_UNBOUND, 0);
681*4882a593Smuzhiyun if (!fsc->inode_wq)
682*4882a593Smuzhiyun goto fail_client;
683*4882a593Smuzhiyun fsc->cap_wq = alloc_workqueue("ceph-cap", 0, 1);
684*4882a593Smuzhiyun if (!fsc->cap_wq)
685*4882a593Smuzhiyun goto fail_inode_wq;
686*4882a593Smuzhiyun
687*4882a593Smuzhiyun spin_lock(&ceph_fsc_lock);
688*4882a593Smuzhiyun list_add_tail(&fsc->metric_wakeup, &ceph_fsc_list);
689*4882a593Smuzhiyun spin_unlock(&ceph_fsc_lock);
690*4882a593Smuzhiyun
691*4882a593Smuzhiyun return fsc;
692*4882a593Smuzhiyun
693*4882a593Smuzhiyun fail_inode_wq:
694*4882a593Smuzhiyun destroy_workqueue(fsc->inode_wq);
695*4882a593Smuzhiyun fail_client:
696*4882a593Smuzhiyun ceph_destroy_client(fsc->client);
697*4882a593Smuzhiyun fail:
698*4882a593Smuzhiyun kfree(fsc);
699*4882a593Smuzhiyun if (opt)
700*4882a593Smuzhiyun ceph_destroy_options(opt);
701*4882a593Smuzhiyun destroy_mount_options(fsopt);
702*4882a593Smuzhiyun return ERR_PTR(err);
703*4882a593Smuzhiyun }
704*4882a593Smuzhiyun
flush_fs_workqueues(struct ceph_fs_client * fsc)705*4882a593Smuzhiyun static void flush_fs_workqueues(struct ceph_fs_client *fsc)
706*4882a593Smuzhiyun {
707*4882a593Smuzhiyun flush_workqueue(fsc->inode_wq);
708*4882a593Smuzhiyun flush_workqueue(fsc->cap_wq);
709*4882a593Smuzhiyun }
710*4882a593Smuzhiyun
destroy_fs_client(struct ceph_fs_client * fsc)711*4882a593Smuzhiyun static void destroy_fs_client(struct ceph_fs_client *fsc)
712*4882a593Smuzhiyun {
713*4882a593Smuzhiyun dout("destroy_fs_client %p\n", fsc);
714*4882a593Smuzhiyun
715*4882a593Smuzhiyun spin_lock(&ceph_fsc_lock);
716*4882a593Smuzhiyun list_del(&fsc->metric_wakeup);
717*4882a593Smuzhiyun spin_unlock(&ceph_fsc_lock);
718*4882a593Smuzhiyun
719*4882a593Smuzhiyun ceph_mdsc_destroy(fsc);
720*4882a593Smuzhiyun destroy_workqueue(fsc->inode_wq);
721*4882a593Smuzhiyun destroy_workqueue(fsc->cap_wq);
722*4882a593Smuzhiyun
723*4882a593Smuzhiyun destroy_mount_options(fsc->mount_options);
724*4882a593Smuzhiyun
725*4882a593Smuzhiyun ceph_destroy_client(fsc->client);
726*4882a593Smuzhiyun
727*4882a593Smuzhiyun kfree(fsc);
728*4882a593Smuzhiyun dout("destroy_fs_client %p done\n", fsc);
729*4882a593Smuzhiyun }
730*4882a593Smuzhiyun
731*4882a593Smuzhiyun /*
732*4882a593Smuzhiyun * caches
733*4882a593Smuzhiyun */
734*4882a593Smuzhiyun struct kmem_cache *ceph_inode_cachep;
735*4882a593Smuzhiyun struct kmem_cache *ceph_cap_cachep;
736*4882a593Smuzhiyun struct kmem_cache *ceph_cap_flush_cachep;
737*4882a593Smuzhiyun struct kmem_cache *ceph_dentry_cachep;
738*4882a593Smuzhiyun struct kmem_cache *ceph_file_cachep;
739*4882a593Smuzhiyun struct kmem_cache *ceph_dir_file_cachep;
740*4882a593Smuzhiyun struct kmem_cache *ceph_mds_request_cachep;
741*4882a593Smuzhiyun mempool_t *ceph_wb_pagevec_pool;
742*4882a593Smuzhiyun
ceph_inode_init_once(void * foo)743*4882a593Smuzhiyun static void ceph_inode_init_once(void *foo)
744*4882a593Smuzhiyun {
745*4882a593Smuzhiyun struct ceph_inode_info *ci = foo;
746*4882a593Smuzhiyun inode_init_once(&ci->vfs_inode);
747*4882a593Smuzhiyun }
748*4882a593Smuzhiyun
init_caches(void)749*4882a593Smuzhiyun static int __init init_caches(void)
750*4882a593Smuzhiyun {
751*4882a593Smuzhiyun int error = -ENOMEM;
752*4882a593Smuzhiyun
753*4882a593Smuzhiyun ceph_inode_cachep = kmem_cache_create("ceph_inode_info",
754*4882a593Smuzhiyun sizeof(struct ceph_inode_info),
755*4882a593Smuzhiyun __alignof__(struct ceph_inode_info),
756*4882a593Smuzhiyun SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD|
757*4882a593Smuzhiyun SLAB_ACCOUNT, ceph_inode_init_once);
758*4882a593Smuzhiyun if (!ceph_inode_cachep)
759*4882a593Smuzhiyun return -ENOMEM;
760*4882a593Smuzhiyun
761*4882a593Smuzhiyun ceph_cap_cachep = KMEM_CACHE(ceph_cap, SLAB_MEM_SPREAD);
762*4882a593Smuzhiyun if (!ceph_cap_cachep)
763*4882a593Smuzhiyun goto bad_cap;
764*4882a593Smuzhiyun ceph_cap_flush_cachep = KMEM_CACHE(ceph_cap_flush,
765*4882a593Smuzhiyun SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD);
766*4882a593Smuzhiyun if (!ceph_cap_flush_cachep)
767*4882a593Smuzhiyun goto bad_cap_flush;
768*4882a593Smuzhiyun
769*4882a593Smuzhiyun ceph_dentry_cachep = KMEM_CACHE(ceph_dentry_info,
770*4882a593Smuzhiyun SLAB_RECLAIM_ACCOUNT|SLAB_MEM_SPREAD);
771*4882a593Smuzhiyun if (!ceph_dentry_cachep)
772*4882a593Smuzhiyun goto bad_dentry;
773*4882a593Smuzhiyun
774*4882a593Smuzhiyun ceph_file_cachep = KMEM_CACHE(ceph_file_info, SLAB_MEM_SPREAD);
775*4882a593Smuzhiyun if (!ceph_file_cachep)
776*4882a593Smuzhiyun goto bad_file;
777*4882a593Smuzhiyun
778*4882a593Smuzhiyun ceph_dir_file_cachep = KMEM_CACHE(ceph_dir_file_info, SLAB_MEM_SPREAD);
779*4882a593Smuzhiyun if (!ceph_dir_file_cachep)
780*4882a593Smuzhiyun goto bad_dir_file;
781*4882a593Smuzhiyun
782*4882a593Smuzhiyun ceph_mds_request_cachep = KMEM_CACHE(ceph_mds_request, SLAB_MEM_SPREAD);
783*4882a593Smuzhiyun if (!ceph_mds_request_cachep)
784*4882a593Smuzhiyun goto bad_mds_req;
785*4882a593Smuzhiyun
786*4882a593Smuzhiyun ceph_wb_pagevec_pool = mempool_create_kmalloc_pool(10, CEPH_MAX_WRITE_SIZE >> PAGE_SHIFT);
787*4882a593Smuzhiyun if (!ceph_wb_pagevec_pool)
788*4882a593Smuzhiyun goto bad_pagevec_pool;
789*4882a593Smuzhiyun
790*4882a593Smuzhiyun error = ceph_fscache_register();
791*4882a593Smuzhiyun if (error)
792*4882a593Smuzhiyun goto bad_fscache;
793*4882a593Smuzhiyun
794*4882a593Smuzhiyun return 0;
795*4882a593Smuzhiyun
796*4882a593Smuzhiyun bad_fscache:
797*4882a593Smuzhiyun kmem_cache_destroy(ceph_mds_request_cachep);
798*4882a593Smuzhiyun bad_pagevec_pool:
799*4882a593Smuzhiyun mempool_destroy(ceph_wb_pagevec_pool);
800*4882a593Smuzhiyun bad_mds_req:
801*4882a593Smuzhiyun kmem_cache_destroy(ceph_dir_file_cachep);
802*4882a593Smuzhiyun bad_dir_file:
803*4882a593Smuzhiyun kmem_cache_destroy(ceph_file_cachep);
804*4882a593Smuzhiyun bad_file:
805*4882a593Smuzhiyun kmem_cache_destroy(ceph_dentry_cachep);
806*4882a593Smuzhiyun bad_dentry:
807*4882a593Smuzhiyun kmem_cache_destroy(ceph_cap_flush_cachep);
808*4882a593Smuzhiyun bad_cap_flush:
809*4882a593Smuzhiyun kmem_cache_destroy(ceph_cap_cachep);
810*4882a593Smuzhiyun bad_cap:
811*4882a593Smuzhiyun kmem_cache_destroy(ceph_inode_cachep);
812*4882a593Smuzhiyun return error;
813*4882a593Smuzhiyun }
814*4882a593Smuzhiyun
destroy_caches(void)815*4882a593Smuzhiyun static void destroy_caches(void)
816*4882a593Smuzhiyun {
817*4882a593Smuzhiyun /*
818*4882a593Smuzhiyun * Make sure all delayed rcu free inodes are flushed before we
819*4882a593Smuzhiyun * destroy cache.
820*4882a593Smuzhiyun */
821*4882a593Smuzhiyun rcu_barrier();
822*4882a593Smuzhiyun
823*4882a593Smuzhiyun kmem_cache_destroy(ceph_inode_cachep);
824*4882a593Smuzhiyun kmem_cache_destroy(ceph_cap_cachep);
825*4882a593Smuzhiyun kmem_cache_destroy(ceph_cap_flush_cachep);
826*4882a593Smuzhiyun kmem_cache_destroy(ceph_dentry_cachep);
827*4882a593Smuzhiyun kmem_cache_destroy(ceph_file_cachep);
828*4882a593Smuzhiyun kmem_cache_destroy(ceph_dir_file_cachep);
829*4882a593Smuzhiyun kmem_cache_destroy(ceph_mds_request_cachep);
830*4882a593Smuzhiyun mempool_destroy(ceph_wb_pagevec_pool);
831*4882a593Smuzhiyun
832*4882a593Smuzhiyun ceph_fscache_unregister();
833*4882a593Smuzhiyun }
834*4882a593Smuzhiyun
835*4882a593Smuzhiyun /*
836*4882a593Smuzhiyun * ceph_umount_begin - initiate forced umount. Tear down the
837*4882a593Smuzhiyun * mount, skipping steps that may hang while waiting for server(s).
838*4882a593Smuzhiyun */
ceph_umount_begin(struct super_block * sb)839*4882a593Smuzhiyun static void ceph_umount_begin(struct super_block *sb)
840*4882a593Smuzhiyun {
841*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(sb);
842*4882a593Smuzhiyun
843*4882a593Smuzhiyun dout("ceph_umount_begin - starting forced umount\n");
844*4882a593Smuzhiyun if (!fsc)
845*4882a593Smuzhiyun return;
846*4882a593Smuzhiyun fsc->mount_state = CEPH_MOUNT_SHUTDOWN;
847*4882a593Smuzhiyun ceph_osdc_abort_requests(&fsc->client->osdc, -EIO);
848*4882a593Smuzhiyun ceph_mdsc_force_umount(fsc->mdsc);
849*4882a593Smuzhiyun fsc->filp_gen++; // invalidate open files
850*4882a593Smuzhiyun }
851*4882a593Smuzhiyun
852*4882a593Smuzhiyun static const struct super_operations ceph_super_ops = {
853*4882a593Smuzhiyun .alloc_inode = ceph_alloc_inode,
854*4882a593Smuzhiyun .free_inode = ceph_free_inode,
855*4882a593Smuzhiyun .write_inode = ceph_write_inode,
856*4882a593Smuzhiyun .drop_inode = generic_delete_inode,
857*4882a593Smuzhiyun .evict_inode = ceph_evict_inode,
858*4882a593Smuzhiyun .sync_fs = ceph_sync_fs,
859*4882a593Smuzhiyun .put_super = ceph_put_super,
860*4882a593Smuzhiyun .show_options = ceph_show_options,
861*4882a593Smuzhiyun .statfs = ceph_statfs,
862*4882a593Smuzhiyun .umount_begin = ceph_umount_begin,
863*4882a593Smuzhiyun };
864*4882a593Smuzhiyun
865*4882a593Smuzhiyun /*
866*4882a593Smuzhiyun * Bootstrap mount by opening the root directory. Note the mount
867*4882a593Smuzhiyun * @started time from caller, and time out if this takes too long.
868*4882a593Smuzhiyun */
open_root_dentry(struct ceph_fs_client * fsc,const char * path,unsigned long started)869*4882a593Smuzhiyun static struct dentry *open_root_dentry(struct ceph_fs_client *fsc,
870*4882a593Smuzhiyun const char *path,
871*4882a593Smuzhiyun unsigned long started)
872*4882a593Smuzhiyun {
873*4882a593Smuzhiyun struct ceph_mds_client *mdsc = fsc->mdsc;
874*4882a593Smuzhiyun struct ceph_mds_request *req = NULL;
875*4882a593Smuzhiyun int err;
876*4882a593Smuzhiyun struct dentry *root;
877*4882a593Smuzhiyun
878*4882a593Smuzhiyun /* open dir */
879*4882a593Smuzhiyun dout("open_root_inode opening '%s'\n", path);
880*4882a593Smuzhiyun req = ceph_mdsc_create_request(mdsc, CEPH_MDS_OP_GETATTR, USE_ANY_MDS);
881*4882a593Smuzhiyun if (IS_ERR(req))
882*4882a593Smuzhiyun return ERR_CAST(req);
883*4882a593Smuzhiyun req->r_path1 = kstrdup(path, GFP_NOFS);
884*4882a593Smuzhiyun if (!req->r_path1) {
885*4882a593Smuzhiyun root = ERR_PTR(-ENOMEM);
886*4882a593Smuzhiyun goto out;
887*4882a593Smuzhiyun }
888*4882a593Smuzhiyun
889*4882a593Smuzhiyun req->r_ino1.ino = CEPH_INO_ROOT;
890*4882a593Smuzhiyun req->r_ino1.snap = CEPH_NOSNAP;
891*4882a593Smuzhiyun req->r_started = started;
892*4882a593Smuzhiyun req->r_timeout = fsc->client->options->mount_timeout;
893*4882a593Smuzhiyun req->r_args.getattr.mask = cpu_to_le32(CEPH_STAT_CAP_INODE);
894*4882a593Smuzhiyun req->r_num_caps = 2;
895*4882a593Smuzhiyun err = ceph_mdsc_do_request(mdsc, NULL, req);
896*4882a593Smuzhiyun if (err == 0) {
897*4882a593Smuzhiyun struct inode *inode = req->r_target_inode;
898*4882a593Smuzhiyun req->r_target_inode = NULL;
899*4882a593Smuzhiyun dout("open_root_inode success\n");
900*4882a593Smuzhiyun root = d_make_root(inode);
901*4882a593Smuzhiyun if (!root) {
902*4882a593Smuzhiyun root = ERR_PTR(-ENOMEM);
903*4882a593Smuzhiyun goto out;
904*4882a593Smuzhiyun }
905*4882a593Smuzhiyun dout("open_root_inode success, root dentry is %p\n", root);
906*4882a593Smuzhiyun } else {
907*4882a593Smuzhiyun root = ERR_PTR(err);
908*4882a593Smuzhiyun }
909*4882a593Smuzhiyun out:
910*4882a593Smuzhiyun ceph_mdsc_put_request(req);
911*4882a593Smuzhiyun return root;
912*4882a593Smuzhiyun }
913*4882a593Smuzhiyun
914*4882a593Smuzhiyun /*
915*4882a593Smuzhiyun * mount: join the ceph cluster, and open root directory.
916*4882a593Smuzhiyun */
ceph_real_mount(struct ceph_fs_client * fsc,struct fs_context * fc)917*4882a593Smuzhiyun static struct dentry *ceph_real_mount(struct ceph_fs_client *fsc,
918*4882a593Smuzhiyun struct fs_context *fc)
919*4882a593Smuzhiyun {
920*4882a593Smuzhiyun int err;
921*4882a593Smuzhiyun unsigned long started = jiffies; /* note the start time */
922*4882a593Smuzhiyun struct dentry *root;
923*4882a593Smuzhiyun
924*4882a593Smuzhiyun dout("mount start %p\n", fsc);
925*4882a593Smuzhiyun mutex_lock(&fsc->client->mount_mutex);
926*4882a593Smuzhiyun
927*4882a593Smuzhiyun if (!fsc->sb->s_root) {
928*4882a593Smuzhiyun const char *path = fsc->mount_options->server_path ?
929*4882a593Smuzhiyun fsc->mount_options->server_path + 1 : "";
930*4882a593Smuzhiyun
931*4882a593Smuzhiyun err = __ceph_open_session(fsc->client, started);
932*4882a593Smuzhiyun if (err < 0)
933*4882a593Smuzhiyun goto out;
934*4882a593Smuzhiyun
935*4882a593Smuzhiyun /* setup fscache */
936*4882a593Smuzhiyun if (fsc->mount_options->flags & CEPH_MOUNT_OPT_FSCACHE) {
937*4882a593Smuzhiyun err = ceph_fscache_register_fs(fsc, fc);
938*4882a593Smuzhiyun if (err < 0)
939*4882a593Smuzhiyun goto out;
940*4882a593Smuzhiyun }
941*4882a593Smuzhiyun
942*4882a593Smuzhiyun dout("mount opening path '%s'\n", path);
943*4882a593Smuzhiyun
944*4882a593Smuzhiyun ceph_fs_debugfs_init(fsc);
945*4882a593Smuzhiyun
946*4882a593Smuzhiyun root = open_root_dentry(fsc, path, started);
947*4882a593Smuzhiyun if (IS_ERR(root)) {
948*4882a593Smuzhiyun err = PTR_ERR(root);
949*4882a593Smuzhiyun goto out;
950*4882a593Smuzhiyun }
951*4882a593Smuzhiyun fsc->sb->s_root = dget(root);
952*4882a593Smuzhiyun } else {
953*4882a593Smuzhiyun root = dget(fsc->sb->s_root);
954*4882a593Smuzhiyun }
955*4882a593Smuzhiyun
956*4882a593Smuzhiyun fsc->mount_state = CEPH_MOUNT_MOUNTED;
957*4882a593Smuzhiyun dout("mount success\n");
958*4882a593Smuzhiyun mutex_unlock(&fsc->client->mount_mutex);
959*4882a593Smuzhiyun return root;
960*4882a593Smuzhiyun
961*4882a593Smuzhiyun out:
962*4882a593Smuzhiyun mutex_unlock(&fsc->client->mount_mutex);
963*4882a593Smuzhiyun return ERR_PTR(err);
964*4882a593Smuzhiyun }
965*4882a593Smuzhiyun
ceph_set_super(struct super_block * s,struct fs_context * fc)966*4882a593Smuzhiyun static int ceph_set_super(struct super_block *s, struct fs_context *fc)
967*4882a593Smuzhiyun {
968*4882a593Smuzhiyun struct ceph_fs_client *fsc = s->s_fs_info;
969*4882a593Smuzhiyun int ret;
970*4882a593Smuzhiyun
971*4882a593Smuzhiyun dout("set_super %p\n", s);
972*4882a593Smuzhiyun
973*4882a593Smuzhiyun s->s_maxbytes = MAX_LFS_FILESIZE;
974*4882a593Smuzhiyun
975*4882a593Smuzhiyun s->s_xattr = ceph_xattr_handlers;
976*4882a593Smuzhiyun fsc->sb = s;
977*4882a593Smuzhiyun fsc->max_file_size = 1ULL << 40; /* temp value until we get mdsmap */
978*4882a593Smuzhiyun
979*4882a593Smuzhiyun s->s_op = &ceph_super_ops;
980*4882a593Smuzhiyun s->s_d_op = &ceph_dentry_ops;
981*4882a593Smuzhiyun s->s_export_op = &ceph_export_ops;
982*4882a593Smuzhiyun
983*4882a593Smuzhiyun s->s_time_gran = 1;
984*4882a593Smuzhiyun s->s_time_min = 0;
985*4882a593Smuzhiyun s->s_time_max = U32_MAX;
986*4882a593Smuzhiyun
987*4882a593Smuzhiyun ret = set_anon_super_fc(s, fc);
988*4882a593Smuzhiyun if (ret != 0)
989*4882a593Smuzhiyun fsc->sb = NULL;
990*4882a593Smuzhiyun return ret;
991*4882a593Smuzhiyun }
992*4882a593Smuzhiyun
993*4882a593Smuzhiyun /*
994*4882a593Smuzhiyun * share superblock if same fs AND options
995*4882a593Smuzhiyun */
ceph_compare_super(struct super_block * sb,struct fs_context * fc)996*4882a593Smuzhiyun static int ceph_compare_super(struct super_block *sb, struct fs_context *fc)
997*4882a593Smuzhiyun {
998*4882a593Smuzhiyun struct ceph_fs_client *new = fc->s_fs_info;
999*4882a593Smuzhiyun struct ceph_mount_options *fsopt = new->mount_options;
1000*4882a593Smuzhiyun struct ceph_options *opt = new->client->options;
1001*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(sb);
1002*4882a593Smuzhiyun
1003*4882a593Smuzhiyun dout("ceph_compare_super %p\n", sb);
1004*4882a593Smuzhiyun
1005*4882a593Smuzhiyun if (compare_mount_options(fsopt, opt, fsc)) {
1006*4882a593Smuzhiyun dout("monitor(s)/mount options don't match\n");
1007*4882a593Smuzhiyun return 0;
1008*4882a593Smuzhiyun }
1009*4882a593Smuzhiyun if ((opt->flags & CEPH_OPT_FSID) &&
1010*4882a593Smuzhiyun ceph_fsid_compare(&opt->fsid, &fsc->client->fsid)) {
1011*4882a593Smuzhiyun dout("fsid doesn't match\n");
1012*4882a593Smuzhiyun return 0;
1013*4882a593Smuzhiyun }
1014*4882a593Smuzhiyun if (fc->sb_flags != (sb->s_flags & ~SB_BORN)) {
1015*4882a593Smuzhiyun dout("flags differ\n");
1016*4882a593Smuzhiyun return 0;
1017*4882a593Smuzhiyun }
1018*4882a593Smuzhiyun
1019*4882a593Smuzhiyun if (fsc->blocklisted && !ceph_test_mount_opt(fsc, CLEANRECOVER)) {
1020*4882a593Smuzhiyun dout("client is blocklisted (and CLEANRECOVER is not set)\n");
1021*4882a593Smuzhiyun return 0;
1022*4882a593Smuzhiyun }
1023*4882a593Smuzhiyun
1024*4882a593Smuzhiyun if (fsc->mount_state == CEPH_MOUNT_SHUTDOWN) {
1025*4882a593Smuzhiyun dout("client has been forcibly unmounted\n");
1026*4882a593Smuzhiyun return 0;
1027*4882a593Smuzhiyun }
1028*4882a593Smuzhiyun
1029*4882a593Smuzhiyun return 1;
1030*4882a593Smuzhiyun }
1031*4882a593Smuzhiyun
1032*4882a593Smuzhiyun /*
1033*4882a593Smuzhiyun * construct our own bdi so we can control readahead, etc.
1034*4882a593Smuzhiyun */
1035*4882a593Smuzhiyun static atomic_long_t bdi_seq = ATOMIC_LONG_INIT(0);
1036*4882a593Smuzhiyun
ceph_setup_bdi(struct super_block * sb,struct ceph_fs_client * fsc)1037*4882a593Smuzhiyun static int ceph_setup_bdi(struct super_block *sb, struct ceph_fs_client *fsc)
1038*4882a593Smuzhiyun {
1039*4882a593Smuzhiyun int err;
1040*4882a593Smuzhiyun
1041*4882a593Smuzhiyun err = super_setup_bdi_name(sb, "ceph-%ld",
1042*4882a593Smuzhiyun atomic_long_inc_return(&bdi_seq));
1043*4882a593Smuzhiyun if (err)
1044*4882a593Smuzhiyun return err;
1045*4882a593Smuzhiyun
1046*4882a593Smuzhiyun /* set ra_pages based on rasize mount option? */
1047*4882a593Smuzhiyun sb->s_bdi->ra_pages = fsc->mount_options->rasize >> PAGE_SHIFT;
1048*4882a593Smuzhiyun
1049*4882a593Smuzhiyun /* set io_pages based on max osd read size */
1050*4882a593Smuzhiyun sb->s_bdi->io_pages = fsc->mount_options->rsize >> PAGE_SHIFT;
1051*4882a593Smuzhiyun
1052*4882a593Smuzhiyun return 0;
1053*4882a593Smuzhiyun }
1054*4882a593Smuzhiyun
ceph_get_tree(struct fs_context * fc)1055*4882a593Smuzhiyun static int ceph_get_tree(struct fs_context *fc)
1056*4882a593Smuzhiyun {
1057*4882a593Smuzhiyun struct ceph_parse_opts_ctx *pctx = fc->fs_private;
1058*4882a593Smuzhiyun struct super_block *sb;
1059*4882a593Smuzhiyun struct ceph_fs_client *fsc;
1060*4882a593Smuzhiyun struct dentry *res;
1061*4882a593Smuzhiyun int (*compare_super)(struct super_block *, struct fs_context *) =
1062*4882a593Smuzhiyun ceph_compare_super;
1063*4882a593Smuzhiyun int err;
1064*4882a593Smuzhiyun
1065*4882a593Smuzhiyun dout("ceph_get_tree\n");
1066*4882a593Smuzhiyun
1067*4882a593Smuzhiyun if (!fc->source)
1068*4882a593Smuzhiyun return invalfc(fc, "No source");
1069*4882a593Smuzhiyun
1070*4882a593Smuzhiyun /* create client (which we may/may not use) */
1071*4882a593Smuzhiyun fsc = create_fs_client(pctx->opts, pctx->copts);
1072*4882a593Smuzhiyun pctx->opts = NULL;
1073*4882a593Smuzhiyun pctx->copts = NULL;
1074*4882a593Smuzhiyun if (IS_ERR(fsc)) {
1075*4882a593Smuzhiyun err = PTR_ERR(fsc);
1076*4882a593Smuzhiyun goto out_final;
1077*4882a593Smuzhiyun }
1078*4882a593Smuzhiyun
1079*4882a593Smuzhiyun err = ceph_mdsc_init(fsc);
1080*4882a593Smuzhiyun if (err < 0)
1081*4882a593Smuzhiyun goto out;
1082*4882a593Smuzhiyun
1083*4882a593Smuzhiyun if (ceph_test_opt(fsc->client, NOSHARE))
1084*4882a593Smuzhiyun compare_super = NULL;
1085*4882a593Smuzhiyun
1086*4882a593Smuzhiyun fc->s_fs_info = fsc;
1087*4882a593Smuzhiyun sb = sget_fc(fc, compare_super, ceph_set_super);
1088*4882a593Smuzhiyun fc->s_fs_info = NULL;
1089*4882a593Smuzhiyun if (IS_ERR(sb)) {
1090*4882a593Smuzhiyun err = PTR_ERR(sb);
1091*4882a593Smuzhiyun goto out;
1092*4882a593Smuzhiyun }
1093*4882a593Smuzhiyun
1094*4882a593Smuzhiyun if (ceph_sb_to_client(sb) != fsc) {
1095*4882a593Smuzhiyun destroy_fs_client(fsc);
1096*4882a593Smuzhiyun fsc = ceph_sb_to_client(sb);
1097*4882a593Smuzhiyun dout("get_sb got existing client %p\n", fsc);
1098*4882a593Smuzhiyun } else {
1099*4882a593Smuzhiyun dout("get_sb using new client %p\n", fsc);
1100*4882a593Smuzhiyun err = ceph_setup_bdi(sb, fsc);
1101*4882a593Smuzhiyun if (err < 0)
1102*4882a593Smuzhiyun goto out_splat;
1103*4882a593Smuzhiyun }
1104*4882a593Smuzhiyun
1105*4882a593Smuzhiyun res = ceph_real_mount(fsc, fc);
1106*4882a593Smuzhiyun if (IS_ERR(res)) {
1107*4882a593Smuzhiyun err = PTR_ERR(res);
1108*4882a593Smuzhiyun goto out_splat;
1109*4882a593Smuzhiyun }
1110*4882a593Smuzhiyun dout("root %p inode %p ino %llx.%llx\n", res,
1111*4882a593Smuzhiyun d_inode(res), ceph_vinop(d_inode(res)));
1112*4882a593Smuzhiyun fc->root = fsc->sb->s_root;
1113*4882a593Smuzhiyun return 0;
1114*4882a593Smuzhiyun
1115*4882a593Smuzhiyun out_splat:
1116*4882a593Smuzhiyun if (!ceph_mdsmap_is_cluster_available(fsc->mdsc->mdsmap)) {
1117*4882a593Smuzhiyun pr_info("No mds server is up or the cluster is laggy\n");
1118*4882a593Smuzhiyun err = -EHOSTUNREACH;
1119*4882a593Smuzhiyun }
1120*4882a593Smuzhiyun
1121*4882a593Smuzhiyun ceph_mdsc_close_sessions(fsc->mdsc);
1122*4882a593Smuzhiyun deactivate_locked_super(sb);
1123*4882a593Smuzhiyun goto out_final;
1124*4882a593Smuzhiyun
1125*4882a593Smuzhiyun out:
1126*4882a593Smuzhiyun destroy_fs_client(fsc);
1127*4882a593Smuzhiyun out_final:
1128*4882a593Smuzhiyun dout("ceph_get_tree fail %d\n", err);
1129*4882a593Smuzhiyun return err;
1130*4882a593Smuzhiyun }
1131*4882a593Smuzhiyun
ceph_free_fc(struct fs_context * fc)1132*4882a593Smuzhiyun static void ceph_free_fc(struct fs_context *fc)
1133*4882a593Smuzhiyun {
1134*4882a593Smuzhiyun struct ceph_parse_opts_ctx *pctx = fc->fs_private;
1135*4882a593Smuzhiyun
1136*4882a593Smuzhiyun if (pctx) {
1137*4882a593Smuzhiyun destroy_mount_options(pctx->opts);
1138*4882a593Smuzhiyun ceph_destroy_options(pctx->copts);
1139*4882a593Smuzhiyun kfree(pctx);
1140*4882a593Smuzhiyun }
1141*4882a593Smuzhiyun }
1142*4882a593Smuzhiyun
ceph_reconfigure_fc(struct fs_context * fc)1143*4882a593Smuzhiyun static int ceph_reconfigure_fc(struct fs_context *fc)
1144*4882a593Smuzhiyun {
1145*4882a593Smuzhiyun struct ceph_parse_opts_ctx *pctx = fc->fs_private;
1146*4882a593Smuzhiyun struct ceph_mount_options *fsopt = pctx->opts;
1147*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(fc->root->d_sb);
1148*4882a593Smuzhiyun
1149*4882a593Smuzhiyun if (fsopt->flags & CEPH_MOUNT_OPT_ASYNC_DIROPS)
1150*4882a593Smuzhiyun ceph_set_mount_opt(fsc, ASYNC_DIROPS);
1151*4882a593Smuzhiyun else
1152*4882a593Smuzhiyun ceph_clear_mount_opt(fsc, ASYNC_DIROPS);
1153*4882a593Smuzhiyun
1154*4882a593Smuzhiyun sync_filesystem(fc->root->d_sb);
1155*4882a593Smuzhiyun return 0;
1156*4882a593Smuzhiyun }
1157*4882a593Smuzhiyun
1158*4882a593Smuzhiyun static const struct fs_context_operations ceph_context_ops = {
1159*4882a593Smuzhiyun .free = ceph_free_fc,
1160*4882a593Smuzhiyun .parse_param = ceph_parse_mount_param,
1161*4882a593Smuzhiyun .get_tree = ceph_get_tree,
1162*4882a593Smuzhiyun .reconfigure = ceph_reconfigure_fc,
1163*4882a593Smuzhiyun };
1164*4882a593Smuzhiyun
1165*4882a593Smuzhiyun /*
1166*4882a593Smuzhiyun * Set up the filesystem mount context.
1167*4882a593Smuzhiyun */
ceph_init_fs_context(struct fs_context * fc)1168*4882a593Smuzhiyun static int ceph_init_fs_context(struct fs_context *fc)
1169*4882a593Smuzhiyun {
1170*4882a593Smuzhiyun struct ceph_parse_opts_ctx *pctx;
1171*4882a593Smuzhiyun struct ceph_mount_options *fsopt;
1172*4882a593Smuzhiyun
1173*4882a593Smuzhiyun pctx = kzalloc(sizeof(*pctx), GFP_KERNEL);
1174*4882a593Smuzhiyun if (!pctx)
1175*4882a593Smuzhiyun return -ENOMEM;
1176*4882a593Smuzhiyun
1177*4882a593Smuzhiyun pctx->copts = ceph_alloc_options();
1178*4882a593Smuzhiyun if (!pctx->copts)
1179*4882a593Smuzhiyun goto nomem;
1180*4882a593Smuzhiyun
1181*4882a593Smuzhiyun pctx->opts = kzalloc(sizeof(*pctx->opts), GFP_KERNEL);
1182*4882a593Smuzhiyun if (!pctx->opts)
1183*4882a593Smuzhiyun goto nomem;
1184*4882a593Smuzhiyun
1185*4882a593Smuzhiyun fsopt = pctx->opts;
1186*4882a593Smuzhiyun fsopt->flags = CEPH_MOUNT_OPT_DEFAULT;
1187*4882a593Smuzhiyun
1188*4882a593Smuzhiyun fsopt->wsize = CEPH_MAX_WRITE_SIZE;
1189*4882a593Smuzhiyun fsopt->rsize = CEPH_MAX_READ_SIZE;
1190*4882a593Smuzhiyun fsopt->rasize = CEPH_RASIZE_DEFAULT;
1191*4882a593Smuzhiyun fsopt->snapdir_name = kstrdup(CEPH_SNAPDIRNAME_DEFAULT, GFP_KERNEL);
1192*4882a593Smuzhiyun if (!fsopt->snapdir_name)
1193*4882a593Smuzhiyun goto nomem;
1194*4882a593Smuzhiyun
1195*4882a593Smuzhiyun fsopt->caps_wanted_delay_min = CEPH_CAPS_WANTED_DELAY_MIN_DEFAULT;
1196*4882a593Smuzhiyun fsopt->caps_wanted_delay_max = CEPH_CAPS_WANTED_DELAY_MAX_DEFAULT;
1197*4882a593Smuzhiyun fsopt->max_readdir = CEPH_MAX_READDIR_DEFAULT;
1198*4882a593Smuzhiyun fsopt->max_readdir_bytes = CEPH_MAX_READDIR_BYTES_DEFAULT;
1199*4882a593Smuzhiyun fsopt->congestion_kb = default_congestion_kb();
1200*4882a593Smuzhiyun
1201*4882a593Smuzhiyun #ifdef CONFIG_CEPH_FS_POSIX_ACL
1202*4882a593Smuzhiyun fc->sb_flags |= SB_POSIXACL;
1203*4882a593Smuzhiyun #endif
1204*4882a593Smuzhiyun
1205*4882a593Smuzhiyun fc->fs_private = pctx;
1206*4882a593Smuzhiyun fc->ops = &ceph_context_ops;
1207*4882a593Smuzhiyun return 0;
1208*4882a593Smuzhiyun
1209*4882a593Smuzhiyun nomem:
1210*4882a593Smuzhiyun destroy_mount_options(pctx->opts);
1211*4882a593Smuzhiyun ceph_destroy_options(pctx->copts);
1212*4882a593Smuzhiyun kfree(pctx);
1213*4882a593Smuzhiyun return -ENOMEM;
1214*4882a593Smuzhiyun }
1215*4882a593Smuzhiyun
ceph_kill_sb(struct super_block * s)1216*4882a593Smuzhiyun static void ceph_kill_sb(struct super_block *s)
1217*4882a593Smuzhiyun {
1218*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(s);
1219*4882a593Smuzhiyun
1220*4882a593Smuzhiyun dout("kill_sb %p\n", s);
1221*4882a593Smuzhiyun
1222*4882a593Smuzhiyun ceph_mdsc_pre_umount(fsc->mdsc);
1223*4882a593Smuzhiyun flush_fs_workqueues(fsc);
1224*4882a593Smuzhiyun
1225*4882a593Smuzhiyun kill_anon_super(s);
1226*4882a593Smuzhiyun
1227*4882a593Smuzhiyun fsc->client->extra_mon_dispatch = NULL;
1228*4882a593Smuzhiyun ceph_fs_debugfs_cleanup(fsc);
1229*4882a593Smuzhiyun
1230*4882a593Smuzhiyun ceph_fscache_unregister_fs(fsc);
1231*4882a593Smuzhiyun
1232*4882a593Smuzhiyun destroy_fs_client(fsc);
1233*4882a593Smuzhiyun }
1234*4882a593Smuzhiyun
1235*4882a593Smuzhiyun static struct file_system_type ceph_fs_type = {
1236*4882a593Smuzhiyun .owner = THIS_MODULE,
1237*4882a593Smuzhiyun .name = "ceph",
1238*4882a593Smuzhiyun .init_fs_context = ceph_init_fs_context,
1239*4882a593Smuzhiyun .kill_sb = ceph_kill_sb,
1240*4882a593Smuzhiyun .fs_flags = FS_RENAME_DOES_D_MOVE,
1241*4882a593Smuzhiyun };
1242*4882a593Smuzhiyun MODULE_ALIAS_FS("ceph");
1243*4882a593Smuzhiyun
ceph_force_reconnect(struct super_block * sb)1244*4882a593Smuzhiyun int ceph_force_reconnect(struct super_block *sb)
1245*4882a593Smuzhiyun {
1246*4882a593Smuzhiyun struct ceph_fs_client *fsc = ceph_sb_to_client(sb);
1247*4882a593Smuzhiyun int err = 0;
1248*4882a593Smuzhiyun
1249*4882a593Smuzhiyun ceph_umount_begin(sb);
1250*4882a593Smuzhiyun
1251*4882a593Smuzhiyun /* Make sure all page caches get invalidated.
1252*4882a593Smuzhiyun * see remove_session_caps_cb() */
1253*4882a593Smuzhiyun flush_workqueue(fsc->inode_wq);
1254*4882a593Smuzhiyun
1255*4882a593Smuzhiyun /* In case that we were blocklisted. This also reset
1256*4882a593Smuzhiyun * all mon/osd connections */
1257*4882a593Smuzhiyun ceph_reset_client_addr(fsc->client);
1258*4882a593Smuzhiyun
1259*4882a593Smuzhiyun ceph_osdc_clear_abort_err(&fsc->client->osdc);
1260*4882a593Smuzhiyun
1261*4882a593Smuzhiyun fsc->blocklisted = false;
1262*4882a593Smuzhiyun fsc->mount_state = CEPH_MOUNT_MOUNTED;
1263*4882a593Smuzhiyun
1264*4882a593Smuzhiyun if (sb->s_root) {
1265*4882a593Smuzhiyun err = __ceph_do_getattr(d_inode(sb->s_root), NULL,
1266*4882a593Smuzhiyun CEPH_STAT_CAP_INODE, true);
1267*4882a593Smuzhiyun }
1268*4882a593Smuzhiyun return err;
1269*4882a593Smuzhiyun }
1270*4882a593Smuzhiyun
init_ceph(void)1271*4882a593Smuzhiyun static int __init init_ceph(void)
1272*4882a593Smuzhiyun {
1273*4882a593Smuzhiyun int ret = init_caches();
1274*4882a593Smuzhiyun if (ret)
1275*4882a593Smuzhiyun goto out;
1276*4882a593Smuzhiyun
1277*4882a593Smuzhiyun ceph_flock_init();
1278*4882a593Smuzhiyun ret = register_filesystem(&ceph_fs_type);
1279*4882a593Smuzhiyun if (ret)
1280*4882a593Smuzhiyun goto out_caches;
1281*4882a593Smuzhiyun
1282*4882a593Smuzhiyun pr_info("loaded (mds proto %d)\n", CEPH_MDSC_PROTOCOL);
1283*4882a593Smuzhiyun
1284*4882a593Smuzhiyun return 0;
1285*4882a593Smuzhiyun
1286*4882a593Smuzhiyun out_caches:
1287*4882a593Smuzhiyun destroy_caches();
1288*4882a593Smuzhiyun out:
1289*4882a593Smuzhiyun return ret;
1290*4882a593Smuzhiyun }
1291*4882a593Smuzhiyun
exit_ceph(void)1292*4882a593Smuzhiyun static void __exit exit_ceph(void)
1293*4882a593Smuzhiyun {
1294*4882a593Smuzhiyun dout("exit_ceph\n");
1295*4882a593Smuzhiyun unregister_filesystem(&ceph_fs_type);
1296*4882a593Smuzhiyun destroy_caches();
1297*4882a593Smuzhiyun }
1298*4882a593Smuzhiyun
param_set_metrics(const char * val,const struct kernel_param * kp)1299*4882a593Smuzhiyun static int param_set_metrics(const char *val, const struct kernel_param *kp)
1300*4882a593Smuzhiyun {
1301*4882a593Smuzhiyun struct ceph_fs_client *fsc;
1302*4882a593Smuzhiyun int ret;
1303*4882a593Smuzhiyun
1304*4882a593Smuzhiyun ret = param_set_bool(val, kp);
1305*4882a593Smuzhiyun if (ret) {
1306*4882a593Smuzhiyun pr_err("Failed to parse sending metrics switch value '%s'\n",
1307*4882a593Smuzhiyun val);
1308*4882a593Smuzhiyun return ret;
1309*4882a593Smuzhiyun } else if (!disable_send_metrics) {
1310*4882a593Smuzhiyun // wake up all the mds clients
1311*4882a593Smuzhiyun spin_lock(&ceph_fsc_lock);
1312*4882a593Smuzhiyun list_for_each_entry(fsc, &ceph_fsc_list, metric_wakeup) {
1313*4882a593Smuzhiyun metric_schedule_delayed(&fsc->mdsc->metric);
1314*4882a593Smuzhiyun }
1315*4882a593Smuzhiyun spin_unlock(&ceph_fsc_lock);
1316*4882a593Smuzhiyun }
1317*4882a593Smuzhiyun
1318*4882a593Smuzhiyun return 0;
1319*4882a593Smuzhiyun }
1320*4882a593Smuzhiyun
1321*4882a593Smuzhiyun static const struct kernel_param_ops param_ops_metrics = {
1322*4882a593Smuzhiyun .set = param_set_metrics,
1323*4882a593Smuzhiyun .get = param_get_bool,
1324*4882a593Smuzhiyun };
1325*4882a593Smuzhiyun
1326*4882a593Smuzhiyun bool disable_send_metrics = false;
1327*4882a593Smuzhiyun module_param_cb(disable_send_metrics, ¶m_ops_metrics, &disable_send_metrics, 0644);
1328*4882a593Smuzhiyun MODULE_PARM_DESC(disable_send_metrics, "Enable sending perf metrics to ceph cluster (default: on)");
1329*4882a593Smuzhiyun
1330*4882a593Smuzhiyun module_init(init_ceph);
1331*4882a593Smuzhiyun module_exit(exit_ceph);
1332*4882a593Smuzhiyun
1333*4882a593Smuzhiyun MODULE_AUTHOR("Sage Weil <sage@newdream.net>");
1334*4882a593Smuzhiyun MODULE_AUTHOR("Yehuda Sadeh <yehuda@hq.newdream.net>");
1335*4882a593Smuzhiyun MODULE_AUTHOR("Patience Warnick <patience@newdream.net>");
1336*4882a593Smuzhiyun MODULE_DESCRIPTION("Ceph filesystem for Linux");
1337*4882a593Smuzhiyun MODULE_LICENSE("GPL");
1338*4882a593Smuzhiyun MODULE_IMPORT_NS(ANDROID_GKI_VFS_EXPORT_ONLY);
1339