xref: /OK3568_Linux_fs/kernel/fs/nfs/blocklayout/dev.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (c) 2014-2016 Christoph Hellwig.
4*4882a593Smuzhiyun  */
5*4882a593Smuzhiyun #include <linux/sunrpc/svc.h>
6*4882a593Smuzhiyun #include <linux/blkdev.h>
7*4882a593Smuzhiyun #include <linux/nfs4.h>
8*4882a593Smuzhiyun #include <linux/nfs_fs.h>
9*4882a593Smuzhiyun #include <linux/nfs_xdr.h>
10*4882a593Smuzhiyun #include <linux/pr.h>
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun #include "blocklayout.h"
13*4882a593Smuzhiyun 
14*4882a593Smuzhiyun #define NFSDBG_FACILITY		NFSDBG_PNFS_LD
15*4882a593Smuzhiyun 
16*4882a593Smuzhiyun static void
bl_free_device(struct pnfs_block_dev * dev)17*4882a593Smuzhiyun bl_free_device(struct pnfs_block_dev *dev)
18*4882a593Smuzhiyun {
19*4882a593Smuzhiyun 	if (dev->nr_children) {
20*4882a593Smuzhiyun 		int i;
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun 		for (i = 0; i < dev->nr_children; i++)
23*4882a593Smuzhiyun 			bl_free_device(&dev->children[i]);
24*4882a593Smuzhiyun 		kfree(dev->children);
25*4882a593Smuzhiyun 	} else {
26*4882a593Smuzhiyun 		if (dev->pr_registered) {
27*4882a593Smuzhiyun 			const struct pr_ops *ops =
28*4882a593Smuzhiyun 				dev->bdev->bd_disk->fops->pr_ops;
29*4882a593Smuzhiyun 			int error;
30*4882a593Smuzhiyun 
31*4882a593Smuzhiyun 			error = ops->pr_register(dev->bdev, dev->pr_key, 0,
32*4882a593Smuzhiyun 				false);
33*4882a593Smuzhiyun 			if (error)
34*4882a593Smuzhiyun 				pr_err("failed to unregister PR key.\n");
35*4882a593Smuzhiyun 		}
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun 		if (dev->bdev)
38*4882a593Smuzhiyun 			blkdev_put(dev->bdev, FMODE_READ | FMODE_WRITE);
39*4882a593Smuzhiyun 	}
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun void
bl_free_deviceid_node(struct nfs4_deviceid_node * d)43*4882a593Smuzhiyun bl_free_deviceid_node(struct nfs4_deviceid_node *d)
44*4882a593Smuzhiyun {
45*4882a593Smuzhiyun 	struct pnfs_block_dev *dev =
46*4882a593Smuzhiyun 		container_of(d, struct pnfs_block_dev, node);
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun 	bl_free_device(dev);
49*4882a593Smuzhiyun 	kfree_rcu(dev, node.rcu);
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun 
52*4882a593Smuzhiyun static int
nfs4_block_decode_volume(struct xdr_stream * xdr,struct pnfs_block_volume * b)53*4882a593Smuzhiyun nfs4_block_decode_volume(struct xdr_stream *xdr, struct pnfs_block_volume *b)
54*4882a593Smuzhiyun {
55*4882a593Smuzhiyun 	__be32 *p;
56*4882a593Smuzhiyun 	int i;
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun 	p = xdr_inline_decode(xdr, 4);
59*4882a593Smuzhiyun 	if (!p)
60*4882a593Smuzhiyun 		return -EIO;
61*4882a593Smuzhiyun 	b->type = be32_to_cpup(p++);
62*4882a593Smuzhiyun 
63*4882a593Smuzhiyun 	switch (b->type) {
64*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_SIMPLE:
65*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, 4);
66*4882a593Smuzhiyun 		if (!p)
67*4882a593Smuzhiyun 			return -EIO;
68*4882a593Smuzhiyun 		b->simple.nr_sigs = be32_to_cpup(p++);
69*4882a593Smuzhiyun 		if (!b->simple.nr_sigs || b->simple.nr_sigs > PNFS_BLOCK_MAX_UUIDS) {
70*4882a593Smuzhiyun 			dprintk("Bad signature count: %d\n", b->simple.nr_sigs);
71*4882a593Smuzhiyun 			return -EIO;
72*4882a593Smuzhiyun 		}
73*4882a593Smuzhiyun 
74*4882a593Smuzhiyun 		b->simple.len = 4 + 4;
75*4882a593Smuzhiyun 		for (i = 0; i < b->simple.nr_sigs; i++) {
76*4882a593Smuzhiyun 			p = xdr_inline_decode(xdr, 8 + 4);
77*4882a593Smuzhiyun 			if (!p)
78*4882a593Smuzhiyun 				return -EIO;
79*4882a593Smuzhiyun 			p = xdr_decode_hyper(p, &b->simple.sigs[i].offset);
80*4882a593Smuzhiyun 			b->simple.sigs[i].sig_len = be32_to_cpup(p++);
81*4882a593Smuzhiyun 			if (b->simple.sigs[i].sig_len > PNFS_BLOCK_UUID_LEN) {
82*4882a593Smuzhiyun 				pr_info("signature too long: %d\n",
83*4882a593Smuzhiyun 					b->simple.sigs[i].sig_len);
84*4882a593Smuzhiyun 				return -EIO;
85*4882a593Smuzhiyun 			}
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun 			p = xdr_inline_decode(xdr, b->simple.sigs[i].sig_len);
88*4882a593Smuzhiyun 			if (!p)
89*4882a593Smuzhiyun 				return -EIO;
90*4882a593Smuzhiyun 			memcpy(&b->simple.sigs[i].sig, p,
91*4882a593Smuzhiyun 				b->simple.sigs[i].sig_len);
92*4882a593Smuzhiyun 
93*4882a593Smuzhiyun 			b->simple.len += 8 + 4 + \
94*4882a593Smuzhiyun 				(XDR_QUADLEN(b->simple.sigs[i].sig_len) << 2);
95*4882a593Smuzhiyun 		}
96*4882a593Smuzhiyun 		break;
97*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_SLICE:
98*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, 8 + 8 + 4);
99*4882a593Smuzhiyun 		if (!p)
100*4882a593Smuzhiyun 			return -EIO;
101*4882a593Smuzhiyun 		p = xdr_decode_hyper(p, &b->slice.start);
102*4882a593Smuzhiyun 		p = xdr_decode_hyper(p, &b->slice.len);
103*4882a593Smuzhiyun 		b->slice.volume = be32_to_cpup(p++);
104*4882a593Smuzhiyun 		break;
105*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_CONCAT:
106*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, 4);
107*4882a593Smuzhiyun 		if (!p)
108*4882a593Smuzhiyun 			return -EIO;
109*4882a593Smuzhiyun 
110*4882a593Smuzhiyun 		b->concat.volumes_count = be32_to_cpup(p++);
111*4882a593Smuzhiyun 		if (b->concat.volumes_count > PNFS_BLOCK_MAX_DEVICES) {
112*4882a593Smuzhiyun 			dprintk("Too many volumes: %d\n", b->concat.volumes_count);
113*4882a593Smuzhiyun 			return -EIO;
114*4882a593Smuzhiyun 		}
115*4882a593Smuzhiyun 
116*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, b->concat.volumes_count * 4);
117*4882a593Smuzhiyun 		if (!p)
118*4882a593Smuzhiyun 			return -EIO;
119*4882a593Smuzhiyun 		for (i = 0; i < b->concat.volumes_count; i++)
120*4882a593Smuzhiyun 			b->concat.volumes[i] = be32_to_cpup(p++);
121*4882a593Smuzhiyun 		break;
122*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_STRIPE:
123*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, 8 + 4);
124*4882a593Smuzhiyun 		if (!p)
125*4882a593Smuzhiyun 			return -EIO;
126*4882a593Smuzhiyun 
127*4882a593Smuzhiyun 		p = xdr_decode_hyper(p, &b->stripe.chunk_size);
128*4882a593Smuzhiyun 		b->stripe.volumes_count = be32_to_cpup(p++);
129*4882a593Smuzhiyun 		if (b->stripe.volumes_count > PNFS_BLOCK_MAX_DEVICES) {
130*4882a593Smuzhiyun 			dprintk("Too many volumes: %d\n", b->stripe.volumes_count);
131*4882a593Smuzhiyun 			return -EIO;
132*4882a593Smuzhiyun 		}
133*4882a593Smuzhiyun 
134*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, b->stripe.volumes_count * 4);
135*4882a593Smuzhiyun 		if (!p)
136*4882a593Smuzhiyun 			return -EIO;
137*4882a593Smuzhiyun 		for (i = 0; i < b->stripe.volumes_count; i++)
138*4882a593Smuzhiyun 			b->stripe.volumes[i] = be32_to_cpup(p++);
139*4882a593Smuzhiyun 		break;
140*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_SCSI:
141*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, 4 + 4 + 4);
142*4882a593Smuzhiyun 		if (!p)
143*4882a593Smuzhiyun 			return -EIO;
144*4882a593Smuzhiyun 		b->scsi.code_set = be32_to_cpup(p++);
145*4882a593Smuzhiyun 		b->scsi.designator_type = be32_to_cpup(p++);
146*4882a593Smuzhiyun 		b->scsi.designator_len = be32_to_cpup(p++);
147*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, b->scsi.designator_len);
148*4882a593Smuzhiyun 		if (!p)
149*4882a593Smuzhiyun 			return -EIO;
150*4882a593Smuzhiyun 		if (b->scsi.designator_len > 256)
151*4882a593Smuzhiyun 			return -EIO;
152*4882a593Smuzhiyun 		memcpy(&b->scsi.designator, p, b->scsi.designator_len);
153*4882a593Smuzhiyun 		p = xdr_inline_decode(xdr, 8);
154*4882a593Smuzhiyun 		if (!p)
155*4882a593Smuzhiyun 			return -EIO;
156*4882a593Smuzhiyun 		p = xdr_decode_hyper(p, &b->scsi.pr_key);
157*4882a593Smuzhiyun 		break;
158*4882a593Smuzhiyun 	default:
159*4882a593Smuzhiyun 		dprintk("unknown volume type!\n");
160*4882a593Smuzhiyun 		return -EIO;
161*4882a593Smuzhiyun 	}
162*4882a593Smuzhiyun 
163*4882a593Smuzhiyun 	return 0;
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun 
bl_map_simple(struct pnfs_block_dev * dev,u64 offset,struct pnfs_block_dev_map * map)166*4882a593Smuzhiyun static bool bl_map_simple(struct pnfs_block_dev *dev, u64 offset,
167*4882a593Smuzhiyun 		struct pnfs_block_dev_map *map)
168*4882a593Smuzhiyun {
169*4882a593Smuzhiyun 	map->start = dev->start;
170*4882a593Smuzhiyun 	map->len = dev->len;
171*4882a593Smuzhiyun 	map->disk_offset = dev->disk_offset;
172*4882a593Smuzhiyun 	map->bdev = dev->bdev;
173*4882a593Smuzhiyun 	return true;
174*4882a593Smuzhiyun }
175*4882a593Smuzhiyun 
bl_map_concat(struct pnfs_block_dev * dev,u64 offset,struct pnfs_block_dev_map * map)176*4882a593Smuzhiyun static bool bl_map_concat(struct pnfs_block_dev *dev, u64 offset,
177*4882a593Smuzhiyun 		struct pnfs_block_dev_map *map)
178*4882a593Smuzhiyun {
179*4882a593Smuzhiyun 	int i;
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 	for (i = 0; i < dev->nr_children; i++) {
182*4882a593Smuzhiyun 		struct pnfs_block_dev *child = &dev->children[i];
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun 		if (child->start > offset ||
185*4882a593Smuzhiyun 		    child->start + child->len <= offset)
186*4882a593Smuzhiyun 			continue;
187*4882a593Smuzhiyun 
188*4882a593Smuzhiyun 		child->map(child, offset - child->start, map);
189*4882a593Smuzhiyun 		return true;
190*4882a593Smuzhiyun 	}
191*4882a593Smuzhiyun 
192*4882a593Smuzhiyun 	dprintk("%s: ran off loop!\n", __func__);
193*4882a593Smuzhiyun 	return false;
194*4882a593Smuzhiyun }
195*4882a593Smuzhiyun 
bl_map_stripe(struct pnfs_block_dev * dev,u64 offset,struct pnfs_block_dev_map * map)196*4882a593Smuzhiyun static bool bl_map_stripe(struct pnfs_block_dev *dev, u64 offset,
197*4882a593Smuzhiyun 		struct pnfs_block_dev_map *map)
198*4882a593Smuzhiyun {
199*4882a593Smuzhiyun 	struct pnfs_block_dev *child;
200*4882a593Smuzhiyun 	u64 chunk;
201*4882a593Smuzhiyun 	u32 chunk_idx;
202*4882a593Smuzhiyun 	u64 disk_offset;
203*4882a593Smuzhiyun 
204*4882a593Smuzhiyun 	chunk = div_u64(offset, dev->chunk_size);
205*4882a593Smuzhiyun 	div_u64_rem(chunk, dev->nr_children, &chunk_idx);
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun 	if (chunk_idx >= dev->nr_children) {
208*4882a593Smuzhiyun 		dprintk("%s: invalid chunk idx %d (%lld/%lld)\n",
209*4882a593Smuzhiyun 			__func__, chunk_idx, offset, dev->chunk_size);
210*4882a593Smuzhiyun 		/* error, should not happen */
211*4882a593Smuzhiyun 		return false;
212*4882a593Smuzhiyun 	}
213*4882a593Smuzhiyun 
214*4882a593Smuzhiyun 	/* truncate offset to the beginning of the stripe */
215*4882a593Smuzhiyun 	offset = chunk * dev->chunk_size;
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun 	/* disk offset of the stripe */
218*4882a593Smuzhiyun 	disk_offset = div_u64(offset, dev->nr_children);
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun 	child = &dev->children[chunk_idx];
221*4882a593Smuzhiyun 	child->map(child, disk_offset, map);
222*4882a593Smuzhiyun 
223*4882a593Smuzhiyun 	map->start += offset;
224*4882a593Smuzhiyun 	map->disk_offset += disk_offset;
225*4882a593Smuzhiyun 	map->len = dev->chunk_size;
226*4882a593Smuzhiyun 	return true;
227*4882a593Smuzhiyun }
228*4882a593Smuzhiyun 
229*4882a593Smuzhiyun static int
230*4882a593Smuzhiyun bl_parse_deviceid(struct nfs_server *server, struct pnfs_block_dev *d,
231*4882a593Smuzhiyun 		struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask);
232*4882a593Smuzhiyun 
233*4882a593Smuzhiyun 
234*4882a593Smuzhiyun static int
bl_parse_simple(struct nfs_server * server,struct pnfs_block_dev * d,struct pnfs_block_volume * volumes,int idx,gfp_t gfp_mask)235*4882a593Smuzhiyun bl_parse_simple(struct nfs_server *server, struct pnfs_block_dev *d,
236*4882a593Smuzhiyun 		struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask)
237*4882a593Smuzhiyun {
238*4882a593Smuzhiyun 	struct pnfs_block_volume *v = &volumes[idx];
239*4882a593Smuzhiyun 	struct block_device *bdev;
240*4882a593Smuzhiyun 	dev_t dev;
241*4882a593Smuzhiyun 
242*4882a593Smuzhiyun 	dev = bl_resolve_deviceid(server, v, gfp_mask);
243*4882a593Smuzhiyun 	if (!dev)
244*4882a593Smuzhiyun 		return -EIO;
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun 	bdev = blkdev_get_by_dev(dev, FMODE_READ | FMODE_WRITE, NULL);
247*4882a593Smuzhiyun 	if (IS_ERR(bdev)) {
248*4882a593Smuzhiyun 		printk(KERN_WARNING "pNFS: failed to open device %d:%d (%ld)\n",
249*4882a593Smuzhiyun 			MAJOR(dev), MINOR(dev), PTR_ERR(bdev));
250*4882a593Smuzhiyun 		return PTR_ERR(bdev);
251*4882a593Smuzhiyun 	}
252*4882a593Smuzhiyun 	d->bdev = bdev;
253*4882a593Smuzhiyun 
254*4882a593Smuzhiyun 
255*4882a593Smuzhiyun 	d->len = i_size_read(d->bdev->bd_inode);
256*4882a593Smuzhiyun 	d->map = bl_map_simple;
257*4882a593Smuzhiyun 
258*4882a593Smuzhiyun 	printk(KERN_INFO "pNFS: using block device %s\n",
259*4882a593Smuzhiyun 		d->bdev->bd_disk->disk_name);
260*4882a593Smuzhiyun 	return 0;
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun 
263*4882a593Smuzhiyun static bool
bl_validate_designator(struct pnfs_block_volume * v)264*4882a593Smuzhiyun bl_validate_designator(struct pnfs_block_volume *v)
265*4882a593Smuzhiyun {
266*4882a593Smuzhiyun 	switch (v->scsi.designator_type) {
267*4882a593Smuzhiyun 	case PS_DESIGNATOR_EUI64:
268*4882a593Smuzhiyun 		if (v->scsi.code_set != PS_CODE_SET_BINARY)
269*4882a593Smuzhiyun 			return false;
270*4882a593Smuzhiyun 
271*4882a593Smuzhiyun 		if (v->scsi.designator_len != 8 &&
272*4882a593Smuzhiyun 		    v->scsi.designator_len != 10 &&
273*4882a593Smuzhiyun 		    v->scsi.designator_len != 16)
274*4882a593Smuzhiyun 			return false;
275*4882a593Smuzhiyun 
276*4882a593Smuzhiyun 		return true;
277*4882a593Smuzhiyun 	case PS_DESIGNATOR_NAA:
278*4882a593Smuzhiyun 		if (v->scsi.code_set != PS_CODE_SET_BINARY)
279*4882a593Smuzhiyun 			return false;
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 		if (v->scsi.designator_len != 8 &&
282*4882a593Smuzhiyun 		    v->scsi.designator_len != 16)
283*4882a593Smuzhiyun 			return false;
284*4882a593Smuzhiyun 
285*4882a593Smuzhiyun 		return true;
286*4882a593Smuzhiyun 	case PS_DESIGNATOR_T10:
287*4882a593Smuzhiyun 	case PS_DESIGNATOR_NAME:
288*4882a593Smuzhiyun 		pr_err("pNFS: unsupported designator "
289*4882a593Smuzhiyun 			"(code set %d, type %d, len %d.\n",
290*4882a593Smuzhiyun 			v->scsi.code_set,
291*4882a593Smuzhiyun 			v->scsi.designator_type,
292*4882a593Smuzhiyun 			v->scsi.designator_len);
293*4882a593Smuzhiyun 		return false;
294*4882a593Smuzhiyun 	default:
295*4882a593Smuzhiyun 		pr_err("pNFS: invalid designator "
296*4882a593Smuzhiyun 			"(code set %d, type %d, len %d.\n",
297*4882a593Smuzhiyun 			v->scsi.code_set,
298*4882a593Smuzhiyun 			v->scsi.designator_type,
299*4882a593Smuzhiyun 			v->scsi.designator_len);
300*4882a593Smuzhiyun 		return false;
301*4882a593Smuzhiyun 	}
302*4882a593Smuzhiyun }
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun /*
305*4882a593Smuzhiyun  * Try to open the udev path for the WWN.  At least on Debian the udev
306*4882a593Smuzhiyun  * by-id path will always point to the dm-multipath device if one exists.
307*4882a593Smuzhiyun  */
308*4882a593Smuzhiyun static struct block_device *
bl_open_udev_path(struct pnfs_block_volume * v)309*4882a593Smuzhiyun bl_open_udev_path(struct pnfs_block_volume *v)
310*4882a593Smuzhiyun {
311*4882a593Smuzhiyun 	struct block_device *bdev;
312*4882a593Smuzhiyun 	const char *devname;
313*4882a593Smuzhiyun 
314*4882a593Smuzhiyun 	devname = kasprintf(GFP_KERNEL, "/dev/disk/by-id/wwn-0x%*phN",
315*4882a593Smuzhiyun 				v->scsi.designator_len, v->scsi.designator);
316*4882a593Smuzhiyun 	if (!devname)
317*4882a593Smuzhiyun 		return ERR_PTR(-ENOMEM);
318*4882a593Smuzhiyun 
319*4882a593Smuzhiyun 	bdev = blkdev_get_by_path(devname, FMODE_READ | FMODE_WRITE, NULL);
320*4882a593Smuzhiyun 	if (IS_ERR(bdev)) {
321*4882a593Smuzhiyun 		pr_warn("pNFS: failed to open device %s (%ld)\n",
322*4882a593Smuzhiyun 			devname, PTR_ERR(bdev));
323*4882a593Smuzhiyun 	}
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun 	kfree(devname);
326*4882a593Smuzhiyun 	return bdev;
327*4882a593Smuzhiyun }
328*4882a593Smuzhiyun 
329*4882a593Smuzhiyun /*
330*4882a593Smuzhiyun  * Try to open the RH/Fedora specific dm-mpath udev path for this WWN, as the
331*4882a593Smuzhiyun  * wwn- links will only point to the first discovered SCSI device there.
332*4882a593Smuzhiyun  */
333*4882a593Smuzhiyun static struct block_device *
bl_open_dm_mpath_udev_path(struct pnfs_block_volume * v)334*4882a593Smuzhiyun bl_open_dm_mpath_udev_path(struct pnfs_block_volume *v)
335*4882a593Smuzhiyun {
336*4882a593Smuzhiyun 	struct block_device *bdev;
337*4882a593Smuzhiyun 	const char *devname;
338*4882a593Smuzhiyun 
339*4882a593Smuzhiyun 	devname = kasprintf(GFP_KERNEL,
340*4882a593Smuzhiyun 			"/dev/disk/by-id/dm-uuid-mpath-%d%*phN",
341*4882a593Smuzhiyun 			v->scsi.designator_type,
342*4882a593Smuzhiyun 			v->scsi.designator_len, v->scsi.designator);
343*4882a593Smuzhiyun 	if (!devname)
344*4882a593Smuzhiyun 		return ERR_PTR(-ENOMEM);
345*4882a593Smuzhiyun 
346*4882a593Smuzhiyun 	bdev = blkdev_get_by_path(devname, FMODE_READ | FMODE_WRITE, NULL);
347*4882a593Smuzhiyun 	kfree(devname);
348*4882a593Smuzhiyun 	return bdev;
349*4882a593Smuzhiyun }
350*4882a593Smuzhiyun 
351*4882a593Smuzhiyun static int
bl_parse_scsi(struct nfs_server * server,struct pnfs_block_dev * d,struct pnfs_block_volume * volumes,int idx,gfp_t gfp_mask)352*4882a593Smuzhiyun bl_parse_scsi(struct nfs_server *server, struct pnfs_block_dev *d,
353*4882a593Smuzhiyun 		struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask)
354*4882a593Smuzhiyun {
355*4882a593Smuzhiyun 	struct pnfs_block_volume *v = &volumes[idx];
356*4882a593Smuzhiyun 	struct block_device *bdev;
357*4882a593Smuzhiyun 	const struct pr_ops *ops;
358*4882a593Smuzhiyun 	int error;
359*4882a593Smuzhiyun 
360*4882a593Smuzhiyun 	if (!bl_validate_designator(v))
361*4882a593Smuzhiyun 		return -EINVAL;
362*4882a593Smuzhiyun 
363*4882a593Smuzhiyun 	bdev = bl_open_dm_mpath_udev_path(v);
364*4882a593Smuzhiyun 	if (IS_ERR(bdev))
365*4882a593Smuzhiyun 		bdev = bl_open_udev_path(v);
366*4882a593Smuzhiyun 	if (IS_ERR(bdev))
367*4882a593Smuzhiyun 		return PTR_ERR(bdev);
368*4882a593Smuzhiyun 	d->bdev = bdev;
369*4882a593Smuzhiyun 
370*4882a593Smuzhiyun 	d->len = i_size_read(d->bdev->bd_inode);
371*4882a593Smuzhiyun 	d->map = bl_map_simple;
372*4882a593Smuzhiyun 	d->pr_key = v->scsi.pr_key;
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun 	pr_info("pNFS: using block device %s (reservation key 0x%llx)\n",
375*4882a593Smuzhiyun 		d->bdev->bd_disk->disk_name, d->pr_key);
376*4882a593Smuzhiyun 
377*4882a593Smuzhiyun 	ops = d->bdev->bd_disk->fops->pr_ops;
378*4882a593Smuzhiyun 	if (!ops) {
379*4882a593Smuzhiyun 		pr_err("pNFS: block device %s does not support reservations.",
380*4882a593Smuzhiyun 				d->bdev->bd_disk->disk_name);
381*4882a593Smuzhiyun 		error = -EINVAL;
382*4882a593Smuzhiyun 		goto out_blkdev_put;
383*4882a593Smuzhiyun 	}
384*4882a593Smuzhiyun 
385*4882a593Smuzhiyun 	error = ops->pr_register(d->bdev, 0, d->pr_key, true);
386*4882a593Smuzhiyun 	if (error) {
387*4882a593Smuzhiyun 		pr_err("pNFS: failed to register key for block device %s.",
388*4882a593Smuzhiyun 				d->bdev->bd_disk->disk_name);
389*4882a593Smuzhiyun 		goto out_blkdev_put;
390*4882a593Smuzhiyun 	}
391*4882a593Smuzhiyun 
392*4882a593Smuzhiyun 	d->pr_registered = true;
393*4882a593Smuzhiyun 	return 0;
394*4882a593Smuzhiyun 
395*4882a593Smuzhiyun out_blkdev_put:
396*4882a593Smuzhiyun 	blkdev_put(d->bdev, FMODE_READ | FMODE_WRITE);
397*4882a593Smuzhiyun 	return error;
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun 
400*4882a593Smuzhiyun static int
bl_parse_slice(struct nfs_server * server,struct pnfs_block_dev * d,struct pnfs_block_volume * volumes,int idx,gfp_t gfp_mask)401*4882a593Smuzhiyun bl_parse_slice(struct nfs_server *server, struct pnfs_block_dev *d,
402*4882a593Smuzhiyun 		struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask)
403*4882a593Smuzhiyun {
404*4882a593Smuzhiyun 	struct pnfs_block_volume *v = &volumes[idx];
405*4882a593Smuzhiyun 	int ret;
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 	ret = bl_parse_deviceid(server, d, volumes, v->slice.volume, gfp_mask);
408*4882a593Smuzhiyun 	if (ret)
409*4882a593Smuzhiyun 		return ret;
410*4882a593Smuzhiyun 
411*4882a593Smuzhiyun 	d->disk_offset = v->slice.start;
412*4882a593Smuzhiyun 	d->len = v->slice.len;
413*4882a593Smuzhiyun 	return 0;
414*4882a593Smuzhiyun }
415*4882a593Smuzhiyun 
416*4882a593Smuzhiyun static int
bl_parse_concat(struct nfs_server * server,struct pnfs_block_dev * d,struct pnfs_block_volume * volumes,int idx,gfp_t gfp_mask)417*4882a593Smuzhiyun bl_parse_concat(struct nfs_server *server, struct pnfs_block_dev *d,
418*4882a593Smuzhiyun 		struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask)
419*4882a593Smuzhiyun {
420*4882a593Smuzhiyun 	struct pnfs_block_volume *v = &volumes[idx];
421*4882a593Smuzhiyun 	u64 len = 0;
422*4882a593Smuzhiyun 	int ret, i;
423*4882a593Smuzhiyun 
424*4882a593Smuzhiyun 	d->children = kcalloc(v->concat.volumes_count,
425*4882a593Smuzhiyun 			sizeof(struct pnfs_block_dev), GFP_KERNEL);
426*4882a593Smuzhiyun 	if (!d->children)
427*4882a593Smuzhiyun 		return -ENOMEM;
428*4882a593Smuzhiyun 
429*4882a593Smuzhiyun 	for (i = 0; i < v->concat.volumes_count; i++) {
430*4882a593Smuzhiyun 		ret = bl_parse_deviceid(server, &d->children[i],
431*4882a593Smuzhiyun 				volumes, v->concat.volumes[i], gfp_mask);
432*4882a593Smuzhiyun 		if (ret)
433*4882a593Smuzhiyun 			return ret;
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun 		d->nr_children++;
436*4882a593Smuzhiyun 		d->children[i].start += len;
437*4882a593Smuzhiyun 		len += d->children[i].len;
438*4882a593Smuzhiyun 	}
439*4882a593Smuzhiyun 
440*4882a593Smuzhiyun 	d->len = len;
441*4882a593Smuzhiyun 	d->map = bl_map_concat;
442*4882a593Smuzhiyun 	return 0;
443*4882a593Smuzhiyun }
444*4882a593Smuzhiyun 
445*4882a593Smuzhiyun static int
bl_parse_stripe(struct nfs_server * server,struct pnfs_block_dev * d,struct pnfs_block_volume * volumes,int idx,gfp_t gfp_mask)446*4882a593Smuzhiyun bl_parse_stripe(struct nfs_server *server, struct pnfs_block_dev *d,
447*4882a593Smuzhiyun 		struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask)
448*4882a593Smuzhiyun {
449*4882a593Smuzhiyun 	struct pnfs_block_volume *v = &volumes[idx];
450*4882a593Smuzhiyun 	u64 len = 0;
451*4882a593Smuzhiyun 	int ret, i;
452*4882a593Smuzhiyun 
453*4882a593Smuzhiyun 	d->children = kcalloc(v->stripe.volumes_count,
454*4882a593Smuzhiyun 			sizeof(struct pnfs_block_dev), GFP_KERNEL);
455*4882a593Smuzhiyun 	if (!d->children)
456*4882a593Smuzhiyun 		return -ENOMEM;
457*4882a593Smuzhiyun 
458*4882a593Smuzhiyun 	for (i = 0; i < v->stripe.volumes_count; i++) {
459*4882a593Smuzhiyun 		ret = bl_parse_deviceid(server, &d->children[i],
460*4882a593Smuzhiyun 				volumes, v->stripe.volumes[i], gfp_mask);
461*4882a593Smuzhiyun 		if (ret)
462*4882a593Smuzhiyun 			return ret;
463*4882a593Smuzhiyun 
464*4882a593Smuzhiyun 		d->nr_children++;
465*4882a593Smuzhiyun 		len += d->children[i].len;
466*4882a593Smuzhiyun 	}
467*4882a593Smuzhiyun 
468*4882a593Smuzhiyun 	d->len = len;
469*4882a593Smuzhiyun 	d->chunk_size = v->stripe.chunk_size;
470*4882a593Smuzhiyun 	d->map = bl_map_stripe;
471*4882a593Smuzhiyun 	return 0;
472*4882a593Smuzhiyun }
473*4882a593Smuzhiyun 
474*4882a593Smuzhiyun static int
bl_parse_deviceid(struct nfs_server * server,struct pnfs_block_dev * d,struct pnfs_block_volume * volumes,int idx,gfp_t gfp_mask)475*4882a593Smuzhiyun bl_parse_deviceid(struct nfs_server *server, struct pnfs_block_dev *d,
476*4882a593Smuzhiyun 		struct pnfs_block_volume *volumes, int idx, gfp_t gfp_mask)
477*4882a593Smuzhiyun {
478*4882a593Smuzhiyun 	switch (volumes[idx].type) {
479*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_SIMPLE:
480*4882a593Smuzhiyun 		return bl_parse_simple(server, d, volumes, idx, gfp_mask);
481*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_SLICE:
482*4882a593Smuzhiyun 		return bl_parse_slice(server, d, volumes, idx, gfp_mask);
483*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_CONCAT:
484*4882a593Smuzhiyun 		return bl_parse_concat(server, d, volumes, idx, gfp_mask);
485*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_STRIPE:
486*4882a593Smuzhiyun 		return bl_parse_stripe(server, d, volumes, idx, gfp_mask);
487*4882a593Smuzhiyun 	case PNFS_BLOCK_VOLUME_SCSI:
488*4882a593Smuzhiyun 		return bl_parse_scsi(server, d, volumes, idx, gfp_mask);
489*4882a593Smuzhiyun 	default:
490*4882a593Smuzhiyun 		dprintk("unsupported volume type: %d\n", volumes[idx].type);
491*4882a593Smuzhiyun 		return -EIO;
492*4882a593Smuzhiyun 	}
493*4882a593Smuzhiyun }
494*4882a593Smuzhiyun 
495*4882a593Smuzhiyun struct nfs4_deviceid_node *
bl_alloc_deviceid_node(struct nfs_server * server,struct pnfs_device * pdev,gfp_t gfp_mask)496*4882a593Smuzhiyun bl_alloc_deviceid_node(struct nfs_server *server, struct pnfs_device *pdev,
497*4882a593Smuzhiyun 		gfp_t gfp_mask)
498*4882a593Smuzhiyun {
499*4882a593Smuzhiyun 	struct nfs4_deviceid_node *node = NULL;
500*4882a593Smuzhiyun 	struct pnfs_block_volume *volumes;
501*4882a593Smuzhiyun 	struct pnfs_block_dev *top;
502*4882a593Smuzhiyun 	struct xdr_stream xdr;
503*4882a593Smuzhiyun 	struct xdr_buf buf;
504*4882a593Smuzhiyun 	struct page *scratch;
505*4882a593Smuzhiyun 	int nr_volumes, ret, i;
506*4882a593Smuzhiyun 	__be32 *p;
507*4882a593Smuzhiyun 
508*4882a593Smuzhiyun 	scratch = alloc_page(gfp_mask);
509*4882a593Smuzhiyun 	if (!scratch)
510*4882a593Smuzhiyun 		goto out;
511*4882a593Smuzhiyun 
512*4882a593Smuzhiyun 	xdr_init_decode_pages(&xdr, &buf, pdev->pages, pdev->pglen);
513*4882a593Smuzhiyun 	xdr_set_scratch_buffer(&xdr, page_address(scratch), PAGE_SIZE);
514*4882a593Smuzhiyun 
515*4882a593Smuzhiyun 	p = xdr_inline_decode(&xdr, sizeof(__be32));
516*4882a593Smuzhiyun 	if (!p)
517*4882a593Smuzhiyun 		goto out_free_scratch;
518*4882a593Smuzhiyun 	nr_volumes = be32_to_cpup(p++);
519*4882a593Smuzhiyun 
520*4882a593Smuzhiyun 	volumes = kcalloc(nr_volumes, sizeof(struct pnfs_block_volume),
521*4882a593Smuzhiyun 			  gfp_mask);
522*4882a593Smuzhiyun 	if (!volumes)
523*4882a593Smuzhiyun 		goto out_free_scratch;
524*4882a593Smuzhiyun 
525*4882a593Smuzhiyun 	for (i = 0; i < nr_volumes; i++) {
526*4882a593Smuzhiyun 		ret = nfs4_block_decode_volume(&xdr, &volumes[i]);
527*4882a593Smuzhiyun 		if (ret < 0)
528*4882a593Smuzhiyun 			goto out_free_volumes;
529*4882a593Smuzhiyun 	}
530*4882a593Smuzhiyun 
531*4882a593Smuzhiyun 	top = kzalloc(sizeof(*top), gfp_mask);
532*4882a593Smuzhiyun 	if (!top)
533*4882a593Smuzhiyun 		goto out_free_volumes;
534*4882a593Smuzhiyun 
535*4882a593Smuzhiyun 	ret = bl_parse_deviceid(server, top, volumes, nr_volumes - 1, gfp_mask);
536*4882a593Smuzhiyun 
537*4882a593Smuzhiyun 	node = &top->node;
538*4882a593Smuzhiyun 	nfs4_init_deviceid_node(node, server, &pdev->dev_id);
539*4882a593Smuzhiyun 	if (ret)
540*4882a593Smuzhiyun 		nfs4_mark_deviceid_unavailable(node);
541*4882a593Smuzhiyun 
542*4882a593Smuzhiyun out_free_volumes:
543*4882a593Smuzhiyun 	kfree(volumes);
544*4882a593Smuzhiyun out_free_scratch:
545*4882a593Smuzhiyun 	__free_page(scratch);
546*4882a593Smuzhiyun out:
547*4882a593Smuzhiyun 	return node;
548*4882a593Smuzhiyun }
549