xref: /OK3568_Linux_fs/kernel/drivers/md/dm-switch.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright (C) 2010-2012 by Dell Inc.  All rights reserved.
3*4882a593Smuzhiyun  * Copyright (C) 2011-2013 Red Hat, Inc.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * This file is released under the GPL.
6*4882a593Smuzhiyun  *
7*4882a593Smuzhiyun  * dm-switch is a device-mapper target that maps IO to underlying block
8*4882a593Smuzhiyun  * devices efficiently when there are a large number of fixed-sized
9*4882a593Smuzhiyun  * address regions but there is no simple pattern to allow for a compact
10*4882a593Smuzhiyun  * mapping representation such as dm-stripe.
11*4882a593Smuzhiyun  */
12*4882a593Smuzhiyun 
13*4882a593Smuzhiyun #include <linux/device-mapper.h>
14*4882a593Smuzhiyun 
15*4882a593Smuzhiyun #include <linux/module.h>
16*4882a593Smuzhiyun #include <linux/init.h>
17*4882a593Smuzhiyun #include <linux/vmalloc.h>
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #define DM_MSG_PREFIX "switch"
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun /*
22*4882a593Smuzhiyun  * One region_table_slot_t holds <region_entries_per_slot> region table
23*4882a593Smuzhiyun  * entries each of which is <region_table_entry_bits> in size.
24*4882a593Smuzhiyun  */
25*4882a593Smuzhiyun typedef unsigned long region_table_slot_t;
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun /*
28*4882a593Smuzhiyun  * A device with the offset to its start sector.
29*4882a593Smuzhiyun  */
30*4882a593Smuzhiyun struct switch_path {
31*4882a593Smuzhiyun 	struct dm_dev *dmdev;
32*4882a593Smuzhiyun 	sector_t start;
33*4882a593Smuzhiyun };
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun /*
36*4882a593Smuzhiyun  * Context block for a dm switch device.
37*4882a593Smuzhiyun  */
38*4882a593Smuzhiyun struct switch_ctx {
39*4882a593Smuzhiyun 	struct dm_target *ti;
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun 	unsigned nr_paths;		/* Number of paths in path_list. */
42*4882a593Smuzhiyun 
43*4882a593Smuzhiyun 	unsigned region_size;		/* Region size in 512-byte sectors */
44*4882a593Smuzhiyun 	unsigned long nr_regions;	/* Number of regions making up the device */
45*4882a593Smuzhiyun 	signed char region_size_bits;	/* log2 of region_size or -1 */
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun 	unsigned char region_table_entry_bits;	/* Number of bits in one region table entry */
48*4882a593Smuzhiyun 	unsigned char region_entries_per_slot;	/* Number of entries in one region table slot */
49*4882a593Smuzhiyun 	signed char region_entries_per_slot_bits;	/* log2 of region_entries_per_slot or -1 */
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun 	region_table_slot_t *region_table;	/* Region table */
52*4882a593Smuzhiyun 
53*4882a593Smuzhiyun 	/*
54*4882a593Smuzhiyun 	 * Array of dm devices to switch between.
55*4882a593Smuzhiyun 	 */
56*4882a593Smuzhiyun 	struct switch_path path_list[];
57*4882a593Smuzhiyun };
58*4882a593Smuzhiyun 
alloc_switch_ctx(struct dm_target * ti,unsigned nr_paths,unsigned region_size)59*4882a593Smuzhiyun static struct switch_ctx *alloc_switch_ctx(struct dm_target *ti, unsigned nr_paths,
60*4882a593Smuzhiyun 					   unsigned region_size)
61*4882a593Smuzhiyun {
62*4882a593Smuzhiyun 	struct switch_ctx *sctx;
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun 	sctx = kzalloc(struct_size(sctx, path_list, nr_paths), GFP_KERNEL);
65*4882a593Smuzhiyun 	if (!sctx)
66*4882a593Smuzhiyun 		return NULL;
67*4882a593Smuzhiyun 
68*4882a593Smuzhiyun 	sctx->ti = ti;
69*4882a593Smuzhiyun 	sctx->region_size = region_size;
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 	ti->private = sctx;
72*4882a593Smuzhiyun 
73*4882a593Smuzhiyun 	return sctx;
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun 
alloc_region_table(struct dm_target * ti,unsigned nr_paths)76*4882a593Smuzhiyun static int alloc_region_table(struct dm_target *ti, unsigned nr_paths)
77*4882a593Smuzhiyun {
78*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
79*4882a593Smuzhiyun 	sector_t nr_regions = ti->len;
80*4882a593Smuzhiyun 	sector_t nr_slots;
81*4882a593Smuzhiyun 
82*4882a593Smuzhiyun 	if (!(sctx->region_size & (sctx->region_size - 1)))
83*4882a593Smuzhiyun 		sctx->region_size_bits = __ffs(sctx->region_size);
84*4882a593Smuzhiyun 	else
85*4882a593Smuzhiyun 		sctx->region_size_bits = -1;
86*4882a593Smuzhiyun 
87*4882a593Smuzhiyun 	sctx->region_table_entry_bits = 1;
88*4882a593Smuzhiyun 	while (sctx->region_table_entry_bits < sizeof(region_table_slot_t) * 8 &&
89*4882a593Smuzhiyun 	       (region_table_slot_t)1 << sctx->region_table_entry_bits < nr_paths)
90*4882a593Smuzhiyun 		sctx->region_table_entry_bits++;
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun 	sctx->region_entries_per_slot = (sizeof(region_table_slot_t) * 8) / sctx->region_table_entry_bits;
93*4882a593Smuzhiyun 	if (!(sctx->region_entries_per_slot & (sctx->region_entries_per_slot - 1)))
94*4882a593Smuzhiyun 		sctx->region_entries_per_slot_bits = __ffs(sctx->region_entries_per_slot);
95*4882a593Smuzhiyun 	else
96*4882a593Smuzhiyun 		sctx->region_entries_per_slot_bits = -1;
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun 	if (sector_div(nr_regions, sctx->region_size))
99*4882a593Smuzhiyun 		nr_regions++;
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun 	if (nr_regions >= ULONG_MAX) {
102*4882a593Smuzhiyun 		ti->error = "Region table too large";
103*4882a593Smuzhiyun 		return -EINVAL;
104*4882a593Smuzhiyun 	}
105*4882a593Smuzhiyun 	sctx->nr_regions = nr_regions;
106*4882a593Smuzhiyun 
107*4882a593Smuzhiyun 	nr_slots = nr_regions;
108*4882a593Smuzhiyun 	if (sector_div(nr_slots, sctx->region_entries_per_slot))
109*4882a593Smuzhiyun 		nr_slots++;
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun 	if (nr_slots > ULONG_MAX / sizeof(region_table_slot_t)) {
112*4882a593Smuzhiyun 		ti->error = "Region table too large";
113*4882a593Smuzhiyun 		return -EINVAL;
114*4882a593Smuzhiyun 	}
115*4882a593Smuzhiyun 
116*4882a593Smuzhiyun 	sctx->region_table = vmalloc(array_size(nr_slots,
117*4882a593Smuzhiyun 						sizeof(region_table_slot_t)));
118*4882a593Smuzhiyun 	if (!sctx->region_table) {
119*4882a593Smuzhiyun 		ti->error = "Cannot allocate region table";
120*4882a593Smuzhiyun 		return -ENOMEM;
121*4882a593Smuzhiyun 	}
122*4882a593Smuzhiyun 
123*4882a593Smuzhiyun 	return 0;
124*4882a593Smuzhiyun }
125*4882a593Smuzhiyun 
switch_get_position(struct switch_ctx * sctx,unsigned long region_nr,unsigned long * region_index,unsigned * bit)126*4882a593Smuzhiyun static void switch_get_position(struct switch_ctx *sctx, unsigned long region_nr,
127*4882a593Smuzhiyun 				unsigned long *region_index, unsigned *bit)
128*4882a593Smuzhiyun {
129*4882a593Smuzhiyun 	if (sctx->region_entries_per_slot_bits >= 0) {
130*4882a593Smuzhiyun 		*region_index = region_nr >> sctx->region_entries_per_slot_bits;
131*4882a593Smuzhiyun 		*bit = region_nr & (sctx->region_entries_per_slot - 1);
132*4882a593Smuzhiyun 	} else {
133*4882a593Smuzhiyun 		*region_index = region_nr / sctx->region_entries_per_slot;
134*4882a593Smuzhiyun 		*bit = region_nr % sctx->region_entries_per_slot;
135*4882a593Smuzhiyun 	}
136*4882a593Smuzhiyun 
137*4882a593Smuzhiyun 	*bit *= sctx->region_table_entry_bits;
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun 
switch_region_table_read(struct switch_ctx * sctx,unsigned long region_nr)140*4882a593Smuzhiyun static unsigned switch_region_table_read(struct switch_ctx *sctx, unsigned long region_nr)
141*4882a593Smuzhiyun {
142*4882a593Smuzhiyun 	unsigned long region_index;
143*4882a593Smuzhiyun 	unsigned bit;
144*4882a593Smuzhiyun 
145*4882a593Smuzhiyun 	switch_get_position(sctx, region_nr, &region_index, &bit);
146*4882a593Smuzhiyun 
147*4882a593Smuzhiyun 	return (READ_ONCE(sctx->region_table[region_index]) >> bit) &
148*4882a593Smuzhiyun 		((1 << sctx->region_table_entry_bits) - 1);
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun /*
152*4882a593Smuzhiyun  * Find which path to use at given offset.
153*4882a593Smuzhiyun  */
switch_get_path_nr(struct switch_ctx * sctx,sector_t offset)154*4882a593Smuzhiyun static unsigned switch_get_path_nr(struct switch_ctx *sctx, sector_t offset)
155*4882a593Smuzhiyun {
156*4882a593Smuzhiyun 	unsigned path_nr;
157*4882a593Smuzhiyun 	sector_t p;
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun 	p = offset;
160*4882a593Smuzhiyun 	if (sctx->region_size_bits >= 0)
161*4882a593Smuzhiyun 		p >>= sctx->region_size_bits;
162*4882a593Smuzhiyun 	else
163*4882a593Smuzhiyun 		sector_div(p, sctx->region_size);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	path_nr = switch_region_table_read(sctx, p);
166*4882a593Smuzhiyun 
167*4882a593Smuzhiyun 	/* This can only happen if the processor uses non-atomic stores. */
168*4882a593Smuzhiyun 	if (unlikely(path_nr >= sctx->nr_paths))
169*4882a593Smuzhiyun 		path_nr = 0;
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun 	return path_nr;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun 
switch_region_table_write(struct switch_ctx * sctx,unsigned long region_nr,unsigned value)174*4882a593Smuzhiyun static void switch_region_table_write(struct switch_ctx *sctx, unsigned long region_nr,
175*4882a593Smuzhiyun 				      unsigned value)
176*4882a593Smuzhiyun {
177*4882a593Smuzhiyun 	unsigned long region_index;
178*4882a593Smuzhiyun 	unsigned bit;
179*4882a593Smuzhiyun 	region_table_slot_t pte;
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun 	switch_get_position(sctx, region_nr, &region_index, &bit);
182*4882a593Smuzhiyun 
183*4882a593Smuzhiyun 	pte = sctx->region_table[region_index];
184*4882a593Smuzhiyun 	pte &= ~((((region_table_slot_t)1 << sctx->region_table_entry_bits) - 1) << bit);
185*4882a593Smuzhiyun 	pte |= (region_table_slot_t)value << bit;
186*4882a593Smuzhiyun 	sctx->region_table[region_index] = pte;
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun /*
190*4882a593Smuzhiyun  * Fill the region table with an initial round robin pattern.
191*4882a593Smuzhiyun  */
initialise_region_table(struct switch_ctx * sctx)192*4882a593Smuzhiyun static void initialise_region_table(struct switch_ctx *sctx)
193*4882a593Smuzhiyun {
194*4882a593Smuzhiyun 	unsigned path_nr = 0;
195*4882a593Smuzhiyun 	unsigned long region_nr;
196*4882a593Smuzhiyun 
197*4882a593Smuzhiyun 	for (region_nr = 0; region_nr < sctx->nr_regions; region_nr++) {
198*4882a593Smuzhiyun 		switch_region_table_write(sctx, region_nr, path_nr);
199*4882a593Smuzhiyun 		if (++path_nr >= sctx->nr_paths)
200*4882a593Smuzhiyun 			path_nr = 0;
201*4882a593Smuzhiyun 	}
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun 
parse_path(struct dm_arg_set * as,struct dm_target * ti)204*4882a593Smuzhiyun static int parse_path(struct dm_arg_set *as, struct dm_target *ti)
205*4882a593Smuzhiyun {
206*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
207*4882a593Smuzhiyun 	unsigned long long start;
208*4882a593Smuzhiyun 	int r;
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 	r = dm_get_device(ti, dm_shift_arg(as), dm_table_get_mode(ti->table),
211*4882a593Smuzhiyun 			  &sctx->path_list[sctx->nr_paths].dmdev);
212*4882a593Smuzhiyun 	if (r) {
213*4882a593Smuzhiyun 		ti->error = "Device lookup failed";
214*4882a593Smuzhiyun 		return r;
215*4882a593Smuzhiyun 	}
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun 	if (kstrtoull(dm_shift_arg(as), 10, &start) || start != (sector_t)start) {
218*4882a593Smuzhiyun 		ti->error = "Invalid device starting offset";
219*4882a593Smuzhiyun 		dm_put_device(ti, sctx->path_list[sctx->nr_paths].dmdev);
220*4882a593Smuzhiyun 		return -EINVAL;
221*4882a593Smuzhiyun 	}
222*4882a593Smuzhiyun 
223*4882a593Smuzhiyun 	sctx->path_list[sctx->nr_paths].start = start;
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun 	sctx->nr_paths++;
226*4882a593Smuzhiyun 
227*4882a593Smuzhiyun 	return 0;
228*4882a593Smuzhiyun }
229*4882a593Smuzhiyun 
230*4882a593Smuzhiyun /*
231*4882a593Smuzhiyun  * Destructor: Don't free the dm_target, just the ti->private data (if any).
232*4882a593Smuzhiyun  */
switch_dtr(struct dm_target * ti)233*4882a593Smuzhiyun static void switch_dtr(struct dm_target *ti)
234*4882a593Smuzhiyun {
235*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
236*4882a593Smuzhiyun 
237*4882a593Smuzhiyun 	while (sctx->nr_paths--)
238*4882a593Smuzhiyun 		dm_put_device(ti, sctx->path_list[sctx->nr_paths].dmdev);
239*4882a593Smuzhiyun 
240*4882a593Smuzhiyun 	vfree(sctx->region_table);
241*4882a593Smuzhiyun 	kfree(sctx);
242*4882a593Smuzhiyun }
243*4882a593Smuzhiyun 
244*4882a593Smuzhiyun /*
245*4882a593Smuzhiyun  * Constructor arguments:
246*4882a593Smuzhiyun  *   <num_paths> <region_size> <num_optional_args> [<optional_args>...]
247*4882a593Smuzhiyun  *   [<dev_path> <offset>]+
248*4882a593Smuzhiyun  *
249*4882a593Smuzhiyun  * Optional args are to allow for future extension: currently this
250*4882a593Smuzhiyun  * parameter must be 0.
251*4882a593Smuzhiyun  */
switch_ctr(struct dm_target * ti,unsigned argc,char ** argv)252*4882a593Smuzhiyun static int switch_ctr(struct dm_target *ti, unsigned argc, char **argv)
253*4882a593Smuzhiyun {
254*4882a593Smuzhiyun 	static const struct dm_arg _args[] = {
255*4882a593Smuzhiyun 		{1, (KMALLOC_MAX_SIZE - sizeof(struct switch_ctx)) / sizeof(struct switch_path), "Invalid number of paths"},
256*4882a593Smuzhiyun 		{1, UINT_MAX, "Invalid region size"},
257*4882a593Smuzhiyun 		{0, 0, "Invalid number of optional args"},
258*4882a593Smuzhiyun 	};
259*4882a593Smuzhiyun 
260*4882a593Smuzhiyun 	struct switch_ctx *sctx;
261*4882a593Smuzhiyun 	struct dm_arg_set as;
262*4882a593Smuzhiyun 	unsigned nr_paths, region_size, nr_optional_args;
263*4882a593Smuzhiyun 	int r;
264*4882a593Smuzhiyun 
265*4882a593Smuzhiyun 	as.argc = argc;
266*4882a593Smuzhiyun 	as.argv = argv;
267*4882a593Smuzhiyun 
268*4882a593Smuzhiyun 	r = dm_read_arg(_args, &as, &nr_paths, &ti->error);
269*4882a593Smuzhiyun 	if (r)
270*4882a593Smuzhiyun 		return -EINVAL;
271*4882a593Smuzhiyun 
272*4882a593Smuzhiyun 	r = dm_read_arg(_args + 1, &as, &region_size, &ti->error);
273*4882a593Smuzhiyun 	if (r)
274*4882a593Smuzhiyun 		return r;
275*4882a593Smuzhiyun 
276*4882a593Smuzhiyun 	r = dm_read_arg_group(_args + 2, &as, &nr_optional_args, &ti->error);
277*4882a593Smuzhiyun 	if (r)
278*4882a593Smuzhiyun 		return r;
279*4882a593Smuzhiyun 	/* parse optional arguments here, if we add any */
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	if (as.argc != nr_paths * 2) {
282*4882a593Smuzhiyun 		ti->error = "Incorrect number of path arguments";
283*4882a593Smuzhiyun 		return -EINVAL;
284*4882a593Smuzhiyun 	}
285*4882a593Smuzhiyun 
286*4882a593Smuzhiyun 	sctx = alloc_switch_ctx(ti, nr_paths, region_size);
287*4882a593Smuzhiyun 	if (!sctx) {
288*4882a593Smuzhiyun 		ti->error = "Cannot allocate redirection context";
289*4882a593Smuzhiyun 		return -ENOMEM;
290*4882a593Smuzhiyun 	}
291*4882a593Smuzhiyun 
292*4882a593Smuzhiyun 	r = dm_set_target_max_io_len(ti, region_size);
293*4882a593Smuzhiyun 	if (r)
294*4882a593Smuzhiyun 		goto error;
295*4882a593Smuzhiyun 
296*4882a593Smuzhiyun 	while (as.argc) {
297*4882a593Smuzhiyun 		r = parse_path(&as, ti);
298*4882a593Smuzhiyun 		if (r)
299*4882a593Smuzhiyun 			goto error;
300*4882a593Smuzhiyun 	}
301*4882a593Smuzhiyun 
302*4882a593Smuzhiyun 	r = alloc_region_table(ti, nr_paths);
303*4882a593Smuzhiyun 	if (r)
304*4882a593Smuzhiyun 		goto error;
305*4882a593Smuzhiyun 
306*4882a593Smuzhiyun 	initialise_region_table(sctx);
307*4882a593Smuzhiyun 
308*4882a593Smuzhiyun 	/* For UNMAP, sending the request down any path is sufficient */
309*4882a593Smuzhiyun 	ti->num_discard_bios = 1;
310*4882a593Smuzhiyun 
311*4882a593Smuzhiyun 	return 0;
312*4882a593Smuzhiyun 
313*4882a593Smuzhiyun error:
314*4882a593Smuzhiyun 	switch_dtr(ti);
315*4882a593Smuzhiyun 
316*4882a593Smuzhiyun 	return r;
317*4882a593Smuzhiyun }
318*4882a593Smuzhiyun 
switch_map(struct dm_target * ti,struct bio * bio)319*4882a593Smuzhiyun static int switch_map(struct dm_target *ti, struct bio *bio)
320*4882a593Smuzhiyun {
321*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
322*4882a593Smuzhiyun 	sector_t offset = dm_target_offset(ti, bio->bi_iter.bi_sector);
323*4882a593Smuzhiyun 	unsigned path_nr = switch_get_path_nr(sctx, offset);
324*4882a593Smuzhiyun 
325*4882a593Smuzhiyun 	bio_set_dev(bio, sctx->path_list[path_nr].dmdev->bdev);
326*4882a593Smuzhiyun 	bio->bi_iter.bi_sector = sctx->path_list[path_nr].start + offset;
327*4882a593Smuzhiyun 
328*4882a593Smuzhiyun 	return DM_MAPIO_REMAPPED;
329*4882a593Smuzhiyun }
330*4882a593Smuzhiyun 
331*4882a593Smuzhiyun /*
332*4882a593Smuzhiyun  * We need to parse hex numbers in the message as quickly as possible.
333*4882a593Smuzhiyun  *
334*4882a593Smuzhiyun  * This table-based hex parser improves performance.
335*4882a593Smuzhiyun  * It improves a time to load 1000000 entries compared to the condition-based
336*4882a593Smuzhiyun  * parser.
337*4882a593Smuzhiyun  *		table-based parser	condition-based parser
338*4882a593Smuzhiyun  * PA-RISC	0.29s			0.31s
339*4882a593Smuzhiyun  * Opteron	0.0495s			0.0498s
340*4882a593Smuzhiyun  */
341*4882a593Smuzhiyun static const unsigned char hex_table[256] = {
342*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
343*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
344*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
345*4882a593Smuzhiyun 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 255, 255, 255, 255, 255, 255,
346*4882a593Smuzhiyun 255, 10, 11, 12, 13, 14, 15, 255, 255, 255, 255, 255, 255, 255, 255, 255,
347*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
348*4882a593Smuzhiyun 255, 10, 11, 12, 13, 14, 15, 255, 255, 255, 255, 255, 255, 255, 255, 255,
349*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
350*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
351*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
352*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
353*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
354*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
355*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
356*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
357*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255
358*4882a593Smuzhiyun };
359*4882a593Smuzhiyun 
parse_hex(const char ** string)360*4882a593Smuzhiyun static __always_inline unsigned long parse_hex(const char **string)
361*4882a593Smuzhiyun {
362*4882a593Smuzhiyun 	unsigned char d;
363*4882a593Smuzhiyun 	unsigned long r = 0;
364*4882a593Smuzhiyun 
365*4882a593Smuzhiyun 	while ((d = hex_table[(unsigned char)**string]) < 16) {
366*4882a593Smuzhiyun 		r = (r << 4) | d;
367*4882a593Smuzhiyun 		(*string)++;
368*4882a593Smuzhiyun 	}
369*4882a593Smuzhiyun 
370*4882a593Smuzhiyun 	return r;
371*4882a593Smuzhiyun }
372*4882a593Smuzhiyun 
process_set_region_mappings(struct switch_ctx * sctx,unsigned argc,char ** argv)373*4882a593Smuzhiyun static int process_set_region_mappings(struct switch_ctx *sctx,
374*4882a593Smuzhiyun 				       unsigned argc, char **argv)
375*4882a593Smuzhiyun {
376*4882a593Smuzhiyun 	unsigned i;
377*4882a593Smuzhiyun 	unsigned long region_index = 0;
378*4882a593Smuzhiyun 
379*4882a593Smuzhiyun 	for (i = 1; i < argc; i++) {
380*4882a593Smuzhiyun 		unsigned long path_nr;
381*4882a593Smuzhiyun 		const char *string = argv[i];
382*4882a593Smuzhiyun 
383*4882a593Smuzhiyun 		if ((*string & 0xdf) == 'R') {
384*4882a593Smuzhiyun 			unsigned long cycle_length, num_write;
385*4882a593Smuzhiyun 
386*4882a593Smuzhiyun 			string++;
387*4882a593Smuzhiyun 			if (unlikely(*string == ',')) {
388*4882a593Smuzhiyun 				DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
389*4882a593Smuzhiyun 				return -EINVAL;
390*4882a593Smuzhiyun 			}
391*4882a593Smuzhiyun 			cycle_length = parse_hex(&string);
392*4882a593Smuzhiyun 			if (unlikely(*string != ',')) {
393*4882a593Smuzhiyun 				DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
394*4882a593Smuzhiyun 				return -EINVAL;
395*4882a593Smuzhiyun 			}
396*4882a593Smuzhiyun 			string++;
397*4882a593Smuzhiyun 			if (unlikely(!*string)) {
398*4882a593Smuzhiyun 				DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
399*4882a593Smuzhiyun 				return -EINVAL;
400*4882a593Smuzhiyun 			}
401*4882a593Smuzhiyun 			num_write = parse_hex(&string);
402*4882a593Smuzhiyun 			if (unlikely(*string)) {
403*4882a593Smuzhiyun 				DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
404*4882a593Smuzhiyun 				return -EINVAL;
405*4882a593Smuzhiyun 			}
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 			if (unlikely(!cycle_length) || unlikely(cycle_length - 1 > region_index)) {
408*4882a593Smuzhiyun 				DMWARN("invalid set_region_mappings cycle length: %lu > %lu",
409*4882a593Smuzhiyun 				       cycle_length - 1, region_index);
410*4882a593Smuzhiyun 				return -EINVAL;
411*4882a593Smuzhiyun 			}
412*4882a593Smuzhiyun 			if (unlikely(region_index + num_write < region_index) ||
413*4882a593Smuzhiyun 			    unlikely(region_index + num_write >= sctx->nr_regions)) {
414*4882a593Smuzhiyun 				DMWARN("invalid set_region_mappings region number: %lu + %lu >= %lu",
415*4882a593Smuzhiyun 				       region_index, num_write, sctx->nr_regions);
416*4882a593Smuzhiyun 				return -EINVAL;
417*4882a593Smuzhiyun 			}
418*4882a593Smuzhiyun 
419*4882a593Smuzhiyun 			while (num_write--) {
420*4882a593Smuzhiyun 				region_index++;
421*4882a593Smuzhiyun 				path_nr = switch_region_table_read(sctx, region_index - cycle_length);
422*4882a593Smuzhiyun 				switch_region_table_write(sctx, region_index, path_nr);
423*4882a593Smuzhiyun 			}
424*4882a593Smuzhiyun 
425*4882a593Smuzhiyun 			continue;
426*4882a593Smuzhiyun 		}
427*4882a593Smuzhiyun 
428*4882a593Smuzhiyun 		if (*string == ':')
429*4882a593Smuzhiyun 			region_index++;
430*4882a593Smuzhiyun 		else {
431*4882a593Smuzhiyun 			region_index = parse_hex(&string);
432*4882a593Smuzhiyun 			if (unlikely(*string != ':')) {
433*4882a593Smuzhiyun 				DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
434*4882a593Smuzhiyun 				return -EINVAL;
435*4882a593Smuzhiyun 			}
436*4882a593Smuzhiyun 		}
437*4882a593Smuzhiyun 
438*4882a593Smuzhiyun 		string++;
439*4882a593Smuzhiyun 		if (unlikely(!*string)) {
440*4882a593Smuzhiyun 			DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
441*4882a593Smuzhiyun 			return -EINVAL;
442*4882a593Smuzhiyun 		}
443*4882a593Smuzhiyun 
444*4882a593Smuzhiyun 		path_nr = parse_hex(&string);
445*4882a593Smuzhiyun 		if (unlikely(*string)) {
446*4882a593Smuzhiyun 			DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
447*4882a593Smuzhiyun 			return -EINVAL;
448*4882a593Smuzhiyun 		}
449*4882a593Smuzhiyun 		if (unlikely(region_index >= sctx->nr_regions)) {
450*4882a593Smuzhiyun 			DMWARN("invalid set_region_mappings region number: %lu >= %lu", region_index, sctx->nr_regions);
451*4882a593Smuzhiyun 			return -EINVAL;
452*4882a593Smuzhiyun 		}
453*4882a593Smuzhiyun 		if (unlikely(path_nr >= sctx->nr_paths)) {
454*4882a593Smuzhiyun 			DMWARN("invalid set_region_mappings device: %lu >= %u", path_nr, sctx->nr_paths);
455*4882a593Smuzhiyun 			return -EINVAL;
456*4882a593Smuzhiyun 		}
457*4882a593Smuzhiyun 
458*4882a593Smuzhiyun 		switch_region_table_write(sctx, region_index, path_nr);
459*4882a593Smuzhiyun 	}
460*4882a593Smuzhiyun 
461*4882a593Smuzhiyun 	return 0;
462*4882a593Smuzhiyun }
463*4882a593Smuzhiyun 
464*4882a593Smuzhiyun /*
465*4882a593Smuzhiyun  * Messages are processed one-at-a-time.
466*4882a593Smuzhiyun  *
467*4882a593Smuzhiyun  * Only set_region_mappings is supported.
468*4882a593Smuzhiyun  */
switch_message(struct dm_target * ti,unsigned argc,char ** argv,char * result,unsigned maxlen)469*4882a593Smuzhiyun static int switch_message(struct dm_target *ti, unsigned argc, char **argv,
470*4882a593Smuzhiyun 			  char *result, unsigned maxlen)
471*4882a593Smuzhiyun {
472*4882a593Smuzhiyun 	static DEFINE_MUTEX(message_mutex);
473*4882a593Smuzhiyun 
474*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
475*4882a593Smuzhiyun 	int r = -EINVAL;
476*4882a593Smuzhiyun 
477*4882a593Smuzhiyun 	mutex_lock(&message_mutex);
478*4882a593Smuzhiyun 
479*4882a593Smuzhiyun 	if (!strcasecmp(argv[0], "set_region_mappings"))
480*4882a593Smuzhiyun 		r = process_set_region_mappings(sctx, argc, argv);
481*4882a593Smuzhiyun 	else
482*4882a593Smuzhiyun 		DMWARN("Unrecognised message received.");
483*4882a593Smuzhiyun 
484*4882a593Smuzhiyun 	mutex_unlock(&message_mutex);
485*4882a593Smuzhiyun 
486*4882a593Smuzhiyun 	return r;
487*4882a593Smuzhiyun }
488*4882a593Smuzhiyun 
switch_status(struct dm_target * ti,status_type_t type,unsigned status_flags,char * result,unsigned maxlen)489*4882a593Smuzhiyun static void switch_status(struct dm_target *ti, status_type_t type,
490*4882a593Smuzhiyun 			  unsigned status_flags, char *result, unsigned maxlen)
491*4882a593Smuzhiyun {
492*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
493*4882a593Smuzhiyun 	unsigned sz = 0;
494*4882a593Smuzhiyun 	int path_nr;
495*4882a593Smuzhiyun 
496*4882a593Smuzhiyun 	switch (type) {
497*4882a593Smuzhiyun 	case STATUSTYPE_INFO:
498*4882a593Smuzhiyun 		result[0] = '\0';
499*4882a593Smuzhiyun 		break;
500*4882a593Smuzhiyun 
501*4882a593Smuzhiyun 	case STATUSTYPE_TABLE:
502*4882a593Smuzhiyun 		DMEMIT("%u %u 0", sctx->nr_paths, sctx->region_size);
503*4882a593Smuzhiyun 		for (path_nr = 0; path_nr < sctx->nr_paths; path_nr++)
504*4882a593Smuzhiyun 			DMEMIT(" %s %llu", sctx->path_list[path_nr].dmdev->name,
505*4882a593Smuzhiyun 			       (unsigned long long)sctx->path_list[path_nr].start);
506*4882a593Smuzhiyun 		break;
507*4882a593Smuzhiyun 	}
508*4882a593Smuzhiyun }
509*4882a593Smuzhiyun 
510*4882a593Smuzhiyun /*
511*4882a593Smuzhiyun  * Switch ioctl:
512*4882a593Smuzhiyun  *
513*4882a593Smuzhiyun  * Passthrough all ioctls to the path for sector 0
514*4882a593Smuzhiyun  */
switch_prepare_ioctl(struct dm_target * ti,struct block_device ** bdev)515*4882a593Smuzhiyun static int switch_prepare_ioctl(struct dm_target *ti, struct block_device **bdev)
516*4882a593Smuzhiyun {
517*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
518*4882a593Smuzhiyun 	unsigned path_nr;
519*4882a593Smuzhiyun 
520*4882a593Smuzhiyun 	path_nr = switch_get_path_nr(sctx, 0);
521*4882a593Smuzhiyun 
522*4882a593Smuzhiyun 	*bdev = sctx->path_list[path_nr].dmdev->bdev;
523*4882a593Smuzhiyun 
524*4882a593Smuzhiyun 	/*
525*4882a593Smuzhiyun 	 * Only pass ioctls through if the device sizes match exactly.
526*4882a593Smuzhiyun 	 */
527*4882a593Smuzhiyun 	if (ti->len + sctx->path_list[path_nr].start !=
528*4882a593Smuzhiyun 	    i_size_read((*bdev)->bd_inode) >> SECTOR_SHIFT)
529*4882a593Smuzhiyun 		return 1;
530*4882a593Smuzhiyun 	return 0;
531*4882a593Smuzhiyun }
532*4882a593Smuzhiyun 
switch_iterate_devices(struct dm_target * ti,iterate_devices_callout_fn fn,void * data)533*4882a593Smuzhiyun static int switch_iterate_devices(struct dm_target *ti,
534*4882a593Smuzhiyun 				  iterate_devices_callout_fn fn, void *data)
535*4882a593Smuzhiyun {
536*4882a593Smuzhiyun 	struct switch_ctx *sctx = ti->private;
537*4882a593Smuzhiyun 	int path_nr;
538*4882a593Smuzhiyun 	int r;
539*4882a593Smuzhiyun 
540*4882a593Smuzhiyun 	for (path_nr = 0; path_nr < sctx->nr_paths; path_nr++) {
541*4882a593Smuzhiyun 		r = fn(ti, sctx->path_list[path_nr].dmdev,
542*4882a593Smuzhiyun 			 sctx->path_list[path_nr].start, ti->len, data);
543*4882a593Smuzhiyun 		if (r)
544*4882a593Smuzhiyun 			return r;
545*4882a593Smuzhiyun 	}
546*4882a593Smuzhiyun 
547*4882a593Smuzhiyun 	return 0;
548*4882a593Smuzhiyun }
549*4882a593Smuzhiyun 
550*4882a593Smuzhiyun static struct target_type switch_target = {
551*4882a593Smuzhiyun 	.name = "switch",
552*4882a593Smuzhiyun 	.version = {1, 1, 0},
553*4882a593Smuzhiyun 	.module = THIS_MODULE,
554*4882a593Smuzhiyun 	.ctr = switch_ctr,
555*4882a593Smuzhiyun 	.dtr = switch_dtr,
556*4882a593Smuzhiyun 	.map = switch_map,
557*4882a593Smuzhiyun 	.message = switch_message,
558*4882a593Smuzhiyun 	.status = switch_status,
559*4882a593Smuzhiyun 	.prepare_ioctl = switch_prepare_ioctl,
560*4882a593Smuzhiyun 	.iterate_devices = switch_iterate_devices,
561*4882a593Smuzhiyun };
562*4882a593Smuzhiyun 
dm_switch_init(void)563*4882a593Smuzhiyun static int __init dm_switch_init(void)
564*4882a593Smuzhiyun {
565*4882a593Smuzhiyun 	int r;
566*4882a593Smuzhiyun 
567*4882a593Smuzhiyun 	r = dm_register_target(&switch_target);
568*4882a593Smuzhiyun 	if (r < 0)
569*4882a593Smuzhiyun 		DMERR("dm_register_target() failed %d", r);
570*4882a593Smuzhiyun 
571*4882a593Smuzhiyun 	return r;
572*4882a593Smuzhiyun }
573*4882a593Smuzhiyun 
dm_switch_exit(void)574*4882a593Smuzhiyun static void __exit dm_switch_exit(void)
575*4882a593Smuzhiyun {
576*4882a593Smuzhiyun 	dm_unregister_target(&switch_target);
577*4882a593Smuzhiyun }
578*4882a593Smuzhiyun 
579*4882a593Smuzhiyun module_init(dm_switch_init);
580*4882a593Smuzhiyun module_exit(dm_switch_exit);
581*4882a593Smuzhiyun 
582*4882a593Smuzhiyun MODULE_DESCRIPTION(DM_NAME " dynamic path switching target");
583*4882a593Smuzhiyun MODULE_AUTHOR("Kevin D. O'Kelley <Kevin_OKelley@dell.com>");
584*4882a593Smuzhiyun MODULE_AUTHOR("Narendran Ganapathy <Narendran_Ganapathy@dell.com>");
585*4882a593Smuzhiyun MODULE_AUTHOR("Jim Ramsay <Jim_Ramsay@dell.com>");
586*4882a593Smuzhiyun MODULE_AUTHOR("Mikulas Patocka <mpatocka@redhat.com>");
587*4882a593Smuzhiyun MODULE_LICENSE("GPL");
588