1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright (C) 2010-2012 by Dell Inc. All rights reserved.
3*4882a593Smuzhiyun * Copyright (C) 2011-2013 Red Hat, Inc.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * This file is released under the GPL.
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * dm-switch is a device-mapper target that maps IO to underlying block
8*4882a593Smuzhiyun * devices efficiently when there are a large number of fixed-sized
9*4882a593Smuzhiyun * address regions but there is no simple pattern to allow for a compact
10*4882a593Smuzhiyun * mapping representation such as dm-stripe.
11*4882a593Smuzhiyun */
12*4882a593Smuzhiyun
13*4882a593Smuzhiyun #include <linux/device-mapper.h>
14*4882a593Smuzhiyun
15*4882a593Smuzhiyun #include <linux/module.h>
16*4882a593Smuzhiyun #include <linux/init.h>
17*4882a593Smuzhiyun #include <linux/vmalloc.h>
18*4882a593Smuzhiyun
19*4882a593Smuzhiyun #define DM_MSG_PREFIX "switch"
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun /*
22*4882a593Smuzhiyun * One region_table_slot_t holds <region_entries_per_slot> region table
23*4882a593Smuzhiyun * entries each of which is <region_table_entry_bits> in size.
24*4882a593Smuzhiyun */
25*4882a593Smuzhiyun typedef unsigned long region_table_slot_t;
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun /*
28*4882a593Smuzhiyun * A device with the offset to its start sector.
29*4882a593Smuzhiyun */
30*4882a593Smuzhiyun struct switch_path {
31*4882a593Smuzhiyun struct dm_dev *dmdev;
32*4882a593Smuzhiyun sector_t start;
33*4882a593Smuzhiyun };
34*4882a593Smuzhiyun
35*4882a593Smuzhiyun /*
36*4882a593Smuzhiyun * Context block for a dm switch device.
37*4882a593Smuzhiyun */
38*4882a593Smuzhiyun struct switch_ctx {
39*4882a593Smuzhiyun struct dm_target *ti;
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun unsigned nr_paths; /* Number of paths in path_list. */
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun unsigned region_size; /* Region size in 512-byte sectors */
44*4882a593Smuzhiyun unsigned long nr_regions; /* Number of regions making up the device */
45*4882a593Smuzhiyun signed char region_size_bits; /* log2 of region_size or -1 */
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun unsigned char region_table_entry_bits; /* Number of bits in one region table entry */
48*4882a593Smuzhiyun unsigned char region_entries_per_slot; /* Number of entries in one region table slot */
49*4882a593Smuzhiyun signed char region_entries_per_slot_bits; /* log2 of region_entries_per_slot or -1 */
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun region_table_slot_t *region_table; /* Region table */
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun /*
54*4882a593Smuzhiyun * Array of dm devices to switch between.
55*4882a593Smuzhiyun */
56*4882a593Smuzhiyun struct switch_path path_list[];
57*4882a593Smuzhiyun };
58*4882a593Smuzhiyun
alloc_switch_ctx(struct dm_target * ti,unsigned nr_paths,unsigned region_size)59*4882a593Smuzhiyun static struct switch_ctx *alloc_switch_ctx(struct dm_target *ti, unsigned nr_paths,
60*4882a593Smuzhiyun unsigned region_size)
61*4882a593Smuzhiyun {
62*4882a593Smuzhiyun struct switch_ctx *sctx;
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun sctx = kzalloc(struct_size(sctx, path_list, nr_paths), GFP_KERNEL);
65*4882a593Smuzhiyun if (!sctx)
66*4882a593Smuzhiyun return NULL;
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun sctx->ti = ti;
69*4882a593Smuzhiyun sctx->region_size = region_size;
70*4882a593Smuzhiyun
71*4882a593Smuzhiyun ti->private = sctx;
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun return sctx;
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun
alloc_region_table(struct dm_target * ti,unsigned nr_paths)76*4882a593Smuzhiyun static int alloc_region_table(struct dm_target *ti, unsigned nr_paths)
77*4882a593Smuzhiyun {
78*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
79*4882a593Smuzhiyun sector_t nr_regions = ti->len;
80*4882a593Smuzhiyun sector_t nr_slots;
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun if (!(sctx->region_size & (sctx->region_size - 1)))
83*4882a593Smuzhiyun sctx->region_size_bits = __ffs(sctx->region_size);
84*4882a593Smuzhiyun else
85*4882a593Smuzhiyun sctx->region_size_bits = -1;
86*4882a593Smuzhiyun
87*4882a593Smuzhiyun sctx->region_table_entry_bits = 1;
88*4882a593Smuzhiyun while (sctx->region_table_entry_bits < sizeof(region_table_slot_t) * 8 &&
89*4882a593Smuzhiyun (region_table_slot_t)1 << sctx->region_table_entry_bits < nr_paths)
90*4882a593Smuzhiyun sctx->region_table_entry_bits++;
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun sctx->region_entries_per_slot = (sizeof(region_table_slot_t) * 8) / sctx->region_table_entry_bits;
93*4882a593Smuzhiyun if (!(sctx->region_entries_per_slot & (sctx->region_entries_per_slot - 1)))
94*4882a593Smuzhiyun sctx->region_entries_per_slot_bits = __ffs(sctx->region_entries_per_slot);
95*4882a593Smuzhiyun else
96*4882a593Smuzhiyun sctx->region_entries_per_slot_bits = -1;
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun if (sector_div(nr_regions, sctx->region_size))
99*4882a593Smuzhiyun nr_regions++;
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun if (nr_regions >= ULONG_MAX) {
102*4882a593Smuzhiyun ti->error = "Region table too large";
103*4882a593Smuzhiyun return -EINVAL;
104*4882a593Smuzhiyun }
105*4882a593Smuzhiyun sctx->nr_regions = nr_regions;
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun nr_slots = nr_regions;
108*4882a593Smuzhiyun if (sector_div(nr_slots, sctx->region_entries_per_slot))
109*4882a593Smuzhiyun nr_slots++;
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun if (nr_slots > ULONG_MAX / sizeof(region_table_slot_t)) {
112*4882a593Smuzhiyun ti->error = "Region table too large";
113*4882a593Smuzhiyun return -EINVAL;
114*4882a593Smuzhiyun }
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun sctx->region_table = vmalloc(array_size(nr_slots,
117*4882a593Smuzhiyun sizeof(region_table_slot_t)));
118*4882a593Smuzhiyun if (!sctx->region_table) {
119*4882a593Smuzhiyun ti->error = "Cannot allocate region table";
120*4882a593Smuzhiyun return -ENOMEM;
121*4882a593Smuzhiyun }
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun return 0;
124*4882a593Smuzhiyun }
125*4882a593Smuzhiyun
switch_get_position(struct switch_ctx * sctx,unsigned long region_nr,unsigned long * region_index,unsigned * bit)126*4882a593Smuzhiyun static void switch_get_position(struct switch_ctx *sctx, unsigned long region_nr,
127*4882a593Smuzhiyun unsigned long *region_index, unsigned *bit)
128*4882a593Smuzhiyun {
129*4882a593Smuzhiyun if (sctx->region_entries_per_slot_bits >= 0) {
130*4882a593Smuzhiyun *region_index = region_nr >> sctx->region_entries_per_slot_bits;
131*4882a593Smuzhiyun *bit = region_nr & (sctx->region_entries_per_slot - 1);
132*4882a593Smuzhiyun } else {
133*4882a593Smuzhiyun *region_index = region_nr / sctx->region_entries_per_slot;
134*4882a593Smuzhiyun *bit = region_nr % sctx->region_entries_per_slot;
135*4882a593Smuzhiyun }
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun *bit *= sctx->region_table_entry_bits;
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun
switch_region_table_read(struct switch_ctx * sctx,unsigned long region_nr)140*4882a593Smuzhiyun static unsigned switch_region_table_read(struct switch_ctx *sctx, unsigned long region_nr)
141*4882a593Smuzhiyun {
142*4882a593Smuzhiyun unsigned long region_index;
143*4882a593Smuzhiyun unsigned bit;
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun switch_get_position(sctx, region_nr, ®ion_index, &bit);
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun return (READ_ONCE(sctx->region_table[region_index]) >> bit) &
148*4882a593Smuzhiyun ((1 << sctx->region_table_entry_bits) - 1);
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun /*
152*4882a593Smuzhiyun * Find which path to use at given offset.
153*4882a593Smuzhiyun */
switch_get_path_nr(struct switch_ctx * sctx,sector_t offset)154*4882a593Smuzhiyun static unsigned switch_get_path_nr(struct switch_ctx *sctx, sector_t offset)
155*4882a593Smuzhiyun {
156*4882a593Smuzhiyun unsigned path_nr;
157*4882a593Smuzhiyun sector_t p;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun p = offset;
160*4882a593Smuzhiyun if (sctx->region_size_bits >= 0)
161*4882a593Smuzhiyun p >>= sctx->region_size_bits;
162*4882a593Smuzhiyun else
163*4882a593Smuzhiyun sector_div(p, sctx->region_size);
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun path_nr = switch_region_table_read(sctx, p);
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun /* This can only happen if the processor uses non-atomic stores. */
168*4882a593Smuzhiyun if (unlikely(path_nr >= sctx->nr_paths))
169*4882a593Smuzhiyun path_nr = 0;
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun return path_nr;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun
switch_region_table_write(struct switch_ctx * sctx,unsigned long region_nr,unsigned value)174*4882a593Smuzhiyun static void switch_region_table_write(struct switch_ctx *sctx, unsigned long region_nr,
175*4882a593Smuzhiyun unsigned value)
176*4882a593Smuzhiyun {
177*4882a593Smuzhiyun unsigned long region_index;
178*4882a593Smuzhiyun unsigned bit;
179*4882a593Smuzhiyun region_table_slot_t pte;
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun switch_get_position(sctx, region_nr, ®ion_index, &bit);
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun pte = sctx->region_table[region_index];
184*4882a593Smuzhiyun pte &= ~((((region_table_slot_t)1 << sctx->region_table_entry_bits) - 1) << bit);
185*4882a593Smuzhiyun pte |= (region_table_slot_t)value << bit;
186*4882a593Smuzhiyun sctx->region_table[region_index] = pte;
187*4882a593Smuzhiyun }
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun /*
190*4882a593Smuzhiyun * Fill the region table with an initial round robin pattern.
191*4882a593Smuzhiyun */
initialise_region_table(struct switch_ctx * sctx)192*4882a593Smuzhiyun static void initialise_region_table(struct switch_ctx *sctx)
193*4882a593Smuzhiyun {
194*4882a593Smuzhiyun unsigned path_nr = 0;
195*4882a593Smuzhiyun unsigned long region_nr;
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun for (region_nr = 0; region_nr < sctx->nr_regions; region_nr++) {
198*4882a593Smuzhiyun switch_region_table_write(sctx, region_nr, path_nr);
199*4882a593Smuzhiyun if (++path_nr >= sctx->nr_paths)
200*4882a593Smuzhiyun path_nr = 0;
201*4882a593Smuzhiyun }
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun
parse_path(struct dm_arg_set * as,struct dm_target * ti)204*4882a593Smuzhiyun static int parse_path(struct dm_arg_set *as, struct dm_target *ti)
205*4882a593Smuzhiyun {
206*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
207*4882a593Smuzhiyun unsigned long long start;
208*4882a593Smuzhiyun int r;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun r = dm_get_device(ti, dm_shift_arg(as), dm_table_get_mode(ti->table),
211*4882a593Smuzhiyun &sctx->path_list[sctx->nr_paths].dmdev);
212*4882a593Smuzhiyun if (r) {
213*4882a593Smuzhiyun ti->error = "Device lookup failed";
214*4882a593Smuzhiyun return r;
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun if (kstrtoull(dm_shift_arg(as), 10, &start) || start != (sector_t)start) {
218*4882a593Smuzhiyun ti->error = "Invalid device starting offset";
219*4882a593Smuzhiyun dm_put_device(ti, sctx->path_list[sctx->nr_paths].dmdev);
220*4882a593Smuzhiyun return -EINVAL;
221*4882a593Smuzhiyun }
222*4882a593Smuzhiyun
223*4882a593Smuzhiyun sctx->path_list[sctx->nr_paths].start = start;
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun sctx->nr_paths++;
226*4882a593Smuzhiyun
227*4882a593Smuzhiyun return 0;
228*4882a593Smuzhiyun }
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun /*
231*4882a593Smuzhiyun * Destructor: Don't free the dm_target, just the ti->private data (if any).
232*4882a593Smuzhiyun */
switch_dtr(struct dm_target * ti)233*4882a593Smuzhiyun static void switch_dtr(struct dm_target *ti)
234*4882a593Smuzhiyun {
235*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun while (sctx->nr_paths--)
238*4882a593Smuzhiyun dm_put_device(ti, sctx->path_list[sctx->nr_paths].dmdev);
239*4882a593Smuzhiyun
240*4882a593Smuzhiyun vfree(sctx->region_table);
241*4882a593Smuzhiyun kfree(sctx);
242*4882a593Smuzhiyun }
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun /*
245*4882a593Smuzhiyun * Constructor arguments:
246*4882a593Smuzhiyun * <num_paths> <region_size> <num_optional_args> [<optional_args>...]
247*4882a593Smuzhiyun * [<dev_path> <offset>]+
248*4882a593Smuzhiyun *
249*4882a593Smuzhiyun * Optional args are to allow for future extension: currently this
250*4882a593Smuzhiyun * parameter must be 0.
251*4882a593Smuzhiyun */
switch_ctr(struct dm_target * ti,unsigned argc,char ** argv)252*4882a593Smuzhiyun static int switch_ctr(struct dm_target *ti, unsigned argc, char **argv)
253*4882a593Smuzhiyun {
254*4882a593Smuzhiyun static const struct dm_arg _args[] = {
255*4882a593Smuzhiyun {1, (KMALLOC_MAX_SIZE - sizeof(struct switch_ctx)) / sizeof(struct switch_path), "Invalid number of paths"},
256*4882a593Smuzhiyun {1, UINT_MAX, "Invalid region size"},
257*4882a593Smuzhiyun {0, 0, "Invalid number of optional args"},
258*4882a593Smuzhiyun };
259*4882a593Smuzhiyun
260*4882a593Smuzhiyun struct switch_ctx *sctx;
261*4882a593Smuzhiyun struct dm_arg_set as;
262*4882a593Smuzhiyun unsigned nr_paths, region_size, nr_optional_args;
263*4882a593Smuzhiyun int r;
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun as.argc = argc;
266*4882a593Smuzhiyun as.argv = argv;
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun r = dm_read_arg(_args, &as, &nr_paths, &ti->error);
269*4882a593Smuzhiyun if (r)
270*4882a593Smuzhiyun return -EINVAL;
271*4882a593Smuzhiyun
272*4882a593Smuzhiyun r = dm_read_arg(_args + 1, &as, ®ion_size, &ti->error);
273*4882a593Smuzhiyun if (r)
274*4882a593Smuzhiyun return r;
275*4882a593Smuzhiyun
276*4882a593Smuzhiyun r = dm_read_arg_group(_args + 2, &as, &nr_optional_args, &ti->error);
277*4882a593Smuzhiyun if (r)
278*4882a593Smuzhiyun return r;
279*4882a593Smuzhiyun /* parse optional arguments here, if we add any */
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun if (as.argc != nr_paths * 2) {
282*4882a593Smuzhiyun ti->error = "Incorrect number of path arguments";
283*4882a593Smuzhiyun return -EINVAL;
284*4882a593Smuzhiyun }
285*4882a593Smuzhiyun
286*4882a593Smuzhiyun sctx = alloc_switch_ctx(ti, nr_paths, region_size);
287*4882a593Smuzhiyun if (!sctx) {
288*4882a593Smuzhiyun ti->error = "Cannot allocate redirection context";
289*4882a593Smuzhiyun return -ENOMEM;
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun
292*4882a593Smuzhiyun r = dm_set_target_max_io_len(ti, region_size);
293*4882a593Smuzhiyun if (r)
294*4882a593Smuzhiyun goto error;
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun while (as.argc) {
297*4882a593Smuzhiyun r = parse_path(&as, ti);
298*4882a593Smuzhiyun if (r)
299*4882a593Smuzhiyun goto error;
300*4882a593Smuzhiyun }
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun r = alloc_region_table(ti, nr_paths);
303*4882a593Smuzhiyun if (r)
304*4882a593Smuzhiyun goto error;
305*4882a593Smuzhiyun
306*4882a593Smuzhiyun initialise_region_table(sctx);
307*4882a593Smuzhiyun
308*4882a593Smuzhiyun /* For UNMAP, sending the request down any path is sufficient */
309*4882a593Smuzhiyun ti->num_discard_bios = 1;
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun return 0;
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun error:
314*4882a593Smuzhiyun switch_dtr(ti);
315*4882a593Smuzhiyun
316*4882a593Smuzhiyun return r;
317*4882a593Smuzhiyun }
318*4882a593Smuzhiyun
switch_map(struct dm_target * ti,struct bio * bio)319*4882a593Smuzhiyun static int switch_map(struct dm_target *ti, struct bio *bio)
320*4882a593Smuzhiyun {
321*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
322*4882a593Smuzhiyun sector_t offset = dm_target_offset(ti, bio->bi_iter.bi_sector);
323*4882a593Smuzhiyun unsigned path_nr = switch_get_path_nr(sctx, offset);
324*4882a593Smuzhiyun
325*4882a593Smuzhiyun bio_set_dev(bio, sctx->path_list[path_nr].dmdev->bdev);
326*4882a593Smuzhiyun bio->bi_iter.bi_sector = sctx->path_list[path_nr].start + offset;
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun return DM_MAPIO_REMAPPED;
329*4882a593Smuzhiyun }
330*4882a593Smuzhiyun
331*4882a593Smuzhiyun /*
332*4882a593Smuzhiyun * We need to parse hex numbers in the message as quickly as possible.
333*4882a593Smuzhiyun *
334*4882a593Smuzhiyun * This table-based hex parser improves performance.
335*4882a593Smuzhiyun * It improves a time to load 1000000 entries compared to the condition-based
336*4882a593Smuzhiyun * parser.
337*4882a593Smuzhiyun * table-based parser condition-based parser
338*4882a593Smuzhiyun * PA-RISC 0.29s 0.31s
339*4882a593Smuzhiyun * Opteron 0.0495s 0.0498s
340*4882a593Smuzhiyun */
341*4882a593Smuzhiyun static const unsigned char hex_table[256] = {
342*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
343*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
344*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
345*4882a593Smuzhiyun 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 255, 255, 255, 255, 255, 255,
346*4882a593Smuzhiyun 255, 10, 11, 12, 13, 14, 15, 255, 255, 255, 255, 255, 255, 255, 255, 255,
347*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
348*4882a593Smuzhiyun 255, 10, 11, 12, 13, 14, 15, 255, 255, 255, 255, 255, 255, 255, 255, 255,
349*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
350*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
351*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
352*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
353*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
354*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
355*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
356*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255,
357*4882a593Smuzhiyun 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255, 255
358*4882a593Smuzhiyun };
359*4882a593Smuzhiyun
parse_hex(const char ** string)360*4882a593Smuzhiyun static __always_inline unsigned long parse_hex(const char **string)
361*4882a593Smuzhiyun {
362*4882a593Smuzhiyun unsigned char d;
363*4882a593Smuzhiyun unsigned long r = 0;
364*4882a593Smuzhiyun
365*4882a593Smuzhiyun while ((d = hex_table[(unsigned char)**string]) < 16) {
366*4882a593Smuzhiyun r = (r << 4) | d;
367*4882a593Smuzhiyun (*string)++;
368*4882a593Smuzhiyun }
369*4882a593Smuzhiyun
370*4882a593Smuzhiyun return r;
371*4882a593Smuzhiyun }
372*4882a593Smuzhiyun
process_set_region_mappings(struct switch_ctx * sctx,unsigned argc,char ** argv)373*4882a593Smuzhiyun static int process_set_region_mappings(struct switch_ctx *sctx,
374*4882a593Smuzhiyun unsigned argc, char **argv)
375*4882a593Smuzhiyun {
376*4882a593Smuzhiyun unsigned i;
377*4882a593Smuzhiyun unsigned long region_index = 0;
378*4882a593Smuzhiyun
379*4882a593Smuzhiyun for (i = 1; i < argc; i++) {
380*4882a593Smuzhiyun unsigned long path_nr;
381*4882a593Smuzhiyun const char *string = argv[i];
382*4882a593Smuzhiyun
383*4882a593Smuzhiyun if ((*string & 0xdf) == 'R') {
384*4882a593Smuzhiyun unsigned long cycle_length, num_write;
385*4882a593Smuzhiyun
386*4882a593Smuzhiyun string++;
387*4882a593Smuzhiyun if (unlikely(*string == ',')) {
388*4882a593Smuzhiyun DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
389*4882a593Smuzhiyun return -EINVAL;
390*4882a593Smuzhiyun }
391*4882a593Smuzhiyun cycle_length = parse_hex(&string);
392*4882a593Smuzhiyun if (unlikely(*string != ',')) {
393*4882a593Smuzhiyun DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
394*4882a593Smuzhiyun return -EINVAL;
395*4882a593Smuzhiyun }
396*4882a593Smuzhiyun string++;
397*4882a593Smuzhiyun if (unlikely(!*string)) {
398*4882a593Smuzhiyun DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
399*4882a593Smuzhiyun return -EINVAL;
400*4882a593Smuzhiyun }
401*4882a593Smuzhiyun num_write = parse_hex(&string);
402*4882a593Smuzhiyun if (unlikely(*string)) {
403*4882a593Smuzhiyun DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
404*4882a593Smuzhiyun return -EINVAL;
405*4882a593Smuzhiyun }
406*4882a593Smuzhiyun
407*4882a593Smuzhiyun if (unlikely(!cycle_length) || unlikely(cycle_length - 1 > region_index)) {
408*4882a593Smuzhiyun DMWARN("invalid set_region_mappings cycle length: %lu > %lu",
409*4882a593Smuzhiyun cycle_length - 1, region_index);
410*4882a593Smuzhiyun return -EINVAL;
411*4882a593Smuzhiyun }
412*4882a593Smuzhiyun if (unlikely(region_index + num_write < region_index) ||
413*4882a593Smuzhiyun unlikely(region_index + num_write >= sctx->nr_regions)) {
414*4882a593Smuzhiyun DMWARN("invalid set_region_mappings region number: %lu + %lu >= %lu",
415*4882a593Smuzhiyun region_index, num_write, sctx->nr_regions);
416*4882a593Smuzhiyun return -EINVAL;
417*4882a593Smuzhiyun }
418*4882a593Smuzhiyun
419*4882a593Smuzhiyun while (num_write--) {
420*4882a593Smuzhiyun region_index++;
421*4882a593Smuzhiyun path_nr = switch_region_table_read(sctx, region_index - cycle_length);
422*4882a593Smuzhiyun switch_region_table_write(sctx, region_index, path_nr);
423*4882a593Smuzhiyun }
424*4882a593Smuzhiyun
425*4882a593Smuzhiyun continue;
426*4882a593Smuzhiyun }
427*4882a593Smuzhiyun
428*4882a593Smuzhiyun if (*string == ':')
429*4882a593Smuzhiyun region_index++;
430*4882a593Smuzhiyun else {
431*4882a593Smuzhiyun region_index = parse_hex(&string);
432*4882a593Smuzhiyun if (unlikely(*string != ':')) {
433*4882a593Smuzhiyun DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
434*4882a593Smuzhiyun return -EINVAL;
435*4882a593Smuzhiyun }
436*4882a593Smuzhiyun }
437*4882a593Smuzhiyun
438*4882a593Smuzhiyun string++;
439*4882a593Smuzhiyun if (unlikely(!*string)) {
440*4882a593Smuzhiyun DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
441*4882a593Smuzhiyun return -EINVAL;
442*4882a593Smuzhiyun }
443*4882a593Smuzhiyun
444*4882a593Smuzhiyun path_nr = parse_hex(&string);
445*4882a593Smuzhiyun if (unlikely(*string)) {
446*4882a593Smuzhiyun DMWARN("invalid set_region_mappings argument: '%s'", argv[i]);
447*4882a593Smuzhiyun return -EINVAL;
448*4882a593Smuzhiyun }
449*4882a593Smuzhiyun if (unlikely(region_index >= sctx->nr_regions)) {
450*4882a593Smuzhiyun DMWARN("invalid set_region_mappings region number: %lu >= %lu", region_index, sctx->nr_regions);
451*4882a593Smuzhiyun return -EINVAL;
452*4882a593Smuzhiyun }
453*4882a593Smuzhiyun if (unlikely(path_nr >= sctx->nr_paths)) {
454*4882a593Smuzhiyun DMWARN("invalid set_region_mappings device: %lu >= %u", path_nr, sctx->nr_paths);
455*4882a593Smuzhiyun return -EINVAL;
456*4882a593Smuzhiyun }
457*4882a593Smuzhiyun
458*4882a593Smuzhiyun switch_region_table_write(sctx, region_index, path_nr);
459*4882a593Smuzhiyun }
460*4882a593Smuzhiyun
461*4882a593Smuzhiyun return 0;
462*4882a593Smuzhiyun }
463*4882a593Smuzhiyun
464*4882a593Smuzhiyun /*
465*4882a593Smuzhiyun * Messages are processed one-at-a-time.
466*4882a593Smuzhiyun *
467*4882a593Smuzhiyun * Only set_region_mappings is supported.
468*4882a593Smuzhiyun */
switch_message(struct dm_target * ti,unsigned argc,char ** argv,char * result,unsigned maxlen)469*4882a593Smuzhiyun static int switch_message(struct dm_target *ti, unsigned argc, char **argv,
470*4882a593Smuzhiyun char *result, unsigned maxlen)
471*4882a593Smuzhiyun {
472*4882a593Smuzhiyun static DEFINE_MUTEX(message_mutex);
473*4882a593Smuzhiyun
474*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
475*4882a593Smuzhiyun int r = -EINVAL;
476*4882a593Smuzhiyun
477*4882a593Smuzhiyun mutex_lock(&message_mutex);
478*4882a593Smuzhiyun
479*4882a593Smuzhiyun if (!strcasecmp(argv[0], "set_region_mappings"))
480*4882a593Smuzhiyun r = process_set_region_mappings(sctx, argc, argv);
481*4882a593Smuzhiyun else
482*4882a593Smuzhiyun DMWARN("Unrecognised message received.");
483*4882a593Smuzhiyun
484*4882a593Smuzhiyun mutex_unlock(&message_mutex);
485*4882a593Smuzhiyun
486*4882a593Smuzhiyun return r;
487*4882a593Smuzhiyun }
488*4882a593Smuzhiyun
switch_status(struct dm_target * ti,status_type_t type,unsigned status_flags,char * result,unsigned maxlen)489*4882a593Smuzhiyun static void switch_status(struct dm_target *ti, status_type_t type,
490*4882a593Smuzhiyun unsigned status_flags, char *result, unsigned maxlen)
491*4882a593Smuzhiyun {
492*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
493*4882a593Smuzhiyun unsigned sz = 0;
494*4882a593Smuzhiyun int path_nr;
495*4882a593Smuzhiyun
496*4882a593Smuzhiyun switch (type) {
497*4882a593Smuzhiyun case STATUSTYPE_INFO:
498*4882a593Smuzhiyun result[0] = '\0';
499*4882a593Smuzhiyun break;
500*4882a593Smuzhiyun
501*4882a593Smuzhiyun case STATUSTYPE_TABLE:
502*4882a593Smuzhiyun DMEMIT("%u %u 0", sctx->nr_paths, sctx->region_size);
503*4882a593Smuzhiyun for (path_nr = 0; path_nr < sctx->nr_paths; path_nr++)
504*4882a593Smuzhiyun DMEMIT(" %s %llu", sctx->path_list[path_nr].dmdev->name,
505*4882a593Smuzhiyun (unsigned long long)sctx->path_list[path_nr].start);
506*4882a593Smuzhiyun break;
507*4882a593Smuzhiyun }
508*4882a593Smuzhiyun }
509*4882a593Smuzhiyun
510*4882a593Smuzhiyun /*
511*4882a593Smuzhiyun * Switch ioctl:
512*4882a593Smuzhiyun *
513*4882a593Smuzhiyun * Passthrough all ioctls to the path for sector 0
514*4882a593Smuzhiyun */
switch_prepare_ioctl(struct dm_target * ti,struct block_device ** bdev)515*4882a593Smuzhiyun static int switch_prepare_ioctl(struct dm_target *ti, struct block_device **bdev)
516*4882a593Smuzhiyun {
517*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
518*4882a593Smuzhiyun unsigned path_nr;
519*4882a593Smuzhiyun
520*4882a593Smuzhiyun path_nr = switch_get_path_nr(sctx, 0);
521*4882a593Smuzhiyun
522*4882a593Smuzhiyun *bdev = sctx->path_list[path_nr].dmdev->bdev;
523*4882a593Smuzhiyun
524*4882a593Smuzhiyun /*
525*4882a593Smuzhiyun * Only pass ioctls through if the device sizes match exactly.
526*4882a593Smuzhiyun */
527*4882a593Smuzhiyun if (ti->len + sctx->path_list[path_nr].start !=
528*4882a593Smuzhiyun i_size_read((*bdev)->bd_inode) >> SECTOR_SHIFT)
529*4882a593Smuzhiyun return 1;
530*4882a593Smuzhiyun return 0;
531*4882a593Smuzhiyun }
532*4882a593Smuzhiyun
switch_iterate_devices(struct dm_target * ti,iterate_devices_callout_fn fn,void * data)533*4882a593Smuzhiyun static int switch_iterate_devices(struct dm_target *ti,
534*4882a593Smuzhiyun iterate_devices_callout_fn fn, void *data)
535*4882a593Smuzhiyun {
536*4882a593Smuzhiyun struct switch_ctx *sctx = ti->private;
537*4882a593Smuzhiyun int path_nr;
538*4882a593Smuzhiyun int r;
539*4882a593Smuzhiyun
540*4882a593Smuzhiyun for (path_nr = 0; path_nr < sctx->nr_paths; path_nr++) {
541*4882a593Smuzhiyun r = fn(ti, sctx->path_list[path_nr].dmdev,
542*4882a593Smuzhiyun sctx->path_list[path_nr].start, ti->len, data);
543*4882a593Smuzhiyun if (r)
544*4882a593Smuzhiyun return r;
545*4882a593Smuzhiyun }
546*4882a593Smuzhiyun
547*4882a593Smuzhiyun return 0;
548*4882a593Smuzhiyun }
549*4882a593Smuzhiyun
550*4882a593Smuzhiyun static struct target_type switch_target = {
551*4882a593Smuzhiyun .name = "switch",
552*4882a593Smuzhiyun .version = {1, 1, 0},
553*4882a593Smuzhiyun .module = THIS_MODULE,
554*4882a593Smuzhiyun .ctr = switch_ctr,
555*4882a593Smuzhiyun .dtr = switch_dtr,
556*4882a593Smuzhiyun .map = switch_map,
557*4882a593Smuzhiyun .message = switch_message,
558*4882a593Smuzhiyun .status = switch_status,
559*4882a593Smuzhiyun .prepare_ioctl = switch_prepare_ioctl,
560*4882a593Smuzhiyun .iterate_devices = switch_iterate_devices,
561*4882a593Smuzhiyun };
562*4882a593Smuzhiyun
dm_switch_init(void)563*4882a593Smuzhiyun static int __init dm_switch_init(void)
564*4882a593Smuzhiyun {
565*4882a593Smuzhiyun int r;
566*4882a593Smuzhiyun
567*4882a593Smuzhiyun r = dm_register_target(&switch_target);
568*4882a593Smuzhiyun if (r < 0)
569*4882a593Smuzhiyun DMERR("dm_register_target() failed %d", r);
570*4882a593Smuzhiyun
571*4882a593Smuzhiyun return r;
572*4882a593Smuzhiyun }
573*4882a593Smuzhiyun
dm_switch_exit(void)574*4882a593Smuzhiyun static void __exit dm_switch_exit(void)
575*4882a593Smuzhiyun {
576*4882a593Smuzhiyun dm_unregister_target(&switch_target);
577*4882a593Smuzhiyun }
578*4882a593Smuzhiyun
579*4882a593Smuzhiyun module_init(dm_switch_init);
580*4882a593Smuzhiyun module_exit(dm_switch_exit);
581*4882a593Smuzhiyun
582*4882a593Smuzhiyun MODULE_DESCRIPTION(DM_NAME " dynamic path switching target");
583*4882a593Smuzhiyun MODULE_AUTHOR("Kevin D. O'Kelley <Kevin_OKelley@dell.com>");
584*4882a593Smuzhiyun MODULE_AUTHOR("Narendran Ganapathy <Narendran_Ganapathy@dell.com>");
585*4882a593Smuzhiyun MODULE_AUTHOR("Jim Ramsay <Jim_Ramsay@dell.com>");
586*4882a593Smuzhiyun MODULE_AUTHOR("Mikulas Patocka <mpatocka@redhat.com>");
587*4882a593Smuzhiyun MODULE_LICENSE("GPL");
588