xref: /OK3568_Linux_fs/kernel/drivers/md/dm-zoned.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0 */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (C) 2017 Western Digital Corporation or its affiliates.
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * This file is released under the GPL.
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #ifndef DM_ZONED_H
9*4882a593Smuzhiyun #define DM_ZONED_H
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <linux/types.h>
12*4882a593Smuzhiyun #include <linux/blkdev.h>
13*4882a593Smuzhiyun #include <linux/device-mapper.h>
14*4882a593Smuzhiyun #include <linux/dm-kcopyd.h>
15*4882a593Smuzhiyun #include <linux/list.h>
16*4882a593Smuzhiyun #include <linux/spinlock.h>
17*4882a593Smuzhiyun #include <linux/mutex.h>
18*4882a593Smuzhiyun #include <linux/workqueue.h>
19*4882a593Smuzhiyun #include <linux/rwsem.h>
20*4882a593Smuzhiyun #include <linux/rbtree.h>
21*4882a593Smuzhiyun #include <linux/radix-tree.h>
22*4882a593Smuzhiyun #include <linux/shrinker.h>
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun /*
25*4882a593Smuzhiyun  * dm-zoned creates block devices with 4KB blocks, always.
26*4882a593Smuzhiyun  */
27*4882a593Smuzhiyun #define DMZ_BLOCK_SHIFT		12
28*4882a593Smuzhiyun #define DMZ_BLOCK_SIZE		(1 << DMZ_BLOCK_SHIFT)
29*4882a593Smuzhiyun #define DMZ_BLOCK_MASK		(DMZ_BLOCK_SIZE - 1)
30*4882a593Smuzhiyun 
31*4882a593Smuzhiyun #define DMZ_BLOCK_SHIFT_BITS	(DMZ_BLOCK_SHIFT + 3)
32*4882a593Smuzhiyun #define DMZ_BLOCK_SIZE_BITS	(1 << DMZ_BLOCK_SHIFT_BITS)
33*4882a593Smuzhiyun #define DMZ_BLOCK_MASK_BITS	(DMZ_BLOCK_SIZE_BITS - 1)
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun #define DMZ_BLOCK_SECTORS_SHIFT	(DMZ_BLOCK_SHIFT - SECTOR_SHIFT)
36*4882a593Smuzhiyun #define DMZ_BLOCK_SECTORS	(DMZ_BLOCK_SIZE >> SECTOR_SHIFT)
37*4882a593Smuzhiyun #define DMZ_BLOCK_SECTORS_MASK	(DMZ_BLOCK_SECTORS - 1)
38*4882a593Smuzhiyun 
39*4882a593Smuzhiyun /*
40*4882a593Smuzhiyun  * 4KB block <-> 512B sector conversion.
41*4882a593Smuzhiyun  */
42*4882a593Smuzhiyun #define dmz_blk2sect(b)		((sector_t)(b) << DMZ_BLOCK_SECTORS_SHIFT)
43*4882a593Smuzhiyun #define dmz_sect2blk(s)		((sector_t)(s) >> DMZ_BLOCK_SECTORS_SHIFT)
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun #define dmz_bio_block(bio)	dmz_sect2blk((bio)->bi_iter.bi_sector)
46*4882a593Smuzhiyun #define dmz_bio_blocks(bio)	dmz_sect2blk(bio_sectors(bio))
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun struct dmz_metadata;
49*4882a593Smuzhiyun struct dmz_reclaim;
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun /*
52*4882a593Smuzhiyun  * Zoned block device information.
53*4882a593Smuzhiyun  */
54*4882a593Smuzhiyun struct dmz_dev {
55*4882a593Smuzhiyun 	struct block_device	*bdev;
56*4882a593Smuzhiyun 	struct dmz_metadata	*metadata;
57*4882a593Smuzhiyun 	struct dmz_reclaim	*reclaim;
58*4882a593Smuzhiyun 
59*4882a593Smuzhiyun 	char			name[BDEVNAME_SIZE];
60*4882a593Smuzhiyun 	uuid_t			uuid;
61*4882a593Smuzhiyun 
62*4882a593Smuzhiyun 	sector_t		capacity;
63*4882a593Smuzhiyun 
64*4882a593Smuzhiyun 	unsigned int		dev_idx;
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 	unsigned int		nr_zones;
67*4882a593Smuzhiyun 	unsigned int		zone_offset;
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun 	unsigned int		flags;
70*4882a593Smuzhiyun 
71*4882a593Smuzhiyun 	sector_t		zone_nr_sectors;
72*4882a593Smuzhiyun 
73*4882a593Smuzhiyun 	unsigned int		nr_rnd;
74*4882a593Smuzhiyun 	atomic_t		unmap_nr_rnd;
75*4882a593Smuzhiyun 	struct list_head	unmap_rnd_list;
76*4882a593Smuzhiyun 	struct list_head	map_rnd_list;
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 	unsigned int		nr_seq;
79*4882a593Smuzhiyun 	atomic_t		unmap_nr_seq;
80*4882a593Smuzhiyun 	struct list_head	unmap_seq_list;
81*4882a593Smuzhiyun 	struct list_head	map_seq_list;
82*4882a593Smuzhiyun };
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun #define dmz_bio_chunk(zmd, bio)	((bio)->bi_iter.bi_sector >> \
85*4882a593Smuzhiyun 				 dmz_zone_nr_sectors_shift(zmd))
86*4882a593Smuzhiyun #define dmz_chunk_block(zmd, b)	((b) & (dmz_zone_nr_blocks(zmd) - 1))
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun /* Device flags. */
89*4882a593Smuzhiyun #define DMZ_BDEV_DYING		(1 << 0)
90*4882a593Smuzhiyun #define DMZ_CHECK_BDEV		(2 << 0)
91*4882a593Smuzhiyun #define DMZ_BDEV_REGULAR	(4 << 0)
92*4882a593Smuzhiyun 
93*4882a593Smuzhiyun /*
94*4882a593Smuzhiyun  * Zone descriptor.
95*4882a593Smuzhiyun  */
96*4882a593Smuzhiyun struct dm_zone {
97*4882a593Smuzhiyun 	/* For listing the zone depending on its state */
98*4882a593Smuzhiyun 	struct list_head	link;
99*4882a593Smuzhiyun 
100*4882a593Smuzhiyun 	/* Device containing this zone */
101*4882a593Smuzhiyun 	struct dmz_dev		*dev;
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun 	/* Zone type and state */
104*4882a593Smuzhiyun 	unsigned long		flags;
105*4882a593Smuzhiyun 
106*4882a593Smuzhiyun 	/* Zone activation reference count */
107*4882a593Smuzhiyun 	atomic_t		refcount;
108*4882a593Smuzhiyun 
109*4882a593Smuzhiyun 	/* Zone id */
110*4882a593Smuzhiyun 	unsigned int		id;
111*4882a593Smuzhiyun 
112*4882a593Smuzhiyun 	/* Zone write pointer block (relative to the zone start block) */
113*4882a593Smuzhiyun 	unsigned int		wp_block;
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun 	/* Zone weight (number of valid blocks in the zone) */
116*4882a593Smuzhiyun 	unsigned int		weight;
117*4882a593Smuzhiyun 
118*4882a593Smuzhiyun 	/* The chunk that the zone maps */
119*4882a593Smuzhiyun 	unsigned int		chunk;
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun 	/*
122*4882a593Smuzhiyun 	 * For a sequential data zone, pointer to the random zone
123*4882a593Smuzhiyun 	 * used as a buffer for processing unaligned writes.
124*4882a593Smuzhiyun 	 * For a buffer zone, this points back to the data zone.
125*4882a593Smuzhiyun 	 */
126*4882a593Smuzhiyun 	struct dm_zone		*bzone;
127*4882a593Smuzhiyun };
128*4882a593Smuzhiyun 
129*4882a593Smuzhiyun /*
130*4882a593Smuzhiyun  * Zone flags.
131*4882a593Smuzhiyun  */
132*4882a593Smuzhiyun enum {
133*4882a593Smuzhiyun 	/* Zone write type */
134*4882a593Smuzhiyun 	DMZ_CACHE,
135*4882a593Smuzhiyun 	DMZ_RND,
136*4882a593Smuzhiyun 	DMZ_SEQ,
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun 	/* Zone critical condition */
139*4882a593Smuzhiyun 	DMZ_OFFLINE,
140*4882a593Smuzhiyun 	DMZ_READ_ONLY,
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun 	/* How the zone is being used */
143*4882a593Smuzhiyun 	DMZ_META,
144*4882a593Smuzhiyun 	DMZ_DATA,
145*4882a593Smuzhiyun 	DMZ_BUF,
146*4882a593Smuzhiyun 	DMZ_RESERVED,
147*4882a593Smuzhiyun 
148*4882a593Smuzhiyun 	/* Zone internal state */
149*4882a593Smuzhiyun 	DMZ_RECLAIM,
150*4882a593Smuzhiyun 	DMZ_SEQ_WRITE_ERR,
151*4882a593Smuzhiyun 	DMZ_RECLAIM_TERMINATE,
152*4882a593Smuzhiyun };
153*4882a593Smuzhiyun 
154*4882a593Smuzhiyun /*
155*4882a593Smuzhiyun  * Zone data accessors.
156*4882a593Smuzhiyun  */
157*4882a593Smuzhiyun #define dmz_is_cache(z)		test_bit(DMZ_CACHE, &(z)->flags)
158*4882a593Smuzhiyun #define dmz_is_rnd(z)		test_bit(DMZ_RND, &(z)->flags)
159*4882a593Smuzhiyun #define dmz_is_seq(z)		test_bit(DMZ_SEQ, &(z)->flags)
160*4882a593Smuzhiyun #define dmz_is_empty(z)		((z)->wp_block == 0)
161*4882a593Smuzhiyun #define dmz_is_offline(z)	test_bit(DMZ_OFFLINE, &(z)->flags)
162*4882a593Smuzhiyun #define dmz_is_readonly(z)	test_bit(DMZ_READ_ONLY, &(z)->flags)
163*4882a593Smuzhiyun #define dmz_in_reclaim(z)	test_bit(DMZ_RECLAIM, &(z)->flags)
164*4882a593Smuzhiyun #define dmz_is_reserved(z)	test_bit(DMZ_RESERVED, &(z)->flags)
165*4882a593Smuzhiyun #define dmz_seq_write_err(z)	test_bit(DMZ_SEQ_WRITE_ERR, &(z)->flags)
166*4882a593Smuzhiyun #define dmz_reclaim_should_terminate(z) \
167*4882a593Smuzhiyun 				test_bit(DMZ_RECLAIM_TERMINATE, &(z)->flags)
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun #define dmz_is_meta(z)		test_bit(DMZ_META, &(z)->flags)
170*4882a593Smuzhiyun #define dmz_is_buf(z)		test_bit(DMZ_BUF, &(z)->flags)
171*4882a593Smuzhiyun #define dmz_is_data(z)		test_bit(DMZ_DATA, &(z)->flags)
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun #define dmz_weight(z)		((z)->weight)
174*4882a593Smuzhiyun 
175*4882a593Smuzhiyun /*
176*4882a593Smuzhiyun  * Message functions.
177*4882a593Smuzhiyun  */
178*4882a593Smuzhiyun #define dmz_dev_info(dev, format, args...)	\
179*4882a593Smuzhiyun 	DMINFO("(%s): " format, (dev)->name, ## args)
180*4882a593Smuzhiyun 
181*4882a593Smuzhiyun #define dmz_dev_err(dev, format, args...)	\
182*4882a593Smuzhiyun 	DMERR("(%s): " format, (dev)->name, ## args)
183*4882a593Smuzhiyun 
184*4882a593Smuzhiyun #define dmz_dev_warn(dev, format, args...)	\
185*4882a593Smuzhiyun 	DMWARN("(%s): " format, (dev)->name, ## args)
186*4882a593Smuzhiyun 
187*4882a593Smuzhiyun #define dmz_dev_debug(dev, format, args...)	\
188*4882a593Smuzhiyun 	DMDEBUG("(%s): " format, (dev)->name, ## args)
189*4882a593Smuzhiyun 
190*4882a593Smuzhiyun /*
191*4882a593Smuzhiyun  * Functions defined in dm-zoned-metadata.c
192*4882a593Smuzhiyun  */
193*4882a593Smuzhiyun int dmz_ctr_metadata(struct dmz_dev *dev, int num_dev,
194*4882a593Smuzhiyun 		     struct dmz_metadata **zmd, const char *devname);
195*4882a593Smuzhiyun void dmz_dtr_metadata(struct dmz_metadata *zmd);
196*4882a593Smuzhiyun int dmz_resume_metadata(struct dmz_metadata *zmd);
197*4882a593Smuzhiyun 
198*4882a593Smuzhiyun void dmz_lock_map(struct dmz_metadata *zmd);
199*4882a593Smuzhiyun void dmz_unlock_map(struct dmz_metadata *zmd);
200*4882a593Smuzhiyun void dmz_lock_metadata(struct dmz_metadata *zmd);
201*4882a593Smuzhiyun void dmz_unlock_metadata(struct dmz_metadata *zmd);
202*4882a593Smuzhiyun void dmz_lock_flush(struct dmz_metadata *zmd);
203*4882a593Smuzhiyun void dmz_unlock_flush(struct dmz_metadata *zmd);
204*4882a593Smuzhiyun int dmz_flush_metadata(struct dmz_metadata *zmd);
205*4882a593Smuzhiyun const char *dmz_metadata_label(struct dmz_metadata *zmd);
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun sector_t dmz_start_sect(struct dmz_metadata *zmd, struct dm_zone *zone);
208*4882a593Smuzhiyun sector_t dmz_start_block(struct dmz_metadata *zmd, struct dm_zone *zone);
209*4882a593Smuzhiyun unsigned int dmz_nr_chunks(struct dmz_metadata *zmd);
210*4882a593Smuzhiyun 
211*4882a593Smuzhiyun bool dmz_check_dev(struct dmz_metadata *zmd);
212*4882a593Smuzhiyun bool dmz_dev_is_dying(struct dmz_metadata *zmd);
213*4882a593Smuzhiyun 
214*4882a593Smuzhiyun #define DMZ_ALLOC_RND		0x01
215*4882a593Smuzhiyun #define DMZ_ALLOC_CACHE		0x02
216*4882a593Smuzhiyun #define DMZ_ALLOC_SEQ		0x04
217*4882a593Smuzhiyun #define DMZ_ALLOC_RECLAIM	0x10
218*4882a593Smuzhiyun 
219*4882a593Smuzhiyun struct dm_zone *dmz_alloc_zone(struct dmz_metadata *zmd,
220*4882a593Smuzhiyun 			       unsigned int dev_idx, unsigned long flags);
221*4882a593Smuzhiyun void dmz_free_zone(struct dmz_metadata *zmd, struct dm_zone *zone);
222*4882a593Smuzhiyun 
223*4882a593Smuzhiyun void dmz_map_zone(struct dmz_metadata *zmd, struct dm_zone *zone,
224*4882a593Smuzhiyun 		  unsigned int chunk);
225*4882a593Smuzhiyun void dmz_unmap_zone(struct dmz_metadata *zmd, struct dm_zone *zone);
226*4882a593Smuzhiyun unsigned int dmz_nr_zones(struct dmz_metadata *zmd);
227*4882a593Smuzhiyun unsigned int dmz_nr_cache_zones(struct dmz_metadata *zmd);
228*4882a593Smuzhiyun unsigned int dmz_nr_unmap_cache_zones(struct dmz_metadata *zmd);
229*4882a593Smuzhiyun unsigned int dmz_nr_rnd_zones(struct dmz_metadata *zmd, int idx);
230*4882a593Smuzhiyun unsigned int dmz_nr_unmap_rnd_zones(struct dmz_metadata *zmd, int idx);
231*4882a593Smuzhiyun unsigned int dmz_nr_seq_zones(struct dmz_metadata *zmd, int idx);
232*4882a593Smuzhiyun unsigned int dmz_nr_unmap_seq_zones(struct dmz_metadata *zmd, int idx);
233*4882a593Smuzhiyun unsigned int dmz_zone_nr_blocks(struct dmz_metadata *zmd);
234*4882a593Smuzhiyun unsigned int dmz_zone_nr_blocks_shift(struct dmz_metadata *zmd);
235*4882a593Smuzhiyun unsigned int dmz_zone_nr_sectors(struct dmz_metadata *zmd);
236*4882a593Smuzhiyun unsigned int dmz_zone_nr_sectors_shift(struct dmz_metadata *zmd);
237*4882a593Smuzhiyun 
238*4882a593Smuzhiyun /*
239*4882a593Smuzhiyun  * Activate a zone (increment its reference count).
240*4882a593Smuzhiyun  */
dmz_activate_zone(struct dm_zone * zone)241*4882a593Smuzhiyun static inline void dmz_activate_zone(struct dm_zone *zone)
242*4882a593Smuzhiyun {
243*4882a593Smuzhiyun 	atomic_inc(&zone->refcount);
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun int dmz_lock_zone_reclaim(struct dm_zone *zone);
247*4882a593Smuzhiyun void dmz_unlock_zone_reclaim(struct dm_zone *zone);
248*4882a593Smuzhiyun struct dm_zone *dmz_get_zone_for_reclaim(struct dmz_metadata *zmd,
249*4882a593Smuzhiyun 					 unsigned int dev_idx, bool idle);
250*4882a593Smuzhiyun 
251*4882a593Smuzhiyun struct dm_zone *dmz_get_chunk_mapping(struct dmz_metadata *zmd,
252*4882a593Smuzhiyun 				      unsigned int chunk, int op);
253*4882a593Smuzhiyun void dmz_put_chunk_mapping(struct dmz_metadata *zmd, struct dm_zone *zone);
254*4882a593Smuzhiyun struct dm_zone *dmz_get_chunk_buffer(struct dmz_metadata *zmd,
255*4882a593Smuzhiyun 				     struct dm_zone *dzone);
256*4882a593Smuzhiyun 
257*4882a593Smuzhiyun int dmz_validate_blocks(struct dmz_metadata *zmd, struct dm_zone *zone,
258*4882a593Smuzhiyun 			sector_t chunk_block, unsigned int nr_blocks);
259*4882a593Smuzhiyun int dmz_invalidate_blocks(struct dmz_metadata *zmd, struct dm_zone *zone,
260*4882a593Smuzhiyun 			  sector_t chunk_block, unsigned int nr_blocks);
261*4882a593Smuzhiyun int dmz_block_valid(struct dmz_metadata *zmd, struct dm_zone *zone,
262*4882a593Smuzhiyun 		    sector_t chunk_block);
263*4882a593Smuzhiyun int dmz_first_valid_block(struct dmz_metadata *zmd, struct dm_zone *zone,
264*4882a593Smuzhiyun 			  sector_t *chunk_block);
265*4882a593Smuzhiyun int dmz_copy_valid_blocks(struct dmz_metadata *zmd, struct dm_zone *from_zone,
266*4882a593Smuzhiyun 			  struct dm_zone *to_zone);
267*4882a593Smuzhiyun int dmz_merge_valid_blocks(struct dmz_metadata *zmd, struct dm_zone *from_zone,
268*4882a593Smuzhiyun 			   struct dm_zone *to_zone, sector_t chunk_block);
269*4882a593Smuzhiyun 
270*4882a593Smuzhiyun /*
271*4882a593Smuzhiyun  * Functions defined in dm-zoned-reclaim.c
272*4882a593Smuzhiyun  */
273*4882a593Smuzhiyun int dmz_ctr_reclaim(struct dmz_metadata *zmd, struct dmz_reclaim **zrc, int idx);
274*4882a593Smuzhiyun void dmz_dtr_reclaim(struct dmz_reclaim *zrc);
275*4882a593Smuzhiyun void dmz_suspend_reclaim(struct dmz_reclaim *zrc);
276*4882a593Smuzhiyun void dmz_resume_reclaim(struct dmz_reclaim *zrc);
277*4882a593Smuzhiyun void dmz_reclaim_bio_acc(struct dmz_reclaim *zrc);
278*4882a593Smuzhiyun void dmz_schedule_reclaim(struct dmz_reclaim *zrc);
279*4882a593Smuzhiyun 
280*4882a593Smuzhiyun /*
281*4882a593Smuzhiyun  * Functions defined in dm-zoned-target.c
282*4882a593Smuzhiyun  */
283*4882a593Smuzhiyun bool dmz_bdev_is_dying(struct dmz_dev *dmz_dev);
284*4882a593Smuzhiyun bool dmz_check_bdev(struct dmz_dev *dmz_dev);
285*4882a593Smuzhiyun 
286*4882a593Smuzhiyun /*
287*4882a593Smuzhiyun  * Deactivate a zone. This decrement the zone reference counter
288*4882a593Smuzhiyun  * indicating that all BIOs to the zone have completed when the count is 0.
289*4882a593Smuzhiyun  */
dmz_deactivate_zone(struct dm_zone * zone)290*4882a593Smuzhiyun static inline void dmz_deactivate_zone(struct dm_zone *zone)
291*4882a593Smuzhiyun {
292*4882a593Smuzhiyun 	dmz_reclaim_bio_acc(zone->dev->reclaim);
293*4882a593Smuzhiyun 	atomic_dec(&zone->refcount);
294*4882a593Smuzhiyun }
295*4882a593Smuzhiyun 
296*4882a593Smuzhiyun /*
297*4882a593Smuzhiyun  * Test if a zone is active, that is, has a refcount > 0.
298*4882a593Smuzhiyun  */
dmz_is_active(struct dm_zone * zone)299*4882a593Smuzhiyun static inline bool dmz_is_active(struct dm_zone *zone)
300*4882a593Smuzhiyun {
301*4882a593Smuzhiyun 	return atomic_read(&zone->refcount);
302*4882a593Smuzhiyun }
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun #endif /* DM_ZONED_H */
305