1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Filename: dev.c
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Authors: Joshua Morris <josh.h.morris@us.ibm.com>
6*4882a593Smuzhiyun * Philip Kelleher <pjk1939@linux.vnet.ibm.com>
7*4882a593Smuzhiyun *
8*4882a593Smuzhiyun * (C) Copyright 2013 IBM Corporation
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <linux/kernel.h>
12*4882a593Smuzhiyun #include <linux/interrupt.h>
13*4882a593Smuzhiyun #include <linux/module.h>
14*4882a593Smuzhiyun #include <linux/pci.h>
15*4882a593Smuzhiyun #include <linux/slab.h>
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun #include <linux/hdreg.h>
18*4882a593Smuzhiyun #include <linux/genhd.h>
19*4882a593Smuzhiyun #include <linux/blkdev.h>
20*4882a593Smuzhiyun #include <linux/bio.h>
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun #include <linux/fs.h>
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #include "rsxx_priv.h"
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun static unsigned int blkdev_minors = 64;
27*4882a593Smuzhiyun module_param(blkdev_minors, uint, 0444);
28*4882a593Smuzhiyun MODULE_PARM_DESC(blkdev_minors, "Number of minors(partitions)");
29*4882a593Smuzhiyun
30*4882a593Smuzhiyun /*
31*4882a593Smuzhiyun * For now I'm making this tweakable in case any applications hit this limit.
32*4882a593Smuzhiyun * If you see a "bio too big" error in the log you will need to raise this
33*4882a593Smuzhiyun * value.
34*4882a593Smuzhiyun */
35*4882a593Smuzhiyun static unsigned int blkdev_max_hw_sectors = 1024;
36*4882a593Smuzhiyun module_param(blkdev_max_hw_sectors, uint, 0444);
37*4882a593Smuzhiyun MODULE_PARM_DESC(blkdev_max_hw_sectors, "Max hw sectors for a single BIO");
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun static unsigned int enable_blkdev = 1;
40*4882a593Smuzhiyun module_param(enable_blkdev , uint, 0444);
41*4882a593Smuzhiyun MODULE_PARM_DESC(enable_blkdev, "Enable block device interfaces");
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun
44*4882a593Smuzhiyun struct rsxx_bio_meta {
45*4882a593Smuzhiyun struct bio *bio;
46*4882a593Smuzhiyun atomic_t pending_dmas;
47*4882a593Smuzhiyun atomic_t error;
48*4882a593Smuzhiyun unsigned long start_time;
49*4882a593Smuzhiyun };
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun static struct kmem_cache *bio_meta_pool;
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun static blk_qc_t rsxx_submit_bio(struct bio *bio);
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun /*----------------- Block Device Operations -----------------*/
rsxx_blkdev_ioctl(struct block_device * bdev,fmode_t mode,unsigned int cmd,unsigned long arg)56*4882a593Smuzhiyun static int rsxx_blkdev_ioctl(struct block_device *bdev,
57*4882a593Smuzhiyun fmode_t mode,
58*4882a593Smuzhiyun unsigned int cmd,
59*4882a593Smuzhiyun unsigned long arg)
60*4882a593Smuzhiyun {
61*4882a593Smuzhiyun struct rsxx_cardinfo *card = bdev->bd_disk->private_data;
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun switch (cmd) {
64*4882a593Smuzhiyun case RSXX_GETREG:
65*4882a593Smuzhiyun return rsxx_reg_access(card, (void __user *)arg, 1);
66*4882a593Smuzhiyun case RSXX_SETREG:
67*4882a593Smuzhiyun return rsxx_reg_access(card, (void __user *)arg, 0);
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun
70*4882a593Smuzhiyun return -ENOTTY;
71*4882a593Smuzhiyun }
72*4882a593Smuzhiyun
rsxx_getgeo(struct block_device * bdev,struct hd_geometry * geo)73*4882a593Smuzhiyun static int rsxx_getgeo(struct block_device *bdev, struct hd_geometry *geo)
74*4882a593Smuzhiyun {
75*4882a593Smuzhiyun struct rsxx_cardinfo *card = bdev->bd_disk->private_data;
76*4882a593Smuzhiyun u64 blocks = card->size8 >> 9;
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun /*
79*4882a593Smuzhiyun * get geometry: Fake it. I haven't found any drivers that set
80*4882a593Smuzhiyun * geo->start, so we won't either.
81*4882a593Smuzhiyun */
82*4882a593Smuzhiyun if (card->size8) {
83*4882a593Smuzhiyun geo->heads = 64;
84*4882a593Smuzhiyun geo->sectors = 16;
85*4882a593Smuzhiyun do_div(blocks, (geo->heads * geo->sectors));
86*4882a593Smuzhiyun geo->cylinders = blocks;
87*4882a593Smuzhiyun } else {
88*4882a593Smuzhiyun geo->heads = 0;
89*4882a593Smuzhiyun geo->sectors = 0;
90*4882a593Smuzhiyun geo->cylinders = 0;
91*4882a593Smuzhiyun }
92*4882a593Smuzhiyun return 0;
93*4882a593Smuzhiyun }
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun static const struct block_device_operations rsxx_fops = {
96*4882a593Smuzhiyun .owner = THIS_MODULE,
97*4882a593Smuzhiyun .submit_bio = rsxx_submit_bio,
98*4882a593Smuzhiyun .getgeo = rsxx_getgeo,
99*4882a593Smuzhiyun .ioctl = rsxx_blkdev_ioctl,
100*4882a593Smuzhiyun };
101*4882a593Smuzhiyun
bio_dma_done_cb(struct rsxx_cardinfo * card,void * cb_data,unsigned int error)102*4882a593Smuzhiyun static void bio_dma_done_cb(struct rsxx_cardinfo *card,
103*4882a593Smuzhiyun void *cb_data,
104*4882a593Smuzhiyun unsigned int error)
105*4882a593Smuzhiyun {
106*4882a593Smuzhiyun struct rsxx_bio_meta *meta = cb_data;
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun if (error)
109*4882a593Smuzhiyun atomic_set(&meta->error, 1);
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun if (atomic_dec_and_test(&meta->pending_dmas)) {
112*4882a593Smuzhiyun if (!card->eeh_state && card->gendisk)
113*4882a593Smuzhiyun bio_end_io_acct(meta->bio, meta->start_time);
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun if (atomic_read(&meta->error))
116*4882a593Smuzhiyun bio_io_error(meta->bio);
117*4882a593Smuzhiyun else
118*4882a593Smuzhiyun bio_endio(meta->bio);
119*4882a593Smuzhiyun kmem_cache_free(bio_meta_pool, meta);
120*4882a593Smuzhiyun }
121*4882a593Smuzhiyun }
122*4882a593Smuzhiyun
rsxx_submit_bio(struct bio * bio)123*4882a593Smuzhiyun static blk_qc_t rsxx_submit_bio(struct bio *bio)
124*4882a593Smuzhiyun {
125*4882a593Smuzhiyun struct rsxx_cardinfo *card = bio->bi_disk->private_data;
126*4882a593Smuzhiyun struct rsxx_bio_meta *bio_meta;
127*4882a593Smuzhiyun blk_status_t st = BLK_STS_IOERR;
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun blk_queue_split(&bio);
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun might_sleep();
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun if (!card)
134*4882a593Smuzhiyun goto req_err;
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun if (bio_end_sector(bio) > get_capacity(card->gendisk))
137*4882a593Smuzhiyun goto req_err;
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun if (unlikely(card->halt))
140*4882a593Smuzhiyun goto req_err;
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun if (unlikely(card->dma_fault))
143*4882a593Smuzhiyun goto req_err;
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun if (bio->bi_iter.bi_size == 0) {
146*4882a593Smuzhiyun dev_err(CARD_TO_DEV(card), "size zero BIO!\n");
147*4882a593Smuzhiyun goto req_err;
148*4882a593Smuzhiyun }
149*4882a593Smuzhiyun
150*4882a593Smuzhiyun bio_meta = kmem_cache_alloc(bio_meta_pool, GFP_KERNEL);
151*4882a593Smuzhiyun if (!bio_meta) {
152*4882a593Smuzhiyun st = BLK_STS_RESOURCE;
153*4882a593Smuzhiyun goto req_err;
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun bio_meta->bio = bio;
157*4882a593Smuzhiyun atomic_set(&bio_meta->error, 0);
158*4882a593Smuzhiyun atomic_set(&bio_meta->pending_dmas, 0);
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun if (!unlikely(card->halt))
161*4882a593Smuzhiyun bio_meta->start_time = bio_start_io_acct(bio);
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun dev_dbg(CARD_TO_DEV(card), "BIO[%c]: meta: %p addr8: x%llx size: %d\n",
164*4882a593Smuzhiyun bio_data_dir(bio) ? 'W' : 'R', bio_meta,
165*4882a593Smuzhiyun (u64)bio->bi_iter.bi_sector << 9, bio->bi_iter.bi_size);
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun st = rsxx_dma_queue_bio(card, bio, &bio_meta->pending_dmas,
168*4882a593Smuzhiyun bio_dma_done_cb, bio_meta);
169*4882a593Smuzhiyun if (st)
170*4882a593Smuzhiyun goto queue_err;
171*4882a593Smuzhiyun
172*4882a593Smuzhiyun return BLK_QC_T_NONE;
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun queue_err:
175*4882a593Smuzhiyun kmem_cache_free(bio_meta_pool, bio_meta);
176*4882a593Smuzhiyun req_err:
177*4882a593Smuzhiyun if (st)
178*4882a593Smuzhiyun bio->bi_status = st;
179*4882a593Smuzhiyun bio_endio(bio);
180*4882a593Smuzhiyun return BLK_QC_T_NONE;
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun /*----------------- Device Setup -------------------*/
rsxx_discard_supported(struct rsxx_cardinfo * card)184*4882a593Smuzhiyun static bool rsxx_discard_supported(struct rsxx_cardinfo *card)
185*4882a593Smuzhiyun {
186*4882a593Smuzhiyun unsigned char pci_rev;
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun pci_read_config_byte(card->dev, PCI_REVISION_ID, &pci_rev);
189*4882a593Smuzhiyun
190*4882a593Smuzhiyun return (pci_rev >= RSXX_DISCARD_SUPPORT);
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun
rsxx_attach_dev(struct rsxx_cardinfo * card)193*4882a593Smuzhiyun int rsxx_attach_dev(struct rsxx_cardinfo *card)
194*4882a593Smuzhiyun {
195*4882a593Smuzhiyun mutex_lock(&card->dev_lock);
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun /* The block device requires the stripe size from the config. */
198*4882a593Smuzhiyun if (enable_blkdev) {
199*4882a593Smuzhiyun if (card->config_valid)
200*4882a593Smuzhiyun set_capacity(card->gendisk, card->size8 >> 9);
201*4882a593Smuzhiyun else
202*4882a593Smuzhiyun set_capacity(card->gendisk, 0);
203*4882a593Smuzhiyun device_add_disk(CARD_TO_DEV(card), card->gendisk, NULL);
204*4882a593Smuzhiyun card->bdev_attached = 1;
205*4882a593Smuzhiyun }
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun mutex_unlock(&card->dev_lock);
208*4882a593Smuzhiyun
209*4882a593Smuzhiyun return 0;
210*4882a593Smuzhiyun }
211*4882a593Smuzhiyun
rsxx_detach_dev(struct rsxx_cardinfo * card)212*4882a593Smuzhiyun void rsxx_detach_dev(struct rsxx_cardinfo *card)
213*4882a593Smuzhiyun {
214*4882a593Smuzhiyun mutex_lock(&card->dev_lock);
215*4882a593Smuzhiyun
216*4882a593Smuzhiyun if (card->bdev_attached) {
217*4882a593Smuzhiyun del_gendisk(card->gendisk);
218*4882a593Smuzhiyun card->bdev_attached = 0;
219*4882a593Smuzhiyun }
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun mutex_unlock(&card->dev_lock);
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun
rsxx_setup_dev(struct rsxx_cardinfo * card)224*4882a593Smuzhiyun int rsxx_setup_dev(struct rsxx_cardinfo *card)
225*4882a593Smuzhiyun {
226*4882a593Smuzhiyun unsigned short blk_size;
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun mutex_init(&card->dev_lock);
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun if (!enable_blkdev)
231*4882a593Smuzhiyun return 0;
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun card->major = register_blkdev(0, DRIVER_NAME);
234*4882a593Smuzhiyun if (card->major < 0) {
235*4882a593Smuzhiyun dev_err(CARD_TO_DEV(card), "Failed to get major number\n");
236*4882a593Smuzhiyun return -ENOMEM;
237*4882a593Smuzhiyun }
238*4882a593Smuzhiyun
239*4882a593Smuzhiyun card->queue = blk_alloc_queue(NUMA_NO_NODE);
240*4882a593Smuzhiyun if (!card->queue) {
241*4882a593Smuzhiyun dev_err(CARD_TO_DEV(card), "Failed queue alloc\n");
242*4882a593Smuzhiyun unregister_blkdev(card->major, DRIVER_NAME);
243*4882a593Smuzhiyun return -ENOMEM;
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun card->gendisk = alloc_disk(blkdev_minors);
247*4882a593Smuzhiyun if (!card->gendisk) {
248*4882a593Smuzhiyun dev_err(CARD_TO_DEV(card), "Failed disk alloc\n");
249*4882a593Smuzhiyun blk_cleanup_queue(card->queue);
250*4882a593Smuzhiyun unregister_blkdev(card->major, DRIVER_NAME);
251*4882a593Smuzhiyun return -ENOMEM;
252*4882a593Smuzhiyun }
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun if (card->config_valid) {
255*4882a593Smuzhiyun blk_size = card->config.data.block_size;
256*4882a593Smuzhiyun blk_queue_dma_alignment(card->queue, blk_size - 1);
257*4882a593Smuzhiyun blk_queue_logical_block_size(card->queue, blk_size);
258*4882a593Smuzhiyun }
259*4882a593Smuzhiyun
260*4882a593Smuzhiyun blk_queue_max_hw_sectors(card->queue, blkdev_max_hw_sectors);
261*4882a593Smuzhiyun blk_queue_physical_block_size(card->queue, RSXX_HW_BLK_SIZE);
262*4882a593Smuzhiyun
263*4882a593Smuzhiyun blk_queue_flag_set(QUEUE_FLAG_NONROT, card->queue);
264*4882a593Smuzhiyun blk_queue_flag_clear(QUEUE_FLAG_ADD_RANDOM, card->queue);
265*4882a593Smuzhiyun if (rsxx_discard_supported(card)) {
266*4882a593Smuzhiyun blk_queue_flag_set(QUEUE_FLAG_DISCARD, card->queue);
267*4882a593Smuzhiyun blk_queue_max_discard_sectors(card->queue,
268*4882a593Smuzhiyun RSXX_HW_BLK_SIZE >> 9);
269*4882a593Smuzhiyun card->queue->limits.discard_granularity = RSXX_HW_BLK_SIZE;
270*4882a593Smuzhiyun card->queue->limits.discard_alignment = RSXX_HW_BLK_SIZE;
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun snprintf(card->gendisk->disk_name, sizeof(card->gendisk->disk_name),
274*4882a593Smuzhiyun "rsxx%d", card->disk_id);
275*4882a593Smuzhiyun card->gendisk->major = card->major;
276*4882a593Smuzhiyun card->gendisk->first_minor = 0;
277*4882a593Smuzhiyun card->gendisk->fops = &rsxx_fops;
278*4882a593Smuzhiyun card->gendisk->private_data = card;
279*4882a593Smuzhiyun card->gendisk->queue = card->queue;
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun return 0;
282*4882a593Smuzhiyun }
283*4882a593Smuzhiyun
rsxx_destroy_dev(struct rsxx_cardinfo * card)284*4882a593Smuzhiyun void rsxx_destroy_dev(struct rsxx_cardinfo *card)
285*4882a593Smuzhiyun {
286*4882a593Smuzhiyun if (!enable_blkdev)
287*4882a593Smuzhiyun return;
288*4882a593Smuzhiyun
289*4882a593Smuzhiyun put_disk(card->gendisk);
290*4882a593Smuzhiyun card->gendisk = NULL;
291*4882a593Smuzhiyun
292*4882a593Smuzhiyun blk_cleanup_queue(card->queue);
293*4882a593Smuzhiyun unregister_blkdev(card->major, DRIVER_NAME);
294*4882a593Smuzhiyun }
295*4882a593Smuzhiyun
rsxx_dev_init(void)296*4882a593Smuzhiyun int rsxx_dev_init(void)
297*4882a593Smuzhiyun {
298*4882a593Smuzhiyun bio_meta_pool = KMEM_CACHE(rsxx_bio_meta, SLAB_HWCACHE_ALIGN);
299*4882a593Smuzhiyun if (!bio_meta_pool)
300*4882a593Smuzhiyun return -ENOMEM;
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun return 0;
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun
rsxx_dev_cleanup(void)305*4882a593Smuzhiyun void rsxx_dev_cleanup(void)
306*4882a593Smuzhiyun {
307*4882a593Smuzhiyun kmem_cache_destroy(bio_meta_pool);
308*4882a593Smuzhiyun }
309*4882a593Smuzhiyun
310*4882a593Smuzhiyun
311