xref: /OK3568_Linux_fs/kernel/drivers/vfio/virqfd.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * VFIO generic eventfd code for IRQFD support.
4*4882a593Smuzhiyun  * Derived from drivers/vfio/pci/vfio_pci_intrs.c
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * Copyright (C) 2012 Red Hat, Inc.  All rights reserved.
7*4882a593Smuzhiyun  *     Author: Alex Williamson <alex.williamson@redhat.com>
8*4882a593Smuzhiyun  */
9*4882a593Smuzhiyun 
10*4882a593Smuzhiyun #include <linux/vfio.h>
11*4882a593Smuzhiyun #include <linux/eventfd.h>
12*4882a593Smuzhiyun #include <linux/file.h>
13*4882a593Smuzhiyun #include <linux/module.h>
14*4882a593Smuzhiyun #include <linux/slab.h>
15*4882a593Smuzhiyun 
16*4882a593Smuzhiyun #define DRIVER_VERSION  "0.1"
17*4882a593Smuzhiyun #define DRIVER_AUTHOR   "Alex Williamson <alex.williamson@redhat.com>"
18*4882a593Smuzhiyun #define DRIVER_DESC     "IRQFD support for VFIO bus drivers"
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun static struct workqueue_struct *vfio_irqfd_cleanup_wq;
21*4882a593Smuzhiyun static DEFINE_SPINLOCK(virqfd_lock);
22*4882a593Smuzhiyun 
vfio_virqfd_init(void)23*4882a593Smuzhiyun static int __init vfio_virqfd_init(void)
24*4882a593Smuzhiyun {
25*4882a593Smuzhiyun 	vfio_irqfd_cleanup_wq =
26*4882a593Smuzhiyun 		create_singlethread_workqueue("vfio-irqfd-cleanup");
27*4882a593Smuzhiyun 	if (!vfio_irqfd_cleanup_wq)
28*4882a593Smuzhiyun 		return -ENOMEM;
29*4882a593Smuzhiyun 
30*4882a593Smuzhiyun 	return 0;
31*4882a593Smuzhiyun }
32*4882a593Smuzhiyun 
vfio_virqfd_exit(void)33*4882a593Smuzhiyun static void __exit vfio_virqfd_exit(void)
34*4882a593Smuzhiyun {
35*4882a593Smuzhiyun 	destroy_workqueue(vfio_irqfd_cleanup_wq);
36*4882a593Smuzhiyun }
37*4882a593Smuzhiyun 
virqfd_deactivate(struct virqfd * virqfd)38*4882a593Smuzhiyun static void virqfd_deactivate(struct virqfd *virqfd)
39*4882a593Smuzhiyun {
40*4882a593Smuzhiyun 	queue_work(vfio_irqfd_cleanup_wq, &virqfd->shutdown);
41*4882a593Smuzhiyun }
42*4882a593Smuzhiyun 
virqfd_wakeup(wait_queue_entry_t * wait,unsigned mode,int sync,void * key)43*4882a593Smuzhiyun static int virqfd_wakeup(wait_queue_entry_t *wait, unsigned mode, int sync, void *key)
44*4882a593Smuzhiyun {
45*4882a593Smuzhiyun 	struct virqfd *virqfd = container_of(wait, struct virqfd, wait);
46*4882a593Smuzhiyun 	__poll_t flags = key_to_poll(key);
47*4882a593Smuzhiyun 
48*4882a593Smuzhiyun 	if (flags & EPOLLIN) {
49*4882a593Smuzhiyun 		/* An event has been signaled, call function */
50*4882a593Smuzhiyun 		if ((!virqfd->handler ||
51*4882a593Smuzhiyun 		     virqfd->handler(virqfd->opaque, virqfd->data)) &&
52*4882a593Smuzhiyun 		    virqfd->thread)
53*4882a593Smuzhiyun 			schedule_work(&virqfd->inject);
54*4882a593Smuzhiyun 	}
55*4882a593Smuzhiyun 
56*4882a593Smuzhiyun 	if (flags & EPOLLHUP) {
57*4882a593Smuzhiyun 		unsigned long flags;
58*4882a593Smuzhiyun 		spin_lock_irqsave(&virqfd_lock, flags);
59*4882a593Smuzhiyun 
60*4882a593Smuzhiyun 		/*
61*4882a593Smuzhiyun 		 * The eventfd is closing, if the virqfd has not yet been
62*4882a593Smuzhiyun 		 * queued for release, as determined by testing whether the
63*4882a593Smuzhiyun 		 * virqfd pointer to it is still valid, queue it now.  As
64*4882a593Smuzhiyun 		 * with kvm irqfds, we know we won't race against the virqfd
65*4882a593Smuzhiyun 		 * going away because we hold the lock to get here.
66*4882a593Smuzhiyun 		 */
67*4882a593Smuzhiyun 		if (*(virqfd->pvirqfd) == virqfd) {
68*4882a593Smuzhiyun 			*(virqfd->pvirqfd) = NULL;
69*4882a593Smuzhiyun 			virqfd_deactivate(virqfd);
70*4882a593Smuzhiyun 		}
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun 		spin_unlock_irqrestore(&virqfd_lock, flags);
73*4882a593Smuzhiyun 	}
74*4882a593Smuzhiyun 
75*4882a593Smuzhiyun 	return 0;
76*4882a593Smuzhiyun }
77*4882a593Smuzhiyun 
virqfd_ptable_queue_proc(struct file * file,wait_queue_head_t * wqh,poll_table * pt)78*4882a593Smuzhiyun static void virqfd_ptable_queue_proc(struct file *file,
79*4882a593Smuzhiyun 				     wait_queue_head_t *wqh, poll_table *pt)
80*4882a593Smuzhiyun {
81*4882a593Smuzhiyun 	struct virqfd *virqfd = container_of(pt, struct virqfd, pt);
82*4882a593Smuzhiyun 	add_wait_queue(wqh, &virqfd->wait);
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun 
virqfd_shutdown(struct work_struct * work)85*4882a593Smuzhiyun static void virqfd_shutdown(struct work_struct *work)
86*4882a593Smuzhiyun {
87*4882a593Smuzhiyun 	struct virqfd *virqfd = container_of(work, struct virqfd, shutdown);
88*4882a593Smuzhiyun 	u64 cnt;
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	eventfd_ctx_remove_wait_queue(virqfd->eventfd, &virqfd->wait, &cnt);
91*4882a593Smuzhiyun 	flush_work(&virqfd->inject);
92*4882a593Smuzhiyun 	eventfd_ctx_put(virqfd->eventfd);
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun 	kfree(virqfd);
95*4882a593Smuzhiyun }
96*4882a593Smuzhiyun 
virqfd_inject(struct work_struct * work)97*4882a593Smuzhiyun static void virqfd_inject(struct work_struct *work)
98*4882a593Smuzhiyun {
99*4882a593Smuzhiyun 	struct virqfd *virqfd = container_of(work, struct virqfd, inject);
100*4882a593Smuzhiyun 	if (virqfd->thread)
101*4882a593Smuzhiyun 		virqfd->thread(virqfd->opaque, virqfd->data);
102*4882a593Smuzhiyun }
103*4882a593Smuzhiyun 
vfio_virqfd_enable(void * opaque,int (* handler)(void *,void *),void (* thread)(void *,void *),void * data,struct virqfd ** pvirqfd,int fd)104*4882a593Smuzhiyun int vfio_virqfd_enable(void *opaque,
105*4882a593Smuzhiyun 		       int (*handler)(void *, void *),
106*4882a593Smuzhiyun 		       void (*thread)(void *, void *),
107*4882a593Smuzhiyun 		       void *data, struct virqfd **pvirqfd, int fd)
108*4882a593Smuzhiyun {
109*4882a593Smuzhiyun 	struct fd irqfd;
110*4882a593Smuzhiyun 	struct eventfd_ctx *ctx;
111*4882a593Smuzhiyun 	struct virqfd *virqfd;
112*4882a593Smuzhiyun 	int ret = 0;
113*4882a593Smuzhiyun 	__poll_t events;
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun 	virqfd = kzalloc(sizeof(*virqfd), GFP_KERNEL);
116*4882a593Smuzhiyun 	if (!virqfd)
117*4882a593Smuzhiyun 		return -ENOMEM;
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun 	virqfd->pvirqfd = pvirqfd;
120*4882a593Smuzhiyun 	virqfd->opaque = opaque;
121*4882a593Smuzhiyun 	virqfd->handler = handler;
122*4882a593Smuzhiyun 	virqfd->thread = thread;
123*4882a593Smuzhiyun 	virqfd->data = data;
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun 	INIT_WORK(&virqfd->shutdown, virqfd_shutdown);
126*4882a593Smuzhiyun 	INIT_WORK(&virqfd->inject, virqfd_inject);
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun 	irqfd = fdget(fd);
129*4882a593Smuzhiyun 	if (!irqfd.file) {
130*4882a593Smuzhiyun 		ret = -EBADF;
131*4882a593Smuzhiyun 		goto err_fd;
132*4882a593Smuzhiyun 	}
133*4882a593Smuzhiyun 
134*4882a593Smuzhiyun 	ctx = eventfd_ctx_fileget(irqfd.file);
135*4882a593Smuzhiyun 	if (IS_ERR(ctx)) {
136*4882a593Smuzhiyun 		ret = PTR_ERR(ctx);
137*4882a593Smuzhiyun 		goto err_ctx;
138*4882a593Smuzhiyun 	}
139*4882a593Smuzhiyun 
140*4882a593Smuzhiyun 	virqfd->eventfd = ctx;
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun 	/*
143*4882a593Smuzhiyun 	 * virqfds can be released by closing the eventfd or directly
144*4882a593Smuzhiyun 	 * through ioctl.  These are both done through a workqueue, so
145*4882a593Smuzhiyun 	 * we update the pointer to the virqfd under lock to avoid
146*4882a593Smuzhiyun 	 * pushing multiple jobs to release the same virqfd.
147*4882a593Smuzhiyun 	 */
148*4882a593Smuzhiyun 	spin_lock_irq(&virqfd_lock);
149*4882a593Smuzhiyun 
150*4882a593Smuzhiyun 	if (*pvirqfd) {
151*4882a593Smuzhiyun 		spin_unlock_irq(&virqfd_lock);
152*4882a593Smuzhiyun 		ret = -EBUSY;
153*4882a593Smuzhiyun 		goto err_busy;
154*4882a593Smuzhiyun 	}
155*4882a593Smuzhiyun 	*pvirqfd = virqfd;
156*4882a593Smuzhiyun 
157*4882a593Smuzhiyun 	spin_unlock_irq(&virqfd_lock);
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun 	/*
160*4882a593Smuzhiyun 	 * Install our own custom wake-up handling so we are notified via
161*4882a593Smuzhiyun 	 * a callback whenever someone signals the underlying eventfd.
162*4882a593Smuzhiyun 	 */
163*4882a593Smuzhiyun 	init_waitqueue_func_entry(&virqfd->wait, virqfd_wakeup);
164*4882a593Smuzhiyun 	init_poll_funcptr(&virqfd->pt, virqfd_ptable_queue_proc);
165*4882a593Smuzhiyun 
166*4882a593Smuzhiyun 	events = vfs_poll(irqfd.file, &virqfd->pt);
167*4882a593Smuzhiyun 
168*4882a593Smuzhiyun 	/*
169*4882a593Smuzhiyun 	 * Check if there was an event already pending on the eventfd
170*4882a593Smuzhiyun 	 * before we registered and trigger it as if we didn't miss it.
171*4882a593Smuzhiyun 	 */
172*4882a593Smuzhiyun 	if (events & EPOLLIN) {
173*4882a593Smuzhiyun 		if ((!handler || handler(opaque, data)) && thread)
174*4882a593Smuzhiyun 			schedule_work(&virqfd->inject);
175*4882a593Smuzhiyun 	}
176*4882a593Smuzhiyun 
177*4882a593Smuzhiyun 	/*
178*4882a593Smuzhiyun 	 * Do not drop the file until the irqfd is fully initialized,
179*4882a593Smuzhiyun 	 * otherwise we might race against the EPOLLHUP.
180*4882a593Smuzhiyun 	 */
181*4882a593Smuzhiyun 	fdput(irqfd);
182*4882a593Smuzhiyun 
183*4882a593Smuzhiyun 	return 0;
184*4882a593Smuzhiyun err_busy:
185*4882a593Smuzhiyun 	eventfd_ctx_put(ctx);
186*4882a593Smuzhiyun err_ctx:
187*4882a593Smuzhiyun 	fdput(irqfd);
188*4882a593Smuzhiyun err_fd:
189*4882a593Smuzhiyun 	kfree(virqfd);
190*4882a593Smuzhiyun 
191*4882a593Smuzhiyun 	return ret;
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(vfio_virqfd_enable);
194*4882a593Smuzhiyun 
vfio_virqfd_disable(struct virqfd ** pvirqfd)195*4882a593Smuzhiyun void vfio_virqfd_disable(struct virqfd **pvirqfd)
196*4882a593Smuzhiyun {
197*4882a593Smuzhiyun 	unsigned long flags;
198*4882a593Smuzhiyun 
199*4882a593Smuzhiyun 	spin_lock_irqsave(&virqfd_lock, flags);
200*4882a593Smuzhiyun 
201*4882a593Smuzhiyun 	if (*pvirqfd) {
202*4882a593Smuzhiyun 		virqfd_deactivate(*pvirqfd);
203*4882a593Smuzhiyun 		*pvirqfd = NULL;
204*4882a593Smuzhiyun 	}
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun 	spin_unlock_irqrestore(&virqfd_lock, flags);
207*4882a593Smuzhiyun 
208*4882a593Smuzhiyun 	/*
209*4882a593Smuzhiyun 	 * Block until we know all outstanding shutdown jobs have completed.
210*4882a593Smuzhiyun 	 * Even if we don't queue the job, flush the wq to be sure it's
211*4882a593Smuzhiyun 	 * been released.
212*4882a593Smuzhiyun 	 */
213*4882a593Smuzhiyun 	flush_workqueue(vfio_irqfd_cleanup_wq);
214*4882a593Smuzhiyun }
215*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(vfio_virqfd_disable);
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun module_init(vfio_virqfd_init);
218*4882a593Smuzhiyun module_exit(vfio_virqfd_exit);
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun MODULE_VERSION(DRIVER_VERSION);
221*4882a593Smuzhiyun MODULE_LICENSE("GPL v2");
222*4882a593Smuzhiyun MODULE_AUTHOR(DRIVER_AUTHOR);
223*4882a593Smuzhiyun MODULE_DESCRIPTION(DRIVER_DESC);
224