1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Virtio vhost-user driver
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright(c) 2019 Intel Corporation
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * This driver allows virtio devices to be used over a vhost-user socket.
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun * Guest devices can be instantiated by kernel module or command line
10*4882a593Smuzhiyun * parameters. One device will be created for each parameter. Syntax:
11*4882a593Smuzhiyun *
12*4882a593Smuzhiyun * virtio_uml.device=<socket>:<virtio_id>[:<platform_id>]
13*4882a593Smuzhiyun * where:
14*4882a593Smuzhiyun * <socket> := vhost-user socket path to connect
15*4882a593Smuzhiyun * <virtio_id> := virtio device id (as in virtio_ids.h)
16*4882a593Smuzhiyun * <platform_id> := (optional) platform device id
17*4882a593Smuzhiyun *
18*4882a593Smuzhiyun * example:
19*4882a593Smuzhiyun * virtio_uml.device=/var/uml.socket:1
20*4882a593Smuzhiyun *
21*4882a593Smuzhiyun * Based on Virtio MMIO driver by Pawel Moll, copyright 2011-2014, ARM Ltd.
22*4882a593Smuzhiyun */
23*4882a593Smuzhiyun #include <linux/module.h>
24*4882a593Smuzhiyun #include <linux/platform_device.h>
25*4882a593Smuzhiyun #include <linux/slab.h>
26*4882a593Smuzhiyun #include <linux/virtio.h>
27*4882a593Smuzhiyun #include <linux/virtio_config.h>
28*4882a593Smuzhiyun #include <linux/virtio_ring.h>
29*4882a593Smuzhiyun #include <linux/time-internal.h>
30*4882a593Smuzhiyun #include <shared/as-layout.h>
31*4882a593Smuzhiyun #include <irq_kern.h>
32*4882a593Smuzhiyun #include <init.h>
33*4882a593Smuzhiyun #include <os.h>
34*4882a593Smuzhiyun #include "vhost_user.h"
35*4882a593Smuzhiyun
36*4882a593Smuzhiyun /* Workaround due to a conflict between irq_user.h and irqreturn.h */
37*4882a593Smuzhiyun #ifdef IRQ_NONE
38*4882a593Smuzhiyun #undef IRQ_NONE
39*4882a593Smuzhiyun #endif
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun #define MAX_SUPPORTED_QUEUE_SIZE 256
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun #define to_virtio_uml_device(_vdev) \
44*4882a593Smuzhiyun container_of(_vdev, struct virtio_uml_device, vdev)
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun struct virtio_uml_platform_data {
47*4882a593Smuzhiyun u32 virtio_device_id;
48*4882a593Smuzhiyun const char *socket_path;
49*4882a593Smuzhiyun struct work_struct conn_broken_wk;
50*4882a593Smuzhiyun struct platform_device *pdev;
51*4882a593Smuzhiyun };
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun struct virtio_uml_device {
54*4882a593Smuzhiyun struct virtio_device vdev;
55*4882a593Smuzhiyun struct platform_device *pdev;
56*4882a593Smuzhiyun
57*4882a593Smuzhiyun spinlock_t sock_lock;
58*4882a593Smuzhiyun int sock, req_fd;
59*4882a593Smuzhiyun u64 features;
60*4882a593Smuzhiyun u64 protocol_features;
61*4882a593Smuzhiyun u8 status;
62*4882a593Smuzhiyun u8 registered:1;
63*4882a593Smuzhiyun };
64*4882a593Smuzhiyun
65*4882a593Smuzhiyun struct virtio_uml_vq_info {
66*4882a593Smuzhiyun int kick_fd, call_fd;
67*4882a593Smuzhiyun char name[32];
68*4882a593Smuzhiyun #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
69*4882a593Smuzhiyun struct virtqueue *vq;
70*4882a593Smuzhiyun vq_callback_t *callback;
71*4882a593Smuzhiyun struct time_travel_event defer;
72*4882a593Smuzhiyun #endif
73*4882a593Smuzhiyun };
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun extern unsigned long long physmem_size, highmem;
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun #define vu_err(vu_dev, ...) dev_err(&(vu_dev)->pdev->dev, ##__VA_ARGS__)
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun /* Vhost-user protocol */
80*4882a593Smuzhiyun
full_sendmsg_fds(int fd,const void * buf,unsigned int len,const int * fds,unsigned int fds_num)81*4882a593Smuzhiyun static int full_sendmsg_fds(int fd, const void *buf, unsigned int len,
82*4882a593Smuzhiyun const int *fds, unsigned int fds_num)
83*4882a593Smuzhiyun {
84*4882a593Smuzhiyun int rc;
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun do {
87*4882a593Smuzhiyun rc = os_sendmsg_fds(fd, buf, len, fds, fds_num);
88*4882a593Smuzhiyun if (rc > 0) {
89*4882a593Smuzhiyun buf += rc;
90*4882a593Smuzhiyun len -= rc;
91*4882a593Smuzhiyun fds = NULL;
92*4882a593Smuzhiyun fds_num = 0;
93*4882a593Smuzhiyun }
94*4882a593Smuzhiyun } while (len && (rc >= 0 || rc == -EINTR));
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun if (rc < 0)
97*4882a593Smuzhiyun return rc;
98*4882a593Smuzhiyun return 0;
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
full_read(int fd,void * buf,int len,bool abortable)101*4882a593Smuzhiyun static int full_read(int fd, void *buf, int len, bool abortable)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun int rc;
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun do {
106*4882a593Smuzhiyun rc = os_read_file(fd, buf, len);
107*4882a593Smuzhiyun if (rc > 0) {
108*4882a593Smuzhiyun buf += rc;
109*4882a593Smuzhiyun len -= rc;
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun } while (len && (rc > 0 || rc == -EINTR || (!abortable && rc == -EAGAIN)));
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun if (rc < 0)
114*4882a593Smuzhiyun return rc;
115*4882a593Smuzhiyun if (rc == 0)
116*4882a593Smuzhiyun return -ECONNRESET;
117*4882a593Smuzhiyun return 0;
118*4882a593Smuzhiyun }
119*4882a593Smuzhiyun
vhost_user_recv_header(int fd,struct vhost_user_msg * msg)120*4882a593Smuzhiyun static int vhost_user_recv_header(int fd, struct vhost_user_msg *msg)
121*4882a593Smuzhiyun {
122*4882a593Smuzhiyun return full_read(fd, msg, sizeof(msg->header), true);
123*4882a593Smuzhiyun }
124*4882a593Smuzhiyun
vhost_user_recv(struct virtio_uml_device * vu_dev,int fd,struct vhost_user_msg * msg,size_t max_payload_size,bool wait)125*4882a593Smuzhiyun static int vhost_user_recv(struct virtio_uml_device *vu_dev,
126*4882a593Smuzhiyun int fd, struct vhost_user_msg *msg,
127*4882a593Smuzhiyun size_t max_payload_size, bool wait)
128*4882a593Smuzhiyun {
129*4882a593Smuzhiyun size_t size;
130*4882a593Smuzhiyun int rc;
131*4882a593Smuzhiyun
132*4882a593Smuzhiyun /*
133*4882a593Smuzhiyun * In virtio time-travel mode, we're handling all the vhost-user
134*4882a593Smuzhiyun * FDs by polling them whenever appropriate. However, we may get
135*4882a593Smuzhiyun * into a situation where we're sending out an interrupt message
136*4882a593Smuzhiyun * to a device (e.g. a net device) and need to handle a simulation
137*4882a593Smuzhiyun * time message while doing so, e.g. one that tells us to update
138*4882a593Smuzhiyun * our idea of how long we can run without scheduling.
139*4882a593Smuzhiyun *
140*4882a593Smuzhiyun * Thus, we need to not just read() from the given fd, but need
141*4882a593Smuzhiyun * to also handle messages for the simulation time - this function
142*4882a593Smuzhiyun * does that for us while waiting for the given fd to be readable.
143*4882a593Smuzhiyun */
144*4882a593Smuzhiyun if (wait)
145*4882a593Smuzhiyun time_travel_wait_readable(fd);
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun rc = vhost_user_recv_header(fd, msg);
148*4882a593Smuzhiyun
149*4882a593Smuzhiyun if (rc == -ECONNRESET && vu_dev->registered) {
150*4882a593Smuzhiyun struct virtio_uml_platform_data *pdata;
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun pdata = vu_dev->pdev->dev.platform_data;
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun virtio_break_device(&vu_dev->vdev);
155*4882a593Smuzhiyun schedule_work(&pdata->conn_broken_wk);
156*4882a593Smuzhiyun }
157*4882a593Smuzhiyun if (rc)
158*4882a593Smuzhiyun return rc;
159*4882a593Smuzhiyun size = msg->header.size;
160*4882a593Smuzhiyun if (size > max_payload_size)
161*4882a593Smuzhiyun return -EPROTO;
162*4882a593Smuzhiyun return full_read(fd, &msg->payload, size, false);
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun
vhost_user_recv_resp(struct virtio_uml_device * vu_dev,struct vhost_user_msg * msg,size_t max_payload_size)165*4882a593Smuzhiyun static int vhost_user_recv_resp(struct virtio_uml_device *vu_dev,
166*4882a593Smuzhiyun struct vhost_user_msg *msg,
167*4882a593Smuzhiyun size_t max_payload_size)
168*4882a593Smuzhiyun {
169*4882a593Smuzhiyun int rc = vhost_user_recv(vu_dev, vu_dev->sock, msg,
170*4882a593Smuzhiyun max_payload_size, true);
171*4882a593Smuzhiyun
172*4882a593Smuzhiyun if (rc)
173*4882a593Smuzhiyun return rc;
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun if (msg->header.flags != (VHOST_USER_FLAG_REPLY | VHOST_USER_VERSION))
176*4882a593Smuzhiyun return -EPROTO;
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun return 0;
179*4882a593Smuzhiyun }
180*4882a593Smuzhiyun
vhost_user_recv_u64(struct virtio_uml_device * vu_dev,u64 * value)181*4882a593Smuzhiyun static int vhost_user_recv_u64(struct virtio_uml_device *vu_dev,
182*4882a593Smuzhiyun u64 *value)
183*4882a593Smuzhiyun {
184*4882a593Smuzhiyun struct vhost_user_msg msg;
185*4882a593Smuzhiyun int rc = vhost_user_recv_resp(vu_dev, &msg,
186*4882a593Smuzhiyun sizeof(msg.payload.integer));
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun if (rc)
189*4882a593Smuzhiyun return rc;
190*4882a593Smuzhiyun if (msg.header.size != sizeof(msg.payload.integer))
191*4882a593Smuzhiyun return -EPROTO;
192*4882a593Smuzhiyun *value = msg.payload.integer;
193*4882a593Smuzhiyun return 0;
194*4882a593Smuzhiyun }
195*4882a593Smuzhiyun
vhost_user_recv_req(struct virtio_uml_device * vu_dev,struct vhost_user_msg * msg,size_t max_payload_size)196*4882a593Smuzhiyun static int vhost_user_recv_req(struct virtio_uml_device *vu_dev,
197*4882a593Smuzhiyun struct vhost_user_msg *msg,
198*4882a593Smuzhiyun size_t max_payload_size)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun int rc = vhost_user_recv(vu_dev, vu_dev->req_fd, msg,
201*4882a593Smuzhiyun max_payload_size, false);
202*4882a593Smuzhiyun
203*4882a593Smuzhiyun if (rc)
204*4882a593Smuzhiyun return rc;
205*4882a593Smuzhiyun
206*4882a593Smuzhiyun if ((msg->header.flags & ~VHOST_USER_FLAG_NEED_REPLY) !=
207*4882a593Smuzhiyun VHOST_USER_VERSION)
208*4882a593Smuzhiyun return -EPROTO;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun return 0;
211*4882a593Smuzhiyun }
212*4882a593Smuzhiyun
vhost_user_send(struct virtio_uml_device * vu_dev,bool need_response,struct vhost_user_msg * msg,int * fds,size_t num_fds)213*4882a593Smuzhiyun static int vhost_user_send(struct virtio_uml_device *vu_dev,
214*4882a593Smuzhiyun bool need_response, struct vhost_user_msg *msg,
215*4882a593Smuzhiyun int *fds, size_t num_fds)
216*4882a593Smuzhiyun {
217*4882a593Smuzhiyun size_t size = sizeof(msg->header) + msg->header.size;
218*4882a593Smuzhiyun unsigned long flags;
219*4882a593Smuzhiyun bool request_ack;
220*4882a593Smuzhiyun int rc;
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun msg->header.flags |= VHOST_USER_VERSION;
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun /*
225*4882a593Smuzhiyun * The need_response flag indicates that we already need a response,
226*4882a593Smuzhiyun * e.g. to read the features. In these cases, don't request an ACK as
227*4882a593Smuzhiyun * it is meaningless. Also request an ACK only if supported.
228*4882a593Smuzhiyun */
229*4882a593Smuzhiyun request_ack = !need_response;
230*4882a593Smuzhiyun if (!(vu_dev->protocol_features &
231*4882a593Smuzhiyun BIT_ULL(VHOST_USER_PROTOCOL_F_REPLY_ACK)))
232*4882a593Smuzhiyun request_ack = false;
233*4882a593Smuzhiyun
234*4882a593Smuzhiyun if (request_ack)
235*4882a593Smuzhiyun msg->header.flags |= VHOST_USER_FLAG_NEED_REPLY;
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun spin_lock_irqsave(&vu_dev->sock_lock, flags);
238*4882a593Smuzhiyun rc = full_sendmsg_fds(vu_dev->sock, msg, size, fds, num_fds);
239*4882a593Smuzhiyun if (rc < 0)
240*4882a593Smuzhiyun goto out;
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun if (request_ack) {
243*4882a593Smuzhiyun uint64_t status;
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun rc = vhost_user_recv_u64(vu_dev, &status);
246*4882a593Smuzhiyun if (rc)
247*4882a593Smuzhiyun goto out;
248*4882a593Smuzhiyun
249*4882a593Smuzhiyun if (status) {
250*4882a593Smuzhiyun vu_err(vu_dev, "slave reports error: %llu\n", status);
251*4882a593Smuzhiyun rc = -EIO;
252*4882a593Smuzhiyun goto out;
253*4882a593Smuzhiyun }
254*4882a593Smuzhiyun }
255*4882a593Smuzhiyun
256*4882a593Smuzhiyun out:
257*4882a593Smuzhiyun spin_unlock_irqrestore(&vu_dev->sock_lock, flags);
258*4882a593Smuzhiyun return rc;
259*4882a593Smuzhiyun }
260*4882a593Smuzhiyun
vhost_user_send_no_payload(struct virtio_uml_device * vu_dev,bool need_response,u32 request)261*4882a593Smuzhiyun static int vhost_user_send_no_payload(struct virtio_uml_device *vu_dev,
262*4882a593Smuzhiyun bool need_response, u32 request)
263*4882a593Smuzhiyun {
264*4882a593Smuzhiyun struct vhost_user_msg msg = {
265*4882a593Smuzhiyun .header.request = request,
266*4882a593Smuzhiyun };
267*4882a593Smuzhiyun
268*4882a593Smuzhiyun return vhost_user_send(vu_dev, need_response, &msg, NULL, 0);
269*4882a593Smuzhiyun }
270*4882a593Smuzhiyun
vhost_user_send_no_payload_fd(struct virtio_uml_device * vu_dev,u32 request,int fd)271*4882a593Smuzhiyun static int vhost_user_send_no_payload_fd(struct virtio_uml_device *vu_dev,
272*4882a593Smuzhiyun u32 request, int fd)
273*4882a593Smuzhiyun {
274*4882a593Smuzhiyun struct vhost_user_msg msg = {
275*4882a593Smuzhiyun .header.request = request,
276*4882a593Smuzhiyun };
277*4882a593Smuzhiyun
278*4882a593Smuzhiyun return vhost_user_send(vu_dev, false, &msg, &fd, 1);
279*4882a593Smuzhiyun }
280*4882a593Smuzhiyun
vhost_user_send_u64(struct virtio_uml_device * vu_dev,u32 request,u64 value)281*4882a593Smuzhiyun static int vhost_user_send_u64(struct virtio_uml_device *vu_dev,
282*4882a593Smuzhiyun u32 request, u64 value)
283*4882a593Smuzhiyun {
284*4882a593Smuzhiyun struct vhost_user_msg msg = {
285*4882a593Smuzhiyun .header.request = request,
286*4882a593Smuzhiyun .header.size = sizeof(msg.payload.integer),
287*4882a593Smuzhiyun .payload.integer = value,
288*4882a593Smuzhiyun };
289*4882a593Smuzhiyun
290*4882a593Smuzhiyun return vhost_user_send(vu_dev, false, &msg, NULL, 0);
291*4882a593Smuzhiyun }
292*4882a593Smuzhiyun
vhost_user_set_owner(struct virtio_uml_device * vu_dev)293*4882a593Smuzhiyun static int vhost_user_set_owner(struct virtio_uml_device *vu_dev)
294*4882a593Smuzhiyun {
295*4882a593Smuzhiyun return vhost_user_send_no_payload(vu_dev, false, VHOST_USER_SET_OWNER);
296*4882a593Smuzhiyun }
297*4882a593Smuzhiyun
vhost_user_get_features(struct virtio_uml_device * vu_dev,u64 * features)298*4882a593Smuzhiyun static int vhost_user_get_features(struct virtio_uml_device *vu_dev,
299*4882a593Smuzhiyun u64 *features)
300*4882a593Smuzhiyun {
301*4882a593Smuzhiyun int rc = vhost_user_send_no_payload(vu_dev, true,
302*4882a593Smuzhiyun VHOST_USER_GET_FEATURES);
303*4882a593Smuzhiyun
304*4882a593Smuzhiyun if (rc)
305*4882a593Smuzhiyun return rc;
306*4882a593Smuzhiyun return vhost_user_recv_u64(vu_dev, features);
307*4882a593Smuzhiyun }
308*4882a593Smuzhiyun
vhost_user_set_features(struct virtio_uml_device * vu_dev,u64 features)309*4882a593Smuzhiyun static int vhost_user_set_features(struct virtio_uml_device *vu_dev,
310*4882a593Smuzhiyun u64 features)
311*4882a593Smuzhiyun {
312*4882a593Smuzhiyun return vhost_user_send_u64(vu_dev, VHOST_USER_SET_FEATURES, features);
313*4882a593Smuzhiyun }
314*4882a593Smuzhiyun
vhost_user_get_protocol_features(struct virtio_uml_device * vu_dev,u64 * protocol_features)315*4882a593Smuzhiyun static int vhost_user_get_protocol_features(struct virtio_uml_device *vu_dev,
316*4882a593Smuzhiyun u64 *protocol_features)
317*4882a593Smuzhiyun {
318*4882a593Smuzhiyun int rc = vhost_user_send_no_payload(vu_dev, true,
319*4882a593Smuzhiyun VHOST_USER_GET_PROTOCOL_FEATURES);
320*4882a593Smuzhiyun
321*4882a593Smuzhiyun if (rc)
322*4882a593Smuzhiyun return rc;
323*4882a593Smuzhiyun return vhost_user_recv_u64(vu_dev, protocol_features);
324*4882a593Smuzhiyun }
325*4882a593Smuzhiyun
vhost_user_set_protocol_features(struct virtio_uml_device * vu_dev,u64 protocol_features)326*4882a593Smuzhiyun static int vhost_user_set_protocol_features(struct virtio_uml_device *vu_dev,
327*4882a593Smuzhiyun u64 protocol_features)
328*4882a593Smuzhiyun {
329*4882a593Smuzhiyun return vhost_user_send_u64(vu_dev, VHOST_USER_SET_PROTOCOL_FEATURES,
330*4882a593Smuzhiyun protocol_features);
331*4882a593Smuzhiyun }
332*4882a593Smuzhiyun
vhost_user_reply(struct virtio_uml_device * vu_dev,struct vhost_user_msg * msg,int response)333*4882a593Smuzhiyun static void vhost_user_reply(struct virtio_uml_device *vu_dev,
334*4882a593Smuzhiyun struct vhost_user_msg *msg, int response)
335*4882a593Smuzhiyun {
336*4882a593Smuzhiyun struct vhost_user_msg reply = {
337*4882a593Smuzhiyun .payload.integer = response,
338*4882a593Smuzhiyun };
339*4882a593Smuzhiyun size_t size = sizeof(reply.header) + sizeof(reply.payload.integer);
340*4882a593Smuzhiyun int rc;
341*4882a593Smuzhiyun
342*4882a593Smuzhiyun reply.header = msg->header;
343*4882a593Smuzhiyun reply.header.flags &= ~VHOST_USER_FLAG_NEED_REPLY;
344*4882a593Smuzhiyun reply.header.flags |= VHOST_USER_FLAG_REPLY;
345*4882a593Smuzhiyun reply.header.size = sizeof(reply.payload.integer);
346*4882a593Smuzhiyun
347*4882a593Smuzhiyun rc = full_sendmsg_fds(vu_dev->req_fd, &reply, size, NULL, 0);
348*4882a593Smuzhiyun
349*4882a593Smuzhiyun if (rc)
350*4882a593Smuzhiyun vu_err(vu_dev,
351*4882a593Smuzhiyun "sending reply to slave request failed: %d (size %zu)\n",
352*4882a593Smuzhiyun rc, size);
353*4882a593Smuzhiyun }
354*4882a593Smuzhiyun
vu_req_interrupt(int irq,void * data)355*4882a593Smuzhiyun static irqreturn_t vu_req_interrupt(int irq, void *data)
356*4882a593Smuzhiyun {
357*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = data;
358*4882a593Smuzhiyun struct virtqueue *vq;
359*4882a593Smuzhiyun int response = 1;
360*4882a593Smuzhiyun struct {
361*4882a593Smuzhiyun struct vhost_user_msg msg;
362*4882a593Smuzhiyun u8 extra_payload[512];
363*4882a593Smuzhiyun } msg;
364*4882a593Smuzhiyun int rc;
365*4882a593Smuzhiyun
366*4882a593Smuzhiyun rc = vhost_user_recv_req(vu_dev, &msg.msg,
367*4882a593Smuzhiyun sizeof(msg.msg.payload) +
368*4882a593Smuzhiyun sizeof(msg.extra_payload));
369*4882a593Smuzhiyun
370*4882a593Smuzhiyun if (rc)
371*4882a593Smuzhiyun return IRQ_NONE;
372*4882a593Smuzhiyun
373*4882a593Smuzhiyun switch (msg.msg.header.request) {
374*4882a593Smuzhiyun case VHOST_USER_SLAVE_CONFIG_CHANGE_MSG:
375*4882a593Smuzhiyun virtio_config_changed(&vu_dev->vdev);
376*4882a593Smuzhiyun response = 0;
377*4882a593Smuzhiyun break;
378*4882a593Smuzhiyun case VHOST_USER_SLAVE_VRING_CALL:
379*4882a593Smuzhiyun virtio_device_for_each_vq((&vu_dev->vdev), vq) {
380*4882a593Smuzhiyun if (vq->index == msg.msg.payload.vring_state.index) {
381*4882a593Smuzhiyun response = 0;
382*4882a593Smuzhiyun vring_interrupt(0 /* ignored */, vq);
383*4882a593Smuzhiyun break;
384*4882a593Smuzhiyun }
385*4882a593Smuzhiyun }
386*4882a593Smuzhiyun break;
387*4882a593Smuzhiyun case VHOST_USER_SLAVE_IOTLB_MSG:
388*4882a593Smuzhiyun /* not supported - VIRTIO_F_ACCESS_PLATFORM */
389*4882a593Smuzhiyun case VHOST_USER_SLAVE_VRING_HOST_NOTIFIER_MSG:
390*4882a593Smuzhiyun /* not supported - VHOST_USER_PROTOCOL_F_HOST_NOTIFIER */
391*4882a593Smuzhiyun default:
392*4882a593Smuzhiyun vu_err(vu_dev, "unexpected slave request %d\n",
393*4882a593Smuzhiyun msg.msg.header.request);
394*4882a593Smuzhiyun }
395*4882a593Smuzhiyun
396*4882a593Smuzhiyun if (msg.msg.header.flags & VHOST_USER_FLAG_NEED_REPLY)
397*4882a593Smuzhiyun vhost_user_reply(vu_dev, &msg.msg, response);
398*4882a593Smuzhiyun
399*4882a593Smuzhiyun return IRQ_HANDLED;
400*4882a593Smuzhiyun }
401*4882a593Smuzhiyun
vhost_user_init_slave_req(struct virtio_uml_device * vu_dev)402*4882a593Smuzhiyun static int vhost_user_init_slave_req(struct virtio_uml_device *vu_dev)
403*4882a593Smuzhiyun {
404*4882a593Smuzhiyun int rc, req_fds[2];
405*4882a593Smuzhiyun
406*4882a593Smuzhiyun /* Use a pipe for slave req fd, SIGIO is not supported for eventfd */
407*4882a593Smuzhiyun rc = os_pipe(req_fds, true, true);
408*4882a593Smuzhiyun if (rc < 0)
409*4882a593Smuzhiyun return rc;
410*4882a593Smuzhiyun vu_dev->req_fd = req_fds[0];
411*4882a593Smuzhiyun
412*4882a593Smuzhiyun rc = um_request_irq(VIRTIO_IRQ, vu_dev->req_fd, IRQ_READ,
413*4882a593Smuzhiyun vu_req_interrupt, IRQF_SHARED,
414*4882a593Smuzhiyun vu_dev->pdev->name, vu_dev);
415*4882a593Smuzhiyun if (rc)
416*4882a593Smuzhiyun goto err_close;
417*4882a593Smuzhiyun
418*4882a593Smuzhiyun rc = vhost_user_send_no_payload_fd(vu_dev, VHOST_USER_SET_SLAVE_REQ_FD,
419*4882a593Smuzhiyun req_fds[1]);
420*4882a593Smuzhiyun if (rc)
421*4882a593Smuzhiyun goto err_free_irq;
422*4882a593Smuzhiyun
423*4882a593Smuzhiyun goto out;
424*4882a593Smuzhiyun
425*4882a593Smuzhiyun err_free_irq:
426*4882a593Smuzhiyun um_free_irq(VIRTIO_IRQ, vu_dev);
427*4882a593Smuzhiyun err_close:
428*4882a593Smuzhiyun os_close_file(req_fds[0]);
429*4882a593Smuzhiyun out:
430*4882a593Smuzhiyun /* Close unused write end of request fds */
431*4882a593Smuzhiyun os_close_file(req_fds[1]);
432*4882a593Smuzhiyun return rc;
433*4882a593Smuzhiyun }
434*4882a593Smuzhiyun
vhost_user_init(struct virtio_uml_device * vu_dev)435*4882a593Smuzhiyun static int vhost_user_init(struct virtio_uml_device *vu_dev)
436*4882a593Smuzhiyun {
437*4882a593Smuzhiyun int rc = vhost_user_set_owner(vu_dev);
438*4882a593Smuzhiyun
439*4882a593Smuzhiyun if (rc)
440*4882a593Smuzhiyun return rc;
441*4882a593Smuzhiyun rc = vhost_user_get_features(vu_dev, &vu_dev->features);
442*4882a593Smuzhiyun if (rc)
443*4882a593Smuzhiyun return rc;
444*4882a593Smuzhiyun
445*4882a593Smuzhiyun if (vu_dev->features & BIT_ULL(VHOST_USER_F_PROTOCOL_FEATURES)) {
446*4882a593Smuzhiyun rc = vhost_user_get_protocol_features(vu_dev,
447*4882a593Smuzhiyun &vu_dev->protocol_features);
448*4882a593Smuzhiyun if (rc)
449*4882a593Smuzhiyun return rc;
450*4882a593Smuzhiyun vu_dev->protocol_features &= VHOST_USER_SUPPORTED_PROTOCOL_F;
451*4882a593Smuzhiyun rc = vhost_user_set_protocol_features(vu_dev,
452*4882a593Smuzhiyun vu_dev->protocol_features);
453*4882a593Smuzhiyun if (rc)
454*4882a593Smuzhiyun return rc;
455*4882a593Smuzhiyun }
456*4882a593Smuzhiyun
457*4882a593Smuzhiyun if (vu_dev->protocol_features &
458*4882a593Smuzhiyun BIT_ULL(VHOST_USER_PROTOCOL_F_SLAVE_REQ)) {
459*4882a593Smuzhiyun rc = vhost_user_init_slave_req(vu_dev);
460*4882a593Smuzhiyun if (rc)
461*4882a593Smuzhiyun return rc;
462*4882a593Smuzhiyun }
463*4882a593Smuzhiyun
464*4882a593Smuzhiyun return 0;
465*4882a593Smuzhiyun }
466*4882a593Smuzhiyun
vhost_user_get_config(struct virtio_uml_device * vu_dev,u32 offset,void * buf,u32 len)467*4882a593Smuzhiyun static void vhost_user_get_config(struct virtio_uml_device *vu_dev,
468*4882a593Smuzhiyun u32 offset, void *buf, u32 len)
469*4882a593Smuzhiyun {
470*4882a593Smuzhiyun u32 cfg_size = offset + len;
471*4882a593Smuzhiyun struct vhost_user_msg *msg;
472*4882a593Smuzhiyun size_t payload_size = sizeof(msg->payload.config) + cfg_size;
473*4882a593Smuzhiyun size_t msg_size = sizeof(msg->header) + payload_size;
474*4882a593Smuzhiyun int rc;
475*4882a593Smuzhiyun
476*4882a593Smuzhiyun if (!(vu_dev->protocol_features &
477*4882a593Smuzhiyun BIT_ULL(VHOST_USER_PROTOCOL_F_CONFIG)))
478*4882a593Smuzhiyun return;
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun msg = kzalloc(msg_size, GFP_KERNEL);
481*4882a593Smuzhiyun if (!msg)
482*4882a593Smuzhiyun return;
483*4882a593Smuzhiyun msg->header.request = VHOST_USER_GET_CONFIG;
484*4882a593Smuzhiyun msg->header.size = payload_size;
485*4882a593Smuzhiyun msg->payload.config.offset = 0;
486*4882a593Smuzhiyun msg->payload.config.size = cfg_size;
487*4882a593Smuzhiyun
488*4882a593Smuzhiyun rc = vhost_user_send(vu_dev, true, msg, NULL, 0);
489*4882a593Smuzhiyun if (rc) {
490*4882a593Smuzhiyun vu_err(vu_dev, "sending VHOST_USER_GET_CONFIG failed: %d\n",
491*4882a593Smuzhiyun rc);
492*4882a593Smuzhiyun goto free;
493*4882a593Smuzhiyun }
494*4882a593Smuzhiyun
495*4882a593Smuzhiyun rc = vhost_user_recv_resp(vu_dev, msg, msg_size);
496*4882a593Smuzhiyun if (rc) {
497*4882a593Smuzhiyun vu_err(vu_dev,
498*4882a593Smuzhiyun "receiving VHOST_USER_GET_CONFIG response failed: %d\n",
499*4882a593Smuzhiyun rc);
500*4882a593Smuzhiyun goto free;
501*4882a593Smuzhiyun }
502*4882a593Smuzhiyun
503*4882a593Smuzhiyun if (msg->header.size != payload_size ||
504*4882a593Smuzhiyun msg->payload.config.size != cfg_size) {
505*4882a593Smuzhiyun rc = -EPROTO;
506*4882a593Smuzhiyun vu_err(vu_dev,
507*4882a593Smuzhiyun "Invalid VHOST_USER_GET_CONFIG sizes (payload %d expected %zu, config %u expected %u)\n",
508*4882a593Smuzhiyun msg->header.size, payload_size,
509*4882a593Smuzhiyun msg->payload.config.size, cfg_size);
510*4882a593Smuzhiyun goto free;
511*4882a593Smuzhiyun }
512*4882a593Smuzhiyun memcpy(buf, msg->payload.config.payload + offset, len);
513*4882a593Smuzhiyun
514*4882a593Smuzhiyun free:
515*4882a593Smuzhiyun kfree(msg);
516*4882a593Smuzhiyun }
517*4882a593Smuzhiyun
vhost_user_set_config(struct virtio_uml_device * vu_dev,u32 offset,const void * buf,u32 len)518*4882a593Smuzhiyun static void vhost_user_set_config(struct virtio_uml_device *vu_dev,
519*4882a593Smuzhiyun u32 offset, const void *buf, u32 len)
520*4882a593Smuzhiyun {
521*4882a593Smuzhiyun struct vhost_user_msg *msg;
522*4882a593Smuzhiyun size_t payload_size = sizeof(msg->payload.config) + len;
523*4882a593Smuzhiyun size_t msg_size = sizeof(msg->header) + payload_size;
524*4882a593Smuzhiyun int rc;
525*4882a593Smuzhiyun
526*4882a593Smuzhiyun if (!(vu_dev->protocol_features &
527*4882a593Smuzhiyun BIT_ULL(VHOST_USER_PROTOCOL_F_CONFIG)))
528*4882a593Smuzhiyun return;
529*4882a593Smuzhiyun
530*4882a593Smuzhiyun msg = kzalloc(msg_size, GFP_KERNEL);
531*4882a593Smuzhiyun if (!msg)
532*4882a593Smuzhiyun return;
533*4882a593Smuzhiyun msg->header.request = VHOST_USER_SET_CONFIG;
534*4882a593Smuzhiyun msg->header.size = payload_size;
535*4882a593Smuzhiyun msg->payload.config.offset = offset;
536*4882a593Smuzhiyun msg->payload.config.size = len;
537*4882a593Smuzhiyun memcpy(msg->payload.config.payload, buf, len);
538*4882a593Smuzhiyun
539*4882a593Smuzhiyun rc = vhost_user_send(vu_dev, false, msg, NULL, 0);
540*4882a593Smuzhiyun if (rc)
541*4882a593Smuzhiyun vu_err(vu_dev, "sending VHOST_USER_SET_CONFIG failed: %d\n",
542*4882a593Smuzhiyun rc);
543*4882a593Smuzhiyun
544*4882a593Smuzhiyun kfree(msg);
545*4882a593Smuzhiyun }
546*4882a593Smuzhiyun
vhost_user_init_mem_region(u64 addr,u64 size,int * fd_out,struct vhost_user_mem_region * region_out)547*4882a593Smuzhiyun static int vhost_user_init_mem_region(u64 addr, u64 size, int *fd_out,
548*4882a593Smuzhiyun struct vhost_user_mem_region *region_out)
549*4882a593Smuzhiyun {
550*4882a593Smuzhiyun unsigned long long mem_offset;
551*4882a593Smuzhiyun int rc = phys_mapping(addr, &mem_offset);
552*4882a593Smuzhiyun
553*4882a593Smuzhiyun if (WARN(rc < 0, "phys_mapping of 0x%llx returned %d\n", addr, rc))
554*4882a593Smuzhiyun return -EFAULT;
555*4882a593Smuzhiyun *fd_out = rc;
556*4882a593Smuzhiyun region_out->guest_addr = addr;
557*4882a593Smuzhiyun region_out->user_addr = addr;
558*4882a593Smuzhiyun region_out->size = size;
559*4882a593Smuzhiyun region_out->mmap_offset = mem_offset;
560*4882a593Smuzhiyun
561*4882a593Smuzhiyun /* Ensure mapping is valid for the entire region */
562*4882a593Smuzhiyun rc = phys_mapping(addr + size - 1, &mem_offset);
563*4882a593Smuzhiyun if (WARN(rc != *fd_out, "phys_mapping of 0x%llx failed: %d != %d\n",
564*4882a593Smuzhiyun addr + size - 1, rc, *fd_out))
565*4882a593Smuzhiyun return -EFAULT;
566*4882a593Smuzhiyun return 0;
567*4882a593Smuzhiyun }
568*4882a593Smuzhiyun
vhost_user_set_mem_table(struct virtio_uml_device * vu_dev)569*4882a593Smuzhiyun static int vhost_user_set_mem_table(struct virtio_uml_device *vu_dev)
570*4882a593Smuzhiyun {
571*4882a593Smuzhiyun struct vhost_user_msg msg = {
572*4882a593Smuzhiyun .header.request = VHOST_USER_SET_MEM_TABLE,
573*4882a593Smuzhiyun .header.size = sizeof(msg.payload.mem_regions),
574*4882a593Smuzhiyun .payload.mem_regions.num = 1,
575*4882a593Smuzhiyun };
576*4882a593Smuzhiyun unsigned long reserved = uml_reserved - uml_physmem;
577*4882a593Smuzhiyun int fds[2];
578*4882a593Smuzhiyun int rc;
579*4882a593Smuzhiyun
580*4882a593Smuzhiyun /*
581*4882a593Smuzhiyun * This is a bit tricky, see also the comment with setup_physmem().
582*4882a593Smuzhiyun *
583*4882a593Smuzhiyun * Essentially, setup_physmem() uses a file to mmap() our physmem,
584*4882a593Smuzhiyun * but the code and data we *already* have is omitted. To us, this
585*4882a593Smuzhiyun * is no difference, since they both become part of our address
586*4882a593Smuzhiyun * space and memory consumption. To somebody looking in from the
587*4882a593Smuzhiyun * outside, however, it is different because the part of our memory
588*4882a593Smuzhiyun * consumption that's already part of the binary (code/data) is not
589*4882a593Smuzhiyun * mapped from the file, so it's not visible to another mmap from
590*4882a593Smuzhiyun * the file descriptor.
591*4882a593Smuzhiyun *
592*4882a593Smuzhiyun * Thus, don't advertise this space to the vhost-user slave. This
593*4882a593Smuzhiyun * means that the slave will likely abort or similar when we give
594*4882a593Smuzhiyun * it an address from the hidden range, since it's not marked as
595*4882a593Smuzhiyun * a valid address, but at least that way we detect the issue and
596*4882a593Smuzhiyun * don't just have the slave read an all-zeroes buffer from the
597*4882a593Smuzhiyun * shared memory file, or write something there that we can never
598*4882a593Smuzhiyun * see (depending on the direction of the virtqueue traffic.)
599*4882a593Smuzhiyun *
600*4882a593Smuzhiyun * Since we usually don't want to use .text for virtio buffers,
601*4882a593Smuzhiyun * this effectively means that you cannot use
602*4882a593Smuzhiyun * 1) global variables, which are in the .bss and not in the shm
603*4882a593Smuzhiyun * file-backed memory
604*4882a593Smuzhiyun * 2) the stack in some processes, depending on where they have
605*4882a593Smuzhiyun * their stack (or maybe only no interrupt stack?)
606*4882a593Smuzhiyun *
607*4882a593Smuzhiyun * The stack is already not typically valid for DMA, so this isn't
608*4882a593Smuzhiyun * much of a restriction, but global variables might be encountered.
609*4882a593Smuzhiyun *
610*4882a593Smuzhiyun * It might be possible to fix it by copying around the data that's
611*4882a593Smuzhiyun * between bss_start and where we map the file now, but it's not
612*4882a593Smuzhiyun * something that you typically encounter with virtio drivers, so
613*4882a593Smuzhiyun * it didn't seem worthwhile.
614*4882a593Smuzhiyun */
615*4882a593Smuzhiyun rc = vhost_user_init_mem_region(reserved, physmem_size - reserved,
616*4882a593Smuzhiyun &fds[0],
617*4882a593Smuzhiyun &msg.payload.mem_regions.regions[0]);
618*4882a593Smuzhiyun
619*4882a593Smuzhiyun if (rc < 0)
620*4882a593Smuzhiyun return rc;
621*4882a593Smuzhiyun if (highmem) {
622*4882a593Smuzhiyun msg.payload.mem_regions.num++;
623*4882a593Smuzhiyun rc = vhost_user_init_mem_region(__pa(end_iomem), highmem,
624*4882a593Smuzhiyun &fds[1], &msg.payload.mem_regions.regions[1]);
625*4882a593Smuzhiyun if (rc < 0)
626*4882a593Smuzhiyun return rc;
627*4882a593Smuzhiyun }
628*4882a593Smuzhiyun
629*4882a593Smuzhiyun return vhost_user_send(vu_dev, false, &msg, fds,
630*4882a593Smuzhiyun msg.payload.mem_regions.num);
631*4882a593Smuzhiyun }
632*4882a593Smuzhiyun
vhost_user_set_vring_state(struct virtio_uml_device * vu_dev,u32 request,u32 index,u32 num)633*4882a593Smuzhiyun static int vhost_user_set_vring_state(struct virtio_uml_device *vu_dev,
634*4882a593Smuzhiyun u32 request, u32 index, u32 num)
635*4882a593Smuzhiyun {
636*4882a593Smuzhiyun struct vhost_user_msg msg = {
637*4882a593Smuzhiyun .header.request = request,
638*4882a593Smuzhiyun .header.size = sizeof(msg.payload.vring_state),
639*4882a593Smuzhiyun .payload.vring_state.index = index,
640*4882a593Smuzhiyun .payload.vring_state.num = num,
641*4882a593Smuzhiyun };
642*4882a593Smuzhiyun
643*4882a593Smuzhiyun return vhost_user_send(vu_dev, false, &msg, NULL, 0);
644*4882a593Smuzhiyun }
645*4882a593Smuzhiyun
vhost_user_set_vring_num(struct virtio_uml_device * vu_dev,u32 index,u32 num)646*4882a593Smuzhiyun static int vhost_user_set_vring_num(struct virtio_uml_device *vu_dev,
647*4882a593Smuzhiyun u32 index, u32 num)
648*4882a593Smuzhiyun {
649*4882a593Smuzhiyun return vhost_user_set_vring_state(vu_dev, VHOST_USER_SET_VRING_NUM,
650*4882a593Smuzhiyun index, num);
651*4882a593Smuzhiyun }
652*4882a593Smuzhiyun
vhost_user_set_vring_base(struct virtio_uml_device * vu_dev,u32 index,u32 offset)653*4882a593Smuzhiyun static int vhost_user_set_vring_base(struct virtio_uml_device *vu_dev,
654*4882a593Smuzhiyun u32 index, u32 offset)
655*4882a593Smuzhiyun {
656*4882a593Smuzhiyun return vhost_user_set_vring_state(vu_dev, VHOST_USER_SET_VRING_BASE,
657*4882a593Smuzhiyun index, offset);
658*4882a593Smuzhiyun }
659*4882a593Smuzhiyun
vhost_user_set_vring_addr(struct virtio_uml_device * vu_dev,u32 index,u64 desc,u64 used,u64 avail,u64 log)660*4882a593Smuzhiyun static int vhost_user_set_vring_addr(struct virtio_uml_device *vu_dev,
661*4882a593Smuzhiyun u32 index, u64 desc, u64 used, u64 avail,
662*4882a593Smuzhiyun u64 log)
663*4882a593Smuzhiyun {
664*4882a593Smuzhiyun struct vhost_user_msg msg = {
665*4882a593Smuzhiyun .header.request = VHOST_USER_SET_VRING_ADDR,
666*4882a593Smuzhiyun .header.size = sizeof(msg.payload.vring_addr),
667*4882a593Smuzhiyun .payload.vring_addr.index = index,
668*4882a593Smuzhiyun .payload.vring_addr.desc = desc,
669*4882a593Smuzhiyun .payload.vring_addr.used = used,
670*4882a593Smuzhiyun .payload.vring_addr.avail = avail,
671*4882a593Smuzhiyun .payload.vring_addr.log = log,
672*4882a593Smuzhiyun };
673*4882a593Smuzhiyun
674*4882a593Smuzhiyun return vhost_user_send(vu_dev, false, &msg, NULL, 0);
675*4882a593Smuzhiyun }
676*4882a593Smuzhiyun
vhost_user_set_vring_fd(struct virtio_uml_device * vu_dev,u32 request,int index,int fd)677*4882a593Smuzhiyun static int vhost_user_set_vring_fd(struct virtio_uml_device *vu_dev,
678*4882a593Smuzhiyun u32 request, int index, int fd)
679*4882a593Smuzhiyun {
680*4882a593Smuzhiyun struct vhost_user_msg msg = {
681*4882a593Smuzhiyun .header.request = request,
682*4882a593Smuzhiyun .header.size = sizeof(msg.payload.integer),
683*4882a593Smuzhiyun .payload.integer = index,
684*4882a593Smuzhiyun };
685*4882a593Smuzhiyun
686*4882a593Smuzhiyun if (index & ~VHOST_USER_VRING_INDEX_MASK)
687*4882a593Smuzhiyun return -EINVAL;
688*4882a593Smuzhiyun if (fd < 0) {
689*4882a593Smuzhiyun msg.payload.integer |= VHOST_USER_VRING_POLL_MASK;
690*4882a593Smuzhiyun return vhost_user_send(vu_dev, false, &msg, NULL, 0);
691*4882a593Smuzhiyun }
692*4882a593Smuzhiyun return vhost_user_send(vu_dev, false, &msg, &fd, 1);
693*4882a593Smuzhiyun }
694*4882a593Smuzhiyun
vhost_user_set_vring_call(struct virtio_uml_device * vu_dev,int index,int fd)695*4882a593Smuzhiyun static int vhost_user_set_vring_call(struct virtio_uml_device *vu_dev,
696*4882a593Smuzhiyun int index, int fd)
697*4882a593Smuzhiyun {
698*4882a593Smuzhiyun return vhost_user_set_vring_fd(vu_dev, VHOST_USER_SET_VRING_CALL,
699*4882a593Smuzhiyun index, fd);
700*4882a593Smuzhiyun }
701*4882a593Smuzhiyun
vhost_user_set_vring_kick(struct virtio_uml_device * vu_dev,int index,int fd)702*4882a593Smuzhiyun static int vhost_user_set_vring_kick(struct virtio_uml_device *vu_dev,
703*4882a593Smuzhiyun int index, int fd)
704*4882a593Smuzhiyun {
705*4882a593Smuzhiyun return vhost_user_set_vring_fd(vu_dev, VHOST_USER_SET_VRING_KICK,
706*4882a593Smuzhiyun index, fd);
707*4882a593Smuzhiyun }
708*4882a593Smuzhiyun
vhost_user_set_vring_enable(struct virtio_uml_device * vu_dev,u32 index,bool enable)709*4882a593Smuzhiyun static int vhost_user_set_vring_enable(struct virtio_uml_device *vu_dev,
710*4882a593Smuzhiyun u32 index, bool enable)
711*4882a593Smuzhiyun {
712*4882a593Smuzhiyun if (!(vu_dev->features & BIT_ULL(VHOST_USER_F_PROTOCOL_FEATURES)))
713*4882a593Smuzhiyun return 0;
714*4882a593Smuzhiyun
715*4882a593Smuzhiyun return vhost_user_set_vring_state(vu_dev, VHOST_USER_SET_VRING_ENABLE,
716*4882a593Smuzhiyun index, enable);
717*4882a593Smuzhiyun }
718*4882a593Smuzhiyun
719*4882a593Smuzhiyun
720*4882a593Smuzhiyun /* Virtio interface */
721*4882a593Smuzhiyun
vu_notify(struct virtqueue * vq)722*4882a593Smuzhiyun static bool vu_notify(struct virtqueue *vq)
723*4882a593Smuzhiyun {
724*4882a593Smuzhiyun struct virtio_uml_vq_info *info = vq->priv;
725*4882a593Smuzhiyun const uint64_t n = 1;
726*4882a593Smuzhiyun int rc;
727*4882a593Smuzhiyun
728*4882a593Smuzhiyun time_travel_propagate_time();
729*4882a593Smuzhiyun
730*4882a593Smuzhiyun if (info->kick_fd < 0) {
731*4882a593Smuzhiyun struct virtio_uml_device *vu_dev;
732*4882a593Smuzhiyun
733*4882a593Smuzhiyun vu_dev = to_virtio_uml_device(vq->vdev);
734*4882a593Smuzhiyun
735*4882a593Smuzhiyun return vhost_user_set_vring_state(vu_dev, VHOST_USER_VRING_KICK,
736*4882a593Smuzhiyun vq->index, 0) == 0;
737*4882a593Smuzhiyun }
738*4882a593Smuzhiyun
739*4882a593Smuzhiyun do {
740*4882a593Smuzhiyun rc = os_write_file(info->kick_fd, &n, sizeof(n));
741*4882a593Smuzhiyun } while (rc == -EINTR);
742*4882a593Smuzhiyun return !WARN(rc != sizeof(n), "write returned %d\n", rc);
743*4882a593Smuzhiyun }
744*4882a593Smuzhiyun
vu_interrupt(int irq,void * opaque)745*4882a593Smuzhiyun static irqreturn_t vu_interrupt(int irq, void *opaque)
746*4882a593Smuzhiyun {
747*4882a593Smuzhiyun struct virtqueue *vq = opaque;
748*4882a593Smuzhiyun struct virtio_uml_vq_info *info = vq->priv;
749*4882a593Smuzhiyun uint64_t n;
750*4882a593Smuzhiyun int rc;
751*4882a593Smuzhiyun irqreturn_t ret = IRQ_NONE;
752*4882a593Smuzhiyun
753*4882a593Smuzhiyun do {
754*4882a593Smuzhiyun rc = os_read_file(info->call_fd, &n, sizeof(n));
755*4882a593Smuzhiyun if (rc == sizeof(n))
756*4882a593Smuzhiyun ret |= vring_interrupt(irq, vq);
757*4882a593Smuzhiyun } while (rc == sizeof(n) || rc == -EINTR);
758*4882a593Smuzhiyun WARN(rc != -EAGAIN, "read returned %d\n", rc);
759*4882a593Smuzhiyun return ret;
760*4882a593Smuzhiyun }
761*4882a593Smuzhiyun
762*4882a593Smuzhiyun
vu_get(struct virtio_device * vdev,unsigned offset,void * buf,unsigned len)763*4882a593Smuzhiyun static void vu_get(struct virtio_device *vdev, unsigned offset,
764*4882a593Smuzhiyun void *buf, unsigned len)
765*4882a593Smuzhiyun {
766*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
767*4882a593Smuzhiyun
768*4882a593Smuzhiyun vhost_user_get_config(vu_dev, offset, buf, len);
769*4882a593Smuzhiyun }
770*4882a593Smuzhiyun
vu_set(struct virtio_device * vdev,unsigned offset,const void * buf,unsigned len)771*4882a593Smuzhiyun static void vu_set(struct virtio_device *vdev, unsigned offset,
772*4882a593Smuzhiyun const void *buf, unsigned len)
773*4882a593Smuzhiyun {
774*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
775*4882a593Smuzhiyun
776*4882a593Smuzhiyun vhost_user_set_config(vu_dev, offset, buf, len);
777*4882a593Smuzhiyun }
778*4882a593Smuzhiyun
vu_get_status(struct virtio_device * vdev)779*4882a593Smuzhiyun static u8 vu_get_status(struct virtio_device *vdev)
780*4882a593Smuzhiyun {
781*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
782*4882a593Smuzhiyun
783*4882a593Smuzhiyun return vu_dev->status;
784*4882a593Smuzhiyun }
785*4882a593Smuzhiyun
vu_set_status(struct virtio_device * vdev,u8 status)786*4882a593Smuzhiyun static void vu_set_status(struct virtio_device *vdev, u8 status)
787*4882a593Smuzhiyun {
788*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
789*4882a593Smuzhiyun
790*4882a593Smuzhiyun vu_dev->status = status;
791*4882a593Smuzhiyun }
792*4882a593Smuzhiyun
vu_reset(struct virtio_device * vdev)793*4882a593Smuzhiyun static void vu_reset(struct virtio_device *vdev)
794*4882a593Smuzhiyun {
795*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
796*4882a593Smuzhiyun
797*4882a593Smuzhiyun vu_dev->status = 0;
798*4882a593Smuzhiyun }
799*4882a593Smuzhiyun
vu_del_vq(struct virtqueue * vq)800*4882a593Smuzhiyun static void vu_del_vq(struct virtqueue *vq)
801*4882a593Smuzhiyun {
802*4882a593Smuzhiyun struct virtio_uml_vq_info *info = vq->priv;
803*4882a593Smuzhiyun
804*4882a593Smuzhiyun if (info->call_fd >= 0) {
805*4882a593Smuzhiyun um_free_irq(VIRTIO_IRQ, vq);
806*4882a593Smuzhiyun os_close_file(info->call_fd);
807*4882a593Smuzhiyun }
808*4882a593Smuzhiyun
809*4882a593Smuzhiyun if (info->kick_fd >= 0)
810*4882a593Smuzhiyun os_close_file(info->kick_fd);
811*4882a593Smuzhiyun
812*4882a593Smuzhiyun vring_del_virtqueue(vq);
813*4882a593Smuzhiyun kfree(info);
814*4882a593Smuzhiyun }
815*4882a593Smuzhiyun
vu_del_vqs(struct virtio_device * vdev)816*4882a593Smuzhiyun static void vu_del_vqs(struct virtio_device *vdev)
817*4882a593Smuzhiyun {
818*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
819*4882a593Smuzhiyun struct virtqueue *vq, *n;
820*4882a593Smuzhiyun u64 features;
821*4882a593Smuzhiyun
822*4882a593Smuzhiyun /* Note: reverse order as a workaround to a decoding bug in snabb */
823*4882a593Smuzhiyun list_for_each_entry_reverse(vq, &vdev->vqs, list)
824*4882a593Smuzhiyun WARN_ON(vhost_user_set_vring_enable(vu_dev, vq->index, false));
825*4882a593Smuzhiyun
826*4882a593Smuzhiyun /* Ensure previous messages have been processed */
827*4882a593Smuzhiyun WARN_ON(vhost_user_get_features(vu_dev, &features));
828*4882a593Smuzhiyun
829*4882a593Smuzhiyun list_for_each_entry_safe(vq, n, &vdev->vqs, list)
830*4882a593Smuzhiyun vu_del_vq(vq);
831*4882a593Smuzhiyun }
832*4882a593Smuzhiyun
vu_setup_vq_call_fd(struct virtio_uml_device * vu_dev,struct virtqueue * vq)833*4882a593Smuzhiyun static int vu_setup_vq_call_fd(struct virtio_uml_device *vu_dev,
834*4882a593Smuzhiyun struct virtqueue *vq)
835*4882a593Smuzhiyun {
836*4882a593Smuzhiyun struct virtio_uml_vq_info *info = vq->priv;
837*4882a593Smuzhiyun int call_fds[2];
838*4882a593Smuzhiyun int rc;
839*4882a593Smuzhiyun
840*4882a593Smuzhiyun /* no call FD needed/desired in this case */
841*4882a593Smuzhiyun if (vu_dev->protocol_features &
842*4882a593Smuzhiyun BIT_ULL(VHOST_USER_PROTOCOL_F_INBAND_NOTIFICATIONS) &&
843*4882a593Smuzhiyun vu_dev->protocol_features &
844*4882a593Smuzhiyun BIT_ULL(VHOST_USER_PROTOCOL_F_SLAVE_REQ)) {
845*4882a593Smuzhiyun info->call_fd = -1;
846*4882a593Smuzhiyun return 0;
847*4882a593Smuzhiyun }
848*4882a593Smuzhiyun
849*4882a593Smuzhiyun /* Use a pipe for call fd, since SIGIO is not supported for eventfd */
850*4882a593Smuzhiyun rc = os_pipe(call_fds, true, true);
851*4882a593Smuzhiyun if (rc < 0)
852*4882a593Smuzhiyun return rc;
853*4882a593Smuzhiyun
854*4882a593Smuzhiyun info->call_fd = call_fds[0];
855*4882a593Smuzhiyun rc = um_request_irq(VIRTIO_IRQ, info->call_fd, IRQ_READ,
856*4882a593Smuzhiyun vu_interrupt, IRQF_SHARED, info->name, vq);
857*4882a593Smuzhiyun if (rc)
858*4882a593Smuzhiyun goto close_both;
859*4882a593Smuzhiyun
860*4882a593Smuzhiyun rc = vhost_user_set_vring_call(vu_dev, vq->index, call_fds[1]);
861*4882a593Smuzhiyun if (rc)
862*4882a593Smuzhiyun goto release_irq;
863*4882a593Smuzhiyun
864*4882a593Smuzhiyun goto out;
865*4882a593Smuzhiyun
866*4882a593Smuzhiyun release_irq:
867*4882a593Smuzhiyun um_free_irq(VIRTIO_IRQ, vq);
868*4882a593Smuzhiyun close_both:
869*4882a593Smuzhiyun os_close_file(call_fds[0]);
870*4882a593Smuzhiyun out:
871*4882a593Smuzhiyun /* Close (unused) write end of call fds */
872*4882a593Smuzhiyun os_close_file(call_fds[1]);
873*4882a593Smuzhiyun
874*4882a593Smuzhiyun return rc;
875*4882a593Smuzhiyun }
876*4882a593Smuzhiyun
877*4882a593Smuzhiyun #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
vu_defer_irq_handle(struct time_travel_event * d)878*4882a593Smuzhiyun static void vu_defer_irq_handle(struct time_travel_event *d)
879*4882a593Smuzhiyun {
880*4882a593Smuzhiyun struct virtio_uml_vq_info *info;
881*4882a593Smuzhiyun
882*4882a593Smuzhiyun info = container_of(d, struct virtio_uml_vq_info, defer);
883*4882a593Smuzhiyun info->callback(info->vq);
884*4882a593Smuzhiyun }
885*4882a593Smuzhiyun
vu_defer_irq_callback(struct virtqueue * vq)886*4882a593Smuzhiyun static void vu_defer_irq_callback(struct virtqueue *vq)
887*4882a593Smuzhiyun {
888*4882a593Smuzhiyun struct virtio_uml_vq_info *info = vq->priv;
889*4882a593Smuzhiyun
890*4882a593Smuzhiyun time_travel_add_irq_event(&info->defer);
891*4882a593Smuzhiyun }
892*4882a593Smuzhiyun #endif
893*4882a593Smuzhiyun
vu_setup_vq(struct virtio_device * vdev,unsigned index,vq_callback_t * callback,const char * name,bool ctx)894*4882a593Smuzhiyun static struct virtqueue *vu_setup_vq(struct virtio_device *vdev,
895*4882a593Smuzhiyun unsigned index, vq_callback_t *callback,
896*4882a593Smuzhiyun const char *name, bool ctx)
897*4882a593Smuzhiyun {
898*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
899*4882a593Smuzhiyun struct platform_device *pdev = vu_dev->pdev;
900*4882a593Smuzhiyun struct virtio_uml_vq_info *info;
901*4882a593Smuzhiyun struct virtqueue *vq;
902*4882a593Smuzhiyun int num = MAX_SUPPORTED_QUEUE_SIZE;
903*4882a593Smuzhiyun int rc;
904*4882a593Smuzhiyun
905*4882a593Smuzhiyun info = kzalloc(sizeof(*info), GFP_KERNEL);
906*4882a593Smuzhiyun if (!info) {
907*4882a593Smuzhiyun rc = -ENOMEM;
908*4882a593Smuzhiyun goto error_kzalloc;
909*4882a593Smuzhiyun }
910*4882a593Smuzhiyun snprintf(info->name, sizeof(info->name), "%s.%d-%s", pdev->name,
911*4882a593Smuzhiyun pdev->id, name);
912*4882a593Smuzhiyun
913*4882a593Smuzhiyun #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
914*4882a593Smuzhiyun /*
915*4882a593Smuzhiyun * When we get an interrupt, we must bounce it through the simulation
916*4882a593Smuzhiyun * calendar (the simtime device), except for the simtime device itself
917*4882a593Smuzhiyun * since that's part of the simulation control.
918*4882a593Smuzhiyun */
919*4882a593Smuzhiyun if (time_travel_mode == TT_MODE_EXTERNAL && callback) {
920*4882a593Smuzhiyun info->callback = callback;
921*4882a593Smuzhiyun callback = vu_defer_irq_callback;
922*4882a593Smuzhiyun time_travel_set_event_fn(&info->defer, vu_defer_irq_handle);
923*4882a593Smuzhiyun }
924*4882a593Smuzhiyun #endif
925*4882a593Smuzhiyun
926*4882a593Smuzhiyun vq = vring_create_virtqueue(index, num, PAGE_SIZE, vdev, true, true,
927*4882a593Smuzhiyun ctx, vu_notify, callback, info->name);
928*4882a593Smuzhiyun if (!vq) {
929*4882a593Smuzhiyun rc = -ENOMEM;
930*4882a593Smuzhiyun goto error_create;
931*4882a593Smuzhiyun }
932*4882a593Smuzhiyun vq->priv = info;
933*4882a593Smuzhiyun num = virtqueue_get_vring_size(vq);
934*4882a593Smuzhiyun #ifdef CONFIG_UML_TIME_TRAVEL_SUPPORT
935*4882a593Smuzhiyun info->vq = vq;
936*4882a593Smuzhiyun #endif
937*4882a593Smuzhiyun
938*4882a593Smuzhiyun if (vu_dev->protocol_features &
939*4882a593Smuzhiyun BIT_ULL(VHOST_USER_PROTOCOL_F_INBAND_NOTIFICATIONS)) {
940*4882a593Smuzhiyun info->kick_fd = -1;
941*4882a593Smuzhiyun } else {
942*4882a593Smuzhiyun rc = os_eventfd(0, 0);
943*4882a593Smuzhiyun if (rc < 0)
944*4882a593Smuzhiyun goto error_kick;
945*4882a593Smuzhiyun info->kick_fd = rc;
946*4882a593Smuzhiyun }
947*4882a593Smuzhiyun
948*4882a593Smuzhiyun rc = vu_setup_vq_call_fd(vu_dev, vq);
949*4882a593Smuzhiyun if (rc)
950*4882a593Smuzhiyun goto error_call;
951*4882a593Smuzhiyun
952*4882a593Smuzhiyun rc = vhost_user_set_vring_num(vu_dev, index, num);
953*4882a593Smuzhiyun if (rc)
954*4882a593Smuzhiyun goto error_setup;
955*4882a593Smuzhiyun
956*4882a593Smuzhiyun rc = vhost_user_set_vring_base(vu_dev, index, 0);
957*4882a593Smuzhiyun if (rc)
958*4882a593Smuzhiyun goto error_setup;
959*4882a593Smuzhiyun
960*4882a593Smuzhiyun rc = vhost_user_set_vring_addr(vu_dev, index,
961*4882a593Smuzhiyun virtqueue_get_desc_addr(vq),
962*4882a593Smuzhiyun virtqueue_get_used_addr(vq),
963*4882a593Smuzhiyun virtqueue_get_avail_addr(vq),
964*4882a593Smuzhiyun (u64) -1);
965*4882a593Smuzhiyun if (rc)
966*4882a593Smuzhiyun goto error_setup;
967*4882a593Smuzhiyun
968*4882a593Smuzhiyun return vq;
969*4882a593Smuzhiyun
970*4882a593Smuzhiyun error_setup:
971*4882a593Smuzhiyun if (info->call_fd >= 0) {
972*4882a593Smuzhiyun um_free_irq(VIRTIO_IRQ, vq);
973*4882a593Smuzhiyun os_close_file(info->call_fd);
974*4882a593Smuzhiyun }
975*4882a593Smuzhiyun error_call:
976*4882a593Smuzhiyun if (info->kick_fd >= 0)
977*4882a593Smuzhiyun os_close_file(info->kick_fd);
978*4882a593Smuzhiyun error_kick:
979*4882a593Smuzhiyun vring_del_virtqueue(vq);
980*4882a593Smuzhiyun error_create:
981*4882a593Smuzhiyun kfree(info);
982*4882a593Smuzhiyun error_kzalloc:
983*4882a593Smuzhiyun return ERR_PTR(rc);
984*4882a593Smuzhiyun }
985*4882a593Smuzhiyun
vu_find_vqs(struct virtio_device * vdev,unsigned nvqs,struct virtqueue * vqs[],vq_callback_t * callbacks[],const char * const names[],const bool * ctx,struct irq_affinity * desc)986*4882a593Smuzhiyun static int vu_find_vqs(struct virtio_device *vdev, unsigned nvqs,
987*4882a593Smuzhiyun struct virtqueue *vqs[], vq_callback_t *callbacks[],
988*4882a593Smuzhiyun const char * const names[], const bool *ctx,
989*4882a593Smuzhiyun struct irq_affinity *desc)
990*4882a593Smuzhiyun {
991*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
992*4882a593Smuzhiyun int i, queue_idx = 0, rc;
993*4882a593Smuzhiyun struct virtqueue *vq;
994*4882a593Smuzhiyun
995*4882a593Smuzhiyun rc = vhost_user_set_mem_table(vu_dev);
996*4882a593Smuzhiyun if (rc)
997*4882a593Smuzhiyun return rc;
998*4882a593Smuzhiyun
999*4882a593Smuzhiyun for (i = 0; i < nvqs; ++i) {
1000*4882a593Smuzhiyun if (!names[i]) {
1001*4882a593Smuzhiyun vqs[i] = NULL;
1002*4882a593Smuzhiyun continue;
1003*4882a593Smuzhiyun }
1004*4882a593Smuzhiyun
1005*4882a593Smuzhiyun vqs[i] = vu_setup_vq(vdev, queue_idx++, callbacks[i], names[i],
1006*4882a593Smuzhiyun ctx ? ctx[i] : false);
1007*4882a593Smuzhiyun if (IS_ERR(vqs[i])) {
1008*4882a593Smuzhiyun rc = PTR_ERR(vqs[i]);
1009*4882a593Smuzhiyun goto error_setup;
1010*4882a593Smuzhiyun }
1011*4882a593Smuzhiyun }
1012*4882a593Smuzhiyun
1013*4882a593Smuzhiyun list_for_each_entry(vq, &vdev->vqs, list) {
1014*4882a593Smuzhiyun struct virtio_uml_vq_info *info = vq->priv;
1015*4882a593Smuzhiyun
1016*4882a593Smuzhiyun if (info->kick_fd >= 0) {
1017*4882a593Smuzhiyun rc = vhost_user_set_vring_kick(vu_dev, vq->index,
1018*4882a593Smuzhiyun info->kick_fd);
1019*4882a593Smuzhiyun if (rc)
1020*4882a593Smuzhiyun goto error_setup;
1021*4882a593Smuzhiyun }
1022*4882a593Smuzhiyun
1023*4882a593Smuzhiyun rc = vhost_user_set_vring_enable(vu_dev, vq->index, true);
1024*4882a593Smuzhiyun if (rc)
1025*4882a593Smuzhiyun goto error_setup;
1026*4882a593Smuzhiyun }
1027*4882a593Smuzhiyun
1028*4882a593Smuzhiyun return 0;
1029*4882a593Smuzhiyun
1030*4882a593Smuzhiyun error_setup:
1031*4882a593Smuzhiyun vu_del_vqs(vdev);
1032*4882a593Smuzhiyun return rc;
1033*4882a593Smuzhiyun }
1034*4882a593Smuzhiyun
vu_get_features(struct virtio_device * vdev)1035*4882a593Smuzhiyun static u64 vu_get_features(struct virtio_device *vdev)
1036*4882a593Smuzhiyun {
1037*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1038*4882a593Smuzhiyun
1039*4882a593Smuzhiyun return vu_dev->features;
1040*4882a593Smuzhiyun }
1041*4882a593Smuzhiyun
vu_finalize_features(struct virtio_device * vdev)1042*4882a593Smuzhiyun static int vu_finalize_features(struct virtio_device *vdev)
1043*4882a593Smuzhiyun {
1044*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1045*4882a593Smuzhiyun u64 supported = vdev->features & VHOST_USER_SUPPORTED_F;
1046*4882a593Smuzhiyun
1047*4882a593Smuzhiyun vring_transport_features(vdev);
1048*4882a593Smuzhiyun vu_dev->features = vdev->features | supported;
1049*4882a593Smuzhiyun
1050*4882a593Smuzhiyun return vhost_user_set_features(vu_dev, vu_dev->features);
1051*4882a593Smuzhiyun }
1052*4882a593Smuzhiyun
vu_bus_name(struct virtio_device * vdev)1053*4882a593Smuzhiyun static const char *vu_bus_name(struct virtio_device *vdev)
1054*4882a593Smuzhiyun {
1055*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1056*4882a593Smuzhiyun
1057*4882a593Smuzhiyun return vu_dev->pdev->name;
1058*4882a593Smuzhiyun }
1059*4882a593Smuzhiyun
1060*4882a593Smuzhiyun static const struct virtio_config_ops virtio_uml_config_ops = {
1061*4882a593Smuzhiyun .get = vu_get,
1062*4882a593Smuzhiyun .set = vu_set,
1063*4882a593Smuzhiyun .get_status = vu_get_status,
1064*4882a593Smuzhiyun .set_status = vu_set_status,
1065*4882a593Smuzhiyun .reset = vu_reset,
1066*4882a593Smuzhiyun .find_vqs = vu_find_vqs,
1067*4882a593Smuzhiyun .del_vqs = vu_del_vqs,
1068*4882a593Smuzhiyun .get_features = vu_get_features,
1069*4882a593Smuzhiyun .finalize_features = vu_finalize_features,
1070*4882a593Smuzhiyun .bus_name = vu_bus_name,
1071*4882a593Smuzhiyun };
1072*4882a593Smuzhiyun
virtio_uml_release_dev(struct device * d)1073*4882a593Smuzhiyun static void virtio_uml_release_dev(struct device *d)
1074*4882a593Smuzhiyun {
1075*4882a593Smuzhiyun struct virtio_device *vdev =
1076*4882a593Smuzhiyun container_of(d, struct virtio_device, dev);
1077*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = to_virtio_uml_device(vdev);
1078*4882a593Smuzhiyun
1079*4882a593Smuzhiyun time_travel_propagate_time();
1080*4882a593Smuzhiyun
1081*4882a593Smuzhiyun /* might not have been opened due to not negotiating the feature */
1082*4882a593Smuzhiyun if (vu_dev->req_fd >= 0) {
1083*4882a593Smuzhiyun um_free_irq(VIRTIO_IRQ, vu_dev);
1084*4882a593Smuzhiyun os_close_file(vu_dev->req_fd);
1085*4882a593Smuzhiyun }
1086*4882a593Smuzhiyun
1087*4882a593Smuzhiyun os_close_file(vu_dev->sock);
1088*4882a593Smuzhiyun kfree(vu_dev);
1089*4882a593Smuzhiyun }
1090*4882a593Smuzhiyun
1091*4882a593Smuzhiyun /* Platform device */
1092*4882a593Smuzhiyun
virtio_uml_probe(struct platform_device * pdev)1093*4882a593Smuzhiyun static int virtio_uml_probe(struct platform_device *pdev)
1094*4882a593Smuzhiyun {
1095*4882a593Smuzhiyun struct virtio_uml_platform_data *pdata = pdev->dev.platform_data;
1096*4882a593Smuzhiyun struct virtio_uml_device *vu_dev;
1097*4882a593Smuzhiyun int rc;
1098*4882a593Smuzhiyun
1099*4882a593Smuzhiyun if (!pdata)
1100*4882a593Smuzhiyun return -EINVAL;
1101*4882a593Smuzhiyun
1102*4882a593Smuzhiyun vu_dev = kzalloc(sizeof(*vu_dev), GFP_KERNEL);
1103*4882a593Smuzhiyun if (!vu_dev)
1104*4882a593Smuzhiyun return -ENOMEM;
1105*4882a593Smuzhiyun
1106*4882a593Smuzhiyun vu_dev->vdev.dev.parent = &pdev->dev;
1107*4882a593Smuzhiyun vu_dev->vdev.dev.release = virtio_uml_release_dev;
1108*4882a593Smuzhiyun vu_dev->vdev.config = &virtio_uml_config_ops;
1109*4882a593Smuzhiyun vu_dev->vdev.id.device = pdata->virtio_device_id;
1110*4882a593Smuzhiyun vu_dev->vdev.id.vendor = VIRTIO_DEV_ANY_ID;
1111*4882a593Smuzhiyun vu_dev->pdev = pdev;
1112*4882a593Smuzhiyun vu_dev->req_fd = -1;
1113*4882a593Smuzhiyun
1114*4882a593Smuzhiyun time_travel_propagate_time();
1115*4882a593Smuzhiyun
1116*4882a593Smuzhiyun do {
1117*4882a593Smuzhiyun rc = os_connect_socket(pdata->socket_path);
1118*4882a593Smuzhiyun } while (rc == -EINTR);
1119*4882a593Smuzhiyun if (rc < 0)
1120*4882a593Smuzhiyun goto error_free;
1121*4882a593Smuzhiyun vu_dev->sock = rc;
1122*4882a593Smuzhiyun
1123*4882a593Smuzhiyun spin_lock_init(&vu_dev->sock_lock);
1124*4882a593Smuzhiyun
1125*4882a593Smuzhiyun rc = vhost_user_init(vu_dev);
1126*4882a593Smuzhiyun if (rc)
1127*4882a593Smuzhiyun goto error_init;
1128*4882a593Smuzhiyun
1129*4882a593Smuzhiyun platform_set_drvdata(pdev, vu_dev);
1130*4882a593Smuzhiyun
1131*4882a593Smuzhiyun rc = register_virtio_device(&vu_dev->vdev);
1132*4882a593Smuzhiyun if (rc)
1133*4882a593Smuzhiyun put_device(&vu_dev->vdev.dev);
1134*4882a593Smuzhiyun vu_dev->registered = 1;
1135*4882a593Smuzhiyun return rc;
1136*4882a593Smuzhiyun
1137*4882a593Smuzhiyun error_init:
1138*4882a593Smuzhiyun os_close_file(vu_dev->sock);
1139*4882a593Smuzhiyun error_free:
1140*4882a593Smuzhiyun kfree(vu_dev);
1141*4882a593Smuzhiyun return rc;
1142*4882a593Smuzhiyun }
1143*4882a593Smuzhiyun
virtio_uml_remove(struct platform_device * pdev)1144*4882a593Smuzhiyun static int virtio_uml_remove(struct platform_device *pdev)
1145*4882a593Smuzhiyun {
1146*4882a593Smuzhiyun struct virtio_uml_device *vu_dev = platform_get_drvdata(pdev);
1147*4882a593Smuzhiyun
1148*4882a593Smuzhiyun unregister_virtio_device(&vu_dev->vdev);
1149*4882a593Smuzhiyun return 0;
1150*4882a593Smuzhiyun }
1151*4882a593Smuzhiyun
1152*4882a593Smuzhiyun /* Command line device list */
1153*4882a593Smuzhiyun
vu_cmdline_release_dev(struct device * d)1154*4882a593Smuzhiyun static void vu_cmdline_release_dev(struct device *d)
1155*4882a593Smuzhiyun {
1156*4882a593Smuzhiyun }
1157*4882a593Smuzhiyun
1158*4882a593Smuzhiyun static struct device vu_cmdline_parent = {
1159*4882a593Smuzhiyun .init_name = "virtio-uml-cmdline",
1160*4882a593Smuzhiyun .release = vu_cmdline_release_dev,
1161*4882a593Smuzhiyun };
1162*4882a593Smuzhiyun
1163*4882a593Smuzhiyun static bool vu_cmdline_parent_registered;
1164*4882a593Smuzhiyun static int vu_cmdline_id;
1165*4882a593Smuzhiyun
vu_unregister_cmdline_device(struct device * dev,void * data)1166*4882a593Smuzhiyun static int vu_unregister_cmdline_device(struct device *dev, void *data)
1167*4882a593Smuzhiyun {
1168*4882a593Smuzhiyun struct platform_device *pdev = to_platform_device(dev);
1169*4882a593Smuzhiyun struct virtio_uml_platform_data *pdata = pdev->dev.platform_data;
1170*4882a593Smuzhiyun
1171*4882a593Smuzhiyun kfree(pdata->socket_path);
1172*4882a593Smuzhiyun platform_device_unregister(pdev);
1173*4882a593Smuzhiyun return 0;
1174*4882a593Smuzhiyun }
1175*4882a593Smuzhiyun
vu_conn_broken(struct work_struct * wk)1176*4882a593Smuzhiyun static void vu_conn_broken(struct work_struct *wk)
1177*4882a593Smuzhiyun {
1178*4882a593Smuzhiyun struct virtio_uml_platform_data *pdata;
1179*4882a593Smuzhiyun
1180*4882a593Smuzhiyun pdata = container_of(wk, struct virtio_uml_platform_data, conn_broken_wk);
1181*4882a593Smuzhiyun vu_unregister_cmdline_device(&pdata->pdev->dev, NULL);
1182*4882a593Smuzhiyun }
1183*4882a593Smuzhiyun
vu_cmdline_set(const char * device,const struct kernel_param * kp)1184*4882a593Smuzhiyun static int vu_cmdline_set(const char *device, const struct kernel_param *kp)
1185*4882a593Smuzhiyun {
1186*4882a593Smuzhiyun const char *ids = strchr(device, ':');
1187*4882a593Smuzhiyun unsigned int virtio_device_id;
1188*4882a593Smuzhiyun int processed, consumed, err;
1189*4882a593Smuzhiyun char *socket_path;
1190*4882a593Smuzhiyun struct virtio_uml_platform_data pdata, *ppdata;
1191*4882a593Smuzhiyun struct platform_device *pdev;
1192*4882a593Smuzhiyun
1193*4882a593Smuzhiyun if (!ids || ids == device)
1194*4882a593Smuzhiyun return -EINVAL;
1195*4882a593Smuzhiyun
1196*4882a593Smuzhiyun processed = sscanf(ids, ":%u%n:%d%n",
1197*4882a593Smuzhiyun &virtio_device_id, &consumed,
1198*4882a593Smuzhiyun &vu_cmdline_id, &consumed);
1199*4882a593Smuzhiyun
1200*4882a593Smuzhiyun if (processed < 1 || ids[consumed])
1201*4882a593Smuzhiyun return -EINVAL;
1202*4882a593Smuzhiyun
1203*4882a593Smuzhiyun if (!vu_cmdline_parent_registered) {
1204*4882a593Smuzhiyun err = device_register(&vu_cmdline_parent);
1205*4882a593Smuzhiyun if (err) {
1206*4882a593Smuzhiyun pr_err("Failed to register parent device!\n");
1207*4882a593Smuzhiyun put_device(&vu_cmdline_parent);
1208*4882a593Smuzhiyun return err;
1209*4882a593Smuzhiyun }
1210*4882a593Smuzhiyun vu_cmdline_parent_registered = true;
1211*4882a593Smuzhiyun }
1212*4882a593Smuzhiyun
1213*4882a593Smuzhiyun socket_path = kmemdup_nul(device, ids - device, GFP_KERNEL);
1214*4882a593Smuzhiyun if (!socket_path)
1215*4882a593Smuzhiyun return -ENOMEM;
1216*4882a593Smuzhiyun
1217*4882a593Smuzhiyun pdata.virtio_device_id = (u32) virtio_device_id;
1218*4882a593Smuzhiyun pdata.socket_path = socket_path;
1219*4882a593Smuzhiyun
1220*4882a593Smuzhiyun pr_info("Registering device virtio-uml.%d id=%d at %s\n",
1221*4882a593Smuzhiyun vu_cmdline_id, virtio_device_id, socket_path);
1222*4882a593Smuzhiyun
1223*4882a593Smuzhiyun pdev = platform_device_register_data(&vu_cmdline_parent, "virtio-uml",
1224*4882a593Smuzhiyun vu_cmdline_id++, &pdata,
1225*4882a593Smuzhiyun sizeof(pdata));
1226*4882a593Smuzhiyun err = PTR_ERR_OR_ZERO(pdev);
1227*4882a593Smuzhiyun if (err)
1228*4882a593Smuzhiyun goto free;
1229*4882a593Smuzhiyun
1230*4882a593Smuzhiyun ppdata = pdev->dev.platform_data;
1231*4882a593Smuzhiyun ppdata->pdev = pdev;
1232*4882a593Smuzhiyun INIT_WORK(&ppdata->conn_broken_wk, vu_conn_broken);
1233*4882a593Smuzhiyun
1234*4882a593Smuzhiyun return 0;
1235*4882a593Smuzhiyun
1236*4882a593Smuzhiyun free:
1237*4882a593Smuzhiyun kfree(socket_path);
1238*4882a593Smuzhiyun return err;
1239*4882a593Smuzhiyun }
1240*4882a593Smuzhiyun
vu_cmdline_get_device(struct device * dev,void * data)1241*4882a593Smuzhiyun static int vu_cmdline_get_device(struct device *dev, void *data)
1242*4882a593Smuzhiyun {
1243*4882a593Smuzhiyun struct platform_device *pdev = to_platform_device(dev);
1244*4882a593Smuzhiyun struct virtio_uml_platform_data *pdata = pdev->dev.platform_data;
1245*4882a593Smuzhiyun char *buffer = data;
1246*4882a593Smuzhiyun unsigned int len = strlen(buffer);
1247*4882a593Smuzhiyun
1248*4882a593Smuzhiyun snprintf(buffer + len, PAGE_SIZE - len, "%s:%d:%d\n",
1249*4882a593Smuzhiyun pdata->socket_path, pdata->virtio_device_id, pdev->id);
1250*4882a593Smuzhiyun return 0;
1251*4882a593Smuzhiyun }
1252*4882a593Smuzhiyun
vu_cmdline_get(char * buffer,const struct kernel_param * kp)1253*4882a593Smuzhiyun static int vu_cmdline_get(char *buffer, const struct kernel_param *kp)
1254*4882a593Smuzhiyun {
1255*4882a593Smuzhiyun buffer[0] = '\0';
1256*4882a593Smuzhiyun if (vu_cmdline_parent_registered)
1257*4882a593Smuzhiyun device_for_each_child(&vu_cmdline_parent, buffer,
1258*4882a593Smuzhiyun vu_cmdline_get_device);
1259*4882a593Smuzhiyun return strlen(buffer) + 1;
1260*4882a593Smuzhiyun }
1261*4882a593Smuzhiyun
1262*4882a593Smuzhiyun static const struct kernel_param_ops vu_cmdline_param_ops = {
1263*4882a593Smuzhiyun .set = vu_cmdline_set,
1264*4882a593Smuzhiyun .get = vu_cmdline_get,
1265*4882a593Smuzhiyun };
1266*4882a593Smuzhiyun
1267*4882a593Smuzhiyun device_param_cb(device, &vu_cmdline_param_ops, NULL, S_IRUSR);
1268*4882a593Smuzhiyun __uml_help(vu_cmdline_param_ops,
1269*4882a593Smuzhiyun "virtio_uml.device=<socket>:<virtio_id>[:<platform_id>]\n"
1270*4882a593Smuzhiyun " Configure a virtio device over a vhost-user socket.\n"
1271*4882a593Smuzhiyun " See virtio_ids.h for a list of possible virtio device id values.\n"
1272*4882a593Smuzhiyun " Optionally use a specific platform_device id.\n\n"
1273*4882a593Smuzhiyun );
1274*4882a593Smuzhiyun
1275*4882a593Smuzhiyun
vu_unregister_cmdline_devices(void)1276*4882a593Smuzhiyun static void vu_unregister_cmdline_devices(void)
1277*4882a593Smuzhiyun {
1278*4882a593Smuzhiyun if (vu_cmdline_parent_registered) {
1279*4882a593Smuzhiyun device_for_each_child(&vu_cmdline_parent, NULL,
1280*4882a593Smuzhiyun vu_unregister_cmdline_device);
1281*4882a593Smuzhiyun device_unregister(&vu_cmdline_parent);
1282*4882a593Smuzhiyun vu_cmdline_parent_registered = false;
1283*4882a593Smuzhiyun }
1284*4882a593Smuzhiyun }
1285*4882a593Smuzhiyun
1286*4882a593Smuzhiyun /* Platform driver */
1287*4882a593Smuzhiyun
1288*4882a593Smuzhiyun static const struct of_device_id virtio_uml_match[] = {
1289*4882a593Smuzhiyun { .compatible = "virtio,uml", },
1290*4882a593Smuzhiyun { }
1291*4882a593Smuzhiyun };
1292*4882a593Smuzhiyun MODULE_DEVICE_TABLE(of, virtio_uml_match);
1293*4882a593Smuzhiyun
1294*4882a593Smuzhiyun static struct platform_driver virtio_uml_driver = {
1295*4882a593Smuzhiyun .probe = virtio_uml_probe,
1296*4882a593Smuzhiyun .remove = virtio_uml_remove,
1297*4882a593Smuzhiyun .driver = {
1298*4882a593Smuzhiyun .name = "virtio-uml",
1299*4882a593Smuzhiyun .of_match_table = virtio_uml_match,
1300*4882a593Smuzhiyun },
1301*4882a593Smuzhiyun };
1302*4882a593Smuzhiyun
virtio_uml_init(void)1303*4882a593Smuzhiyun static int __init virtio_uml_init(void)
1304*4882a593Smuzhiyun {
1305*4882a593Smuzhiyun return platform_driver_register(&virtio_uml_driver);
1306*4882a593Smuzhiyun }
1307*4882a593Smuzhiyun
virtio_uml_exit(void)1308*4882a593Smuzhiyun static void __exit virtio_uml_exit(void)
1309*4882a593Smuzhiyun {
1310*4882a593Smuzhiyun platform_driver_unregister(&virtio_uml_driver);
1311*4882a593Smuzhiyun vu_unregister_cmdline_devices();
1312*4882a593Smuzhiyun }
1313*4882a593Smuzhiyun
1314*4882a593Smuzhiyun module_init(virtio_uml_init);
1315*4882a593Smuzhiyun module_exit(virtio_uml_exit);
1316*4882a593Smuzhiyun __uml_exitcall(virtio_uml_exit);
1317*4882a593Smuzhiyun
1318*4882a593Smuzhiyun MODULE_DESCRIPTION("UML driver for vhost-user virtio devices");
1319*4882a593Smuzhiyun MODULE_LICENSE("GPL");
1320