]> git.proxmox.com Git - qemu.git/blame - hw/virtio-pci.c
vhost: force vhost off for non-MSI guests
[qemu.git] / hw / virtio-pci.c
CommitLineData
53c25cea
PB
1/*
2 * Virtio PCI Bindings
3 *
4 * Copyright IBM, Corp. 2007
5 * Copyright (c) 2009 CodeSourcery
6 *
7 * Authors:
8 * Anthony Liguori <aliguori@us.ibm.com>
9 * Paul Brook <paul@codesourcery.com>
10 *
11 * This work is licensed under the terms of the GNU GPL, version 2. See
12 * the COPYING file in the top-level directory.
13 *
14 */
15
16#include <inttypes.h>
17
18#include "virtio.h"
8172539d
MT
19#include "virtio-blk.h"
20#include "virtio-net.h"
53c25cea 21#include "pci.h"
2f792016 22#include "qemu-error.h"
aba800a3 23#include "msix.h"
a1e0fea5 24#include "net.h"
97b15621 25#include "loader.h"
ade80dc8 26#include "kvm.h"
2446333c 27#include "blockdev.h"
53c25cea
PB
28
29/* from Linux's linux/virtio_pci.h */
30
31/* A 32-bit r/o bitmask of the features supported by the host */
32#define VIRTIO_PCI_HOST_FEATURES 0
33
34/* A 32-bit r/w bitmask of features activated by the guest */
35#define VIRTIO_PCI_GUEST_FEATURES 4
36
37/* A 32-bit r/w PFN for the currently selected queue */
38#define VIRTIO_PCI_QUEUE_PFN 8
39
40/* A 16-bit r/o queue size for the currently selected queue */
41#define VIRTIO_PCI_QUEUE_NUM 12
42
43/* A 16-bit r/w queue selector */
44#define VIRTIO_PCI_QUEUE_SEL 14
45
46/* A 16-bit r/w queue notifier */
47#define VIRTIO_PCI_QUEUE_NOTIFY 16
48
49/* An 8-bit device status register. */
50#define VIRTIO_PCI_STATUS 18
51
52/* An 8-bit r/o interrupt status register. Reading the value will return the
53 * current contents of the ISR and will also clear it. This is effectively
54 * a read-and-acknowledge. */
55#define VIRTIO_PCI_ISR 19
56
aba800a3
MT
57/* MSI-X registers: only enabled if MSI-X is enabled. */
58/* A 16-bit vector for configuration changes. */
59#define VIRTIO_MSI_CONFIG_VECTOR 20
60/* A 16-bit vector for selected queue notifications. */
61#define VIRTIO_MSI_QUEUE_VECTOR 22
62
63/* Config space size */
64#define VIRTIO_PCI_CONFIG_NOMSI 20
65#define VIRTIO_PCI_CONFIG_MSI 24
66#define VIRTIO_PCI_REGION_SIZE(dev) (msix_present(dev) ? \
67 VIRTIO_PCI_CONFIG_MSI : \
68 VIRTIO_PCI_CONFIG_NOMSI)
69
70/* The remaining space is defined by each driver as the per-driver
71 * configuration space */
72#define VIRTIO_PCI_CONFIG(dev) (msix_enabled(dev) ? \
73 VIRTIO_PCI_CONFIG_MSI : \
74 VIRTIO_PCI_CONFIG_NOMSI)
53c25cea
PB
75
76/* Virtio ABI version, if we increment this, we break the guest driver. */
77#define VIRTIO_PCI_ABI_VERSION 0
78
79/* How many bits to shift physical queue address written to QUEUE_PFN.
80 * 12 is historical, and due to x86 page size. */
81#define VIRTIO_PCI_QUEUE_ADDR_SHIFT 12
82
3dbca8e6
SH
83/* Flags track per-device state like workarounds for quirks in older guests. */
84#define VIRTIO_PCI_FLAG_BUS_MASTER_BUG (1 << 0)
c81131db 85
25db9ebe
SH
86/* Performance improves when virtqueue kick processing is decoupled from the
87 * vcpu thread using ioeventfd for some devices. */
88#define VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT 1
89#define VIRTIO_PCI_FLAG_USE_IOEVENTFD (1 << VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT)
90
53c25cea
PB
91/* QEMU doesn't strictly need write barriers since everything runs in
92 * lock-step. We'll leave the calls to wmb() in though to make it obvious for
93 * KVM or if kqemu gets SMP support.
94 */
95#define wmb() do { } while (0)
96
97/* PCI bindings. */
98
99typedef struct {
100 PCIDevice pci_dev;
101 VirtIODevice *vdev;
3dbca8e6 102 uint32_t flags;
53c25cea 103 uint32_t addr;
ab73ff29 104 uint32_t class_code;
a1e0fea5 105 uint32_t nvectors;
428c149b 106 BlockConf block;
97b15621 107 NICConf nic;
8172539d 108 uint32_t host_features;
9f107513
AL
109#ifdef CONFIG_LINUX
110 V9fsConf fsconf;
111#endif
98b19252
AS
112 /* Max. number of ports we can have for a the virtio-serial device */
113 uint32_t max_virtserial_ports;
f0c07c7c 114 virtio_net_conf net;
25db9ebe
SH
115 bool ioeventfd_disabled;
116 bool ioeventfd_started;
53c25cea
PB
117} VirtIOPCIProxy;
118
119/* virtio device */
120
7055e687 121static void virtio_pci_notify(void *opaque, uint16_t vector)
53c25cea
PB
122{
123 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
124 if (msix_enabled(&proxy->pci_dev))
125 msix_notify(&proxy->pci_dev, vector);
126 else
127 qemu_set_irq(proxy->pci_dev.irq[0], proxy->vdev->isr & 1);
53c25cea
PB
128}
129
ff24bd58
MT
130static void virtio_pci_save_config(void * opaque, QEMUFile *f)
131{
132 VirtIOPCIProxy *proxy = opaque;
133 pci_device_save(&proxy->pci_dev, f);
134 msix_save(&proxy->pci_dev, f);
135 if (msix_present(&proxy->pci_dev))
136 qemu_put_be16(f, proxy->vdev->config_vector);
137}
138
139static void virtio_pci_save_queue(void * opaque, int n, QEMUFile *f)
140{
141 VirtIOPCIProxy *proxy = opaque;
142 if (msix_present(&proxy->pci_dev))
143 qemu_put_be16(f, virtio_queue_vector(proxy->vdev, n));
144}
145
146static int virtio_pci_load_config(void * opaque, QEMUFile *f)
147{
148 VirtIOPCIProxy *proxy = opaque;
149 int ret;
150 ret = pci_device_load(&proxy->pci_dev, f);
e6da7680 151 if (ret) {
ff24bd58 152 return ret;
e6da7680 153 }
ff24bd58 154 msix_load(&proxy->pci_dev, f);
e6da7680 155 if (msix_present(&proxy->pci_dev)) {
ff24bd58 156 qemu_get_be16s(f, &proxy->vdev->config_vector);
e6da7680
MT
157 } else {
158 proxy->vdev->config_vector = VIRTIO_NO_VECTOR;
159 }
160 if (proxy->vdev->config_vector != VIRTIO_NO_VECTOR) {
161 return msix_vector_use(&proxy->pci_dev, proxy->vdev->config_vector);
162 }
c81131db
AG
163
164 /* Try to find out if the guest has bus master disabled, but is
165 in ready state. Then we have a buggy guest OS. */
8a911107 166 if ((proxy->vdev->status & VIRTIO_CONFIG_S_DRIVER_OK) &&
c81131db 167 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
3dbca8e6 168 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
c81131db 169 }
ff24bd58
MT
170 return 0;
171}
172
173static int virtio_pci_load_queue(void * opaque, int n, QEMUFile *f)
174{
175 VirtIOPCIProxy *proxy = opaque;
176 uint16_t vector;
e6da7680
MT
177 if (msix_present(&proxy->pci_dev)) {
178 qemu_get_be16s(f, &vector);
179 } else {
180 vector = VIRTIO_NO_VECTOR;
181 }
ff24bd58 182 virtio_queue_set_vector(proxy->vdev, n, vector);
e6da7680
MT
183 if (vector != VIRTIO_NO_VECTOR) {
184 return msix_vector_use(&proxy->pci_dev, vector);
185 }
ff24bd58
MT
186 return 0;
187}
188
25db9ebe
SH
189static int virtio_pci_set_host_notifier_internal(VirtIOPCIProxy *proxy,
190 int n, bool assign)
191{
192 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
193 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
194 int r;
195 if (assign) {
196 r = event_notifier_init(notifier, 1);
197 if (r < 0) {
b36e3914
MT
198 error_report("%s: unable to init event notifier: %d",
199 __func__, r);
25db9ebe
SH
200 return r;
201 }
202 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
203 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
204 n, assign);
205 if (r < 0) {
b36e3914
MT
206 error_report("%s: unable to map ioeventfd: %d",
207 __func__, r);
25db9ebe
SH
208 event_notifier_cleanup(notifier);
209 }
210 } else {
211 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
212 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
213 n, assign);
214 if (r < 0) {
b36e3914
MT
215 error_report("%s: unable to unmap ioeventfd: %d",
216 __func__, r);
25db9ebe
SH
217 return r;
218 }
219
220 /* Handle the race condition where the guest kicked and we deassigned
221 * before we got around to handling the kick.
222 */
223 if (event_notifier_test_and_clear(notifier)) {
224 virtio_queue_notify_vq(vq);
225 }
226
227 event_notifier_cleanup(notifier);
228 }
229 return r;
230}
231
232static void virtio_pci_host_notifier_read(void *opaque)
233{
234 VirtQueue *vq = opaque;
235 EventNotifier *n = virtio_queue_get_host_notifier(vq);
236 if (event_notifier_test_and_clear(n)) {
237 virtio_queue_notify_vq(vq);
238 }
239}
240
241static void virtio_pci_set_host_notifier_fd_handler(VirtIOPCIProxy *proxy,
242 int n, bool assign)
243{
244 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
245 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
246 if (assign) {
247 qemu_set_fd_handler(event_notifier_get_fd(notifier),
248 virtio_pci_host_notifier_read, NULL, vq);
249 } else {
250 qemu_set_fd_handler(event_notifier_get_fd(notifier),
251 NULL, NULL, NULL);
252 }
253}
254
b36e3914 255static void virtio_pci_start_ioeventfd(VirtIOPCIProxy *proxy)
25db9ebe
SH
256{
257 int n, r;
258
259 if (!(proxy->flags & VIRTIO_PCI_FLAG_USE_IOEVENTFD) ||
260 proxy->ioeventfd_disabled ||
261 proxy->ioeventfd_started) {
b36e3914 262 return;
25db9ebe
SH
263 }
264
265 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
266 if (!virtio_queue_get_num(proxy->vdev, n)) {
267 continue;
268 }
269
270 r = virtio_pci_set_host_notifier_internal(proxy, n, true);
271 if (r < 0) {
272 goto assign_error;
273 }
274
275 virtio_pci_set_host_notifier_fd_handler(proxy, n, true);
276 }
277 proxy->ioeventfd_started = true;
b36e3914 278 return;
25db9ebe
SH
279
280assign_error:
281 while (--n >= 0) {
282 if (!virtio_queue_get_num(proxy->vdev, n)) {
283 continue;
284 }
285
286 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
b36e3914
MT
287 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
288 assert(r >= 0);
25db9ebe
SH
289 }
290 proxy->ioeventfd_started = false;
b36e3914 291 error_report("%s: failed. Fallback to a userspace (slower).", __func__);
25db9ebe
SH
292}
293
b36e3914 294static void virtio_pci_stop_ioeventfd(VirtIOPCIProxy *proxy)
25db9ebe 295{
b36e3914 296 int r;
25db9ebe
SH
297 int n;
298
299 if (!proxy->ioeventfd_started) {
b36e3914 300 return;
25db9ebe
SH
301 }
302
303 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
304 if (!virtio_queue_get_num(proxy->vdev, n)) {
305 continue;
306 }
307
308 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
b36e3914
MT
309 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
310 assert(r >= 0);
25db9ebe
SH
311 }
312 proxy->ioeventfd_started = false;
25db9ebe
SH
313}
314
e489030d 315static void virtio_pci_reset(DeviceState *d)
7055e687 316{
e489030d 317 VirtIOPCIProxy *proxy = container_of(d, VirtIOPCIProxy, pci_dev.qdev);
25db9ebe 318 virtio_pci_stop_ioeventfd(proxy);
7055e687 319 virtio_reset(proxy->vdev);
aba800a3 320 msix_reset(&proxy->pci_dev);
25db9ebe 321 proxy->flags &= ~VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
7055e687
MT
322}
323
53c25cea
PB
324static void virtio_ioport_write(void *opaque, uint32_t addr, uint32_t val)
325{
326 VirtIOPCIProxy *proxy = opaque;
327 VirtIODevice *vdev = proxy->vdev;
c227f099 328 target_phys_addr_t pa;
53c25cea 329
53c25cea
PB
330 switch (addr) {
331 case VIRTIO_PCI_GUEST_FEATURES:
332 /* Guest does not negotiate properly? We have to assume nothing. */
333 if (val & (1 << VIRTIO_F_BAD_FEATURE)) {
334 if (vdev->bad_features)
8172539d 335 val = proxy->host_features & vdev->bad_features(vdev);
53c25cea
PB
336 else
337 val = 0;
338 }
339 if (vdev->set_features)
340 vdev->set_features(vdev, val);
704a76fc 341 vdev->guest_features = val;
53c25cea
PB
342 break;
343 case VIRTIO_PCI_QUEUE_PFN:
c227f099 344 pa = (target_phys_addr_t)val << VIRTIO_PCI_QUEUE_ADDR_SHIFT;
1b8e9b27 345 if (pa == 0) {
25db9ebe 346 virtio_pci_stop_ioeventfd(proxy);
1b8e9b27
MT
347 virtio_reset(proxy->vdev);
348 msix_unuse_all_vectors(&proxy->pci_dev);
349 }
7055e687
MT
350 else
351 virtio_queue_set_addr(vdev, vdev->queue_sel, pa);
53c25cea
PB
352 break;
353 case VIRTIO_PCI_QUEUE_SEL:
354 if (val < VIRTIO_PCI_QUEUE_MAX)
355 vdev->queue_sel = val;
356 break;
357 case VIRTIO_PCI_QUEUE_NOTIFY:
358 virtio_queue_notify(vdev, val);
359 break;
360 case VIRTIO_PCI_STATUS:
25db9ebe
SH
361 if (!(val & VIRTIO_CONFIG_S_DRIVER_OK)) {
362 virtio_pci_stop_ioeventfd(proxy);
363 }
364
3e607cb5 365 virtio_set_status(vdev, val & 0xFF);
25db9ebe
SH
366
367 if (val & VIRTIO_CONFIG_S_DRIVER_OK) {
368 virtio_pci_start_ioeventfd(proxy);
369 }
370
1b8e9b27
MT
371 if (vdev->status == 0) {
372 virtio_reset(proxy->vdev);
373 msix_unuse_all_vectors(&proxy->pci_dev);
374 }
c81131db
AG
375
376 /* Linux before 2.6.34 sets the device as OK without enabling
377 the PCI device bus master bit. In this case we need to disable
378 some safety checks. */
379 if ((val & VIRTIO_CONFIG_S_DRIVER_OK) &&
380 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
3dbca8e6 381 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
c81131db 382 }
53c25cea 383 break;
aba800a3
MT
384 case VIRTIO_MSI_CONFIG_VECTOR:
385 msix_vector_unuse(&proxy->pci_dev, vdev->config_vector);
386 /* Make it possible for guest to discover an error took place. */
387 if (msix_vector_use(&proxy->pci_dev, val) < 0)
388 val = VIRTIO_NO_VECTOR;
389 vdev->config_vector = val;
390 break;
391 case VIRTIO_MSI_QUEUE_VECTOR:
392 msix_vector_unuse(&proxy->pci_dev,
393 virtio_queue_vector(vdev, vdev->queue_sel));
394 /* Make it possible for guest to discover an error took place. */
395 if (msix_vector_use(&proxy->pci_dev, val) < 0)
396 val = VIRTIO_NO_VECTOR;
397 virtio_queue_set_vector(vdev, vdev->queue_sel, val);
398 break;
399 default:
4e02d460
SH
400 error_report("%s: unexpected address 0x%x value 0x%x",
401 __func__, addr, val);
aba800a3 402 break;
53c25cea
PB
403 }
404}
405
aba800a3 406static uint32_t virtio_ioport_read(VirtIOPCIProxy *proxy, uint32_t addr)
53c25cea 407{
53c25cea
PB
408 VirtIODevice *vdev = proxy->vdev;
409 uint32_t ret = 0xFFFFFFFF;
410
53c25cea
PB
411 switch (addr) {
412 case VIRTIO_PCI_HOST_FEATURES:
8172539d 413 ret = proxy->host_features;
53c25cea
PB
414 break;
415 case VIRTIO_PCI_GUEST_FEATURES:
704a76fc 416 ret = vdev->guest_features;
53c25cea
PB
417 break;
418 case VIRTIO_PCI_QUEUE_PFN:
419 ret = virtio_queue_get_addr(vdev, vdev->queue_sel)
420 >> VIRTIO_PCI_QUEUE_ADDR_SHIFT;
421 break;
422 case VIRTIO_PCI_QUEUE_NUM:
423 ret = virtio_queue_get_num(vdev, vdev->queue_sel);
424 break;
425 case VIRTIO_PCI_QUEUE_SEL:
426 ret = vdev->queue_sel;
427 break;
428 case VIRTIO_PCI_STATUS:
429 ret = vdev->status;
430 break;
431 case VIRTIO_PCI_ISR:
432 /* reading from the ISR also clears it. */
433 ret = vdev->isr;
434 vdev->isr = 0;
7055e687 435 qemu_set_irq(proxy->pci_dev.irq[0], 0);
53c25cea 436 break;
aba800a3
MT
437 case VIRTIO_MSI_CONFIG_VECTOR:
438 ret = vdev->config_vector;
439 break;
440 case VIRTIO_MSI_QUEUE_VECTOR:
441 ret = virtio_queue_vector(vdev, vdev->queue_sel);
442 break;
53c25cea
PB
443 default:
444 break;
445 }
446
447 return ret;
448}
449
450static uint32_t virtio_pci_config_readb(void *opaque, uint32_t addr)
451{
452 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
453 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
454 addr -= proxy->addr;
455 if (addr < config)
456 return virtio_ioport_read(proxy, addr);
457 addr -= config;
53c25cea
PB
458 return virtio_config_readb(proxy->vdev, addr);
459}
460
461static uint32_t virtio_pci_config_readw(void *opaque, uint32_t addr)
462{
463 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
464 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
465 addr -= proxy->addr;
466 if (addr < config)
467 return virtio_ioport_read(proxy, addr);
468 addr -= config;
53c25cea
PB
469 return virtio_config_readw(proxy->vdev, addr);
470}
471
472static uint32_t virtio_pci_config_readl(void *opaque, uint32_t addr)
473{
474 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
475 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
476 addr -= proxy->addr;
477 if (addr < config)
478 return virtio_ioport_read(proxy, addr);
479 addr -= config;
53c25cea
PB
480 return virtio_config_readl(proxy->vdev, addr);
481}
482
483static void virtio_pci_config_writeb(void *opaque, uint32_t addr, uint32_t val)
484{
485 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
486 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
487 addr -= proxy->addr;
488 if (addr < config) {
489 virtio_ioport_write(proxy, addr, val);
490 return;
491 }
492 addr -= config;
53c25cea
PB
493 virtio_config_writeb(proxy->vdev, addr, val);
494}
495
496static void virtio_pci_config_writew(void *opaque, uint32_t addr, uint32_t val)
497{
498 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
499 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
500 addr -= proxy->addr;
501 if (addr < config) {
502 virtio_ioport_write(proxy, addr, val);
503 return;
504 }
505 addr -= config;
53c25cea
PB
506 virtio_config_writew(proxy->vdev, addr, val);
507}
508
509static void virtio_pci_config_writel(void *opaque, uint32_t addr, uint32_t val)
510{
511 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
512 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
513 addr -= proxy->addr;
514 if (addr < config) {
515 virtio_ioport_write(proxy, addr, val);
516 return;
517 }
518 addr -= config;
53c25cea
PB
519 virtio_config_writel(proxy->vdev, addr, val);
520}
521
522static void virtio_map(PCIDevice *pci_dev, int region_num,
6e355d90 523 pcibus_t addr, pcibus_t size, int type)
53c25cea
PB
524{
525 VirtIOPCIProxy *proxy = container_of(pci_dev, VirtIOPCIProxy, pci_dev);
526 VirtIODevice *vdev = proxy->vdev;
aba800a3 527 unsigned config_len = VIRTIO_PCI_REGION_SIZE(pci_dev) + vdev->config_len;
53c25cea
PB
528
529 proxy->addr = addr;
53c25cea 530
aba800a3
MT
531 register_ioport_write(addr, config_len, 1, virtio_pci_config_writeb, proxy);
532 register_ioport_write(addr, config_len, 2, virtio_pci_config_writew, proxy);
533 register_ioport_write(addr, config_len, 4, virtio_pci_config_writel, proxy);
534 register_ioport_read(addr, config_len, 1, virtio_pci_config_readb, proxy);
535 register_ioport_read(addr, config_len, 2, virtio_pci_config_readw, proxy);
536 register_ioport_read(addr, config_len, 4, virtio_pci_config_readl, proxy);
53c25cea 537
aba800a3 538 if (vdev->config_len)
53c25cea 539 vdev->get_config(vdev, vdev->config);
aba800a3
MT
540}
541
542static void virtio_write_config(PCIDevice *pci_dev, uint32_t address,
543 uint32_t val, int len)
544{
ed757e14
YV
545 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
546
547 if (PCI_COMMAND == address) {
548 if (!(val & PCI_COMMAND_MASTER)) {
3dbca8e6 549 if (!(proxy->flags & VIRTIO_PCI_FLAG_BUS_MASTER_BUG)) {
25db9ebe 550 virtio_pci_stop_ioeventfd(proxy);
3e607cb5
MT
551 virtio_set_status(proxy->vdev,
552 proxy->vdev->status & ~VIRTIO_CONFIG_S_DRIVER_OK);
c81131db 553 }
ed757e14
YV
554 }
555 }
556
aba800a3 557 pci_default_write_config(pci_dev, address, val, len);
85352471 558 msix_write_config(pci_dev, address, val, len);
53c25cea
PB
559}
560
6d74ca5a
MT
561static unsigned virtio_pci_get_features(void *opaque)
562{
8172539d
MT
563 VirtIOPCIProxy *proxy = opaque;
564 return proxy->host_features;
6d74ca5a
MT
565}
566
ade80dc8
MT
567static void virtio_pci_guest_notifier_read(void *opaque)
568{
569 VirtQueue *vq = opaque;
570 EventNotifier *n = virtio_queue_get_guest_notifier(vq);
571 if (event_notifier_test_and_clear(n)) {
572 virtio_irq(vq);
573 }
574}
575
576static int virtio_pci_set_guest_notifier(void *opaque, int n, bool assign)
577{
578 VirtIOPCIProxy *proxy = opaque;
579 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
580 EventNotifier *notifier = virtio_queue_get_guest_notifier(vq);
581
582 if (assign) {
583 int r = event_notifier_init(notifier, 0);
584 if (r < 0) {
585 return r;
586 }
587 qemu_set_fd_handler(event_notifier_get_fd(notifier),
588 virtio_pci_guest_notifier_read, NULL, vq);
589 } else {
590 qemu_set_fd_handler(event_notifier_get_fd(notifier),
591 NULL, NULL, NULL);
592 event_notifier_cleanup(notifier);
593 }
594
595 return 0;
596}
597
5430a28f 598static bool virtio_pci_query_guest_notifiers(void *opaque)
599{
600 VirtIOPCIProxy *proxy = opaque;
601 return msix_enabled(&proxy->pci_dev);
602}
603
54dd9321
MT
604static int virtio_pci_set_guest_notifiers(void *opaque, bool assign)
605{
606 VirtIOPCIProxy *proxy = opaque;
607 VirtIODevice *vdev = proxy->vdev;
608 int r, n;
609
610 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
611 if (!virtio_queue_get_num(vdev, n)) {
612 break;
613 }
614
615 r = virtio_pci_set_guest_notifier(opaque, n, assign);
616 if (r < 0) {
617 goto assign_error;
618 }
619 }
620
621 return 0;
622
623assign_error:
624 /* We get here on assignment failure. Recover by undoing for VQs 0 .. n. */
625 while (--n >= 0) {
626 virtio_pci_set_guest_notifier(opaque, n, !assign);
627 }
628 return r;
629}
630
ade80dc8
MT
631static int virtio_pci_set_host_notifier(void *opaque, int n, bool assign)
632{
633 VirtIOPCIProxy *proxy = opaque;
25db9ebe
SH
634
635 /* Stop using ioeventfd for virtqueue kick if the device starts using host
636 * notifiers. This makes it easy to avoid stepping on each others' toes.
637 */
638 proxy->ioeventfd_disabled = assign;
ade80dc8 639 if (assign) {
25db9ebe
SH
640 virtio_pci_stop_ioeventfd(proxy);
641 }
642 /* We don't need to start here: it's not needed because backend
643 * currently only stops on status change away from ok,
644 * reset, vmstop and such. If we do add code to start here,
645 * need to check vmstate, device state etc. */
646 return virtio_pci_set_host_notifier_internal(proxy, n, assign);
647}
648
649static void virtio_pci_vmstate_change(void *opaque, bool running)
650{
651 VirtIOPCIProxy *proxy = opaque;
652
653 if (running) {
654 virtio_pci_start_ioeventfd(proxy);
ade80dc8 655 } else {
25db9ebe 656 virtio_pci_stop_ioeventfd(proxy);
ade80dc8 657 }
ade80dc8
MT
658}
659
53c25cea 660static const VirtIOBindings virtio_pci_bindings = {
ff24bd58
MT
661 .notify = virtio_pci_notify,
662 .save_config = virtio_pci_save_config,
663 .load_config = virtio_pci_load_config,
664 .save_queue = virtio_pci_save_queue,
665 .load_queue = virtio_pci_load_queue,
6d74ca5a 666 .get_features = virtio_pci_get_features,
5430a28f 667 .query_guest_notifiers = virtio_pci_query_guest_notifiers,
ade80dc8 668 .set_host_notifier = virtio_pci_set_host_notifier,
54dd9321 669 .set_guest_notifiers = virtio_pci_set_guest_notifiers,
25db9ebe 670 .vmstate_change = virtio_pci_vmstate_change,
53c25cea
PB
671};
672
673static void virtio_init_pci(VirtIOPCIProxy *proxy, VirtIODevice *vdev,
674 uint16_t vendor, uint16_t device,
675 uint16_t class_code, uint8_t pif)
676{
677 uint8_t *config;
678 uint32_t size;
679
680 proxy->vdev = vdev;
681
682 config = proxy->pci_dev.config;
683 pci_config_set_vendor_id(config, vendor);
684 pci_config_set_device_id(config, device);
685
686 config[0x08] = VIRTIO_PCI_ABI_VERSION;
687
688 config[0x09] = pif;
689 pci_config_set_class(config, class_code);
53c25cea
PB
690
691 config[0x2c] = vendor & 0xFF;
692 config[0x2d] = (vendor >> 8) & 0xFF;
693 config[0x2e] = vdev->device_id & 0xFF;
694 config[0x2f] = (vdev->device_id >> 8) & 0xFF;
695
696 config[0x3d] = 1;
697
5a1fc5e8 698 if (vdev->nvectors && !msix_init(&proxy->pci_dev, vdev->nvectors, 1, 0)) {
aba800a3
MT
699 pci_register_bar(&proxy->pci_dev, 1,
700 msix_bar_size(&proxy->pci_dev),
0392a017 701 PCI_BASE_ADDRESS_SPACE_MEMORY,
aba800a3 702 msix_mmio_map);
aba800a3
MT
703 } else
704 vdev->nvectors = 0;
705
ed757e14
YV
706 proxy->pci_dev.config_write = virtio_write_config;
707
aba800a3 708 size = VIRTIO_PCI_REGION_SIZE(&proxy->pci_dev) + vdev->config_len;
53c25cea
PB
709 if (size & (size-1))
710 size = 1 << qemu_fls(size);
711
0392a017 712 pci_register_bar(&proxy->pci_dev, 0, size, PCI_BASE_ADDRESS_SPACE_IO,
53c25cea
PB
713 virtio_map);
714
25db9ebe
SH
715 if (!kvm_has_many_ioeventfds()) {
716 proxy->flags &= ~VIRTIO_PCI_FLAG_USE_IOEVENTFD;
717 }
718
53c25cea 719 virtio_bind_device(vdev, &virtio_pci_bindings, proxy);
8172539d
MT
720 proxy->host_features |= 0x1 << VIRTIO_F_NOTIFY_ON_EMPTY;
721 proxy->host_features |= 0x1 << VIRTIO_F_BAD_FEATURE;
722 proxy->host_features = vdev->get_features(vdev, proxy->host_features);
53c25cea
PB
723}
724
81a322d4 725static int virtio_blk_init_pci(PCIDevice *pci_dev)
53c25cea
PB
726{
727 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
728 VirtIODevice *vdev;
729
ab73ff29
GH
730 if (proxy->class_code != PCI_CLASS_STORAGE_SCSI &&
731 proxy->class_code != PCI_CLASS_STORAGE_OTHER)
732 proxy->class_code = PCI_CLASS_STORAGE_SCSI;
53c25cea 733
428c149b 734 vdev = virtio_blk_init(&pci_dev->qdev, &proxy->block);
ac0c14d7
MA
735 if (!vdev) {
736 return -1;
737 }
177539e0 738 vdev->nvectors = proxy->nvectors;
53c25cea
PB
739 virtio_init_pci(proxy, vdev,
740 PCI_VENDOR_ID_REDHAT_QUMRANET,
85c2c735
MM
741 PCI_DEVICE_ID_VIRTIO_BLOCK,
742 proxy->class_code, 0x00);
177539e0
GH
743 /* make the actual value visible */
744 proxy->nvectors = vdev->nvectors;
81a322d4 745 return 0;
21d58b57
MM
746}
747
0f457d91
MT
748static int virtio_exit_pci(PCIDevice *pci_dev)
749{
750 return msix_uninit(pci_dev);
751}
752
56a14938
GH
753static int virtio_blk_exit_pci(PCIDevice *pci_dev)
754{
755 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
756
25db9ebe 757 virtio_pci_stop_ioeventfd(proxy);
9d0d3138 758 virtio_blk_exit(proxy->vdev);
f8b6cc00 759 blockdev_mark_auto_del(proxy->block.bs);
0f457d91 760 return virtio_exit_pci(pci_dev);
56a14938
GH
761}
762
98b19252 763static int virtio_serial_init_pci(PCIDevice *pci_dev)
21d58b57 764{
d6beee99 765 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
85c2c735
MM
766 VirtIODevice *vdev;
767
d6beee99
GH
768 if (proxy->class_code != PCI_CLASS_COMMUNICATION_OTHER &&
769 proxy->class_code != PCI_CLASS_DISPLAY_OTHER && /* qemu 0.10 */
770 proxy->class_code != PCI_CLASS_OTHERS) /* qemu-kvm */
771 proxy->class_code = PCI_CLASS_COMMUNICATION_OTHER;
772
98b19252 773 vdev = virtio_serial_init(&pci_dev->qdev, proxy->max_virtserial_ports);
25fe3654
AS
774 if (!vdev) {
775 return -1;
776 }
573fb60c
AS
777 vdev->nvectors = proxy->nvectors == DEV_NVECTORS_UNSPECIFIED
778 ? proxy->max_virtserial_ports + 1
779 : proxy->nvectors;
85c2c735
MM
780 virtio_init_pci(proxy, vdev,
781 PCI_VENDOR_ID_REDHAT_QUMRANET,
782 PCI_DEVICE_ID_VIRTIO_CONSOLE,
783 proxy->class_code, 0x00);
a1829205 784 proxy->nvectors = vdev->nvectors;
81a322d4 785 return 0;
53c25cea
PB
786}
787
8b53a865
AS
788static int virtio_serial_exit_pci(PCIDevice *pci_dev)
789{
790 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
791
792 virtio_serial_exit(proxy->vdev);
793 return virtio_exit_pci(pci_dev);
794}
795
81a322d4 796static int virtio_net_init_pci(PCIDevice *pci_dev)
53c25cea
PB
797{
798 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
799 VirtIODevice *vdev;
800
f0c07c7c 801 vdev = virtio_net_init(&pci_dev->qdev, &proxy->nic, &proxy->net);
a1e0fea5 802
97b15621 803 vdev->nvectors = proxy->nvectors;
53c25cea
PB
804 virtio_init_pci(proxy, vdev,
805 PCI_VENDOR_ID_REDHAT_QUMRANET,
806 PCI_DEVICE_ID_VIRTIO_NET,
807 PCI_CLASS_NETWORK_ETHERNET,
808 0x00);
a1e0fea5
GH
809
810 /* make the actual value visible */
811 proxy->nvectors = vdev->nvectors;
81a322d4 812 return 0;
53c25cea
PB
813}
814
97b15621
GH
815static int virtio_net_exit_pci(PCIDevice *pci_dev)
816{
817 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
818
25db9ebe 819 virtio_pci_stop_ioeventfd(proxy);
97b15621
GH
820 virtio_net_exit(proxy->vdev);
821 return virtio_exit_pci(pci_dev);
822}
823
81a322d4 824static int virtio_balloon_init_pci(PCIDevice *pci_dev)
53c25cea
PB
825{
826 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
827 VirtIODevice *vdev;
828
829 vdev = virtio_balloon_init(&pci_dev->qdev);
830 virtio_init_pci(proxy, vdev,
831 PCI_VENDOR_ID_REDHAT_QUMRANET,
832 PCI_DEVICE_ID_VIRTIO_BALLOON,
833 PCI_CLASS_MEMORY_RAM,
834 0x00);
81a322d4 835 return 0;
53c25cea
PB
836}
837
758e8e38 838#ifdef CONFIG_VIRTFS
9f107513
AL
839static int virtio_9p_init_pci(PCIDevice *pci_dev)
840{
841 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
842 VirtIODevice *vdev;
843
844 vdev = virtio_9p_init(&pci_dev->qdev, &proxy->fsconf);
9dbcca5a 845 vdev->nvectors = proxy->nvectors;
9f107513
AL
846 virtio_init_pci(proxy, vdev,
847 PCI_VENDOR_ID_REDHAT_QUMRANET,
848 0x1009,
849 0x2,
850 0x00);
9dbcca5a
GH
851 /* make the actual value visible */
852 proxy->nvectors = vdev->nvectors;
9f107513
AL
853 return 0;
854}
855#endif
856
0aab0d3a
GH
857static PCIDeviceInfo virtio_info[] = {
858 {
859 .qdev.name = "virtio-blk-pci",
779206de 860 .qdev.alias = "virtio-blk",
0aab0d3a
GH
861 .qdev.size = sizeof(VirtIOPCIProxy),
862 .init = virtio_blk_init_pci,
56a14938 863 .exit = virtio_blk_exit_pci,
ab73ff29 864 .qdev.props = (Property[]) {
72c61d0b 865 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
428c149b 866 DEFINE_BLOCK_PROPERTIES(VirtIOPCIProxy, block),
25db9ebe
SH
867 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
868 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, true),
177539e0 869 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 2),
8172539d 870 DEFINE_VIRTIO_BLK_FEATURES(VirtIOPCIProxy, host_features),
72c61d0b 871 DEFINE_PROP_END_OF_LIST(),
ab73ff29 872 },
e489030d 873 .qdev.reset = virtio_pci_reset,
0aab0d3a 874 },{
a1e0fea5
GH
875 .qdev.name = "virtio-net-pci",
876 .qdev.size = sizeof(VirtIOPCIProxy),
877 .init = virtio_net_init_pci,
97b15621 878 .exit = virtio_net_exit_pci,
8c52c8f3 879 .romfile = "pxe-virtio.bin",
a1e0fea5 880 .qdev.props = (Property[]) {
25db9ebe
SH
881 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
882 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, false),
97b15621 883 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 3),
8172539d 884 DEFINE_VIRTIO_NET_FEATURES(VirtIOPCIProxy, host_features),
97b15621 885 DEFINE_NIC_PROPERTIES(VirtIOPCIProxy, nic),
f0c07c7c
AW
886 DEFINE_PROP_UINT32("x-txtimer", VirtIOPCIProxy,
887 net.txtimer, TX_TIMER_INTERVAL),
e3f30488
AW
888 DEFINE_PROP_INT32("x-txburst", VirtIOPCIProxy,
889 net.txburst, TX_BURST),
a697a334 890 DEFINE_PROP_STRING("tx", VirtIOPCIProxy, net.tx),
72c61d0b 891 DEFINE_PROP_END_OF_LIST(),
a1e0fea5 892 },
e489030d 893 .qdev.reset = virtio_pci_reset,
0aab0d3a 894 },{
98b19252
AS
895 .qdev.name = "virtio-serial-pci",
896 .qdev.alias = "virtio-serial",
0aab0d3a 897 .qdev.size = sizeof(VirtIOPCIProxy),
98b19252 898 .init = virtio_serial_init_pci,
8b53a865 899 .exit = virtio_serial_exit_pci,
d6beee99 900 .qdev.props = (Property[]) {
573fb60c
AS
901 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors,
902 DEV_NVECTORS_UNSPECIFIED),
72c61d0b 903 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
8172539d 904 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
98b19252
AS
905 DEFINE_PROP_UINT32("max_ports", VirtIOPCIProxy, max_virtserial_ports,
906 31),
72c61d0b 907 DEFINE_PROP_END_OF_LIST(),
d6beee99 908 },
e489030d 909 .qdev.reset = virtio_pci_reset,
0aab0d3a
GH
910 },{
911 .qdev.name = "virtio-balloon-pci",
912 .qdev.size = sizeof(VirtIOPCIProxy),
913 .init = virtio_balloon_init_pci,
0f457d91 914 .exit = virtio_exit_pci,
8172539d
MT
915 .qdev.props = (Property[]) {
916 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
917 DEFINE_PROP_END_OF_LIST(),
918 },
e489030d 919 .qdev.reset = virtio_pci_reset,
0aab0d3a 920 },{
758e8e38 921#ifdef CONFIG_VIRTFS
9f107513
AL
922 .qdev.name = "virtio-9p-pci",
923 .qdev.size = sizeof(VirtIOPCIProxy),
924 .init = virtio_9p_init_pci,
925 .qdev.props = (Property[]) {
9dbcca5a 926 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 2),
9f107513
AL
927 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
928 DEFINE_PROP_STRING("mount_tag", VirtIOPCIProxy, fsconf.tag),
929 DEFINE_PROP_STRING("fsdev", VirtIOPCIProxy, fsconf.fsdev_id),
930 DEFINE_PROP_END_OF_LIST(),
931 },
932 }, {
933#endif
0aab0d3a
GH
934 /* end of list */
935 }
936};
937
53c25cea
PB
938static void virtio_pci_register_devices(void)
939{
0aab0d3a 940 pci_qdev_register_many(virtio_info);
53c25cea
PB
941}
942
943device_init(virtio_pci_register_devices)