]> git.proxmox.com Git - qemu.git/blame - hw/virtio-pci.c
user: Restore debug usage message for '-d ?' in user mode emulation
[qemu.git] / hw / virtio-pci.c
CommitLineData
53c25cea
PB
1/*
2 * Virtio PCI Bindings
3 *
4 * Copyright IBM, Corp. 2007
5 * Copyright (c) 2009 CodeSourcery
6 *
7 * Authors:
8 * Anthony Liguori <aliguori@us.ibm.com>
9 * Paul Brook <paul@codesourcery.com>
10 *
11 * This work is licensed under the terms of the GNU GPL, version 2. See
12 * the COPYING file in the top-level directory.
13 *
14 */
15
16#include <inttypes.h>
17
18#include "virtio.h"
8172539d
MT
19#include "virtio-blk.h"
20#include "virtio-net.h"
6b331efb 21#include "virtio-serial.h"
53c25cea 22#include "pci.h"
2f792016 23#include "qemu-error.h"
aba800a3 24#include "msix.h"
a1e0fea5 25#include "net.h"
97b15621 26#include "loader.h"
ade80dc8 27#include "kvm.h"
2446333c 28#include "blockdev.h"
9fe1ebeb 29#include "virtio-pci.h"
53c25cea
PB
30
31/* from Linux's linux/virtio_pci.h */
32
33/* A 32-bit r/o bitmask of the features supported by the host */
34#define VIRTIO_PCI_HOST_FEATURES 0
35
36/* A 32-bit r/w bitmask of features activated by the guest */
37#define VIRTIO_PCI_GUEST_FEATURES 4
38
39/* A 32-bit r/w PFN for the currently selected queue */
40#define VIRTIO_PCI_QUEUE_PFN 8
41
42/* A 16-bit r/o queue size for the currently selected queue */
43#define VIRTIO_PCI_QUEUE_NUM 12
44
45/* A 16-bit r/w queue selector */
46#define VIRTIO_PCI_QUEUE_SEL 14
47
48/* A 16-bit r/w queue notifier */
49#define VIRTIO_PCI_QUEUE_NOTIFY 16
50
51/* An 8-bit device status register. */
52#define VIRTIO_PCI_STATUS 18
53
54/* An 8-bit r/o interrupt status register. Reading the value will return the
55 * current contents of the ISR and will also clear it. This is effectively
56 * a read-and-acknowledge. */
57#define VIRTIO_PCI_ISR 19
58
aba800a3
MT
59/* MSI-X registers: only enabled if MSI-X is enabled. */
60/* A 16-bit vector for configuration changes. */
61#define VIRTIO_MSI_CONFIG_VECTOR 20
62/* A 16-bit vector for selected queue notifications. */
63#define VIRTIO_MSI_QUEUE_VECTOR 22
64
65/* Config space size */
66#define VIRTIO_PCI_CONFIG_NOMSI 20
67#define VIRTIO_PCI_CONFIG_MSI 24
68#define VIRTIO_PCI_REGION_SIZE(dev) (msix_present(dev) ? \
69 VIRTIO_PCI_CONFIG_MSI : \
70 VIRTIO_PCI_CONFIG_NOMSI)
71
72/* The remaining space is defined by each driver as the per-driver
73 * configuration space */
74#define VIRTIO_PCI_CONFIG(dev) (msix_enabled(dev) ? \
75 VIRTIO_PCI_CONFIG_MSI : \
76 VIRTIO_PCI_CONFIG_NOMSI)
53c25cea 77
53c25cea
PB
78/* How many bits to shift physical queue address written to QUEUE_PFN.
79 * 12 is historical, and due to x86 page size. */
80#define VIRTIO_PCI_QUEUE_ADDR_SHIFT 12
81
3dbca8e6
SH
82/* Flags track per-device state like workarounds for quirks in older guests. */
83#define VIRTIO_PCI_FLAG_BUS_MASTER_BUG (1 << 0)
c81131db 84
25db9ebe
SH
85/* Performance improves when virtqueue kick processing is decoupled from the
86 * vcpu thread using ioeventfd for some devices. */
87#define VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT 1
88#define VIRTIO_PCI_FLAG_USE_IOEVENTFD (1 << VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT)
89
53c25cea
PB
90/* QEMU doesn't strictly need write barriers since everything runs in
91 * lock-step. We'll leave the calls to wmb() in though to make it obvious for
92 * KVM or if kqemu gets SMP support.
93 */
94#define wmb() do { } while (0)
95
53c25cea
PB
96/* virtio device */
97
7055e687 98static void virtio_pci_notify(void *opaque, uint16_t vector)
53c25cea
PB
99{
100 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
101 if (msix_enabled(&proxy->pci_dev))
102 msix_notify(&proxy->pci_dev, vector);
103 else
104 qemu_set_irq(proxy->pci_dev.irq[0], proxy->vdev->isr & 1);
53c25cea
PB
105}
106
ff24bd58
MT
107static void virtio_pci_save_config(void * opaque, QEMUFile *f)
108{
109 VirtIOPCIProxy *proxy = opaque;
110 pci_device_save(&proxy->pci_dev, f);
111 msix_save(&proxy->pci_dev, f);
112 if (msix_present(&proxy->pci_dev))
113 qemu_put_be16(f, proxy->vdev->config_vector);
114}
115
116static void virtio_pci_save_queue(void * opaque, int n, QEMUFile *f)
117{
118 VirtIOPCIProxy *proxy = opaque;
119 if (msix_present(&proxy->pci_dev))
120 qemu_put_be16(f, virtio_queue_vector(proxy->vdev, n));
121}
122
123static int virtio_pci_load_config(void * opaque, QEMUFile *f)
124{
125 VirtIOPCIProxy *proxy = opaque;
126 int ret;
127 ret = pci_device_load(&proxy->pci_dev, f);
e6da7680 128 if (ret) {
ff24bd58 129 return ret;
e6da7680 130 }
ff24bd58 131 msix_load(&proxy->pci_dev, f);
e6da7680 132 if (msix_present(&proxy->pci_dev)) {
ff24bd58 133 qemu_get_be16s(f, &proxy->vdev->config_vector);
e6da7680
MT
134 } else {
135 proxy->vdev->config_vector = VIRTIO_NO_VECTOR;
136 }
137 if (proxy->vdev->config_vector != VIRTIO_NO_VECTOR) {
138 return msix_vector_use(&proxy->pci_dev, proxy->vdev->config_vector);
139 }
ff24bd58
MT
140 return 0;
141}
142
143static int virtio_pci_load_queue(void * opaque, int n, QEMUFile *f)
144{
145 VirtIOPCIProxy *proxy = opaque;
146 uint16_t vector;
e6da7680
MT
147 if (msix_present(&proxy->pci_dev)) {
148 qemu_get_be16s(f, &vector);
149 } else {
150 vector = VIRTIO_NO_VECTOR;
151 }
ff24bd58 152 virtio_queue_set_vector(proxy->vdev, n, vector);
e6da7680
MT
153 if (vector != VIRTIO_NO_VECTOR) {
154 return msix_vector_use(&proxy->pci_dev, vector);
155 }
ff24bd58
MT
156 return 0;
157}
158
25db9ebe
SH
159static int virtio_pci_set_host_notifier_internal(VirtIOPCIProxy *proxy,
160 int n, bool assign)
161{
162 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
163 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
164 int r;
165 if (assign) {
166 r = event_notifier_init(notifier, 1);
167 if (r < 0) {
b36e3914
MT
168 error_report("%s: unable to init event notifier: %d",
169 __func__, r);
25db9ebe
SH
170 return r;
171 }
172 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
173 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
174 n, assign);
175 if (r < 0) {
b36e3914
MT
176 error_report("%s: unable to map ioeventfd: %d",
177 __func__, r);
25db9ebe
SH
178 event_notifier_cleanup(notifier);
179 }
180 } else {
181 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
182 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
183 n, assign);
184 if (r < 0) {
b36e3914
MT
185 error_report("%s: unable to unmap ioeventfd: %d",
186 __func__, r);
25db9ebe
SH
187 return r;
188 }
189
190 /* Handle the race condition where the guest kicked and we deassigned
191 * before we got around to handling the kick.
192 */
193 if (event_notifier_test_and_clear(notifier)) {
194 virtio_queue_notify_vq(vq);
195 }
196
197 event_notifier_cleanup(notifier);
198 }
199 return r;
200}
201
202static void virtio_pci_host_notifier_read(void *opaque)
203{
204 VirtQueue *vq = opaque;
205 EventNotifier *n = virtio_queue_get_host_notifier(vq);
206 if (event_notifier_test_and_clear(n)) {
207 virtio_queue_notify_vq(vq);
208 }
209}
210
211static void virtio_pci_set_host_notifier_fd_handler(VirtIOPCIProxy *proxy,
212 int n, bool assign)
213{
214 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
215 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
216 if (assign) {
217 qemu_set_fd_handler(event_notifier_get_fd(notifier),
218 virtio_pci_host_notifier_read, NULL, vq);
219 } else {
220 qemu_set_fd_handler(event_notifier_get_fd(notifier),
221 NULL, NULL, NULL);
222 }
223}
224
b36e3914 225static void virtio_pci_start_ioeventfd(VirtIOPCIProxy *proxy)
25db9ebe
SH
226{
227 int n, r;
228
229 if (!(proxy->flags & VIRTIO_PCI_FLAG_USE_IOEVENTFD) ||
230 proxy->ioeventfd_disabled ||
231 proxy->ioeventfd_started) {
b36e3914 232 return;
25db9ebe
SH
233 }
234
235 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
236 if (!virtio_queue_get_num(proxy->vdev, n)) {
237 continue;
238 }
239
240 r = virtio_pci_set_host_notifier_internal(proxy, n, true);
241 if (r < 0) {
242 goto assign_error;
243 }
244
245 virtio_pci_set_host_notifier_fd_handler(proxy, n, true);
246 }
247 proxy->ioeventfd_started = true;
b36e3914 248 return;
25db9ebe
SH
249
250assign_error:
251 while (--n >= 0) {
252 if (!virtio_queue_get_num(proxy->vdev, n)) {
253 continue;
254 }
255
256 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
b36e3914
MT
257 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
258 assert(r >= 0);
25db9ebe
SH
259 }
260 proxy->ioeventfd_started = false;
b36e3914 261 error_report("%s: failed. Fallback to a userspace (slower).", __func__);
25db9ebe
SH
262}
263
b36e3914 264static void virtio_pci_stop_ioeventfd(VirtIOPCIProxy *proxy)
25db9ebe 265{
b36e3914 266 int r;
25db9ebe
SH
267 int n;
268
269 if (!proxy->ioeventfd_started) {
b36e3914 270 return;
25db9ebe
SH
271 }
272
273 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
274 if (!virtio_queue_get_num(proxy->vdev, n)) {
275 continue;
276 }
277
278 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
b36e3914
MT
279 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
280 assert(r >= 0);
25db9ebe
SH
281 }
282 proxy->ioeventfd_started = false;
25db9ebe
SH
283}
284
e489030d 285static void virtio_pci_reset(DeviceState *d)
7055e687 286{
e489030d 287 VirtIOPCIProxy *proxy = container_of(d, VirtIOPCIProxy, pci_dev.qdev);
25db9ebe 288 virtio_pci_stop_ioeventfd(proxy);
7055e687 289 virtio_reset(proxy->vdev);
aba800a3 290 msix_reset(&proxy->pci_dev);
25db9ebe 291 proxy->flags &= ~VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
7055e687
MT
292}
293
53c25cea
PB
294static void virtio_ioport_write(void *opaque, uint32_t addr, uint32_t val)
295{
296 VirtIOPCIProxy *proxy = opaque;
297 VirtIODevice *vdev = proxy->vdev;
c227f099 298 target_phys_addr_t pa;
53c25cea 299
53c25cea
PB
300 switch (addr) {
301 case VIRTIO_PCI_GUEST_FEATURES:
302 /* Guest does not negotiate properly? We have to assume nothing. */
303 if (val & (1 << VIRTIO_F_BAD_FEATURE)) {
304 if (vdev->bad_features)
8172539d 305 val = proxy->host_features & vdev->bad_features(vdev);
53c25cea
PB
306 else
307 val = 0;
308 }
309 if (vdev->set_features)
310 vdev->set_features(vdev, val);
704a76fc 311 vdev->guest_features = val;
53c25cea
PB
312 break;
313 case VIRTIO_PCI_QUEUE_PFN:
c227f099 314 pa = (target_phys_addr_t)val << VIRTIO_PCI_QUEUE_ADDR_SHIFT;
1b8e9b27 315 if (pa == 0) {
25db9ebe 316 virtio_pci_stop_ioeventfd(proxy);
1b8e9b27
MT
317 virtio_reset(proxy->vdev);
318 msix_unuse_all_vectors(&proxy->pci_dev);
319 }
7055e687
MT
320 else
321 virtio_queue_set_addr(vdev, vdev->queue_sel, pa);
53c25cea
PB
322 break;
323 case VIRTIO_PCI_QUEUE_SEL:
324 if (val < VIRTIO_PCI_QUEUE_MAX)
325 vdev->queue_sel = val;
326 break;
327 case VIRTIO_PCI_QUEUE_NOTIFY:
7157e2e2
SH
328 if (val < VIRTIO_PCI_QUEUE_MAX) {
329 virtio_queue_notify(vdev, val);
330 }
53c25cea
PB
331 break;
332 case VIRTIO_PCI_STATUS:
25db9ebe
SH
333 if (!(val & VIRTIO_CONFIG_S_DRIVER_OK)) {
334 virtio_pci_stop_ioeventfd(proxy);
335 }
336
3e607cb5 337 virtio_set_status(vdev, val & 0xFF);
25db9ebe
SH
338
339 if (val & VIRTIO_CONFIG_S_DRIVER_OK) {
340 virtio_pci_start_ioeventfd(proxy);
341 }
342
1b8e9b27
MT
343 if (vdev->status == 0) {
344 virtio_reset(proxy->vdev);
345 msix_unuse_all_vectors(&proxy->pci_dev);
346 }
c81131db
AG
347
348 /* Linux before 2.6.34 sets the device as OK without enabling
349 the PCI device bus master bit. In this case we need to disable
350 some safety checks. */
351 if ((val & VIRTIO_CONFIG_S_DRIVER_OK) &&
352 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
3dbca8e6 353 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
c81131db 354 }
53c25cea 355 break;
aba800a3
MT
356 case VIRTIO_MSI_CONFIG_VECTOR:
357 msix_vector_unuse(&proxy->pci_dev, vdev->config_vector);
358 /* Make it possible for guest to discover an error took place. */
359 if (msix_vector_use(&proxy->pci_dev, val) < 0)
360 val = VIRTIO_NO_VECTOR;
361 vdev->config_vector = val;
362 break;
363 case VIRTIO_MSI_QUEUE_VECTOR:
364 msix_vector_unuse(&proxy->pci_dev,
365 virtio_queue_vector(vdev, vdev->queue_sel));
366 /* Make it possible for guest to discover an error took place. */
367 if (msix_vector_use(&proxy->pci_dev, val) < 0)
368 val = VIRTIO_NO_VECTOR;
369 virtio_queue_set_vector(vdev, vdev->queue_sel, val);
370 break;
371 default:
4e02d460
SH
372 error_report("%s: unexpected address 0x%x value 0x%x",
373 __func__, addr, val);
aba800a3 374 break;
53c25cea
PB
375 }
376}
377
aba800a3 378static uint32_t virtio_ioport_read(VirtIOPCIProxy *proxy, uint32_t addr)
53c25cea 379{
53c25cea
PB
380 VirtIODevice *vdev = proxy->vdev;
381 uint32_t ret = 0xFFFFFFFF;
382
53c25cea
PB
383 switch (addr) {
384 case VIRTIO_PCI_HOST_FEATURES:
8172539d 385 ret = proxy->host_features;
53c25cea
PB
386 break;
387 case VIRTIO_PCI_GUEST_FEATURES:
704a76fc 388 ret = vdev->guest_features;
53c25cea
PB
389 break;
390 case VIRTIO_PCI_QUEUE_PFN:
391 ret = virtio_queue_get_addr(vdev, vdev->queue_sel)
392 >> VIRTIO_PCI_QUEUE_ADDR_SHIFT;
393 break;
394 case VIRTIO_PCI_QUEUE_NUM:
395 ret = virtio_queue_get_num(vdev, vdev->queue_sel);
396 break;
397 case VIRTIO_PCI_QUEUE_SEL:
398 ret = vdev->queue_sel;
399 break;
400 case VIRTIO_PCI_STATUS:
401 ret = vdev->status;
402 break;
403 case VIRTIO_PCI_ISR:
404 /* reading from the ISR also clears it. */
405 ret = vdev->isr;
406 vdev->isr = 0;
7055e687 407 qemu_set_irq(proxy->pci_dev.irq[0], 0);
53c25cea 408 break;
aba800a3
MT
409 case VIRTIO_MSI_CONFIG_VECTOR:
410 ret = vdev->config_vector;
411 break;
412 case VIRTIO_MSI_QUEUE_VECTOR:
413 ret = virtio_queue_vector(vdev, vdev->queue_sel);
414 break;
53c25cea
PB
415 default:
416 break;
417 }
418
419 return ret;
420}
421
422static uint32_t virtio_pci_config_readb(void *opaque, uint32_t addr)
423{
424 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
425 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
426 addr -= proxy->addr;
427 if (addr < config)
428 return virtio_ioport_read(proxy, addr);
429 addr -= config;
53c25cea
PB
430 return virtio_config_readb(proxy->vdev, addr);
431}
432
433static uint32_t virtio_pci_config_readw(void *opaque, uint32_t addr)
434{
435 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
436 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
437 addr -= proxy->addr;
438 if (addr < config)
439 return virtio_ioport_read(proxy, addr);
440 addr -= config;
53c25cea
PB
441 return virtio_config_readw(proxy->vdev, addr);
442}
443
444static uint32_t virtio_pci_config_readl(void *opaque, uint32_t addr)
445{
446 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
447 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
448 addr -= proxy->addr;
449 if (addr < config)
450 return virtio_ioport_read(proxy, addr);
451 addr -= config;
53c25cea
PB
452 return virtio_config_readl(proxy->vdev, addr);
453}
454
455static void virtio_pci_config_writeb(void *opaque, uint32_t addr, uint32_t val)
456{
457 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
458 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
459 addr -= proxy->addr;
460 if (addr < config) {
461 virtio_ioport_write(proxy, addr, val);
462 return;
463 }
464 addr -= config;
53c25cea
PB
465 virtio_config_writeb(proxy->vdev, addr, val);
466}
467
468static void virtio_pci_config_writew(void *opaque, uint32_t addr, uint32_t val)
469{
470 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
471 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
472 addr -= proxy->addr;
473 if (addr < config) {
474 virtio_ioport_write(proxy, addr, val);
475 return;
476 }
477 addr -= config;
53c25cea
PB
478 virtio_config_writew(proxy->vdev, addr, val);
479}
480
481static void virtio_pci_config_writel(void *opaque, uint32_t addr, uint32_t val)
482{
483 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
484 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
485 addr -= proxy->addr;
486 if (addr < config) {
487 virtio_ioport_write(proxy, addr, val);
488 return;
489 }
490 addr -= config;
53c25cea
PB
491 virtio_config_writel(proxy->vdev, addr, val);
492}
493
494static void virtio_map(PCIDevice *pci_dev, int region_num,
6e355d90 495 pcibus_t addr, pcibus_t size, int type)
53c25cea
PB
496{
497 VirtIOPCIProxy *proxy = container_of(pci_dev, VirtIOPCIProxy, pci_dev);
498 VirtIODevice *vdev = proxy->vdev;
aba800a3 499 unsigned config_len = VIRTIO_PCI_REGION_SIZE(pci_dev) + vdev->config_len;
53c25cea
PB
500
501 proxy->addr = addr;
53c25cea 502
aba800a3
MT
503 register_ioport_write(addr, config_len, 1, virtio_pci_config_writeb, proxy);
504 register_ioport_write(addr, config_len, 2, virtio_pci_config_writew, proxy);
505 register_ioport_write(addr, config_len, 4, virtio_pci_config_writel, proxy);
506 register_ioport_read(addr, config_len, 1, virtio_pci_config_readb, proxy);
507 register_ioport_read(addr, config_len, 2, virtio_pci_config_readw, proxy);
508 register_ioport_read(addr, config_len, 4, virtio_pci_config_readl, proxy);
53c25cea 509
aba800a3 510 if (vdev->config_len)
53c25cea 511 vdev->get_config(vdev, vdev->config);
aba800a3
MT
512}
513
514static void virtio_write_config(PCIDevice *pci_dev, uint32_t address,
515 uint32_t val, int len)
516{
ed757e14
YV
517 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
518
519 if (PCI_COMMAND == address) {
520 if (!(val & PCI_COMMAND_MASTER)) {
3dbca8e6 521 if (!(proxy->flags & VIRTIO_PCI_FLAG_BUS_MASTER_BUG)) {
25db9ebe 522 virtio_pci_stop_ioeventfd(proxy);
3e607cb5
MT
523 virtio_set_status(proxy->vdev,
524 proxy->vdev->status & ~VIRTIO_CONFIG_S_DRIVER_OK);
c81131db 525 }
ed757e14
YV
526 }
527 }
528
aba800a3 529 pci_default_write_config(pci_dev, address, val, len);
85352471 530 msix_write_config(pci_dev, address, val, len);
53c25cea
PB
531}
532
6d74ca5a
MT
533static unsigned virtio_pci_get_features(void *opaque)
534{
8172539d
MT
535 VirtIOPCIProxy *proxy = opaque;
536 return proxy->host_features;
6d74ca5a
MT
537}
538
ade80dc8
MT
539static void virtio_pci_guest_notifier_read(void *opaque)
540{
541 VirtQueue *vq = opaque;
542 EventNotifier *n = virtio_queue_get_guest_notifier(vq);
543 if (event_notifier_test_and_clear(n)) {
544 virtio_irq(vq);
545 }
546}
547
548static int virtio_pci_set_guest_notifier(void *opaque, int n, bool assign)
549{
550 VirtIOPCIProxy *proxy = opaque;
551 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
552 EventNotifier *notifier = virtio_queue_get_guest_notifier(vq);
553
554 if (assign) {
555 int r = event_notifier_init(notifier, 0);
556 if (r < 0) {
557 return r;
558 }
559 qemu_set_fd_handler(event_notifier_get_fd(notifier),
560 virtio_pci_guest_notifier_read, NULL, vq);
561 } else {
562 qemu_set_fd_handler(event_notifier_get_fd(notifier),
563 NULL, NULL, NULL);
564 event_notifier_cleanup(notifier);
565 }
566
567 return 0;
568}
569
5430a28f 570static bool virtio_pci_query_guest_notifiers(void *opaque)
571{
572 VirtIOPCIProxy *proxy = opaque;
573 return msix_enabled(&proxy->pci_dev);
574}
575
54dd9321
MT
576static int virtio_pci_set_guest_notifiers(void *opaque, bool assign)
577{
578 VirtIOPCIProxy *proxy = opaque;
579 VirtIODevice *vdev = proxy->vdev;
580 int r, n;
581
582 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
583 if (!virtio_queue_get_num(vdev, n)) {
584 break;
585 }
586
587 r = virtio_pci_set_guest_notifier(opaque, n, assign);
588 if (r < 0) {
589 goto assign_error;
590 }
591 }
592
593 return 0;
594
595assign_error:
596 /* We get here on assignment failure. Recover by undoing for VQs 0 .. n. */
597 while (--n >= 0) {
598 virtio_pci_set_guest_notifier(opaque, n, !assign);
599 }
600 return r;
601}
602
ade80dc8
MT
603static int virtio_pci_set_host_notifier(void *opaque, int n, bool assign)
604{
605 VirtIOPCIProxy *proxy = opaque;
25db9ebe
SH
606
607 /* Stop using ioeventfd for virtqueue kick if the device starts using host
608 * notifiers. This makes it easy to avoid stepping on each others' toes.
609 */
610 proxy->ioeventfd_disabled = assign;
ade80dc8 611 if (assign) {
25db9ebe
SH
612 virtio_pci_stop_ioeventfd(proxy);
613 }
614 /* We don't need to start here: it's not needed because backend
615 * currently only stops on status change away from ok,
616 * reset, vmstop and such. If we do add code to start here,
617 * need to check vmstate, device state etc. */
618 return virtio_pci_set_host_notifier_internal(proxy, n, assign);
619}
620
621static void virtio_pci_vmstate_change(void *opaque, bool running)
622{
623 VirtIOPCIProxy *proxy = opaque;
624
625 if (running) {
89c473fd
MT
626 /* Try to find out if the guest has bus master disabled, but is
627 in ready state. Then we have a buggy guest OS. */
628 if ((proxy->vdev->status & VIRTIO_CONFIG_S_DRIVER_OK) &&
629 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
630 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
631 }
25db9ebe 632 virtio_pci_start_ioeventfd(proxy);
ade80dc8 633 } else {
25db9ebe 634 virtio_pci_stop_ioeventfd(proxy);
ade80dc8 635 }
ade80dc8
MT
636}
637
53c25cea 638static const VirtIOBindings virtio_pci_bindings = {
ff24bd58
MT
639 .notify = virtio_pci_notify,
640 .save_config = virtio_pci_save_config,
641 .load_config = virtio_pci_load_config,
642 .save_queue = virtio_pci_save_queue,
643 .load_queue = virtio_pci_load_queue,
6d74ca5a 644 .get_features = virtio_pci_get_features,
5430a28f 645 .query_guest_notifiers = virtio_pci_query_guest_notifiers,
ade80dc8 646 .set_host_notifier = virtio_pci_set_host_notifier,
54dd9321 647 .set_guest_notifiers = virtio_pci_set_guest_notifiers,
25db9ebe 648 .vmstate_change = virtio_pci_vmstate_change,
53c25cea
PB
649};
650
befeac45 651void virtio_init_pci(VirtIOPCIProxy *proxy, VirtIODevice *vdev)
53c25cea
PB
652{
653 uint8_t *config;
654 uint32_t size;
655
656 proxy->vdev = vdev;
657
658 config = proxy->pci_dev.config;
53c25cea 659
e75ccf2c
IY
660 if (proxy->class_code) {
661 pci_config_set_class(config, proxy->class_code);
662 }
663 pci_set_word(config + 0x2c, pci_get_word(config + PCI_VENDOR_ID));
664 pci_set_word(config + 0x2e, vdev->device_id);
53c25cea
PB
665 config[0x3d] = 1;
666
5a1fc5e8 667 if (vdev->nvectors && !msix_init(&proxy->pci_dev, vdev->nvectors, 1, 0)) {
aba800a3
MT
668 pci_register_bar(&proxy->pci_dev, 1,
669 msix_bar_size(&proxy->pci_dev),
0392a017 670 PCI_BASE_ADDRESS_SPACE_MEMORY,
aba800a3 671 msix_mmio_map);
aba800a3
MT
672 } else
673 vdev->nvectors = 0;
674
ed757e14
YV
675 proxy->pci_dev.config_write = virtio_write_config;
676
aba800a3 677 size = VIRTIO_PCI_REGION_SIZE(&proxy->pci_dev) + vdev->config_len;
53c25cea
PB
678 if (size & (size-1))
679 size = 1 << qemu_fls(size);
680
0392a017 681 pci_register_bar(&proxy->pci_dev, 0, size, PCI_BASE_ADDRESS_SPACE_IO,
53c25cea
PB
682 virtio_map);
683
25db9ebe
SH
684 if (!kvm_has_many_ioeventfds()) {
685 proxy->flags &= ~VIRTIO_PCI_FLAG_USE_IOEVENTFD;
686 }
687
53c25cea 688 virtio_bind_device(vdev, &virtio_pci_bindings, proxy);
8172539d
MT
689 proxy->host_features |= 0x1 << VIRTIO_F_NOTIFY_ON_EMPTY;
690 proxy->host_features |= 0x1 << VIRTIO_F_BAD_FEATURE;
691 proxy->host_features = vdev->get_features(vdev, proxy->host_features);
53c25cea
PB
692}
693
81a322d4 694static int virtio_blk_init_pci(PCIDevice *pci_dev)
53c25cea
PB
695{
696 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
697 VirtIODevice *vdev;
698
ab73ff29
GH
699 if (proxy->class_code != PCI_CLASS_STORAGE_SCSI &&
700 proxy->class_code != PCI_CLASS_STORAGE_OTHER)
701 proxy->class_code = PCI_CLASS_STORAGE_SCSI;
53c25cea 702
a8686a9b
MA
703 vdev = virtio_blk_init(&pci_dev->qdev, &proxy->block,
704 &proxy->block_serial);
ac0c14d7
MA
705 if (!vdev) {
706 return -1;
707 }
177539e0 708 vdev->nvectors = proxy->nvectors;
e75ccf2c 709 virtio_init_pci(proxy, vdev);
177539e0
GH
710 /* make the actual value visible */
711 proxy->nvectors = vdev->nvectors;
81a322d4 712 return 0;
21d58b57
MM
713}
714
0f457d91
MT
715static int virtio_exit_pci(PCIDevice *pci_dev)
716{
717 return msix_uninit(pci_dev);
718}
719
56a14938
GH
720static int virtio_blk_exit_pci(PCIDevice *pci_dev)
721{
722 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
723
25db9ebe 724 virtio_pci_stop_ioeventfd(proxy);
9d0d3138 725 virtio_blk_exit(proxy->vdev);
f8b6cc00 726 blockdev_mark_auto_del(proxy->block.bs);
0f457d91 727 return virtio_exit_pci(pci_dev);
56a14938
GH
728}
729
98b19252 730static int virtio_serial_init_pci(PCIDevice *pci_dev)
21d58b57 731{
d6beee99 732 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
85c2c735
MM
733 VirtIODevice *vdev;
734
d6beee99
GH
735 if (proxy->class_code != PCI_CLASS_COMMUNICATION_OTHER &&
736 proxy->class_code != PCI_CLASS_DISPLAY_OTHER && /* qemu 0.10 */
737 proxy->class_code != PCI_CLASS_OTHERS) /* qemu-kvm */
738 proxy->class_code = PCI_CLASS_COMMUNICATION_OTHER;
739
6b331efb 740 vdev = virtio_serial_init(&pci_dev->qdev, &proxy->serial);
25fe3654
AS
741 if (!vdev) {
742 return -1;
743 }
573fb60c 744 vdev->nvectors = proxy->nvectors == DEV_NVECTORS_UNSPECIFIED
6b331efb 745 ? proxy->serial.max_virtserial_ports + 1
573fb60c 746 : proxy->nvectors;
e75ccf2c 747 virtio_init_pci(proxy, vdev);
a1829205 748 proxy->nvectors = vdev->nvectors;
81a322d4 749 return 0;
53c25cea
PB
750}
751
8b53a865
AS
752static int virtio_serial_exit_pci(PCIDevice *pci_dev)
753{
754 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
755
32059220 756 virtio_pci_stop_ioeventfd(proxy);
8b53a865
AS
757 virtio_serial_exit(proxy->vdev);
758 return virtio_exit_pci(pci_dev);
759}
760
81a322d4 761static int virtio_net_init_pci(PCIDevice *pci_dev)
53c25cea
PB
762{
763 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
764 VirtIODevice *vdev;
765
f0c07c7c 766 vdev = virtio_net_init(&pci_dev->qdev, &proxy->nic, &proxy->net);
a1e0fea5 767
97b15621 768 vdev->nvectors = proxy->nvectors;
e75ccf2c 769 virtio_init_pci(proxy, vdev);
a1e0fea5
GH
770
771 /* make the actual value visible */
772 proxy->nvectors = vdev->nvectors;
81a322d4 773 return 0;
53c25cea
PB
774}
775
97b15621
GH
776static int virtio_net_exit_pci(PCIDevice *pci_dev)
777{
778 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
779
25db9ebe 780 virtio_pci_stop_ioeventfd(proxy);
97b15621
GH
781 virtio_net_exit(proxy->vdev);
782 return virtio_exit_pci(pci_dev);
783}
784
81a322d4 785static int virtio_balloon_init_pci(PCIDevice *pci_dev)
53c25cea
PB
786{
787 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
788 VirtIODevice *vdev;
789
790 vdev = virtio_balloon_init(&pci_dev->qdev);
ab640dbf
AS
791 if (!vdev) {
792 return -1;
793 }
e75ccf2c 794 virtio_init_pci(proxy, vdev);
81a322d4 795 return 0;
53c25cea
PB
796}
797
7e10be8c
AS
798static int virtio_balloon_exit_pci(PCIDevice *pci_dev)
799{
800 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
801
802 virtio_pci_stop_ioeventfd(proxy);
803 virtio_balloon_exit(proxy->vdev);
804 return virtio_exit_pci(pci_dev);
805}
806
0aab0d3a
GH
807static PCIDeviceInfo virtio_info[] = {
808 {
809 .qdev.name = "virtio-blk-pci",
779206de 810 .qdev.alias = "virtio-blk",
0aab0d3a
GH
811 .qdev.size = sizeof(VirtIOPCIProxy),
812 .init = virtio_blk_init_pci,
56a14938 813 .exit = virtio_blk_exit_pci,
e75ccf2c
IY
814 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
815 .device_id = PCI_DEVICE_ID_VIRTIO_BLOCK,
816 .revision = VIRTIO_PCI_ABI_VERSION,
817 .class_id = PCI_CLASS_STORAGE_SCSI,
ab73ff29 818 .qdev.props = (Property[]) {
72c61d0b 819 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
428c149b 820 DEFINE_BLOCK_PROPERTIES(VirtIOPCIProxy, block),
a8686a9b 821 DEFINE_PROP_STRING("serial", VirtIOPCIProxy, block_serial),
25db9ebe
SH
822 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
823 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, true),
177539e0 824 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 2),
8172539d 825 DEFINE_VIRTIO_BLK_FEATURES(VirtIOPCIProxy, host_features),
72c61d0b 826 DEFINE_PROP_END_OF_LIST(),
ab73ff29 827 },
e489030d 828 .qdev.reset = virtio_pci_reset,
0aab0d3a 829 },{
a1e0fea5 830 .qdev.name = "virtio-net-pci",
29f82b37 831 .qdev.alias = "virtio-net",
a1e0fea5
GH
832 .qdev.size = sizeof(VirtIOPCIProxy),
833 .init = virtio_net_init_pci,
97b15621 834 .exit = virtio_net_exit_pci,
5ee8ad71 835 .romfile = "pxe-virtio.rom",
e75ccf2c
IY
836 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
837 .device_id = PCI_DEVICE_ID_VIRTIO_NET,
838 .revision = VIRTIO_PCI_ABI_VERSION,
839 .class_id = PCI_CLASS_NETWORK_ETHERNET,
a1e0fea5 840 .qdev.props = (Property[]) {
25db9ebe
SH
841 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
842 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, false),
97b15621 843 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 3),
8172539d 844 DEFINE_VIRTIO_NET_FEATURES(VirtIOPCIProxy, host_features),
97b15621 845 DEFINE_NIC_PROPERTIES(VirtIOPCIProxy, nic),
f0c07c7c
AW
846 DEFINE_PROP_UINT32("x-txtimer", VirtIOPCIProxy,
847 net.txtimer, TX_TIMER_INTERVAL),
e3f30488
AW
848 DEFINE_PROP_INT32("x-txburst", VirtIOPCIProxy,
849 net.txburst, TX_BURST),
a697a334 850 DEFINE_PROP_STRING("tx", VirtIOPCIProxy, net.tx),
72c61d0b 851 DEFINE_PROP_END_OF_LIST(),
a1e0fea5 852 },
e489030d 853 .qdev.reset = virtio_pci_reset,
0aab0d3a 854 },{
98b19252
AS
855 .qdev.name = "virtio-serial-pci",
856 .qdev.alias = "virtio-serial",
0aab0d3a 857 .qdev.size = sizeof(VirtIOPCIProxy),
98b19252 858 .init = virtio_serial_init_pci,
8b53a865 859 .exit = virtio_serial_exit_pci,
e75ccf2c
IY
860 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
861 .device_id = PCI_DEVICE_ID_VIRTIO_CONSOLE,
862 .revision = VIRTIO_PCI_ABI_VERSION,
863 .class_id = PCI_CLASS_COMMUNICATION_OTHER,
d6beee99 864 .qdev.props = (Property[]) {
32059220
AS
865 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
866 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, true),
573fb60c
AS
867 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors,
868 DEV_NVECTORS_UNSPECIFIED),
72c61d0b 869 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
8172539d 870 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
6b331efb
AS
871 DEFINE_PROP_UINT32("max_ports", VirtIOPCIProxy,
872 serial.max_virtserial_ports, 31),
72c61d0b 873 DEFINE_PROP_END_OF_LIST(),
d6beee99 874 },
e489030d 875 .qdev.reset = virtio_pci_reset,
0aab0d3a
GH
876 },{
877 .qdev.name = "virtio-balloon-pci",
29f82b37 878 .qdev.alias = "virtio-balloon",
0aab0d3a
GH
879 .qdev.size = sizeof(VirtIOPCIProxy),
880 .init = virtio_balloon_init_pci,
7e10be8c 881 .exit = virtio_balloon_exit_pci,
e75ccf2c
IY
882 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
883 .device_id = PCI_DEVICE_ID_VIRTIO_BALLOON,
884 .revision = VIRTIO_PCI_ABI_VERSION,
885 .class_id = PCI_CLASS_MEMORY_RAM,
8172539d
MT
886 .qdev.props = (Property[]) {
887 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
888 DEFINE_PROP_END_OF_LIST(),
889 },
e489030d 890 .qdev.reset = virtio_pci_reset,
0aab0d3a
GH
891 },{
892 /* end of list */
893 }
894};
895
53c25cea
PB
896static void virtio_pci_register_devices(void)
897{
0aab0d3a 898 pci_qdev_register_many(virtio_info);
53c25cea
PB
899}
900
901device_init(virtio_pci_register_devices)