]> git.proxmox.com Git - mirror_qemu.git/blame - hw/virtio-pci.c
ivshmem: convert to memory API
[mirror_qemu.git] / hw / virtio-pci.c
CommitLineData
53c25cea
PB
1/*
2 * Virtio PCI Bindings
3 *
4 * Copyright IBM, Corp. 2007
5 * Copyright (c) 2009 CodeSourcery
6 *
7 * Authors:
8 * Anthony Liguori <aliguori@us.ibm.com>
9 * Paul Brook <paul@codesourcery.com>
10 *
11 * This work is licensed under the terms of the GNU GPL, version 2. See
12 * the COPYING file in the top-level directory.
13 *
14 */
15
16#include <inttypes.h>
17
18#include "virtio.h"
8172539d
MT
19#include "virtio-blk.h"
20#include "virtio-net.h"
6b331efb 21#include "virtio-serial.h"
53c25cea 22#include "pci.h"
2f792016 23#include "qemu-error.h"
aba800a3 24#include "msix.h"
a1e0fea5 25#include "net.h"
97b15621 26#include "loader.h"
ade80dc8 27#include "kvm.h"
2446333c 28#include "blockdev.h"
9fe1ebeb 29#include "virtio-pci.h"
1129714f 30#include "range.h"
53c25cea
PB
31
32/* from Linux's linux/virtio_pci.h */
33
34/* A 32-bit r/o bitmask of the features supported by the host */
35#define VIRTIO_PCI_HOST_FEATURES 0
36
37/* A 32-bit r/w bitmask of features activated by the guest */
38#define VIRTIO_PCI_GUEST_FEATURES 4
39
40/* A 32-bit r/w PFN for the currently selected queue */
41#define VIRTIO_PCI_QUEUE_PFN 8
42
43/* A 16-bit r/o queue size for the currently selected queue */
44#define VIRTIO_PCI_QUEUE_NUM 12
45
46/* A 16-bit r/w queue selector */
47#define VIRTIO_PCI_QUEUE_SEL 14
48
49/* A 16-bit r/w queue notifier */
50#define VIRTIO_PCI_QUEUE_NOTIFY 16
51
52/* An 8-bit device status register. */
53#define VIRTIO_PCI_STATUS 18
54
55/* An 8-bit r/o interrupt status register. Reading the value will return the
56 * current contents of the ISR and will also clear it. This is effectively
57 * a read-and-acknowledge. */
58#define VIRTIO_PCI_ISR 19
59
aba800a3
MT
60/* MSI-X registers: only enabled if MSI-X is enabled. */
61/* A 16-bit vector for configuration changes. */
62#define VIRTIO_MSI_CONFIG_VECTOR 20
63/* A 16-bit vector for selected queue notifications. */
64#define VIRTIO_MSI_QUEUE_VECTOR 22
65
66/* Config space size */
67#define VIRTIO_PCI_CONFIG_NOMSI 20
68#define VIRTIO_PCI_CONFIG_MSI 24
69#define VIRTIO_PCI_REGION_SIZE(dev) (msix_present(dev) ? \
70 VIRTIO_PCI_CONFIG_MSI : \
71 VIRTIO_PCI_CONFIG_NOMSI)
72
73/* The remaining space is defined by each driver as the per-driver
74 * configuration space */
75#define VIRTIO_PCI_CONFIG(dev) (msix_enabled(dev) ? \
76 VIRTIO_PCI_CONFIG_MSI : \
77 VIRTIO_PCI_CONFIG_NOMSI)
53c25cea 78
53c25cea
PB
79/* How many bits to shift physical queue address written to QUEUE_PFN.
80 * 12 is historical, and due to x86 page size. */
81#define VIRTIO_PCI_QUEUE_ADDR_SHIFT 12
82
3dbca8e6
SH
83/* Flags track per-device state like workarounds for quirks in older guests. */
84#define VIRTIO_PCI_FLAG_BUS_MASTER_BUG (1 << 0)
c81131db 85
25db9ebe
SH
86/* Performance improves when virtqueue kick processing is decoupled from the
87 * vcpu thread using ioeventfd for some devices. */
88#define VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT 1
89#define VIRTIO_PCI_FLAG_USE_IOEVENTFD (1 << VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT)
90
53c25cea
PB
91/* QEMU doesn't strictly need write barriers since everything runs in
92 * lock-step. We'll leave the calls to wmb() in though to make it obvious for
93 * KVM or if kqemu gets SMP support.
94 */
95#define wmb() do { } while (0)
96
53c25cea
PB
97/* virtio device */
98
7055e687 99static void virtio_pci_notify(void *opaque, uint16_t vector)
53c25cea
PB
100{
101 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
102 if (msix_enabled(&proxy->pci_dev))
103 msix_notify(&proxy->pci_dev, vector);
104 else
105 qemu_set_irq(proxy->pci_dev.irq[0], proxy->vdev->isr & 1);
53c25cea
PB
106}
107
ff24bd58
MT
108static void virtio_pci_save_config(void * opaque, QEMUFile *f)
109{
110 VirtIOPCIProxy *proxy = opaque;
111 pci_device_save(&proxy->pci_dev, f);
112 msix_save(&proxy->pci_dev, f);
113 if (msix_present(&proxy->pci_dev))
114 qemu_put_be16(f, proxy->vdev->config_vector);
115}
116
117static void virtio_pci_save_queue(void * opaque, int n, QEMUFile *f)
118{
119 VirtIOPCIProxy *proxy = opaque;
120 if (msix_present(&proxy->pci_dev))
121 qemu_put_be16(f, virtio_queue_vector(proxy->vdev, n));
122}
123
124static int virtio_pci_load_config(void * opaque, QEMUFile *f)
125{
126 VirtIOPCIProxy *proxy = opaque;
127 int ret;
128 ret = pci_device_load(&proxy->pci_dev, f);
e6da7680 129 if (ret) {
ff24bd58 130 return ret;
e6da7680 131 }
ff24bd58 132 msix_load(&proxy->pci_dev, f);
e6da7680 133 if (msix_present(&proxy->pci_dev)) {
ff24bd58 134 qemu_get_be16s(f, &proxy->vdev->config_vector);
e6da7680
MT
135 } else {
136 proxy->vdev->config_vector = VIRTIO_NO_VECTOR;
137 }
138 if (proxy->vdev->config_vector != VIRTIO_NO_VECTOR) {
139 return msix_vector_use(&proxy->pci_dev, proxy->vdev->config_vector);
140 }
ff24bd58
MT
141 return 0;
142}
143
144static int virtio_pci_load_queue(void * opaque, int n, QEMUFile *f)
145{
146 VirtIOPCIProxy *proxy = opaque;
147 uint16_t vector;
e6da7680
MT
148 if (msix_present(&proxy->pci_dev)) {
149 qemu_get_be16s(f, &vector);
150 } else {
151 vector = VIRTIO_NO_VECTOR;
152 }
ff24bd58 153 virtio_queue_set_vector(proxy->vdev, n, vector);
e6da7680
MT
154 if (vector != VIRTIO_NO_VECTOR) {
155 return msix_vector_use(&proxy->pci_dev, vector);
156 }
ff24bd58
MT
157 return 0;
158}
159
25db9ebe
SH
160static int virtio_pci_set_host_notifier_internal(VirtIOPCIProxy *proxy,
161 int n, bool assign)
162{
163 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
164 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
165 int r;
166 if (assign) {
167 r = event_notifier_init(notifier, 1);
168 if (r < 0) {
b36e3914
MT
169 error_report("%s: unable to init event notifier: %d",
170 __func__, r);
25db9ebe
SH
171 return r;
172 }
173 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
174 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
175 n, assign);
176 if (r < 0) {
b36e3914
MT
177 error_report("%s: unable to map ioeventfd: %d",
178 __func__, r);
25db9ebe
SH
179 event_notifier_cleanup(notifier);
180 }
181 } else {
182 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
183 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
184 n, assign);
185 if (r < 0) {
b36e3914
MT
186 error_report("%s: unable to unmap ioeventfd: %d",
187 __func__, r);
25db9ebe
SH
188 return r;
189 }
190
191 /* Handle the race condition where the guest kicked and we deassigned
192 * before we got around to handling the kick.
193 */
194 if (event_notifier_test_and_clear(notifier)) {
195 virtio_queue_notify_vq(vq);
196 }
197
198 event_notifier_cleanup(notifier);
199 }
200 return r;
201}
202
203static void virtio_pci_host_notifier_read(void *opaque)
204{
205 VirtQueue *vq = opaque;
206 EventNotifier *n = virtio_queue_get_host_notifier(vq);
207 if (event_notifier_test_and_clear(n)) {
208 virtio_queue_notify_vq(vq);
209 }
210}
211
212static void virtio_pci_set_host_notifier_fd_handler(VirtIOPCIProxy *proxy,
213 int n, bool assign)
214{
215 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
216 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
217 if (assign) {
218 qemu_set_fd_handler(event_notifier_get_fd(notifier),
219 virtio_pci_host_notifier_read, NULL, vq);
220 } else {
221 qemu_set_fd_handler(event_notifier_get_fd(notifier),
222 NULL, NULL, NULL);
223 }
224}
225
b36e3914 226static void virtio_pci_start_ioeventfd(VirtIOPCIProxy *proxy)
25db9ebe
SH
227{
228 int n, r;
229
230 if (!(proxy->flags & VIRTIO_PCI_FLAG_USE_IOEVENTFD) ||
231 proxy->ioeventfd_disabled ||
232 proxy->ioeventfd_started) {
b36e3914 233 return;
25db9ebe
SH
234 }
235
236 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
237 if (!virtio_queue_get_num(proxy->vdev, n)) {
238 continue;
239 }
240
241 r = virtio_pci_set_host_notifier_internal(proxy, n, true);
242 if (r < 0) {
243 goto assign_error;
244 }
245
246 virtio_pci_set_host_notifier_fd_handler(proxy, n, true);
247 }
248 proxy->ioeventfd_started = true;
b36e3914 249 return;
25db9ebe
SH
250
251assign_error:
252 while (--n >= 0) {
253 if (!virtio_queue_get_num(proxy->vdev, n)) {
254 continue;
255 }
256
257 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
b36e3914
MT
258 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
259 assert(r >= 0);
25db9ebe
SH
260 }
261 proxy->ioeventfd_started = false;
b36e3914 262 error_report("%s: failed. Fallback to a userspace (slower).", __func__);
25db9ebe
SH
263}
264
b36e3914 265static void virtio_pci_stop_ioeventfd(VirtIOPCIProxy *proxy)
25db9ebe 266{
b36e3914 267 int r;
25db9ebe
SH
268 int n;
269
270 if (!proxy->ioeventfd_started) {
b36e3914 271 return;
25db9ebe
SH
272 }
273
274 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
275 if (!virtio_queue_get_num(proxy->vdev, n)) {
276 continue;
277 }
278
279 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
b36e3914
MT
280 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
281 assert(r >= 0);
25db9ebe
SH
282 }
283 proxy->ioeventfd_started = false;
25db9ebe
SH
284}
285
e489030d 286static void virtio_pci_reset(DeviceState *d)
7055e687 287{
e489030d 288 VirtIOPCIProxy *proxy = container_of(d, VirtIOPCIProxy, pci_dev.qdev);
25db9ebe 289 virtio_pci_stop_ioeventfd(proxy);
7055e687 290 virtio_reset(proxy->vdev);
aba800a3 291 msix_reset(&proxy->pci_dev);
25db9ebe 292 proxy->flags &= ~VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
7055e687
MT
293}
294
53c25cea
PB
295static void virtio_ioport_write(void *opaque, uint32_t addr, uint32_t val)
296{
297 VirtIOPCIProxy *proxy = opaque;
298 VirtIODevice *vdev = proxy->vdev;
c227f099 299 target_phys_addr_t pa;
53c25cea 300
53c25cea
PB
301 switch (addr) {
302 case VIRTIO_PCI_GUEST_FEATURES:
303 /* Guest does not negotiate properly? We have to assume nothing. */
304 if (val & (1 << VIRTIO_F_BAD_FEATURE)) {
305 if (vdev->bad_features)
8172539d 306 val = proxy->host_features & vdev->bad_features(vdev);
53c25cea
PB
307 else
308 val = 0;
309 }
310 if (vdev->set_features)
311 vdev->set_features(vdev, val);
704a76fc 312 vdev->guest_features = val;
53c25cea
PB
313 break;
314 case VIRTIO_PCI_QUEUE_PFN:
c227f099 315 pa = (target_phys_addr_t)val << VIRTIO_PCI_QUEUE_ADDR_SHIFT;
1b8e9b27 316 if (pa == 0) {
25db9ebe 317 virtio_pci_stop_ioeventfd(proxy);
1b8e9b27
MT
318 virtio_reset(proxy->vdev);
319 msix_unuse_all_vectors(&proxy->pci_dev);
320 }
7055e687
MT
321 else
322 virtio_queue_set_addr(vdev, vdev->queue_sel, pa);
53c25cea
PB
323 break;
324 case VIRTIO_PCI_QUEUE_SEL:
325 if (val < VIRTIO_PCI_QUEUE_MAX)
326 vdev->queue_sel = val;
327 break;
328 case VIRTIO_PCI_QUEUE_NOTIFY:
7157e2e2
SH
329 if (val < VIRTIO_PCI_QUEUE_MAX) {
330 virtio_queue_notify(vdev, val);
331 }
53c25cea
PB
332 break;
333 case VIRTIO_PCI_STATUS:
25db9ebe
SH
334 if (!(val & VIRTIO_CONFIG_S_DRIVER_OK)) {
335 virtio_pci_stop_ioeventfd(proxy);
336 }
337
3e607cb5 338 virtio_set_status(vdev, val & 0xFF);
25db9ebe
SH
339
340 if (val & VIRTIO_CONFIG_S_DRIVER_OK) {
341 virtio_pci_start_ioeventfd(proxy);
342 }
343
1b8e9b27
MT
344 if (vdev->status == 0) {
345 virtio_reset(proxy->vdev);
346 msix_unuse_all_vectors(&proxy->pci_dev);
347 }
c81131db
AG
348
349 /* Linux before 2.6.34 sets the device as OK without enabling
350 the PCI device bus master bit. In this case we need to disable
351 some safety checks. */
352 if ((val & VIRTIO_CONFIG_S_DRIVER_OK) &&
353 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
3dbca8e6 354 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
c81131db 355 }
53c25cea 356 break;
aba800a3
MT
357 case VIRTIO_MSI_CONFIG_VECTOR:
358 msix_vector_unuse(&proxy->pci_dev, vdev->config_vector);
359 /* Make it possible for guest to discover an error took place. */
360 if (msix_vector_use(&proxy->pci_dev, val) < 0)
361 val = VIRTIO_NO_VECTOR;
362 vdev->config_vector = val;
363 break;
364 case VIRTIO_MSI_QUEUE_VECTOR:
365 msix_vector_unuse(&proxy->pci_dev,
366 virtio_queue_vector(vdev, vdev->queue_sel));
367 /* Make it possible for guest to discover an error took place. */
368 if (msix_vector_use(&proxy->pci_dev, val) < 0)
369 val = VIRTIO_NO_VECTOR;
370 virtio_queue_set_vector(vdev, vdev->queue_sel, val);
371 break;
372 default:
4e02d460
SH
373 error_report("%s: unexpected address 0x%x value 0x%x",
374 __func__, addr, val);
aba800a3 375 break;
53c25cea
PB
376 }
377}
378
aba800a3 379static uint32_t virtio_ioport_read(VirtIOPCIProxy *proxy, uint32_t addr)
53c25cea 380{
53c25cea
PB
381 VirtIODevice *vdev = proxy->vdev;
382 uint32_t ret = 0xFFFFFFFF;
383
53c25cea
PB
384 switch (addr) {
385 case VIRTIO_PCI_HOST_FEATURES:
8172539d 386 ret = proxy->host_features;
53c25cea
PB
387 break;
388 case VIRTIO_PCI_GUEST_FEATURES:
704a76fc 389 ret = vdev->guest_features;
53c25cea
PB
390 break;
391 case VIRTIO_PCI_QUEUE_PFN:
392 ret = virtio_queue_get_addr(vdev, vdev->queue_sel)
393 >> VIRTIO_PCI_QUEUE_ADDR_SHIFT;
394 break;
395 case VIRTIO_PCI_QUEUE_NUM:
396 ret = virtio_queue_get_num(vdev, vdev->queue_sel);
397 break;
398 case VIRTIO_PCI_QUEUE_SEL:
399 ret = vdev->queue_sel;
400 break;
401 case VIRTIO_PCI_STATUS:
402 ret = vdev->status;
403 break;
404 case VIRTIO_PCI_ISR:
405 /* reading from the ISR also clears it. */
406 ret = vdev->isr;
407 vdev->isr = 0;
7055e687 408 qemu_set_irq(proxy->pci_dev.irq[0], 0);
53c25cea 409 break;
aba800a3
MT
410 case VIRTIO_MSI_CONFIG_VECTOR:
411 ret = vdev->config_vector;
412 break;
413 case VIRTIO_MSI_QUEUE_VECTOR:
414 ret = virtio_queue_vector(vdev, vdev->queue_sel);
415 break;
53c25cea
PB
416 default:
417 break;
418 }
419
420 return ret;
421}
422
423static uint32_t virtio_pci_config_readb(void *opaque, uint32_t addr)
424{
425 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
426 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
427 addr -= proxy->addr;
428 if (addr < config)
429 return virtio_ioport_read(proxy, addr);
430 addr -= config;
53c25cea
PB
431 return virtio_config_readb(proxy->vdev, addr);
432}
433
434static uint32_t virtio_pci_config_readw(void *opaque, uint32_t addr)
435{
436 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
437 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
438 addr -= proxy->addr;
439 if (addr < config)
440 return virtio_ioport_read(proxy, addr);
441 addr -= config;
53c25cea
PB
442 return virtio_config_readw(proxy->vdev, addr);
443}
444
445static uint32_t virtio_pci_config_readl(void *opaque, uint32_t addr)
446{
447 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
448 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
449 addr -= proxy->addr;
450 if (addr < config)
451 return virtio_ioport_read(proxy, addr);
452 addr -= config;
53c25cea
PB
453 return virtio_config_readl(proxy->vdev, addr);
454}
455
456static void virtio_pci_config_writeb(void *opaque, uint32_t addr, uint32_t val)
457{
458 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
459 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
460 addr -= proxy->addr;
461 if (addr < config) {
462 virtio_ioport_write(proxy, addr, val);
463 return;
464 }
465 addr -= config;
53c25cea
PB
466 virtio_config_writeb(proxy->vdev, addr, val);
467}
468
469static void virtio_pci_config_writew(void *opaque, uint32_t addr, uint32_t val)
470{
471 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
472 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
473 addr -= proxy->addr;
474 if (addr < config) {
475 virtio_ioport_write(proxy, addr, val);
476 return;
477 }
478 addr -= config;
53c25cea
PB
479 virtio_config_writew(proxy->vdev, addr, val);
480}
481
482static void virtio_pci_config_writel(void *opaque, uint32_t addr, uint32_t val)
483{
484 VirtIOPCIProxy *proxy = opaque;
aba800a3
MT
485 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
486 addr -= proxy->addr;
487 if (addr < config) {
488 virtio_ioport_write(proxy, addr, val);
489 return;
490 }
491 addr -= config;
53c25cea
PB
492 virtio_config_writel(proxy->vdev, addr, val);
493}
494
495static void virtio_map(PCIDevice *pci_dev, int region_num,
6e355d90 496 pcibus_t addr, pcibus_t size, int type)
53c25cea
PB
497{
498 VirtIOPCIProxy *proxy = container_of(pci_dev, VirtIOPCIProxy, pci_dev);
499 VirtIODevice *vdev = proxy->vdev;
aba800a3 500 unsigned config_len = VIRTIO_PCI_REGION_SIZE(pci_dev) + vdev->config_len;
53c25cea
PB
501
502 proxy->addr = addr;
53c25cea 503
aba800a3
MT
504 register_ioport_write(addr, config_len, 1, virtio_pci_config_writeb, proxy);
505 register_ioport_write(addr, config_len, 2, virtio_pci_config_writew, proxy);
506 register_ioport_write(addr, config_len, 4, virtio_pci_config_writel, proxy);
507 register_ioport_read(addr, config_len, 1, virtio_pci_config_readb, proxy);
508 register_ioport_read(addr, config_len, 2, virtio_pci_config_readw, proxy);
509 register_ioport_read(addr, config_len, 4, virtio_pci_config_readl, proxy);
53c25cea 510
aba800a3 511 if (vdev->config_len)
53c25cea 512 vdev->get_config(vdev, vdev->config);
aba800a3
MT
513}
514
515static void virtio_write_config(PCIDevice *pci_dev, uint32_t address,
516 uint32_t val, int len)
517{
ed757e14
YV
518 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
519
1129714f
MT
520 pci_default_write_config(pci_dev, address, val, len);
521
522 if (range_covers_byte(address, len, PCI_COMMAND) &&
523 !(pci_dev->config[PCI_COMMAND] & PCI_COMMAND_MASTER) &&
524 !(proxy->flags & VIRTIO_PCI_FLAG_BUS_MASTER_BUG)) {
525 virtio_pci_stop_ioeventfd(proxy);
526 virtio_set_status(proxy->vdev,
527 proxy->vdev->status & ~VIRTIO_CONFIG_S_DRIVER_OK);
ed757e14
YV
528 }
529
85352471 530 msix_write_config(pci_dev, address, val, len);
53c25cea
PB
531}
532
6d74ca5a
MT
533static unsigned virtio_pci_get_features(void *opaque)
534{
8172539d
MT
535 VirtIOPCIProxy *proxy = opaque;
536 return proxy->host_features;
6d74ca5a
MT
537}
538
ade80dc8
MT
539static void virtio_pci_guest_notifier_read(void *opaque)
540{
541 VirtQueue *vq = opaque;
542 EventNotifier *n = virtio_queue_get_guest_notifier(vq);
543 if (event_notifier_test_and_clear(n)) {
544 virtio_irq(vq);
545 }
546}
547
548static int virtio_pci_set_guest_notifier(void *opaque, int n, bool assign)
549{
550 VirtIOPCIProxy *proxy = opaque;
551 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
552 EventNotifier *notifier = virtio_queue_get_guest_notifier(vq);
553
554 if (assign) {
555 int r = event_notifier_init(notifier, 0);
556 if (r < 0) {
557 return r;
558 }
559 qemu_set_fd_handler(event_notifier_get_fd(notifier),
560 virtio_pci_guest_notifier_read, NULL, vq);
561 } else {
562 qemu_set_fd_handler(event_notifier_get_fd(notifier),
563 NULL, NULL, NULL);
564 event_notifier_cleanup(notifier);
565 }
566
567 return 0;
568}
569
5430a28f
MT
570static bool virtio_pci_query_guest_notifiers(void *opaque)
571{
572 VirtIOPCIProxy *proxy = opaque;
573 return msix_enabled(&proxy->pci_dev);
574}
575
54dd9321
MT
576static int virtio_pci_set_guest_notifiers(void *opaque, bool assign)
577{
578 VirtIOPCIProxy *proxy = opaque;
579 VirtIODevice *vdev = proxy->vdev;
580 int r, n;
581
582 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
583 if (!virtio_queue_get_num(vdev, n)) {
584 break;
585 }
586
587 r = virtio_pci_set_guest_notifier(opaque, n, assign);
588 if (r < 0) {
589 goto assign_error;
590 }
591 }
592
593 return 0;
594
595assign_error:
596 /* We get here on assignment failure. Recover by undoing for VQs 0 .. n. */
597 while (--n >= 0) {
598 virtio_pci_set_guest_notifier(opaque, n, !assign);
599 }
600 return r;
601}
602
ade80dc8
MT
603static int virtio_pci_set_host_notifier(void *opaque, int n, bool assign)
604{
605 VirtIOPCIProxy *proxy = opaque;
25db9ebe
SH
606
607 /* Stop using ioeventfd for virtqueue kick if the device starts using host
608 * notifiers. This makes it easy to avoid stepping on each others' toes.
609 */
610 proxy->ioeventfd_disabled = assign;
ade80dc8 611 if (assign) {
25db9ebe
SH
612 virtio_pci_stop_ioeventfd(proxy);
613 }
614 /* We don't need to start here: it's not needed because backend
615 * currently only stops on status change away from ok,
616 * reset, vmstop and such. If we do add code to start here,
617 * need to check vmstate, device state etc. */
618 return virtio_pci_set_host_notifier_internal(proxy, n, assign);
619}
620
621static void virtio_pci_vmstate_change(void *opaque, bool running)
622{
623 VirtIOPCIProxy *proxy = opaque;
624
625 if (running) {
89c473fd
MT
626 /* Try to find out if the guest has bus master disabled, but is
627 in ready state. Then we have a buggy guest OS. */
628 if ((proxy->vdev->status & VIRTIO_CONFIG_S_DRIVER_OK) &&
629 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
630 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
631 }
25db9ebe 632 virtio_pci_start_ioeventfd(proxy);
ade80dc8 633 } else {
25db9ebe 634 virtio_pci_stop_ioeventfd(proxy);
ade80dc8 635 }
ade80dc8
MT
636}
637
53c25cea 638static const VirtIOBindings virtio_pci_bindings = {
ff24bd58
MT
639 .notify = virtio_pci_notify,
640 .save_config = virtio_pci_save_config,
641 .load_config = virtio_pci_load_config,
642 .save_queue = virtio_pci_save_queue,
643 .load_queue = virtio_pci_load_queue,
6d74ca5a 644 .get_features = virtio_pci_get_features,
5430a28f 645 .query_guest_notifiers = virtio_pci_query_guest_notifiers,
ade80dc8 646 .set_host_notifier = virtio_pci_set_host_notifier,
54dd9321 647 .set_guest_notifiers = virtio_pci_set_guest_notifiers,
25db9ebe 648 .vmstate_change = virtio_pci_vmstate_change,
53c25cea
PB
649};
650
befeac45 651void virtio_init_pci(VirtIOPCIProxy *proxy, VirtIODevice *vdev)
53c25cea
PB
652{
653 uint8_t *config;
654 uint32_t size;
655
656 proxy->vdev = vdev;
657
658 config = proxy->pci_dev.config;
53c25cea 659
e75ccf2c
IY
660 if (proxy->class_code) {
661 pci_config_set_class(config, proxy->class_code);
662 }
663 pci_set_word(config + 0x2c, pci_get_word(config + PCI_VENDOR_ID));
664 pci_set_word(config + 0x2e, vdev->device_id);
53c25cea
PB
665 config[0x3d] = 1;
666
5a1fc5e8 667 if (vdev->nvectors && !msix_init(&proxy->pci_dev, vdev->nvectors, 1, 0)) {
aba800a3
MT
668 pci_register_bar(&proxy->pci_dev, 1,
669 msix_bar_size(&proxy->pci_dev),
0392a017 670 PCI_BASE_ADDRESS_SPACE_MEMORY,
aba800a3 671 msix_mmio_map);
aba800a3
MT
672 } else
673 vdev->nvectors = 0;
674
ed757e14
YV
675 proxy->pci_dev.config_write = virtio_write_config;
676
aba800a3 677 size = VIRTIO_PCI_REGION_SIZE(&proxy->pci_dev) + vdev->config_len;
53c25cea
PB
678 if (size & (size-1))
679 size = 1 << qemu_fls(size);
680
0392a017 681 pci_register_bar(&proxy->pci_dev, 0, size, PCI_BASE_ADDRESS_SPACE_IO,
53c25cea
PB
682 virtio_map);
683
25db9ebe
SH
684 if (!kvm_has_many_ioeventfds()) {
685 proxy->flags &= ~VIRTIO_PCI_FLAG_USE_IOEVENTFD;
686 }
687
53c25cea 688 virtio_bind_device(vdev, &virtio_pci_bindings, proxy);
8172539d
MT
689 proxy->host_features |= 0x1 << VIRTIO_F_NOTIFY_ON_EMPTY;
690 proxy->host_features |= 0x1 << VIRTIO_F_BAD_FEATURE;
691 proxy->host_features = vdev->get_features(vdev, proxy->host_features);
53c25cea
PB
692}
693
81a322d4 694static int virtio_blk_init_pci(PCIDevice *pci_dev)
53c25cea
PB
695{
696 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
697 VirtIODevice *vdev;
698
ab73ff29
GH
699 if (proxy->class_code != PCI_CLASS_STORAGE_SCSI &&
700 proxy->class_code != PCI_CLASS_STORAGE_OTHER)
701 proxy->class_code = PCI_CLASS_STORAGE_SCSI;
53c25cea 702
a8686a9b
MA
703 vdev = virtio_blk_init(&pci_dev->qdev, &proxy->block,
704 &proxy->block_serial);
ac0c14d7
MA
705 if (!vdev) {
706 return -1;
707 }
177539e0 708 vdev->nvectors = proxy->nvectors;
e75ccf2c 709 virtio_init_pci(proxy, vdev);
177539e0
GH
710 /* make the actual value visible */
711 proxy->nvectors = vdev->nvectors;
81a322d4 712 return 0;
21d58b57
MM
713}
714
0f457d91
MT
715static int virtio_exit_pci(PCIDevice *pci_dev)
716{
717 return msix_uninit(pci_dev);
718}
719
56a14938
GH
720static int virtio_blk_exit_pci(PCIDevice *pci_dev)
721{
722 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
723
25db9ebe 724 virtio_pci_stop_ioeventfd(proxy);
9d0d3138 725 virtio_blk_exit(proxy->vdev);
f8b6cc00 726 blockdev_mark_auto_del(proxy->block.bs);
0f457d91 727 return virtio_exit_pci(pci_dev);
56a14938
GH
728}
729
98b19252 730static int virtio_serial_init_pci(PCIDevice *pci_dev)
21d58b57 731{
d6beee99 732 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
85c2c735
MM
733 VirtIODevice *vdev;
734
d6beee99
GH
735 if (proxy->class_code != PCI_CLASS_COMMUNICATION_OTHER &&
736 proxy->class_code != PCI_CLASS_DISPLAY_OTHER && /* qemu 0.10 */
737 proxy->class_code != PCI_CLASS_OTHERS) /* qemu-kvm */
738 proxy->class_code = PCI_CLASS_COMMUNICATION_OTHER;
739
6b331efb 740 vdev = virtio_serial_init(&pci_dev->qdev, &proxy->serial);
25fe3654
AS
741 if (!vdev) {
742 return -1;
743 }
573fb60c 744 vdev->nvectors = proxy->nvectors == DEV_NVECTORS_UNSPECIFIED
6b331efb 745 ? proxy->serial.max_virtserial_ports + 1
573fb60c 746 : proxy->nvectors;
e75ccf2c 747 virtio_init_pci(proxy, vdev);
a1829205 748 proxy->nvectors = vdev->nvectors;
81a322d4 749 return 0;
53c25cea
PB
750}
751
8b53a865
AS
752static int virtio_serial_exit_pci(PCIDevice *pci_dev)
753{
754 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
755
32059220 756 virtio_pci_stop_ioeventfd(proxy);
8b53a865
AS
757 virtio_serial_exit(proxy->vdev);
758 return virtio_exit_pci(pci_dev);
759}
760
81a322d4 761static int virtio_net_init_pci(PCIDevice *pci_dev)
53c25cea
PB
762{
763 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
764 VirtIODevice *vdev;
765
f0c07c7c 766 vdev = virtio_net_init(&pci_dev->qdev, &proxy->nic, &proxy->net);
a1e0fea5 767
97b15621 768 vdev->nvectors = proxy->nvectors;
e75ccf2c 769 virtio_init_pci(proxy, vdev);
a1e0fea5
GH
770
771 /* make the actual value visible */
772 proxy->nvectors = vdev->nvectors;
81a322d4 773 return 0;
53c25cea
PB
774}
775
97b15621
GH
776static int virtio_net_exit_pci(PCIDevice *pci_dev)
777{
778 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
779
25db9ebe 780 virtio_pci_stop_ioeventfd(proxy);
97b15621
GH
781 virtio_net_exit(proxy->vdev);
782 return virtio_exit_pci(pci_dev);
783}
784
81a322d4 785static int virtio_balloon_init_pci(PCIDevice *pci_dev)
53c25cea
PB
786{
787 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
788 VirtIODevice *vdev;
789
790 vdev = virtio_balloon_init(&pci_dev->qdev);
f76f6655
AS
791 if (!vdev) {
792 return -1;
793 }
e75ccf2c 794 virtio_init_pci(proxy, vdev);
81a322d4 795 return 0;
53c25cea
PB
796}
797
855d7e25
AS
798static int virtio_balloon_exit_pci(PCIDevice *pci_dev)
799{
800 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
801
802 virtio_pci_stop_ioeventfd(proxy);
803 virtio_balloon_exit(proxy->vdev);
804 return virtio_exit_pci(pci_dev);
805}
806
0aab0d3a
GH
807static PCIDeviceInfo virtio_info[] = {
808 {
809 .qdev.name = "virtio-blk-pci",
779206de 810 .qdev.alias = "virtio-blk",
0aab0d3a
GH
811 .qdev.size = sizeof(VirtIOPCIProxy),
812 .init = virtio_blk_init_pci,
56a14938 813 .exit = virtio_blk_exit_pci,
e75ccf2c
IY
814 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
815 .device_id = PCI_DEVICE_ID_VIRTIO_BLOCK,
816 .revision = VIRTIO_PCI_ABI_VERSION,
817 .class_id = PCI_CLASS_STORAGE_SCSI,
ab73ff29 818 .qdev.props = (Property[]) {
72c61d0b 819 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
428c149b 820 DEFINE_BLOCK_PROPERTIES(VirtIOPCIProxy, block),
a8686a9b 821 DEFINE_PROP_STRING("serial", VirtIOPCIProxy, block_serial),
25db9ebe
SH
822 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
823 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, true),
177539e0 824 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 2),
8172539d 825 DEFINE_VIRTIO_BLK_FEATURES(VirtIOPCIProxy, host_features),
72c61d0b 826 DEFINE_PROP_END_OF_LIST(),
ab73ff29 827 },
e489030d 828 .qdev.reset = virtio_pci_reset,
0aab0d3a 829 },{
a1e0fea5 830 .qdev.name = "virtio-net-pci",
29f82b37 831 .qdev.alias = "virtio-net",
a1e0fea5
GH
832 .qdev.size = sizeof(VirtIOPCIProxy),
833 .init = virtio_net_init_pci,
97b15621 834 .exit = virtio_net_exit_pci,
5ee8ad71 835 .romfile = "pxe-virtio.rom",
e75ccf2c
IY
836 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
837 .device_id = PCI_DEVICE_ID_VIRTIO_NET,
838 .revision = VIRTIO_PCI_ABI_VERSION,
839 .class_id = PCI_CLASS_NETWORK_ETHERNET,
a1e0fea5 840 .qdev.props = (Property[]) {
25db9ebe
SH
841 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
842 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, false),
97b15621 843 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 3),
8172539d 844 DEFINE_VIRTIO_NET_FEATURES(VirtIOPCIProxy, host_features),
97b15621 845 DEFINE_NIC_PROPERTIES(VirtIOPCIProxy, nic),
f0c07c7c
AW
846 DEFINE_PROP_UINT32("x-txtimer", VirtIOPCIProxy,
847 net.txtimer, TX_TIMER_INTERVAL),
e3f30488
AW
848 DEFINE_PROP_INT32("x-txburst", VirtIOPCIProxy,
849 net.txburst, TX_BURST),
a697a334 850 DEFINE_PROP_STRING("tx", VirtIOPCIProxy, net.tx),
72c61d0b 851 DEFINE_PROP_END_OF_LIST(),
a1e0fea5 852 },
e489030d 853 .qdev.reset = virtio_pci_reset,
0aab0d3a 854 },{
98b19252
AS
855 .qdev.name = "virtio-serial-pci",
856 .qdev.alias = "virtio-serial",
0aab0d3a 857 .qdev.size = sizeof(VirtIOPCIProxy),
98b19252 858 .init = virtio_serial_init_pci,
8b53a865 859 .exit = virtio_serial_exit_pci,
e75ccf2c
IY
860 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
861 .device_id = PCI_DEVICE_ID_VIRTIO_CONSOLE,
862 .revision = VIRTIO_PCI_ABI_VERSION,
863 .class_id = PCI_CLASS_COMMUNICATION_OTHER,
d6beee99 864 .qdev.props = (Property[]) {
32059220
AS
865 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
866 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, true),
573fb60c
AS
867 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors,
868 DEV_NVECTORS_UNSPECIFIED),
72c61d0b 869 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
8172539d 870 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
6b331efb
AS
871 DEFINE_PROP_UINT32("max_ports", VirtIOPCIProxy,
872 serial.max_virtserial_ports, 31),
72c61d0b 873 DEFINE_PROP_END_OF_LIST(),
d6beee99 874 },
e489030d 875 .qdev.reset = virtio_pci_reset,
0aab0d3a
GH
876 },{
877 .qdev.name = "virtio-balloon-pci",
29f82b37 878 .qdev.alias = "virtio-balloon",
0aab0d3a
GH
879 .qdev.size = sizeof(VirtIOPCIProxy),
880 .init = virtio_balloon_init_pci,
855d7e25 881 .exit = virtio_balloon_exit_pci,
e75ccf2c
IY
882 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
883 .device_id = PCI_DEVICE_ID_VIRTIO_BALLOON,
884 .revision = VIRTIO_PCI_ABI_VERSION,
885 .class_id = PCI_CLASS_MEMORY_RAM,
8172539d
MT
886 .qdev.props = (Property[]) {
887 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
888 DEFINE_PROP_END_OF_LIST(),
889 },
e489030d 890 .qdev.reset = virtio_pci_reset,
0aab0d3a
GH
891 },{
892 /* end of list */
893 }
894};
895
53c25cea
PB
896static void virtio_pci_register_devices(void)
897{
0aab0d3a 898 pci_qdev_register_many(virtio_info);
53c25cea
PB
899}
900
901device_init(virtio_pci_register_devices)