]> git.proxmox.com Git - mirror_qemu.git/blame - softmmu/dma-helpers.c
block/export: Conditionally ignore set-context error
[mirror_qemu.git] / softmmu / dma-helpers.c
CommitLineData
244ab90e
AL
1/*
2 * DMA helper functions
3 *
bb755f52 4 * Copyright (c) 2009,2020 Red Hat
244ab90e
AL
5 *
6 * This work is licensed under the terms of the GNU General Public License
7 * (GNU GPL), version 2 or later.
8 */
9
d38ea87a 10#include "qemu/osdep.h"
4be74634 11#include "sysemu/block-backend.h"
9c17d615 12#include "sysemu/dma.h"
243af022 13#include "trace/trace-root.h"
1de7afc9 14#include "qemu/thread.h"
6a1751b7 15#include "qemu/main-loop.h"
740b1759 16#include "sysemu/cpu-timers.h"
5fb0a6b5 17#include "qemu/range.h"
244ab90e 18
e5332e63
DG
19/* #define DEBUG_IOMMU */
20
bb755f52
PMD
21MemTxResult dma_memory_set(AddressSpace *as, dma_addr_t addr,
22 uint8_t c, dma_addr_t len)
d86a77f8 23{
df32fd1c 24 dma_barrier(as, DMA_DIRECTION_FROM_DEVICE);
24addbc7 25
d86a77f8
DG
26#define FILLBUF_SIZE 512
27 uint8_t fillbuf[FILLBUF_SIZE];
28 int l;
bb755f52 29 MemTxResult error = MEMTX_OK;
d86a77f8
DG
30
31 memset(fillbuf, c, FILLBUF_SIZE);
32 while (len > 0) {
33 l = len < FILLBUF_SIZE ? len : FILLBUF_SIZE;
19f70347
PM
34 error |= address_space_write(as, addr, MEMTXATTRS_UNSPECIFIED,
35 fillbuf, l);
bc9b78de
BH
36 len -= l;
37 addr += l;
d86a77f8 38 }
e5332e63 39
24addbc7 40 return error;
d86a77f8
DG
41}
42
f487b677
PB
43void qemu_sglist_init(QEMUSGList *qsg, DeviceState *dev, int alloc_hint,
44 AddressSpace *as)
244ab90e 45{
7267c094 46 qsg->sg = g_malloc(alloc_hint * sizeof(ScatterGatherEntry));
244ab90e
AL
47 qsg->nsg = 0;
48 qsg->nalloc = alloc_hint;
49 qsg->size = 0;
df32fd1c 50 qsg->as = as;
f487b677
PB
51 qsg->dev = dev;
52 object_ref(OBJECT(dev));
244ab90e
AL
53}
54
d3231181 55void qemu_sglist_add(QEMUSGList *qsg, dma_addr_t base, dma_addr_t len)
244ab90e
AL
56{
57 if (qsg->nsg == qsg->nalloc) {
58 qsg->nalloc = 2 * qsg->nalloc + 1;
7267c094 59 qsg->sg = g_realloc(qsg->sg, qsg->nalloc * sizeof(ScatterGatherEntry));
244ab90e
AL
60 }
61 qsg->sg[qsg->nsg].base = base;
62 qsg->sg[qsg->nsg].len = len;
63 qsg->size += len;
64 ++qsg->nsg;
65}
66
67void qemu_sglist_destroy(QEMUSGList *qsg)
68{
f487b677 69 object_unref(OBJECT(qsg->dev));
7267c094 70 g_free(qsg->sg);
ea8d82a1 71 memset(qsg, 0, sizeof(*qsg));
244ab90e
AL
72}
73
59a703eb 74typedef struct {
7c84b1b8 75 BlockAIOCB common;
8a8e63eb 76 AioContext *ctx;
7c84b1b8 77 BlockAIOCB *acb;
59a703eb 78 QEMUSGList *sg;
99868af3 79 uint32_t align;
d4f510eb 80 uint64_t offset;
43cf8ae6 81 DMADirection dir;
59a703eb 82 int sg_cur_index;
d3231181 83 dma_addr_t sg_cur_byte;
59a703eb
AL
84 QEMUIOVector iov;
85 QEMUBH *bh;
cb144ccb 86 DMAIOFunc *io_func;
8a8e63eb 87 void *io_func_opaque;
37b7842c 88} DMAAIOCB;
59a703eb 89
4be74634 90static void dma_blk_cb(void *opaque, int ret);
59a703eb
AL
91
92static void reschedule_dma(void *opaque)
93{
37b7842c 94 DMAAIOCB *dbs = (DMAAIOCB *)opaque;
59a703eb 95
539343c0 96 assert(!dbs->acb && dbs->bh);
59a703eb
AL
97 qemu_bh_delete(dbs->bh);
98 dbs->bh = NULL;
4be74634 99 dma_blk_cb(dbs, 0);
59a703eb
AL
100}
101
4be74634 102static void dma_blk_unmap(DMAAIOCB *dbs)
59a703eb 103{
59a703eb
AL
104 int i;
105
59a703eb 106 for (i = 0; i < dbs->iov.niov; ++i) {
df32fd1c 107 dma_memory_unmap(dbs->sg->as, dbs->iov.iov[i].iov_base,
c65bcef3
DG
108 dbs->iov.iov[i].iov_len, dbs->dir,
109 dbs->iov.iov[i].iov_len);
59a703eb 110 }
c3adb5b9
PB
111 qemu_iovec_reset(&dbs->iov);
112}
113
114static void dma_complete(DMAAIOCB *dbs, int ret)
115{
c57c4658
KW
116 trace_dma_complete(dbs, ret, dbs->common.cb);
117
539343c0 118 assert(!dbs->acb && !dbs->bh);
4be74634 119 dma_blk_unmap(dbs);
c3adb5b9
PB
120 if (dbs->common.cb) {
121 dbs->common.cb(dbs->common.opaque, ret);
122 }
123 qemu_iovec_destroy(&dbs->iov);
8007429a 124 qemu_aio_unref(dbs);
7403b14e
AL
125}
126
4be74634 127static void dma_blk_cb(void *opaque, int ret)
7403b14e
AL
128{
129 DMAAIOCB *dbs = (DMAAIOCB *)opaque;
c65bcef3 130 dma_addr_t cur_addr, cur_len;
7403b14e
AL
131 void *mem;
132
4be74634 133 trace_dma_blk_cb(dbs, ret);
c57c4658 134
7403b14e 135 dbs->acb = NULL;
d4f510eb 136 dbs->offset += dbs->iov.size;
59a703eb
AL
137
138 if (dbs->sg_cur_index == dbs->sg->nsg || ret < 0) {
c3adb5b9 139 dma_complete(dbs, ret);
59a703eb
AL
140 return;
141 }
4be74634 142 dma_blk_unmap(dbs);
59a703eb
AL
143
144 while (dbs->sg_cur_index < dbs->sg->nsg) {
145 cur_addr = dbs->sg->sg[dbs->sg_cur_index].base + dbs->sg_cur_byte;
146 cur_len = dbs->sg->sg[dbs->sg_cur_index].len - dbs->sg_cur_byte;
df32fd1c 147 mem = dma_memory_map(dbs->sg->as, cur_addr, &cur_len, dbs->dir);
5fb0a6b5
PD
148 /*
149 * Make reads deterministic in icount mode. Windows sometimes issues
150 * disk read requests with overlapping SGs. It leads
151 * to non-determinism, because resulting buffer contents may be mixed
152 * from several sectors. This code splits all SGs into several
153 * groups. SGs in every group do not overlap.
154 */
740b1759 155 if (mem && icount_enabled() && dbs->dir == DMA_DIRECTION_FROM_DEVICE) {
5fb0a6b5
PD
156 int i;
157 for (i = 0 ; i < dbs->iov.niov ; ++i) {
158 if (ranges_overlap((intptr_t)dbs->iov.iov[i].iov_base,
159 dbs->iov.iov[i].iov_len, (intptr_t)mem,
160 cur_len)) {
161 dma_memory_unmap(dbs->sg->as, mem, cur_len,
162 dbs->dir, cur_len);
163 mem = NULL;
164 break;
165 }
166 }
167 }
59a703eb
AL
168 if (!mem)
169 break;
170 qemu_iovec_add(&dbs->iov, mem, cur_len);
171 dbs->sg_cur_byte += cur_len;
172 if (dbs->sg_cur_byte == dbs->sg->sg[dbs->sg_cur_index].len) {
173 dbs->sg_cur_byte = 0;
174 ++dbs->sg_cur_index;
175 }
176 }
177
178 if (dbs->iov.size == 0) {
c57c4658 179 trace_dma_map_wait(dbs);
8a8e63eb 180 dbs->bh = aio_bh_new(dbs->ctx, reschedule_dma, dbs);
e95205e1 181 cpu_register_map_client(dbs->bh);
59a703eb
AL
182 return;
183 }
184
99868af3
MCA
185 if (!QEMU_IS_ALIGNED(dbs->iov.size, dbs->align)) {
186 qemu_iovec_discard_back(&dbs->iov,
187 QEMU_ALIGN_DOWN(dbs->iov.size, dbs->align));
58f423fb
KW
188 }
189
1919631e 190 aio_context_acquire(dbs->ctx);
8a8e63eb
PB
191 dbs->acb = dbs->io_func(dbs->offset, &dbs->iov,
192 dma_blk_cb, dbs, dbs->io_func_opaque);
1919631e 193 aio_context_release(dbs->ctx);
6bee44ea 194 assert(dbs->acb);
59a703eb
AL
195}
196
7c84b1b8 197static void dma_aio_cancel(BlockAIOCB *acb)
c16b5a2c
CH
198{
199 DMAAIOCB *dbs = container_of(acb, DMAAIOCB, common);
200
c57c4658
KW
201 trace_dma_aio_cancel(dbs);
202
539343c0 203 assert(!(dbs->acb && dbs->bh));
c16b5a2c 204 if (dbs->acb) {
539343c0 205 /* This will invoke dma_blk_cb. */
4be74634 206 blk_aio_cancel_async(dbs->acb);
539343c0 207 return;
c16b5a2c 208 }
539343c0 209
e95205e1
FZ
210 if (dbs->bh) {
211 cpu_unregister_map_client(dbs->bh);
212 qemu_bh_delete(dbs->bh);
213 dbs->bh = NULL;
214 }
539343c0
PB
215 if (dbs->common.cb) {
216 dbs->common.cb(dbs->common.opaque, -ECANCELED);
217 }
c16b5a2c
CH
218}
219
5fa78b2a
SH
220static AioContext *dma_get_aio_context(BlockAIOCB *acb)
221{
222 DMAAIOCB *dbs = container_of(acb, DMAAIOCB, common);
223
224 return dbs->ctx;
225}
9bb9da46 226
d7331bed 227static const AIOCBInfo dma_aiocb_info = {
c16b5a2c 228 .aiocb_size = sizeof(DMAAIOCB),
9bb9da46 229 .cancel_async = dma_aio_cancel,
5fa78b2a 230 .get_aio_context = dma_get_aio_context,
c16b5a2c
CH
231};
232
8a8e63eb 233BlockAIOCB *dma_blk_io(AioContext *ctx,
99868af3 234 QEMUSGList *sg, uint64_t offset, uint32_t align,
8a8e63eb
PB
235 DMAIOFunc *io_func, void *io_func_opaque,
236 BlockCompletionFunc *cb,
43cf8ae6 237 void *opaque, DMADirection dir)
59a703eb 238{
8a8e63eb 239 DMAAIOCB *dbs = qemu_aio_get(&dma_aiocb_info, NULL, cb, opaque);
59a703eb 240
8a8e63eb 241 trace_dma_blk_io(dbs, io_func_opaque, offset, (dir == DMA_DIRECTION_TO_DEVICE));
c57c4658 242
37b7842c 243 dbs->acb = NULL;
59a703eb 244 dbs->sg = sg;
8a8e63eb 245 dbs->ctx = ctx;
cbe0ed62 246 dbs->offset = offset;
99868af3 247 dbs->align = align;
59a703eb
AL
248 dbs->sg_cur_index = 0;
249 dbs->sg_cur_byte = 0;
43cf8ae6 250 dbs->dir = dir;
cb144ccb 251 dbs->io_func = io_func;
8a8e63eb 252 dbs->io_func_opaque = io_func_opaque;
59a703eb
AL
253 dbs->bh = NULL;
254 qemu_iovec_init(&dbs->iov, sg->nsg);
4be74634 255 dma_blk_cb(dbs, 0);
37b7842c 256 return &dbs->common;
59a703eb
AL
257}
258
259
8a8e63eb
PB
260static
261BlockAIOCB *dma_blk_read_io_func(int64_t offset, QEMUIOVector *iov,
262 BlockCompletionFunc *cb, void *cb_opaque,
263 void *opaque)
264{
265 BlockBackend *blk = opaque;
266 return blk_aio_preadv(blk, offset, iov, 0, cb, cb_opaque);
267}
268
4be74634 269BlockAIOCB *dma_blk_read(BlockBackend *blk,
99868af3 270 QEMUSGList *sg, uint64_t offset, uint32_t align,
4be74634 271 void (*cb)(void *opaque, int ret), void *opaque)
59a703eb 272{
99868af3
MCA
273 return dma_blk_io(blk_get_aio_context(blk), sg, offset, align,
274 dma_blk_read_io_func, blk, cb, opaque,
4be74634 275 DMA_DIRECTION_FROM_DEVICE);
59a703eb
AL
276}
277
8a8e63eb
PB
278static
279BlockAIOCB *dma_blk_write_io_func(int64_t offset, QEMUIOVector *iov,
280 BlockCompletionFunc *cb, void *cb_opaque,
281 void *opaque)
282{
283 BlockBackend *blk = opaque;
284 return blk_aio_pwritev(blk, offset, iov, 0, cb, cb_opaque);
285}
286
4be74634 287BlockAIOCB *dma_blk_write(BlockBackend *blk,
99868af3 288 QEMUSGList *sg, uint64_t offset, uint32_t align,
4be74634 289 void (*cb)(void *opaque, int ret), void *opaque)
59a703eb 290{
99868af3
MCA
291 return dma_blk_io(blk_get_aio_context(blk), sg, offset, align,
292 dma_blk_write_io_func, blk, cb, opaque,
4be74634 293 DMA_DIRECTION_TO_DEVICE);
59a703eb 294}
8171ee35
PB
295
296
c65bcef3
DG
297static uint64_t dma_buf_rw(uint8_t *ptr, int32_t len, QEMUSGList *sg,
298 DMADirection dir)
8171ee35
PB
299{
300 uint64_t resid;
301 int sg_cur_index;
302
303 resid = sg->size;
304 sg_cur_index = 0;
305 len = MIN(len, resid);
306 while (len > 0) {
307 ScatterGatherEntry entry = sg->sg[sg_cur_index++];
308 int32_t xfer = MIN(len, entry.len);
df32fd1c 309 dma_memory_rw(sg->as, entry.base, ptr, xfer, dir);
8171ee35
PB
310 ptr += xfer;
311 len -= xfer;
312 resid -= xfer;
313 }
314
315 return resid;
316}
317
318uint64_t dma_buf_read(uint8_t *ptr, int32_t len, QEMUSGList *sg)
319{
c65bcef3 320 return dma_buf_rw(ptr, len, sg, DMA_DIRECTION_FROM_DEVICE);
8171ee35
PB
321}
322
323uint64_t dma_buf_write(uint8_t *ptr, int32_t len, QEMUSGList *sg)
324{
c65bcef3 325 return dma_buf_rw(ptr, len, sg, DMA_DIRECTION_TO_DEVICE);
8171ee35 326}
84a69356 327
4be74634 328void dma_acct_start(BlockBackend *blk, BlockAcctCookie *cookie,
84a69356
PB
329 QEMUSGList *sg, enum BlockAcctType type)
330{
4be74634 331 block_acct_start(blk_get_stats(blk), cookie, sg->size, type);
84a69356 332}
f14fb6c2
EA
333
334uint64_t dma_aligned_pow2_mask(uint64_t start, uint64_t end, int max_addr_bits)
335{
336 uint64_t max_mask = UINT64_MAX, addr_mask = end - start;
337 uint64_t alignment_mask, size_mask;
338
339 if (max_addr_bits != 64) {
340 max_mask = (1ULL << max_addr_bits) - 1;
341 }
342
343 alignment_mask = start ? (start & -start) - 1 : max_mask;
344 alignment_mask = MIN(alignment_mask, max_mask);
345 size_mask = MIN(addr_mask, max_mask);
346
347 if (alignment_mask <= size_mask) {
348 /* Increase the alignment of start */
349 return alignment_mask;
350 } else {
351 /* Find the largest page mask from size */
352 if (addr_mask == UINT64_MAX) {
353 return UINT64_MAX;
354 }
355 return (1ULL << (63 - clz64(addr_mask + 1))) - 1;
356 }
357}
358