dma-helpers.c 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331
  1. /*
  2. * DMA helper functions
  3. *
  4. * Copyright (c) 2009 Red Hat
  5. *
  6. * This work is licensed under the terms of the GNU General Public License
  7. * (GNU GPL), version 2 or later.
  8. */
  9. #include "qemu/osdep.h"
  10. #include "sysemu/block-backend.h"
  11. #include "sysemu/dma.h"
  12. #include "trace/trace-root.h"
  13. #include "qemu/thread.h"
  14. #include "qemu/main-loop.h"
  15. #include "sysemu/cpus.h"
  16. #include "qemu/range.h"
  17. /* #define DEBUG_IOMMU */
  18. int dma_memory_set(AddressSpace *as, dma_addr_t addr, uint8_t c, dma_addr_t len)
  19. {
  20. dma_barrier(as, DMA_DIRECTION_FROM_DEVICE);
  21. #define FILLBUF_SIZE 512
  22. uint8_t fillbuf[FILLBUF_SIZE];
  23. int l;
  24. bool error = false;
  25. memset(fillbuf, c, FILLBUF_SIZE);
  26. while (len > 0) {
  27. l = len < FILLBUF_SIZE ? len : FILLBUF_SIZE;
  28. error |= address_space_write(as, addr, MEMTXATTRS_UNSPECIFIED,
  29. fillbuf, l);
  30. len -= l;
  31. addr += l;
  32. }
  33. return error;
  34. }
  35. void qemu_sglist_init(QEMUSGList *qsg, DeviceState *dev, int alloc_hint,
  36. AddressSpace *as)
  37. {
  38. qsg->sg = g_malloc(alloc_hint * sizeof(ScatterGatherEntry));
  39. qsg->nsg = 0;
  40. qsg->nalloc = alloc_hint;
  41. qsg->size = 0;
  42. qsg->as = as;
  43. qsg->dev = dev;
  44. object_ref(OBJECT(dev));
  45. }
  46. void qemu_sglist_add(QEMUSGList *qsg, dma_addr_t base, dma_addr_t len)
  47. {
  48. if (qsg->nsg == qsg->nalloc) {
  49. qsg->nalloc = 2 * qsg->nalloc + 1;
  50. qsg->sg = g_realloc(qsg->sg, qsg->nalloc * sizeof(ScatterGatherEntry));
  51. }
  52. qsg->sg[qsg->nsg].base = base;
  53. qsg->sg[qsg->nsg].len = len;
  54. qsg->size += len;
  55. ++qsg->nsg;
  56. }
  57. void qemu_sglist_destroy(QEMUSGList *qsg)
  58. {
  59. object_unref(OBJECT(qsg->dev));
  60. g_free(qsg->sg);
  61. memset(qsg, 0, sizeof(*qsg));
  62. }
  63. typedef struct {
  64. BlockAIOCB common;
  65. AioContext *ctx;
  66. BlockAIOCB *acb;
  67. QEMUSGList *sg;
  68. uint32_t align;
  69. uint64_t offset;
  70. DMADirection dir;
  71. int sg_cur_index;
  72. dma_addr_t sg_cur_byte;
  73. QEMUIOVector iov;
  74. QEMUBH *bh;
  75. DMAIOFunc *io_func;
  76. void *io_func_opaque;
  77. } DMAAIOCB;
  78. static void dma_blk_cb(void *opaque, int ret);
  79. static void reschedule_dma(void *opaque)
  80. {
  81. DMAAIOCB *dbs = (DMAAIOCB *)opaque;
  82. assert(!dbs->acb && dbs->bh);
  83. qemu_bh_delete(dbs->bh);
  84. dbs->bh = NULL;
  85. dma_blk_cb(dbs, 0);
  86. }
  87. static void dma_blk_unmap(DMAAIOCB *dbs)
  88. {
  89. int i;
  90. for (i = 0; i < dbs->iov.niov; ++i) {
  91. dma_memory_unmap(dbs->sg->as, dbs->iov.iov[i].iov_base,
  92. dbs->iov.iov[i].iov_len, dbs->dir,
  93. dbs->iov.iov[i].iov_len);
  94. }
  95. qemu_iovec_reset(&dbs->iov);
  96. }
  97. static void dma_complete(DMAAIOCB *dbs, int ret)
  98. {
  99. trace_dma_complete(dbs, ret, dbs->common.cb);
  100. assert(!dbs->acb && !dbs->bh);
  101. dma_blk_unmap(dbs);
  102. if (dbs->common.cb) {
  103. dbs->common.cb(dbs->common.opaque, ret);
  104. }
  105. qemu_iovec_destroy(&dbs->iov);
  106. qemu_aio_unref(dbs);
  107. }
  108. static void dma_blk_cb(void *opaque, int ret)
  109. {
  110. DMAAIOCB *dbs = (DMAAIOCB *)opaque;
  111. dma_addr_t cur_addr, cur_len;
  112. void *mem;
  113. trace_dma_blk_cb(dbs, ret);
  114. dbs->acb = NULL;
  115. dbs->offset += dbs->iov.size;
  116. if (dbs->sg_cur_index == dbs->sg->nsg || ret < 0) {
  117. dma_complete(dbs, ret);
  118. return;
  119. }
  120. dma_blk_unmap(dbs);
  121. while (dbs->sg_cur_index < dbs->sg->nsg) {
  122. cur_addr = dbs->sg->sg[dbs->sg_cur_index].base + dbs->sg_cur_byte;
  123. cur_len = dbs->sg->sg[dbs->sg_cur_index].len - dbs->sg_cur_byte;
  124. mem = dma_memory_map(dbs->sg->as, cur_addr, &cur_len, dbs->dir);
  125. /*
  126. * Make reads deterministic in icount mode. Windows sometimes issues
  127. * disk read requests with overlapping SGs. It leads
  128. * to non-determinism, because resulting buffer contents may be mixed
  129. * from several sectors. This code splits all SGs into several
  130. * groups. SGs in every group do not overlap.
  131. */
  132. if (mem && use_icount && dbs->dir == DMA_DIRECTION_FROM_DEVICE) {
  133. int i;
  134. for (i = 0 ; i < dbs->iov.niov ; ++i) {
  135. if (ranges_overlap((intptr_t)dbs->iov.iov[i].iov_base,
  136. dbs->iov.iov[i].iov_len, (intptr_t)mem,
  137. cur_len)) {
  138. dma_memory_unmap(dbs->sg->as, mem, cur_len,
  139. dbs->dir, cur_len);
  140. mem = NULL;
  141. break;
  142. }
  143. }
  144. }
  145. if (!mem)
  146. break;
  147. qemu_iovec_add(&dbs->iov, mem, cur_len);
  148. dbs->sg_cur_byte += cur_len;
  149. if (dbs->sg_cur_byte == dbs->sg->sg[dbs->sg_cur_index].len) {
  150. dbs->sg_cur_byte = 0;
  151. ++dbs->sg_cur_index;
  152. }
  153. }
  154. if (dbs->iov.size == 0) {
  155. trace_dma_map_wait(dbs);
  156. dbs->bh = aio_bh_new(dbs->ctx, reschedule_dma, dbs);
  157. cpu_register_map_client(dbs->bh);
  158. return;
  159. }
  160. if (!QEMU_IS_ALIGNED(dbs->iov.size, dbs->align)) {
  161. qemu_iovec_discard_back(&dbs->iov,
  162. QEMU_ALIGN_DOWN(dbs->iov.size, dbs->align));
  163. }
  164. aio_context_acquire(dbs->ctx);
  165. dbs->acb = dbs->io_func(dbs->offset, &dbs->iov,
  166. dma_blk_cb, dbs, dbs->io_func_opaque);
  167. aio_context_release(dbs->ctx);
  168. assert(dbs->acb);
  169. }
  170. static void dma_aio_cancel(BlockAIOCB *acb)
  171. {
  172. DMAAIOCB *dbs = container_of(acb, DMAAIOCB, common);
  173. trace_dma_aio_cancel(dbs);
  174. assert(!(dbs->acb && dbs->bh));
  175. if (dbs->acb) {
  176. /* This will invoke dma_blk_cb. */
  177. blk_aio_cancel_async(dbs->acb);
  178. return;
  179. }
  180. if (dbs->bh) {
  181. cpu_unregister_map_client(dbs->bh);
  182. qemu_bh_delete(dbs->bh);
  183. dbs->bh = NULL;
  184. }
  185. if (dbs->common.cb) {
  186. dbs->common.cb(dbs->common.opaque, -ECANCELED);
  187. }
  188. }
  189. static AioContext *dma_get_aio_context(BlockAIOCB *acb)
  190. {
  191. DMAAIOCB *dbs = container_of(acb, DMAAIOCB, common);
  192. return dbs->ctx;
  193. }
  194. static const AIOCBInfo dma_aiocb_info = {
  195. .aiocb_size = sizeof(DMAAIOCB),
  196. .cancel_async = dma_aio_cancel,
  197. .get_aio_context = dma_get_aio_context,
  198. };
  199. BlockAIOCB *dma_blk_io(AioContext *ctx,
  200. QEMUSGList *sg, uint64_t offset, uint32_t align,
  201. DMAIOFunc *io_func, void *io_func_opaque,
  202. BlockCompletionFunc *cb,
  203. void *opaque, DMADirection dir)
  204. {
  205. DMAAIOCB *dbs = qemu_aio_get(&dma_aiocb_info, NULL, cb, opaque);
  206. trace_dma_blk_io(dbs, io_func_opaque, offset, (dir == DMA_DIRECTION_TO_DEVICE));
  207. dbs->acb = NULL;
  208. dbs->sg = sg;
  209. dbs->ctx = ctx;
  210. dbs->offset = offset;
  211. dbs->align = align;
  212. dbs->sg_cur_index = 0;
  213. dbs->sg_cur_byte = 0;
  214. dbs->dir = dir;
  215. dbs->io_func = io_func;
  216. dbs->io_func_opaque = io_func_opaque;
  217. dbs->bh = NULL;
  218. qemu_iovec_init(&dbs->iov, sg->nsg);
  219. dma_blk_cb(dbs, 0);
  220. return &dbs->common;
  221. }
  222. static
  223. BlockAIOCB *dma_blk_read_io_func(int64_t offset, QEMUIOVector *iov,
  224. BlockCompletionFunc *cb, void *cb_opaque,
  225. void *opaque)
  226. {
  227. BlockBackend *blk = opaque;
  228. return blk_aio_preadv(blk, offset, iov, 0, cb, cb_opaque);
  229. }
  230. BlockAIOCB *dma_blk_read(BlockBackend *blk,
  231. QEMUSGList *sg, uint64_t offset, uint32_t align,
  232. void (*cb)(void *opaque, int ret), void *opaque)
  233. {
  234. return dma_blk_io(blk_get_aio_context(blk), sg, offset, align,
  235. dma_blk_read_io_func, blk, cb, opaque,
  236. DMA_DIRECTION_FROM_DEVICE);
  237. }
  238. static
  239. BlockAIOCB *dma_blk_write_io_func(int64_t offset, QEMUIOVector *iov,
  240. BlockCompletionFunc *cb, void *cb_opaque,
  241. void *opaque)
  242. {
  243. BlockBackend *blk = opaque;
  244. return blk_aio_pwritev(blk, offset, iov, 0, cb, cb_opaque);
  245. }
  246. BlockAIOCB *dma_blk_write(BlockBackend *blk,
  247. QEMUSGList *sg, uint64_t offset, uint32_t align,
  248. void (*cb)(void *opaque, int ret), void *opaque)
  249. {
  250. return dma_blk_io(blk_get_aio_context(blk), sg, offset, align,
  251. dma_blk_write_io_func, blk, cb, opaque,
  252. DMA_DIRECTION_TO_DEVICE);
  253. }
  254. static uint64_t dma_buf_rw(uint8_t *ptr, int32_t len, QEMUSGList *sg,
  255. DMADirection dir)
  256. {
  257. uint64_t resid;
  258. int sg_cur_index;
  259. resid = sg->size;
  260. sg_cur_index = 0;
  261. len = MIN(len, resid);
  262. while (len > 0) {
  263. ScatterGatherEntry entry = sg->sg[sg_cur_index++];
  264. int32_t xfer = MIN(len, entry.len);
  265. dma_memory_rw(sg->as, entry.base, ptr, xfer, dir);
  266. ptr += xfer;
  267. len -= xfer;
  268. resid -= xfer;
  269. }
  270. return resid;
  271. }
  272. uint64_t dma_buf_read(uint8_t *ptr, int32_t len, QEMUSGList *sg)
  273. {
  274. return dma_buf_rw(ptr, len, sg, DMA_DIRECTION_FROM_DEVICE);
  275. }
  276. uint64_t dma_buf_write(uint8_t *ptr, int32_t len, QEMUSGList *sg)
  277. {
  278. return dma_buf_rw(ptr, len, sg, DMA_DIRECTION_TO_DEVICE);
  279. }
  280. void dma_acct_start(BlockBackend *blk, BlockAcctCookie *cookie,
  281. QEMUSGList *sg, enum BlockAcctType type)
  282. {
  283. block_acct_start(blk_get_stats(blk), cookie, sg->size, type);
  284. }