summaryrefslogtreecommitdiff
path: root/sys/dev/pv
diff options
context:
space:
mode:
authorReyk Floeter <reyk@cvs.openbsd.org>2017-01-21 11:23:02 +0000
committerReyk Floeter <reyk@cvs.openbsd.org>2017-01-21 11:23:02 +0000
commitc04db73516aca488ee775f5d3ab23ff3d35084ef (patch)
tree3ab638008415ec323d6d656821a8708040817bf4 /sys/dev/pv
parentb6e5e7916cbd37066a048886881ef7377a7f1034 (diff)
Move virtio.c to sys/dev/pv/virtio.c
virtio itself is not PCI, it is a paravirtual bus on top of either PCI or MMIO (arm). This is the second step of moving the virtio files to dev/pv. No functional change. Moving the file is done by removing and adding it again - the old history can be found in the Attic of sys/dev/pci/virtio.c. no objections from sf@ mlarkin@
Diffstat (limited to 'sys/dev/pv')
-rw-r--r--sys/dev/pv/virtio.c903
1 files changed, 903 insertions, 0 deletions
diff --git a/sys/dev/pv/virtio.c b/sys/dev/pv/virtio.c
new file mode 100644
index 00000000000..e892971726f
--- /dev/null
+++ b/sys/dev/pv/virtio.c
@@ -0,0 +1,903 @@
+/* $OpenBSD: virtio.c,v 1.1 2017/01/21 11:23:01 reyk Exp $ */
+/* $NetBSD: virtio.c,v 1.3 2011/11/02 23:05:52 njoly Exp $ */
+
+/*
+ * Copyright (c) 2012 Stefan Fritsch, Alexander Fiveg.
+ * Copyright (c) 2010 Minoura Makoto.
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include <sys/param.h>
+#include <sys/systm.h>
+#include <sys/kernel.h>
+#include <sys/device.h>
+#include <sys/mutex.h>
+#include <sys/atomic.h>
+#include <sys/malloc.h>
+
+#include <dev/pv/virtioreg.h>
+#include <dev/pv/virtiovar.h>
+
+#define MINSEG_INDIRECT 2 /* use indirect if nsegs >= this value */
+
+#if VIRTIO_DEBUG
+#define VIRTIO_ASSERT(x) KASSERT(x)
+#else
+#define VIRTIO_ASSERT(x)
+#endif
+
+void virtio_init_vq(struct virtio_softc *,
+ struct virtqueue *, int);
+void vq_free_entry(struct virtqueue *, struct vq_entry *);
+struct vq_entry *vq_alloc_entry(struct virtqueue *);
+
+struct cfdriver virtio_cd = {
+ NULL, "virtio", DV_DULL
+};
+
+#define virtio_set_status(sc, s) (sc)->sc_ops->set_status(sc, s)
+#define virtio_device_reset(sc) virtio_set_status((sc), 0)
+
+static const char * const virtio_device_name[] = {
+ "Unknown (0)", /* 0 */
+ "Network", /* 1 */
+ "Block", /* 2 */
+ "Console", /* 3 */
+ "Entropy", /* 4 */
+ "Memory Balloon", /* 5 */
+ "IO Memory", /* 6 */
+ "Rpmsg", /* 7 */
+ "SCSI host", /* 8 */
+ "9P Transport" /* 9 */
+ "mac80211 wlan" /* 10 */
+};
+#define NDEVNAMES (sizeof(virtio_device_name)/sizeof(char*))
+
+static const struct virtio_feature_name transport_feature_names[] = {
+ { VIRTIO_F_NOTIFY_ON_EMPTY, "NotifyOnEmpty"},
+ { VIRTIO_F_RING_INDIRECT_DESC, "RingIndirectDesc"},
+ { VIRTIO_F_RING_EVENT_IDX, "RingEventIdx"},
+ { VIRTIO_F_BAD_FEATURE, "BadFeature"},
+ { 0, NULL}
+};
+
+const char *
+virtio_device_string(int id)
+{
+ return id < NDEVNAMES ? virtio_device_name[id] : "Unknown";
+}
+
+void
+virtio_log_features(uint32_t host, uint32_t neg,
+ const struct virtio_feature_name *guest_feature_names)
+{
+ const struct virtio_feature_name *namep;
+ int i;
+ char c;
+ uint32_t bit;
+
+ for (i = 0; i < 32; i++) {
+ if (i == 30) {
+ /*
+ * VIRTIO_F_BAD_FEATURE is only used for
+ * checking correct negotiation
+ */
+ continue;
+ }
+ bit = 1 << i;
+ if ((host&bit) == 0)
+ continue;
+ namep = (i < 24) ? guest_feature_names :
+ transport_feature_names;
+ while (namep->bit && namep->bit != bit)
+ namep++;
+ c = (neg&bit) ? '+' : '-';
+ if (namep->name)
+ printf(" %c%s", c, namep->name);
+ else
+ printf(" %cUnknown(%d)", c, i);
+ }
+}
+
+/*
+ * Reset the device.
+ */
+/*
+ * To reset the device to a known state, do following:
+ * virtio_reset(sc); // this will stop the device activity
+ * <dequeue finished requests>; // virtio_dequeue() still can be called
+ * <revoke pending requests in the vqs if any>;
+ * virtio_reinit_start(sc); // dequeue prohibitted
+ * newfeatures = virtio_negotiate_features(sc, requestedfeatures);
+ * <some other initialization>;
+ * virtio_reinit_end(sc); // device activated; enqueue allowed
+ * Once attached, feature negotiation can only be allowed after virtio_reset.
+ */
+void
+virtio_reset(struct virtio_softc *sc)
+{
+ virtio_device_reset(sc);
+}
+
+void
+virtio_reinit_start(struct virtio_softc *sc)
+{
+ int i;
+
+ virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_ACK);
+ virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_DRIVER);
+ for (i = 0; i < sc->sc_nvqs; i++) {
+ int n;
+ struct virtqueue *vq = &sc->sc_vqs[i];
+ n = virtio_read_queue_size(sc, vq->vq_index);
+ if (n == 0) /* vq disappeared */
+ continue;
+ if (n != vq->vq_num) {
+ panic("%s: virtqueue size changed, vq index %d\n",
+ sc->sc_dev.dv_xname, vq->vq_index);
+ }
+ virtio_init_vq(sc, vq, 1);
+ virtio_setup_queue(sc, vq->vq_index,
+ vq->vq_dmamap->dm_segs[0].ds_addr / VIRTIO_PAGE_SIZE);
+ }
+}
+
+void
+virtio_reinit_end(struct virtio_softc *sc)
+{
+ virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_DRIVER_OK);
+}
+
+/*
+ * dmamap sync operations for a virtqueue.
+ */
+static inline void
+vq_sync_descs(struct virtio_softc *sc, struct virtqueue *vq, int ops)
+{
+ /* availoffset == sizeof(vring_desc)*vq_num */
+ bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, 0, vq->vq_availoffset,
+ ops);
+}
+
+static inline void
+vq_sync_aring(struct virtio_softc *sc, struct virtqueue *vq, int ops)
+{
+ bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_availoffset,
+ offsetof(struct vring_avail, ring) + vq->vq_num * sizeof(uint16_t),
+ ops);
+}
+
+static inline void
+vq_sync_uring(struct virtio_softc *sc, struct virtqueue *vq, int ops)
+{
+ bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_usedoffset,
+ offsetof(struct vring_used, ring) + vq->vq_num *
+ sizeof(struct vring_used_elem), ops);
+}
+
+static inline void
+vq_sync_indirect(struct virtio_softc *sc, struct virtqueue *vq, int slot,
+ int ops)
+{
+ int offset = vq->vq_indirectoffset +
+ sizeof(struct vring_desc) * vq->vq_maxnsegs * slot;
+
+ bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, offset,
+ sizeof(struct vring_desc) * vq->vq_maxnsegs, ops);
+}
+
+/*
+ * Scan vq, bus_dmamap_sync for the vqs (not for the payload),
+ * and calls (*vq_done)() if some entries are consumed.
+ * For use in transport specific irq handlers.
+ */
+int
+virtio_check_vqs(struct virtio_softc *sc)
+{
+ struct virtqueue *vq;
+ int i, r = 0;
+
+ /* going backwards is better for if_vio */
+ for (i = sc->sc_nvqs - 1; i >= 0; i--) {
+ vq = &sc->sc_vqs[i];
+ if (vq->vq_queued) {
+ vq->vq_queued = 0;
+ vq_sync_aring(sc, vq, BUS_DMASYNC_POSTWRITE);
+ }
+ vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD);
+ if (vq->vq_used_idx != vq->vq_used->idx) {
+ if (vq->vq_done)
+ r |= (vq->vq_done)(vq);
+ }
+ }
+
+ return r;
+}
+
+/*
+ * Initialize vq structure.
+ */
+void
+virtio_init_vq(struct virtio_softc *sc, struct virtqueue *vq, int reinit)
+{
+ int i, j;
+ int vq_size = vq->vq_num;
+
+ memset(vq->vq_vaddr, 0, vq->vq_bytesize);
+
+ /* build the indirect descriptor chain */
+ if (vq->vq_indirect != NULL) {
+ struct vring_desc *vd;
+
+ for (i = 0; i < vq_size; i++) {
+ vd = vq->vq_indirect;
+ vd += vq->vq_maxnsegs * i;
+ for (j = 0; j < vq->vq_maxnsegs-1; j++)
+ vd[j].next = j + 1;
+ }
+ }
+
+ /* free slot management */
+ SIMPLEQ_INIT(&vq->vq_freelist);
+ for (i = 0; i < vq_size; i++) {
+ SIMPLEQ_INSERT_TAIL(&vq->vq_freelist,
+ &vq->vq_entries[i], qe_list);
+ vq->vq_entries[i].qe_index = i;
+ }
+
+ /* enqueue/dequeue status */
+ vq->vq_avail_idx = 0;
+ vq->vq_used_idx = 0;
+ vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
+ vq_sync_uring(sc, vq, BUS_DMASYNC_PREREAD);
+ vq->vq_queued = 1;
+}
+
+/*
+ * Allocate/free a vq.
+ */
+int
+virtio_alloc_vq(struct virtio_softc *sc, struct virtqueue *vq, int index,
+ int maxsegsize, int maxnsegs, const char *name)
+{
+ int vq_size, allocsize1, allocsize2, allocsize3, allocsize = 0;
+ int rsegs, r, hdrlen;
+#define VIRTQUEUE_ALIGN(n) (((n)+(VIRTIO_PAGE_SIZE-1))& \
+ ~(VIRTIO_PAGE_SIZE-1))
+
+ memset(vq, 0, sizeof(*vq));
+
+ vq_size = virtio_read_queue_size(sc, index);
+ if (vq_size == 0) {
+ printf("virtqueue not exist, index %d for %s\n", index, name);
+ goto err;
+ }
+ if (((vq_size - 1) & vq_size) != 0)
+ panic("vq_size not power of two: %d", vq_size);
+
+ hdrlen = (sc->sc_features & VIRTIO_F_RING_EVENT_IDX) ? 3 : 2;
+
+ /* allocsize1: descriptor table + avail ring + pad */
+ allocsize1 = VIRTQUEUE_ALIGN(sizeof(struct vring_desc) * vq_size
+ + sizeof(uint16_t) * (hdrlen + vq_size));
+ /* allocsize2: used ring + pad */
+ allocsize2 = VIRTQUEUE_ALIGN(sizeof(uint16_t) * hdrlen
+ + sizeof(struct vring_used_elem) * vq_size);
+ /* allocsize3: indirect table */
+ /* XXX: This is rather inefficient. In practice only a fraction of this
+ * XXX: memory will be used.
+ */
+ if (sc->sc_indirect && maxnsegs >= MINSEG_INDIRECT)
+ allocsize3 = sizeof(struct vring_desc) * maxnsegs * vq_size;
+ else
+ allocsize3 = 0;
+ allocsize = allocsize1 + allocsize2 + allocsize3;
+
+ /* alloc and map the memory */
+ r = bus_dmamem_alloc(sc->sc_dmat, allocsize, VIRTIO_PAGE_SIZE, 0,
+ &vq->vq_segs[0], 1, &rsegs, BUS_DMA_NOWAIT);
+ if (r != 0) {
+ printf("virtqueue %d for %s allocation failed, error %d\n",
+ index, name, r);
+ goto err;
+ }
+ r = bus_dmamem_map(sc->sc_dmat, &vq->vq_segs[0], 1, allocsize,
+ (caddr_t*)&vq->vq_vaddr, BUS_DMA_NOWAIT);
+ if (r != 0) {
+ printf("virtqueue %d for %s map failed, error %d\n", index,
+ name, r);
+ goto err;
+ }
+ r = bus_dmamap_create(sc->sc_dmat, allocsize, 1, allocsize, 0,
+ BUS_DMA_NOWAIT, &vq->vq_dmamap);
+ if (r != 0) {
+ printf("virtqueue %d for %s dmamap creation failed, "
+ "error %d\n", index, name, r);
+ goto err;
+ }
+ r = bus_dmamap_load(sc->sc_dmat, vq->vq_dmamap, vq->vq_vaddr,
+ allocsize, NULL, BUS_DMA_NOWAIT);
+ if (r != 0) {
+ printf("virtqueue %d for %s dmamap load failed, error %d\n",
+ index, name, r);
+ goto err;
+ }
+
+ virtio_setup_queue(sc, index,
+ vq->vq_dmamap->dm_segs[0].ds_addr / VIRTIO_PAGE_SIZE);
+
+ /* remember addresses and offsets for later use */
+ vq->vq_owner = sc;
+ vq->vq_num = vq_size;
+ vq->vq_mask = vq_size - 1;
+ vq->vq_index = index;
+ vq->vq_desc = vq->vq_vaddr;
+ vq->vq_availoffset = sizeof(struct vring_desc)*vq_size;
+ vq->vq_avail = (struct vring_avail*)(((char*)vq->vq_desc) +
+ vq->vq_availoffset);
+ vq->vq_usedoffset = allocsize1;
+ vq->vq_used = (struct vring_used*)(((char*)vq->vq_desc) +
+ vq->vq_usedoffset);
+ if (allocsize3 > 0) {
+ vq->vq_indirectoffset = allocsize1 + allocsize2;
+ vq->vq_indirect = (void*)(((char*)vq->vq_desc)
+ + vq->vq_indirectoffset);
+ }
+ vq->vq_bytesize = allocsize;
+ vq->vq_maxsegsize = maxsegsize;
+ vq->vq_maxnsegs = maxnsegs;
+
+ /* free slot management */
+ vq->vq_entries = mallocarray(vq_size, sizeof(struct vq_entry),
+ M_DEVBUF, M_NOWAIT | M_ZERO);
+ if (vq->vq_entries == NULL) {
+ r = ENOMEM;
+ goto err;
+ }
+
+ virtio_init_vq(sc, vq, 0);
+
+#if VIRTIO_DEBUG
+ printf("\nallocated %u byte for virtqueue %d for %s, size %d\n",
+ allocsize, index, name, vq_size);
+ if (allocsize3 > 0)
+ printf("using %d byte (%d entries) indirect descriptors\n",
+ allocsize3, maxnsegs * vq_size);
+#endif
+ return 0;
+
+err:
+ virtio_setup_queue(sc, index, 0);
+ if (vq->vq_dmamap)
+ bus_dmamap_destroy(sc->sc_dmat, vq->vq_dmamap);
+ if (vq->vq_vaddr)
+ bus_dmamem_unmap(sc->sc_dmat, vq->vq_vaddr, allocsize);
+ if (vq->vq_segs[0].ds_addr)
+ bus_dmamem_free(sc->sc_dmat, &vq->vq_segs[0], 1);
+ memset(vq, 0, sizeof(*vq));
+
+ return -1;
+}
+
+int
+virtio_free_vq(struct virtio_softc *sc, struct virtqueue *vq)
+{
+ struct vq_entry *qe;
+ int i = 0;
+
+ /* device must be already deactivated */
+ /* confirm the vq is empty */
+ SIMPLEQ_FOREACH(qe, &vq->vq_freelist, qe_list) {
+ i++;
+ }
+ if (i != vq->vq_num) {
+ printf("%s: freeing non-empty vq, index %d\n",
+ sc->sc_dev.dv_xname, vq->vq_index);
+ return EBUSY;
+ }
+
+ /* tell device that there's no virtqueue any longer */
+ virtio_setup_queue(sc, vq->vq_index, 0);
+
+ free(vq->vq_entries, M_DEVBUF, 0);
+ bus_dmamap_unload(sc->sc_dmat, vq->vq_dmamap);
+ bus_dmamap_destroy(sc->sc_dmat, vq->vq_dmamap);
+ bus_dmamem_unmap(sc->sc_dmat, vq->vq_vaddr, vq->vq_bytesize);
+ bus_dmamem_free(sc->sc_dmat, &vq->vq_segs[0], 1);
+ memset(vq, 0, sizeof(*vq));
+
+ return 0;
+}
+
+/*
+ * Free descriptor management.
+ */
+struct vq_entry *
+vq_alloc_entry(struct virtqueue *vq)
+{
+ struct vq_entry *qe;
+
+ if (SIMPLEQ_EMPTY(&vq->vq_freelist))
+ return NULL;
+ qe = SIMPLEQ_FIRST(&vq->vq_freelist);
+ SIMPLEQ_REMOVE_HEAD(&vq->vq_freelist, qe_list);
+
+ return qe;
+}
+
+void
+vq_free_entry(struct virtqueue *vq, struct vq_entry *qe)
+{
+ SIMPLEQ_INSERT_TAIL(&vq->vq_freelist, qe, qe_list);
+}
+
+/*
+ * Enqueue several dmamaps as a single request.
+ */
+/*
+ * Typical usage:
+ * <queue size> number of followings are stored in arrays
+ * - command blocks (in dmamem) should be pre-allocated and mapped
+ * - dmamaps for command blocks should be pre-allocated and loaded
+ * - dmamaps for payload should be pre-allocated
+ * r = virtio_enqueue_prep(sc, vq, &slot); // allocate a slot
+ * if (r) // currently 0 or EAGAIN
+ * return r;
+ * r = bus_dmamap_load(dmat, dmamap_payload[slot], data, count, ..);
+ * if (r) {
+ * virtio_enqueue_abort(sc, vq, slot);
+ * bus_dmamap_unload(dmat, dmamap_payload[slot]);
+ * return r;
+ * }
+ * r = virtio_enqueue_reserve(sc, vq, slot,
+ * dmamap_payload[slot]->dm_nsegs+1);
+ * // ^ +1 for command
+ * if (r) { // currently 0 or EAGAIN
+ * bus_dmamap_unload(dmat, dmamap_payload[slot]);
+ * return r; // do not call abort()
+ * }
+ * <setup and prepare commands>
+ * bus_dmamap_sync(dmat, dmamap_cmd[slot],... BUS_DMASYNC_PREWRITE);
+ * bus_dmamap_sync(dmat, dmamap_payload[slot],...);
+ * virtio_enqueue(sc, vq, slot, dmamap_cmd[slot], 0);
+ * virtio_enqueue(sc, vq, slot, dmamap_payload[slot], iswrite);
+ * virtio_enqueue_commit(sc, vq, slot, 1);
+ */
+
+/*
+ * enqueue_prep: allocate a slot number
+ */
+int
+virtio_enqueue_prep(struct virtqueue *vq, int *slotp)
+{
+ struct vq_entry *qe1;
+
+ VIRTIO_ASSERT(slotp != NULL);
+
+ qe1 = vq_alloc_entry(vq);
+ if (qe1 == NULL)
+ return EAGAIN;
+ /* next slot is not allocated yet */
+ qe1->qe_next = -1;
+ *slotp = qe1->qe_index;
+
+ return 0;
+}
+
+/*
+ * enqueue_reserve: allocate remaining slots and build the descriptor chain.
+ * Calls virtio_enqueue_abort() on failure.
+ */
+int
+virtio_enqueue_reserve(struct virtqueue *vq, int slot, int nsegs)
+{
+ int indirect;
+ struct vq_entry *qe1 = &vq->vq_entries[slot];
+
+ VIRTIO_ASSERT(qe1->qe_next == -1);
+ VIRTIO_ASSERT(1 <= nsegs && nsegs <= vq->vq_num);
+
+ if ((vq->vq_indirect != NULL) && (nsegs >= MINSEG_INDIRECT) &&
+ (nsegs <= vq->vq_maxnsegs))
+ indirect = 1;
+ else
+ indirect = 0;
+ qe1->qe_indirect = indirect;
+
+ if (indirect) {
+ struct vring_desc *vd;
+ int i;
+
+ vd = &vq->vq_desc[qe1->qe_index];
+ vd->addr = vq->vq_dmamap->dm_segs[0].ds_addr +
+ vq->vq_indirectoffset;
+ vd->addr += sizeof(struct vring_desc) * vq->vq_maxnsegs *
+ qe1->qe_index;
+ vd->len = sizeof(struct vring_desc) * nsegs;
+ vd->flags = VRING_DESC_F_INDIRECT;
+
+ vd = vq->vq_indirect;
+ vd += vq->vq_maxnsegs * qe1->qe_index;
+ qe1->qe_desc_base = vd;
+
+ for (i = 0; i < nsegs-1; i++)
+ vd[i].flags = VRING_DESC_F_NEXT;
+ vd[i].flags = 0;
+ qe1->qe_next = 0;
+
+ return 0;
+ } else {
+ struct vring_desc *vd;
+ struct vq_entry *qe;
+ int i, s;
+
+ vd = &vq->vq_desc[0];
+ qe1->qe_desc_base = vd;
+ qe1->qe_next = qe1->qe_index;
+ s = slot;
+ for (i = 0; i < nsegs - 1; i++) {
+ qe = vq_alloc_entry(vq);
+ if (qe == NULL) {
+ vd[s].flags = 0;
+ virtio_enqueue_abort(vq, slot);
+ return EAGAIN;
+ }
+ vd[s].flags = VRING_DESC_F_NEXT;
+ vd[s].next = qe->qe_index;
+ s = qe->qe_index;
+ }
+ vd[s].flags = 0;
+
+ return 0;
+ }
+}
+
+/*
+ * enqueue: enqueue a single dmamap.
+ */
+int
+virtio_enqueue(struct virtqueue *vq, int slot, bus_dmamap_t dmamap, int write)
+{
+ struct vq_entry *qe1 = &vq->vq_entries[slot];
+ struct vring_desc *vd = qe1->qe_desc_base;
+ int i;
+ int s = qe1->qe_next;
+
+ VIRTIO_ASSERT(s >= 0);
+ VIRTIO_ASSERT(dmamap->dm_nsegs > 0);
+ if (dmamap->dm_nsegs > vq->vq_maxnsegs) {
+#if VIRTIO_DEBUG
+ for (i = 0; i < dmamap->dm_nsegs; i++) {
+ printf(" %d (%d): %p %lx \n", i, write,
+ (void *)dmamap->dm_segs[i].ds_addr,
+ dmamap->dm_segs[i].ds_len);
+ }
+#endif
+ panic("dmamap->dm_nseg %d > vq->vq_maxnsegs %d\n",
+ dmamap->dm_nsegs, vq->vq_maxnsegs);
+ }
+
+ for (i = 0; i < dmamap->dm_nsegs; i++) {
+ vd[s].addr = dmamap->dm_segs[i].ds_addr;
+ vd[s].len = dmamap->dm_segs[i].ds_len;
+ if (!write)
+ vd[s].flags |= VRING_DESC_F_WRITE;
+ s = vd[s].next;
+ }
+ qe1->qe_next = s;
+
+ return 0;
+}
+
+int
+virtio_enqueue_p(struct virtqueue *vq, int slot, bus_dmamap_t dmamap,
+ bus_addr_t start, bus_size_t len, int write)
+{
+ struct vq_entry *qe1 = &vq->vq_entries[slot];
+ struct vring_desc *vd = qe1->qe_desc_base;
+ int s = qe1->qe_next;
+
+ VIRTIO_ASSERT(s >= 0);
+ /* XXX todo: handle more segments */
+ VIRTIO_ASSERT(dmamap->dm_nsegs == 1);
+ VIRTIO_ASSERT((dmamap->dm_segs[0].ds_len > start) &&
+ (dmamap->dm_segs[0].ds_len >= start + len));
+
+ vd[s].addr = dmamap->dm_segs[0].ds_addr + start;
+ vd[s].len = len;
+ if (!write)
+ vd[s].flags |= VRING_DESC_F_WRITE;
+ qe1->qe_next = vd[s].next;
+
+ return 0;
+}
+
+static void
+publish_avail_idx(struct virtio_softc *sc, struct virtqueue *vq)
+{
+ vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
+
+ virtio_membar_producer();
+ vq->vq_avail->idx = vq->vq_avail_idx;
+ vq_sync_aring(sc, vq, BUS_DMASYNC_POSTWRITE);
+ vq->vq_queued = 1;
+}
+
+/*
+ * enqueue_commit: add it to the aring.
+ */
+void
+virtio_enqueue_commit(struct virtio_softc *sc, struct virtqueue *vq, int slot,
+ int notifynow)
+{
+ struct vq_entry *qe1;
+
+ if (slot < 0)
+ goto notify;
+ vq_sync_descs(sc, vq, BUS_DMASYNC_PREWRITE);
+ qe1 = &vq->vq_entries[slot];
+ if (qe1->qe_indirect)
+ vq_sync_indirect(sc, vq, slot, BUS_DMASYNC_PREWRITE);
+ vq->vq_avail->ring[(vq->vq_avail_idx++) & vq->vq_mask] = slot;
+
+notify:
+ if (notifynow) {
+ if (vq->vq_owner->sc_features & VIRTIO_F_RING_EVENT_IDX) {
+ uint16_t o = vq->vq_avail->idx;
+ uint16_t n = vq->vq_avail_idx;
+ uint16_t t;
+ publish_avail_idx(sc, vq);
+
+ virtio_membar_sync();
+ t = VQ_AVAIL_EVENT(vq) + 1;
+ if ((uint16_t)(n - t) < (uint16_t)(n - o))
+ sc->sc_ops->kick(sc, vq->vq_index);
+ } else {
+ publish_avail_idx(sc, vq);
+
+ virtio_membar_sync();
+ if (!(vq->vq_used->flags & VRING_USED_F_NO_NOTIFY))
+ sc->sc_ops->kick(sc, vq->vq_index);
+ }
+ }
+}
+
+/*
+ * enqueue_abort: rollback.
+ */
+int
+virtio_enqueue_abort(struct virtqueue *vq, int slot)
+{
+ struct vq_entry *qe = &vq->vq_entries[slot];
+ struct vring_desc *vd;
+ int s;
+
+ if (qe->qe_next < 0) {
+ vq_free_entry(vq, qe);
+ return 0;
+ }
+
+ s = slot;
+ vd = &vq->vq_desc[0];
+ while (vd[s].flags & VRING_DESC_F_NEXT) {
+ s = vd[s].next;
+ vq_free_entry(vq, qe);
+ qe = &vq->vq_entries[s];
+ }
+ vq_free_entry(vq, qe);
+ return 0;
+}
+
+/*
+ * Dequeue a request.
+ */
+/*
+ * dequeue: dequeue a request from uring; dmamap_sync for uring is
+ * already done in the interrupt handler.
+ */
+int
+virtio_dequeue(struct virtio_softc *sc, struct virtqueue *vq,
+ int *slotp, int *lenp)
+{
+ uint16_t slot, usedidx;
+ struct vq_entry *qe;
+
+ if (vq->vq_used_idx == vq->vq_used->idx)
+ return ENOENT;
+ usedidx = vq->vq_used_idx++;
+ usedidx &= vq->vq_mask;
+
+ virtio_membar_consumer();
+ slot = vq->vq_used->ring[usedidx].id;
+ qe = &vq->vq_entries[slot];
+
+ if (qe->qe_indirect)
+ vq_sync_indirect(sc, vq, slot, BUS_DMASYNC_POSTWRITE);
+
+ if (slotp)
+ *slotp = slot;
+ if (lenp)
+ *lenp = vq->vq_used->ring[usedidx].len;
+
+ return 0;
+}
+
+/*
+ * dequeue_commit: complete dequeue; the slot is recycled for future use.
+ * if you forget to call this the slot will be leaked.
+ */
+int
+virtio_dequeue_commit(struct virtqueue *vq, int slot)
+{
+ struct vq_entry *qe = &vq->vq_entries[slot];
+ struct vring_desc *vd = &vq->vq_desc[0];
+ int s = slot;
+
+ while (vd[s].flags & VRING_DESC_F_NEXT) {
+ s = vd[s].next;
+ vq_free_entry(vq, qe);
+ qe = &vq->vq_entries[s];
+ }
+ vq_free_entry(vq, qe);
+
+ return 0;
+}
+
+/*
+ * Increase the event index in order to delay interrupts.
+ * Returns 0 on success; returns 1 if the used ring has already advanced
+ * too far, and the caller must process the queue again (otherewise, no
+ * more interrupts will happen).
+ */
+int
+virtio_postpone_intr(struct virtqueue *vq, uint16_t nslots)
+{
+ uint16_t idx;
+
+ idx = vq->vq_used_idx + nslots;
+
+ /* set the new event index: avail_ring->used_event = idx */
+ VQ_USED_EVENT(vq) = idx;
+ virtio_membar_sync();
+
+ vq_sync_aring(vq->vq_owner, vq, BUS_DMASYNC_PREWRITE);
+ vq->vq_queued++;
+
+ if (nslots < virtio_nused(vq))
+ return 1;
+
+ return 0;
+}
+
+/*
+ * Postpone interrupt until 3/4 of the available descriptors have been
+ * consumed.
+ */
+int
+virtio_postpone_intr_smart(struct virtqueue *vq)
+{
+ uint16_t nslots;
+
+ nslots = (uint16_t)(vq->vq_avail->idx - vq->vq_used_idx) * 3 / 4;
+
+ return virtio_postpone_intr(vq, nslots);
+}
+
+/*
+ * Postpone interrupt until all of the available descriptors have been
+ * consumed.
+ */
+int
+virtio_postpone_intr_far(struct virtqueue *vq)
+{
+ uint16_t nslots;
+
+ nslots = (uint16_t)(vq->vq_avail->idx - vq->vq_used_idx);
+
+ return virtio_postpone_intr(vq, nslots);
+}
+
+
+/*
+ * Start/stop vq interrupt. No guarantee.
+ */
+void
+virtio_stop_vq_intr(struct virtio_softc *sc, struct virtqueue *vq)
+{
+ if ((sc->sc_features & VIRTIO_F_RING_EVENT_IDX)) {
+ /*
+ * No way to disable the interrupt completely with
+ * RingEventIdx. Instead advance used_event by half
+ * the possible value. This won't happen soon and
+ * is far enough in the past to not trigger a spurios
+ * interrupt.
+ */
+ VQ_USED_EVENT(vq) = vq->vq_used_idx + 0x8000;
+ } else {
+ vq->vq_avail->flags |= VRING_AVAIL_F_NO_INTERRUPT;
+ }
+ vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
+ vq->vq_queued++;
+}
+
+int
+virtio_start_vq_intr(struct virtio_softc *sc, struct virtqueue *vq)
+{
+ /*
+ * If event index feature is negotiated, enabling
+ * interrupts is done through setting the latest
+ * consumed index in the used_event field
+ */
+ if (sc->sc_features & VIRTIO_F_RING_EVENT_IDX)
+ VQ_USED_EVENT(vq) = vq->vq_used_idx;
+ else
+ vq->vq_avail->flags &= ~VRING_AVAIL_F_NO_INTERRUPT;
+
+ virtio_membar_sync();
+
+ vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
+ vq->vq_queued++;
+
+ if (vq->vq_used_idx != vq->vq_used->idx)
+ return 1;
+
+ return 0;
+}
+
+/*
+ * Returns a number of slots in the used ring available to
+ * be supplied to the avail ring.
+ */
+int
+virtio_nused(struct virtqueue *vq)
+{
+ uint16_t n;
+
+ n = (uint16_t)(vq->vq_used->idx - vq->vq_used_idx);
+ VIRTIO_ASSERT(n <= vq->vq_num);
+
+ return n;
+}
+
+#if VIRTIO_DEBUG
+void
+virtio_vq_dump(struct virtqueue *vq)
+{
+ /* Common fields */
+ printf(" + vq num: %d\n", vq->vq_num);
+ printf(" + vq mask: 0x%X\n", vq->vq_mask);
+ printf(" + vq index: %d\n", vq->vq_index);
+ printf(" + vq used idx: %d\n", vq->vq_used_idx);
+ printf(" + vq avail idx: %d\n", vq->vq_avail_idx);
+ printf(" + vq queued: %d\n",vq->vq_queued);
+ /* Avail ring fields */
+ printf(" + avail flags: 0x%X\n", vq->vq_avail->flags);
+ printf(" + avail idx: %d\n", vq->vq_avail->idx);
+ printf(" + avail event: %d\n", VQ_AVAIL_EVENT(vq));
+ /* Used ring fields */
+ printf(" + used flags: 0x%X\n",vq->vq_used->flags);
+ printf(" + used idx: %d\n",vq->vq_used->idx);
+ printf(" + used event: %d\n", VQ_USED_EVENT(vq));
+ printf(" +++++++++++++++++++++++++++\n");
+}
+#endif