/* $OpenBSD: virtio.c,v 1.32 2024/09/02 08:26:26 sf Exp $ */ /* $NetBSD: virtio.c,v 1.3 2011/11/02 23:05:52 njoly Exp $ */ /* * Copyright (c) 2012 Stefan Fritsch, Alexander Fiveg. * Copyright (c) 2010 Minoura Makoto. * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions * are met: * 1. Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include #include #include #include #include #include #include #if VIRTIO_DEBUG #define VIRTIO_ASSERT(x) KASSERT(x) #else #define VIRTIO_ASSERT(x) #endif void virtio_init_vq(struct virtio_softc *, struct virtqueue *); void vq_free_entry(struct virtqueue *, struct vq_entry *); struct vq_entry *vq_alloc_entry(struct virtqueue *); struct cfdriver virtio_cd = { NULL, "virtio", DV_DULL }; static const char * const virtio_device_name[] = { "Unknown (0)", /* 0 */ "Network", /* 1 */ "Block", /* 2 */ "Console", /* 3 */ "Entropy", /* 4 */ "Memory Balloon", /* 5 */ "IO Memory", /* 6 */ "Rpmsg", /* 7 */ "SCSI host", /* 8 */ "9P Transport", /* 9 */ "mac80211 wlan", /* 10 */ NULL, /* 11 */ NULL, /* 12 */ NULL, /* 13 */ NULL, /* 14 */ NULL, /* 15 */ "GPU", /* 16 */ }; #define NDEVNAMES (sizeof(virtio_device_name)/sizeof(char*)) const char * virtio_device_string(int id) { return id < NDEVNAMES ? virtio_device_name[id] : "Unknown"; } #if VIRTIO_DEBUG static const struct virtio_feature_name transport_feature_names[] = { { VIRTIO_F_NOTIFY_ON_EMPTY, "NotifyOnEmpty"}, { VIRTIO_F_ANY_LAYOUT, "AnyLayout"}, { VIRTIO_F_RING_INDIRECT_DESC, "RingIndirectDesc"}, { VIRTIO_F_RING_EVENT_IDX, "RingEventIdx"}, { VIRTIO_F_BAD_FEATURE, "BadFeature"}, { VIRTIO_F_VERSION_1, "Version1"}, { VIRTIO_F_ACCESS_PLATFORM, "AccessPlatf"}, { VIRTIO_F_RING_PACKED, "RingPacked"}, { VIRTIO_F_IN_ORDER, "InOrder"}, { VIRTIO_F_ORDER_PLATFORM, "OrderPlatf"}, { VIRTIO_F_SR_IOV, "SrIov"}, { VIRTIO_F_NOTIFICATION_DATA, "NotifData"}, { VIRTIO_F_NOTIF_CONFIG_DATA, "NotifConfData"}, { VIRTIO_F_RING_RESET, "RingReset"}, { 0, NULL} }; void virtio_log_features(uint64_t host, uint64_t neg, const struct virtio_feature_name *guest_feature_names) { const struct virtio_feature_name *namep; int i; char c; uint64_t bit; for (i = 0; i < 64; i++) { if (i == 30) { /* * VIRTIO_F_BAD_FEATURE is only used for * checking correct negotiation */ continue; } bit = 1ULL << i; if ((host&bit) == 0) continue; namep = guest_feature_names; while (namep->bit && namep->bit != bit) namep++; if (namep->name == NULL) { namep = transport_feature_names; while (namep->bit && namep->bit != bit) namep++; } c = (neg&bit) ? '+' : '-'; if (namep->name) printf(" %c%s", c, namep->name); else printf(" %cUnknown(%d)", c, i); } } #endif /* * Reset the device. */ /* * To reset the device to a known state, do following: * virtio_reset(sc); // this will stop the device activity * ; // virtio_dequeue() still can be called * ; * virtio_reinit_start(sc); // dequeue prohibited * ; * virtio_reinit_end(sc); // device activated; enqueue allowed * Once attached, features are assumed to not change again. */ void virtio_reset(struct virtio_softc *sc) { virtio_device_reset(sc); sc->sc_active_features = 0; } void virtio_reinit_start(struct virtio_softc *sc) { int i; virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_ACK); virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_DRIVER); virtio_negotiate_features(sc, NULL); for (i = 0; i < sc->sc_nvqs; i++) { int n; struct virtqueue *vq = &sc->sc_vqs[i]; n = virtio_read_queue_size(sc, vq->vq_index); if (n == 0) /* vq disappeared */ continue; if (n != vq->vq_num) { panic("%s: virtqueue size changed, vq index %d", sc->sc_dev.dv_xname, vq->vq_index); } virtio_init_vq(sc, vq); virtio_setup_queue(sc, vq, vq->vq_dmamap->dm_segs[0].ds_addr); } sc->sc_ops->setup_intrs(sc); } void virtio_reinit_end(struct virtio_softc *sc) { virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_DRIVER_OK); } /* * dmamap sync operations for a virtqueue. * * XXX These should be more fine grained. Syncing the whole ring if we * XXX only need a few bytes is inefficient if we use bounce buffers. */ static inline void vq_sync_descs(struct virtio_softc *sc, struct virtqueue *vq, int ops) { /* availoffset == sizeof(vring_desc)*vq_num */ bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, 0, vq->vq_availoffset, ops); } static inline void vq_sync_aring(struct virtio_softc *sc, struct virtqueue *vq, int ops) { bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_availoffset, offsetof(struct vring_avail, ring) + vq->vq_num * sizeof(uint16_t), ops); } static inline void vq_sync_aring_used_event(struct virtio_softc *sc, struct virtqueue *vq, int ops) { bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_availoffset + offsetof(struct vring_avail, ring) + vq->vq_num * sizeof(uint16_t), sizeof(uint16_t), ops); } static inline void vq_sync_uring(struct virtio_softc *sc, struct virtqueue *vq, int ops) { bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_usedoffset, offsetof(struct vring_used, ring) + vq->vq_num * sizeof(struct vring_used_elem), ops); } static inline void vq_sync_uring_avail_event(struct virtio_softc *sc, struct virtqueue *vq, int ops) { bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_usedoffset + offsetof(struct vring_used, ring) + vq->vq_num * sizeof(struct vring_used_elem), sizeof(uint16_t), ops); } static inline void vq_sync_indirect(struct virtio_softc *sc, struct virtqueue *vq, int slot, int ops) { int offset = vq->vq_indirectoffset + sizeof(struct vring_desc) * vq->vq_maxnsegs * slot; bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, offset, sizeof(struct vring_desc) * vq->vq_maxnsegs, ops); } /* * Scan vq, bus_dmamap_sync for the vqs (not for the payload), * and calls (*vq_done)() if some entries are consumed. * For use in transport specific irq handlers. */ int virtio_check_vqs(struct virtio_softc *sc) { int i, r = 0; /* going backwards is better for if_vio */ for (i = sc->sc_nvqs - 1; i >= 0; i--) r |= virtio_check_vq(sc, &sc->sc_vqs[i]); return r; } int virtio_check_vq(struct virtio_softc *sc, struct virtqueue *vq) { if (vq->vq_queued) { vq->vq_queued = 0; vq_sync_aring(sc, vq, BUS_DMASYNC_POSTWRITE); } vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD); if (vq->vq_used_idx != vq->vq_used->idx) { if (vq->vq_done) return (vq->vq_done)(vq); } return 0; } /* * Initialize vq structure. */ void virtio_init_vq(struct virtio_softc *sc, struct virtqueue *vq) { int i, j; int vq_size = vq->vq_num; memset(vq->vq_vaddr, 0, vq->vq_bytesize); /* build the indirect descriptor chain */ if (vq->vq_indirect != NULL) { struct vring_desc *vd; for (i = 0; i < vq_size; i++) { vd = vq->vq_indirect; vd += vq->vq_maxnsegs * i; for (j = 0; j < vq->vq_maxnsegs-1; j++) vd[j].next = j + 1; } } /* free slot management */ SLIST_INIT(&vq->vq_freelist); /* * virtio_enqueue_trim needs monotonely raising entries, therefore * initialize in reverse order */ for (i = vq_size - 1; i >= 0; i--) { SLIST_INSERT_HEAD(&vq->vq_freelist, &vq->vq_entries[i], qe_list); vq->vq_entries[i].qe_index = i; } bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, 0, vq->vq_bytesize, BUS_DMASYNC_PREWRITE); /* enqueue/dequeue status */ vq->vq_avail_idx = 0; vq->vq_used_idx = 0; vq_sync_uring(sc, vq, BUS_DMASYNC_PREREAD); vq->vq_queued = 1; } /* * Allocate/free a vq. * * maxnsegs denotes how much space should be allocated for indirect * descriptors. maxnsegs == 1 can be used to disable use indirect * descriptors for this queue. */ int virtio_alloc_vq(struct virtio_softc *sc, struct virtqueue *vq, int index, int maxnsegs, const char *name) { int vq_size, allocsize1, allocsize2, allocsize3, allocsize = 0; int rsegs, r, hdrlen; #define VIRTQUEUE_ALIGN(n) (((n)+(VIRTIO_PAGE_SIZE-1))& \ ~(VIRTIO_PAGE_SIZE-1)) memset(vq, 0, sizeof(*vq)); vq_size = virtio_read_queue_size(sc, index); if (vq_size == 0) { printf("virtqueue not exist, index %d for %s\n", index, name); goto err; } if (((vq_size - 1) & vq_size) != 0) panic("vq_size not power of two: %d", vq_size); hdrlen = virtio_has_feature(sc, VIRTIO_F_RING_EVENT_IDX) ? 3 : 2; /* allocsize1: descriptor table + avail ring + pad */ allocsize1 = VIRTQUEUE_ALIGN(sizeof(struct vring_desc) * vq_size + sizeof(uint16_t) * (hdrlen + vq_size)); /* allocsize2: used ring + pad */ allocsize2 = VIRTQUEUE_ALIGN(sizeof(uint16_t) * hdrlen + sizeof(struct vring_used_elem) * vq_size); /* allocsize3: indirect table */ if (sc->sc_indirect && maxnsegs > 1) allocsize3 = sizeof(struct vring_desc) * maxnsegs * vq_size; else allocsize3 = 0; allocsize = allocsize1 + allocsize2 + allocsize3; /* alloc and map the memory */ r = bus_dmamem_alloc(sc->sc_dmat, allocsize, VIRTIO_PAGE_SIZE, 0, &vq->vq_segs[0], 1, &rsegs, BUS_DMA_NOWAIT); if (r != 0) { printf("virtqueue %d for %s allocation failed, error %d\n", index, name, r); goto err; } r = bus_dmamem_map(sc->sc_dmat, &vq->vq_segs[0], 1, allocsize, (caddr_t*)&vq->vq_vaddr, BUS_DMA_NOWAIT); if (r != 0) { printf("virtqueue %d for %s map failed, error %d\n", index, name, r); goto err; } r = bus_dmamap_create(sc->sc_dmat, allocsize, 1, allocsize, 0, BUS_DMA_NOWAIT, &vq->vq_dmamap); if (r != 0) { printf("virtqueue %d for %s dmamap creation failed, " "error %d\n", index, name, r); goto err; } r = bus_dmamap_load(sc->sc_dmat, vq->vq_dmamap, vq->vq_vaddr, allocsize, NULL, BUS_DMA_NOWAIT); if (r != 0) { printf("virtqueue %d for %s dmamap load failed, error %d\n", index, name, r); goto err; } /* remember addresses and offsets for later use */ vq->vq_owner = sc; vq->vq_num = vq_size; vq->vq_mask = vq_size - 1; vq->vq_index = index; vq->vq_desc = vq->vq_vaddr; vq->vq_availoffset = sizeof(struct vring_desc)*vq_size; vq->vq_avail = (struct vring_avail*)(((char*)vq->vq_desc) + vq->vq_availoffset); vq->vq_usedoffset = allocsize1; vq->vq_used = (struct vring_used*)(((char*)vq->vq_desc) + vq->vq_usedoffset); if (allocsize3 > 0) { vq->vq_indirectoffset = allocsize1 + allocsize2; vq->vq_indirect = (void*)(((char*)vq->vq_desc) + vq->vq_indirectoffset); } vq->vq_bytesize = allocsize; vq->vq_maxnsegs = maxnsegs; /* free slot management */ vq->vq_entries = mallocarray(vq_size, sizeof(struct vq_entry), M_DEVBUF, M_NOWAIT | M_ZERO); if (vq->vq_entries == NULL) { r = ENOMEM; goto err; } virtio_init_vq(sc, vq); virtio_setup_queue(sc, vq, vq->vq_dmamap->dm_segs[0].ds_addr); #if VIRTIO_DEBUG printf("\nallocated %u byte for virtqueue %d for %s, size %d\n", allocsize, index, name, vq_size); if (allocsize3 > 0) printf("using %d byte (%d entries) indirect descriptors\n", allocsize3, maxnsegs * vq_size); #endif return 0; err: if (vq->vq_dmamap) bus_dmamap_destroy(sc->sc_dmat, vq->vq_dmamap); if (vq->vq_vaddr) bus_dmamem_unmap(sc->sc_dmat, vq->vq_vaddr, allocsize); if (vq->vq_segs[0].ds_addr) bus_dmamem_free(sc->sc_dmat, &vq->vq_segs[0], 1); memset(vq, 0, sizeof(*vq)); return -1; } int virtio_free_vq(struct virtio_softc *sc, struct virtqueue *vq) { struct vq_entry *qe; int i = 0; /* device must be already deactivated */ /* confirm the vq is empty */ SLIST_FOREACH(qe, &vq->vq_freelist, qe_list) { i++; } if (i != vq->vq_num) { printf("%s: freeing non-empty vq, index %d\n", sc->sc_dev.dv_xname, vq->vq_index); return EBUSY; } /* tell device that there's no virtqueue any longer */ virtio_setup_queue(sc, vq, 0); free(vq->vq_entries, M_DEVBUF, 0); bus_dmamap_unload(sc->sc_dmat, vq->vq_dmamap); bus_dmamap_destroy(sc->sc_dmat, vq->vq_dmamap); bus_dmamem_unmap(sc->sc_dmat, vq->vq_vaddr, vq->vq_bytesize); bus_dmamem_free(sc->sc_dmat, &vq->vq_segs[0], 1); memset(vq, 0, sizeof(*vq)); return 0; } /* * Free descriptor management. */ struct vq_entry * vq_alloc_entry(struct virtqueue *vq) { struct vq_entry *qe; if (SLIST_EMPTY(&vq->vq_freelist)) return NULL; qe = SLIST_FIRST(&vq->vq_freelist); SLIST_REMOVE_HEAD(&vq->vq_freelist, qe_list); return qe; } void vq_free_entry(struct virtqueue *vq, struct vq_entry *qe) { SLIST_INSERT_HEAD(&vq->vq_freelist, qe, qe_list); } /* * Enqueue several dmamaps as a single request. */ /* * Typical usage: * number of followings are stored in arrays * - command blocks (in dmamem) should be pre-allocated and mapped * - dmamaps for command blocks should be pre-allocated and loaded * - dmamaps for payload should be pre-allocated * r = virtio_enqueue_prep(sc, vq, &slot); // allocate a slot * if (r) // currently 0 or EAGAIN * return r; * r = bus_dmamap_load(dmat, dmamap_payload[slot], data, count, ..); * if (r) { * virtio_enqueue_abort(sc, vq, slot); * bus_dmamap_unload(dmat, dmamap_payload[slot]); * return r; * } * r = virtio_enqueue_reserve(sc, vq, slot, * dmamap_payload[slot]->dm_nsegs+1); * // ^ +1 for command * if (r) { // currently 0 or EAGAIN * bus_dmamap_unload(dmat, dmamap_payload[slot]); * return r; // do not call abort() * } * * bus_dmamap_sync(dmat, dmamap_cmd[slot],... BUS_DMASYNC_PREWRITE); * bus_dmamap_sync(dmat, dmamap_payload[slot],...); * virtio_enqueue(sc, vq, slot, dmamap_cmd[slot], 0); * virtio_enqueue(sc, vq, slot, dmamap_payload[slot], iswrite); * virtio_enqueue_commit(sc, vq, slot, 1); * * Alternative usage with statically allocated slots: * * // while not out of slots, do * virtio_enqueue_prep(sc, vq, &slot); // allocate a slot * virtio_enqueue_reserve(sc, vq, slot, max_segs); // reserve all slots * that may ever be needed * * * // Don't call virtio_enqueue_prep() * bus_dmamap_load(dmat, dmamap_payload[slot], data, count, ..); * bus_dmamap_sync(dmat, dmamap_cmd[slot],... BUS_DMASYNC_PREWRITE); * bus_dmamap_sync(dmat, dmamap_payload[slot],...); * virtio_enqueue_trim(sc, vq, slot, num_segs_needed); * virtio_enqueue(sc, vq, slot, dmamap_cmd[slot], 0); * virtio_enqueue(sc, vq, slot, dmamap_payload[slot], iswrite); * virtio_enqueue_commit(sc, vq, slot, 1); * * * // don't call virtio_dequeue_commit() */ /* * enqueue_prep: allocate a slot number */ int virtio_enqueue_prep(struct virtqueue *vq, int *slotp) { struct vq_entry *qe1; VIRTIO_ASSERT(slotp != NULL); qe1 = vq_alloc_entry(vq); if (qe1 == NULL) return EAGAIN; /* next slot is not allocated yet */ qe1->qe_next = -1; *slotp = qe1->qe_index; return 0; } /* * enqueue_reserve: allocate remaining slots and build the descriptor chain. * Calls virtio_enqueue_abort() on failure. */ int virtio_enqueue_reserve(struct virtqueue *vq, int slot, int nsegs) { struct vq_entry *qe1 = &vq->vq_entries[slot]; VIRTIO_ASSERT(qe1->qe_next == -1); VIRTIO_ASSERT(1 <= nsegs && nsegs <= vq->vq_num); if (vq->vq_indirect != NULL && nsegs > 1 && nsegs <= vq->vq_maxnsegs) { struct vring_desc *vd; int i; qe1->qe_indirect = 1; vd = &vq->vq_desc[qe1->qe_index]; vd->addr = vq->vq_dmamap->dm_segs[0].ds_addr + vq->vq_indirectoffset; vd->addr += sizeof(struct vring_desc) * vq->vq_maxnsegs * qe1->qe_index; vd->len = sizeof(struct vring_desc) * nsegs; vd->flags = VRING_DESC_F_INDIRECT; vd = vq->vq_indirect; vd += vq->vq_maxnsegs * qe1->qe_index; qe1->qe_desc_base = vd; for (i = 0; i < nsegs-1; i++) vd[i].flags = VRING_DESC_F_NEXT; vd[i].flags = 0; qe1->qe_next = 0; return 0; } else { struct vring_desc *vd; struct vq_entry *qe; int i, s; qe1->qe_indirect = 0; vd = &vq->vq_desc[0]; qe1->qe_desc_base = vd; qe1->qe_next = qe1->qe_index; s = slot; for (i = 0; i < nsegs - 1; i++) { qe = vq_alloc_entry(vq); if (qe == NULL) { vd[s].flags = 0; virtio_enqueue_abort(vq, slot); return EAGAIN; } vd[s].flags = VRING_DESC_F_NEXT; vd[s].next = qe->qe_index; s = qe->qe_index; } vd[s].flags = 0; return 0; } } /* * enqueue: enqueue a single dmamap. */ int virtio_enqueue(struct virtqueue *vq, int slot, bus_dmamap_t dmamap, int write) { struct vq_entry *qe1 = &vq->vq_entries[slot]; struct vring_desc *vd = qe1->qe_desc_base; int i; int s = qe1->qe_next; VIRTIO_ASSERT(s >= 0); VIRTIO_ASSERT(dmamap->dm_nsegs > 0); if (dmamap->dm_nsegs > vq->vq_maxnsegs) { #if VIRTIO_DEBUG for (i = 0; i < dmamap->dm_nsegs; i++) { printf(" %d (%d): %p %lx \n", i, write, (void *)dmamap->dm_segs[i].ds_addr, dmamap->dm_segs[i].ds_len); } #endif panic("dmamap->dm_nseg %d > vq->vq_maxnsegs %d", dmamap->dm_nsegs, vq->vq_maxnsegs); } for (i = 0; i < dmamap->dm_nsegs; i++) { vd[s].addr = dmamap->dm_segs[i].ds_addr; vd[s].len = dmamap->dm_segs[i].ds_len; if (!write) vd[s].flags |= VRING_DESC_F_WRITE; s = vd[s].next; } qe1->qe_next = s; return 0; } int virtio_enqueue_p(struct virtqueue *vq, int slot, bus_dmamap_t dmamap, bus_addr_t start, bus_size_t len, int write) { struct vq_entry *qe1 = &vq->vq_entries[slot]; struct vring_desc *vd = qe1->qe_desc_base; int s = qe1->qe_next; VIRTIO_ASSERT(s >= 0); /* XXX todo: handle more segments */ VIRTIO_ASSERT(dmamap->dm_nsegs == 1); VIRTIO_ASSERT((dmamap->dm_segs[0].ds_len > start) && (dmamap->dm_segs[0].ds_len >= start + len)); vd[s].addr = dmamap->dm_segs[0].ds_addr + start; vd[s].len = len; if (!write) vd[s].flags |= VRING_DESC_F_WRITE; qe1->qe_next = vd[s].next; return 0; } static void publish_avail_idx(struct virtio_softc *sc, struct virtqueue *vq) { /* first make sure the avail ring entries are visible to the device */ vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE); virtio_membar_producer(); vq->vq_avail->idx = vq->vq_avail_idx; /* make the avail idx visible to the device */ vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE); vq->vq_queued = 1; } /* * enqueue_commit: add it to the aring. */ void virtio_enqueue_commit(struct virtio_softc *sc, struct virtqueue *vq, int slot, int notifynow) { struct vq_entry *qe1; if (slot < 0) goto notify; vq_sync_descs(sc, vq, BUS_DMASYNC_PREWRITE); qe1 = &vq->vq_entries[slot]; if (qe1->qe_indirect) vq_sync_indirect(sc, vq, slot, BUS_DMASYNC_PREWRITE); vq->vq_avail->ring[(vq->vq_avail_idx++) & vq->vq_mask] = slot; notify: if (notifynow) { if (virtio_has_feature(vq->vq_owner, VIRTIO_F_RING_EVENT_IDX)) { uint16_t o = vq->vq_avail->idx; uint16_t n = vq->vq_avail_idx; uint16_t t; publish_avail_idx(sc, vq); virtio_membar_sync(); vq_sync_uring_avail_event(sc, vq, BUS_DMASYNC_POSTREAD); t = VQ_AVAIL_EVENT(vq) + 1; if ((uint16_t)(n - t) < (uint16_t)(n - o)) sc->sc_ops->kick(sc, vq->vq_index); } else { publish_avail_idx(sc, vq); virtio_membar_sync(); vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD); if (!(vq->vq_used->flags & VRING_USED_F_NO_NOTIFY)) sc->sc_ops->kick(sc, vq->vq_index); } } } /* * enqueue_abort: rollback. */ int virtio_enqueue_abort(struct virtqueue *vq, int slot) { struct vq_entry *qe = &vq->vq_entries[slot]; struct vring_desc *vd; int s; if (qe->qe_next < 0) { vq_free_entry(vq, qe); return 0; } s = slot; vd = &vq->vq_desc[0]; while (vd[s].flags & VRING_DESC_F_NEXT) { s = vd[s].next; vq_free_entry(vq, qe); qe = &vq->vq_entries[s]; } vq_free_entry(vq, qe); return 0; } /* * enqueue_trim: adjust buffer size to given # of segments, a.k.a. * descriptors. */ void virtio_enqueue_trim(struct virtqueue *vq, int slot, int nsegs) { struct vq_entry *qe1 = &vq->vq_entries[slot]; struct vring_desc *vd = &vq->vq_desc[0]; int i; if ((vd[slot].flags & VRING_DESC_F_INDIRECT) == 0) { qe1->qe_next = qe1->qe_index; /* * N.B.: the vq_entries are ASSUMED to be a contiguous * block with slot being the index to the first one. */ } else { qe1->qe_next = 0; vd = &vq->vq_desc[qe1->qe_index]; vd->len = sizeof(struct vring_desc) * nsegs; vd = qe1->qe_desc_base; slot = 0; } for (i = 0; i < nsegs -1 ; i++) { vd[slot].flags = VRING_DESC_F_NEXT; slot++; } vd[slot].flags = 0; } /* * Dequeue a request. */ /* * dequeue: dequeue a request from uring; bus_dmamap_sync for uring must * already have been done, usually by virtio_check_vq() * in the interrupt handler. This means that polling virtio_dequeue() * repeatedly until it returns 0 does not work. */ int virtio_dequeue(struct virtio_softc *sc, struct virtqueue *vq, int *slotp, int *lenp) { uint16_t slot, usedidx; struct vq_entry *qe; if (vq->vq_used_idx == vq->vq_used->idx) return ENOENT; usedidx = vq->vq_used_idx++; usedidx &= vq->vq_mask; virtio_membar_consumer(); vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD); slot = vq->vq_used->ring[usedidx].id; qe = &vq->vq_entries[slot]; if (qe->qe_indirect) vq_sync_indirect(sc, vq, slot, BUS_DMASYNC_POSTWRITE); if (slotp) *slotp = slot; if (lenp) *lenp = vq->vq_used->ring[usedidx].len; return 0; } /* * dequeue_commit: complete dequeue; the slot is recycled for future use. * if you forget to call this the slot will be leaked. * * Don't call this if you use statically allocated slots * and virtio_enqueue_trim(). */ int virtio_dequeue_commit(struct virtqueue *vq, int slot) { struct vq_entry *qe = &vq->vq_entries[slot]; struct vring_desc *vd = &vq->vq_desc[0]; int s = slot; while (vd[s].flags & VRING_DESC_F_NEXT) { s = vd[s].next; vq_free_entry(vq, qe); qe = &vq->vq_entries[s]; } vq_free_entry(vq, qe); return 0; } /* * Increase the event index in order to delay interrupts. * Returns 0 on success; returns 1 if the used ring has already advanced * too far, and the caller must process the queue again (otherwise, no * more interrupts will happen). */ int virtio_postpone_intr(struct virtqueue *vq, uint16_t nslots) { uint16_t idx; idx = vq->vq_used_idx + nslots; /* set the new event index: avail_ring->used_event = idx */ VQ_USED_EVENT(vq) = idx; virtio_membar_sync(); vq_sync_aring_used_event(vq->vq_owner, vq, BUS_DMASYNC_PREWRITE); vq->vq_queued++; if (nslots < virtio_nused(vq)) return 1; return 0; } /* * Postpone interrupt until 3/4 of the available descriptors have been * consumed. */ int virtio_postpone_intr_smart(struct virtqueue *vq) { uint16_t nslots; nslots = (uint16_t)(vq->vq_avail->idx - vq->vq_used_idx) * 3 / 4; return virtio_postpone_intr(vq, nslots); } /* * Postpone interrupt until all of the available descriptors have been * consumed. */ int virtio_postpone_intr_far(struct virtqueue *vq) { uint16_t nslots; nslots = (uint16_t)(vq->vq_avail->idx - vq->vq_used_idx); return virtio_postpone_intr(vq, nslots); } /* * Start/stop vq interrupt. No guarantee. */ void virtio_stop_vq_intr(struct virtio_softc *sc, struct virtqueue *vq) { if (virtio_has_feature(sc, VIRTIO_F_RING_EVENT_IDX)) { /* * No way to disable the interrupt completely with * RingEventIdx. Instead advance used_event by half * the possible value. This won't happen soon and * is far enough in the past to not trigger a spurious * interrupt. */ VQ_USED_EVENT(vq) = vq->vq_used_idx + 0x8000; vq_sync_aring_used_event(sc, vq, BUS_DMASYNC_PREWRITE); } else { vq->vq_avail->flags |= VRING_AVAIL_F_NO_INTERRUPT; } vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE); vq->vq_queued++; } int virtio_start_vq_intr(struct virtio_softc *sc, struct virtqueue *vq) { /* * If event index feature is negotiated, enabling * interrupts is done through setting the latest * consumed index in the used_event field */ if (virtio_has_feature(sc, VIRTIO_F_RING_EVENT_IDX)) { VQ_USED_EVENT(vq) = vq->vq_used_idx; vq_sync_aring_used_event(sc, vq, BUS_DMASYNC_PREWRITE); } else { vq->vq_avail->flags &= ~VRING_AVAIL_F_NO_INTERRUPT; vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE); } virtio_membar_sync(); vq->vq_queued++; vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD); if (vq->vq_used_idx != vq->vq_used->idx) return 1; return 0; } /* * Returns a number of slots in the used ring available to * be supplied to the avail ring. */ int virtio_nused(struct virtqueue *vq) { uint16_t n; vq_sync_uring(vq->vq_owner, vq, BUS_DMASYNC_POSTREAD); n = (uint16_t)(vq->vq_used->idx - vq->vq_used_idx); VIRTIO_ASSERT(n <= vq->vq_num); return n; } #if VIRTIO_DEBUG void virtio_vq_dump(struct virtqueue *vq) { #if VIRTIO_DEBUG >= 2 int i; #endif /* Common fields */ printf(" + addr: %p\n", vq); printf(" + vq num: %d\n", vq->vq_num); printf(" + vq mask: 0x%X\n", vq->vq_mask); printf(" + vq index: %d\n", vq->vq_index); printf(" + vq used idx: %d\n", vq->vq_used_idx); printf(" + vq avail idx: %d\n", vq->vq_avail_idx); printf(" + vq queued: %d\n",vq->vq_queued); #if VIRTIO_DEBUG >= 2 for (i = 0; i < vq->vq_num; i++) { struct vring_desc *desc = &vq->vq_desc[i]; printf(" D%-3d len:%d flags:%d next:%d\n", i, desc->len, desc->flags, desc->next); } #endif /* Avail ring fields */ printf(" + avail flags: 0x%X\n", vq->vq_avail->flags); printf(" + avail idx: %d\n", vq->vq_avail->idx); printf(" + avail event: %d\n", VQ_AVAIL_EVENT(vq)); #if VIRTIO_DEBUG >= 2 for (i = 0; i < vq->vq_num; i++) printf(" A%-3d idx:%d\n", i, vq->vq_avail->ring[i]); #endif /* Used ring fields */ printf(" + used flags: 0x%X\n",vq->vq_used->flags); printf(" + used idx: %d\n",vq->vq_used->idx); printf(" + used event: %d\n", VQ_USED_EVENT(vq)); #if VIRTIO_DEBUG >= 2 for (i = 0; i < vq->vq_num; i++) { printf(" U%-3d id:%d len:%d\n", i, vq->vq_used->ring[i].id, vq->vq_used->ring[i].len); } #endif printf(" +++++++++++++++++++++++++++\n"); } #endif