src/sys/dev/pv/virtio.c

1032 lines
27 KiB
C

/* $OpenBSD: virtio.c,v 1.31 2024/08/27 18:44:12 sf Exp $ */
/* $NetBSD: virtio.c,v 1.3 2011/11/02 23:05:52 njoly Exp $ */
/*
* Copyright (c) 2012 Stefan Fritsch, Alexander Fiveg.
* Copyright (c) 2010 Minoura Makoto.
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include <sys/param.h>
#include <sys/systm.h>
#include <sys/device.h>
#include <sys/atomic.h>
#include <sys/malloc.h>
#include <dev/pv/virtioreg.h>
#include <dev/pv/virtiovar.h>
#if VIRTIO_DEBUG
#define VIRTIO_ASSERT(x) KASSERT(x)
#else
#define VIRTIO_ASSERT(x)
#endif
void virtio_init_vq(struct virtio_softc *,
struct virtqueue *);
void vq_free_entry(struct virtqueue *, struct vq_entry *);
struct vq_entry *vq_alloc_entry(struct virtqueue *);
struct cfdriver virtio_cd = {
NULL, "virtio", DV_DULL
};
static const char * const virtio_device_name[] = {
"Unknown (0)", /* 0 */
"Network", /* 1 */
"Block", /* 2 */
"Console", /* 3 */
"Entropy", /* 4 */
"Memory Balloon", /* 5 */
"IO Memory", /* 6 */
"Rpmsg", /* 7 */
"SCSI host", /* 8 */
"9P Transport", /* 9 */
"mac80211 wlan", /* 10 */
NULL, /* 11 */
NULL, /* 12 */
NULL, /* 13 */
NULL, /* 14 */
NULL, /* 15 */
"GPU", /* 16 */
};
#define NDEVNAMES (sizeof(virtio_device_name)/sizeof(char*))
const char *
virtio_device_string(int id)
{
return id < NDEVNAMES ? virtio_device_name[id] : "Unknown";
}
#if VIRTIO_DEBUG
static const struct virtio_feature_name transport_feature_names[] = {
{ VIRTIO_F_NOTIFY_ON_EMPTY, "NotifyOnEmpty"},
{ VIRTIO_F_ANY_LAYOUT, "AnyLayout"},
{ VIRTIO_F_RING_INDIRECT_DESC, "RingIndirectDesc"},
{ VIRTIO_F_RING_EVENT_IDX, "RingEventIdx"},
{ VIRTIO_F_BAD_FEATURE, "BadFeature"},
{ VIRTIO_F_VERSION_1, "Version1"},
{ VIRTIO_F_ACCESS_PLATFORM, "AccessPlatf"},
{ VIRTIO_F_RING_PACKED, "RingPacked"},
{ VIRTIO_F_IN_ORDER, "InOrder"},
{ VIRTIO_F_ORDER_PLATFORM, "OrderPlatf"},
{ VIRTIO_F_SR_IOV, "SrIov"},
{ VIRTIO_F_NOTIFICATION_DATA, "NotifData"},
{ VIRTIO_F_NOTIF_CONFIG_DATA, "NotifConfData"},
{ VIRTIO_F_RING_RESET, "RingReset"},
{ 0, NULL}
};
void
virtio_log_features(uint64_t host, uint64_t neg,
const struct virtio_feature_name *guest_feature_names)
{
const struct virtio_feature_name *namep;
int i;
char c;
uint64_t bit;
for (i = 0; i < 64; i++) {
if (i == 30) {
/*
* VIRTIO_F_BAD_FEATURE is only used for
* checking correct negotiation
*/
continue;
}
bit = 1ULL << i;
if ((host&bit) == 0)
continue;
namep = guest_feature_names;
while (namep->bit && namep->bit != bit)
namep++;
if (namep->name == NULL) {
namep = transport_feature_names;
while (namep->bit && namep->bit != bit)
namep++;
}
c = (neg&bit) ? '+' : '-';
if (namep->name)
printf(" %c%s", c, namep->name);
else
printf(" %cUnknown(%d)", c, i);
}
}
#endif
/*
* Reset the device.
*/
/*
* To reset the device to a known state, do following:
* virtio_reset(sc); // this will stop the device activity
* <dequeue finished requests>; // virtio_dequeue() still can be called
* <revoke pending requests in the vqs if any>;
* virtio_reinit_start(sc); // dequeue prohibited
* <some other initialization>;
* virtio_reinit_end(sc); // device activated; enqueue allowed
* Once attached, features are assumed to not change again.
*/
void
virtio_reset(struct virtio_softc *sc)
{
virtio_device_reset(sc);
sc->sc_active_features = 0;
}
void
virtio_reinit_start(struct virtio_softc *sc)
{
int i;
virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_ACK);
virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_DRIVER);
virtio_negotiate_features(sc, NULL);
for (i = 0; i < sc->sc_nvqs; i++) {
int n;
struct virtqueue *vq = &sc->sc_vqs[i];
n = virtio_read_queue_size(sc, vq->vq_index);
if (n == 0) /* vq disappeared */
continue;
if (n != vq->vq_num) {
panic("%s: virtqueue size changed, vq index %d",
sc->sc_dev.dv_xname, vq->vq_index);
}
virtio_init_vq(sc, vq);
virtio_setup_queue(sc, vq, vq->vq_dmamap->dm_segs[0].ds_addr);
}
}
void
virtio_reinit_end(struct virtio_softc *sc)
{
virtio_set_status(sc, VIRTIO_CONFIG_DEVICE_STATUS_DRIVER_OK);
}
/*
* dmamap sync operations for a virtqueue.
*
* XXX These should be more fine grained. Syncing the whole ring if we
* XXX only need a few bytes is inefficient if we use bounce buffers.
*/
static inline void
vq_sync_descs(struct virtio_softc *sc, struct virtqueue *vq, int ops)
{
/* availoffset == sizeof(vring_desc)*vq_num */
bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, 0, vq->vq_availoffset,
ops);
}
static inline void
vq_sync_aring(struct virtio_softc *sc, struct virtqueue *vq, int ops)
{
bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_availoffset,
offsetof(struct vring_avail, ring) + vq->vq_num * sizeof(uint16_t),
ops);
}
static inline void
vq_sync_aring_used_event(struct virtio_softc *sc, struct virtqueue *vq, int ops)
{
bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_availoffset +
offsetof(struct vring_avail, ring) + vq->vq_num * sizeof(uint16_t),
sizeof(uint16_t), ops);
}
static inline void
vq_sync_uring(struct virtio_softc *sc, struct virtqueue *vq, int ops)
{
bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, vq->vq_usedoffset,
offsetof(struct vring_used, ring) + vq->vq_num *
sizeof(struct vring_used_elem), ops);
}
static inline void
vq_sync_uring_avail_event(struct virtio_softc *sc, struct virtqueue *vq, int ops)
{
bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap,
vq->vq_usedoffset + offsetof(struct vring_used, ring) +
vq->vq_num * sizeof(struct vring_used_elem), sizeof(uint16_t),
ops);
}
static inline void
vq_sync_indirect(struct virtio_softc *sc, struct virtqueue *vq, int slot,
int ops)
{
int offset = vq->vq_indirectoffset +
sizeof(struct vring_desc) * vq->vq_maxnsegs * slot;
bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, offset,
sizeof(struct vring_desc) * vq->vq_maxnsegs, ops);
}
/*
* Scan vq, bus_dmamap_sync for the vqs (not for the payload),
* and calls (*vq_done)() if some entries are consumed.
* For use in transport specific irq handlers.
*/
int
virtio_check_vqs(struct virtio_softc *sc)
{
int i, r = 0;
/* going backwards is better for if_vio */
for (i = sc->sc_nvqs - 1; i >= 0; i--)
r |= virtio_check_vq(sc, &sc->sc_vqs[i]);
return r;
}
int
virtio_check_vq(struct virtio_softc *sc, struct virtqueue *vq)
{
if (vq->vq_queued) {
vq->vq_queued = 0;
vq_sync_aring(sc, vq, BUS_DMASYNC_POSTWRITE);
}
vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD);
if (vq->vq_used_idx != vq->vq_used->idx) {
if (vq->vq_done)
return (vq->vq_done)(vq);
}
return 0;
}
/*
* Initialize vq structure.
*/
void
virtio_init_vq(struct virtio_softc *sc, struct virtqueue *vq)
{
int i, j;
int vq_size = vq->vq_num;
memset(vq->vq_vaddr, 0, vq->vq_bytesize);
/* build the indirect descriptor chain */
if (vq->vq_indirect != NULL) {
struct vring_desc *vd;
for (i = 0; i < vq_size; i++) {
vd = vq->vq_indirect;
vd += vq->vq_maxnsegs * i;
for (j = 0; j < vq->vq_maxnsegs-1; j++)
vd[j].next = j + 1;
}
}
/* free slot management */
SLIST_INIT(&vq->vq_freelist);
/*
* virtio_enqueue_trim needs monotonely raising entries, therefore
* initialize in reverse order
*/
for (i = vq_size - 1; i >= 0; i--) {
SLIST_INSERT_HEAD(&vq->vq_freelist, &vq->vq_entries[i],
qe_list);
vq->vq_entries[i].qe_index = i;
}
bus_dmamap_sync(sc->sc_dmat, vq->vq_dmamap, 0, vq->vq_bytesize,
BUS_DMASYNC_PREWRITE);
/* enqueue/dequeue status */
vq->vq_avail_idx = 0;
vq->vq_used_idx = 0;
vq_sync_uring(sc, vq, BUS_DMASYNC_PREREAD);
vq->vq_queued = 1;
}
/*
* Allocate/free a vq.
*
* maxnsegs denotes how much space should be allocated for indirect
* descriptors. maxnsegs == 1 can be used to disable use indirect
* descriptors for this queue.
*/
int
virtio_alloc_vq(struct virtio_softc *sc, struct virtqueue *vq, int index,
int maxnsegs, const char *name)
{
int vq_size, allocsize1, allocsize2, allocsize3, allocsize = 0;
int rsegs, r, hdrlen;
#define VIRTQUEUE_ALIGN(n) (((n)+(VIRTIO_PAGE_SIZE-1))& \
~(VIRTIO_PAGE_SIZE-1))
memset(vq, 0, sizeof(*vq));
vq_size = virtio_read_queue_size(sc, index);
if (vq_size == 0) {
printf("virtqueue not exist, index %d for %s\n", index, name);
goto err;
}
if (((vq_size - 1) & vq_size) != 0)
panic("vq_size not power of two: %d", vq_size);
hdrlen = virtio_has_feature(sc, VIRTIO_F_RING_EVENT_IDX) ? 3 : 2;
/* allocsize1: descriptor table + avail ring + pad */
allocsize1 = VIRTQUEUE_ALIGN(sizeof(struct vring_desc) * vq_size
+ sizeof(uint16_t) * (hdrlen + vq_size));
/* allocsize2: used ring + pad */
allocsize2 = VIRTQUEUE_ALIGN(sizeof(uint16_t) * hdrlen
+ sizeof(struct vring_used_elem) * vq_size);
/* allocsize3: indirect table */
if (sc->sc_indirect && maxnsegs > 1)
allocsize3 = sizeof(struct vring_desc) * maxnsegs * vq_size;
else
allocsize3 = 0;
allocsize = allocsize1 + allocsize2 + allocsize3;
/* alloc and map the memory */
r = bus_dmamem_alloc(sc->sc_dmat, allocsize, VIRTIO_PAGE_SIZE, 0,
&vq->vq_segs[0], 1, &rsegs, BUS_DMA_NOWAIT);
if (r != 0) {
printf("virtqueue %d for %s allocation failed, error %d\n",
index, name, r);
goto err;
}
r = bus_dmamem_map(sc->sc_dmat, &vq->vq_segs[0], 1, allocsize,
(caddr_t*)&vq->vq_vaddr, BUS_DMA_NOWAIT);
if (r != 0) {
printf("virtqueue %d for %s map failed, error %d\n", index,
name, r);
goto err;
}
r = bus_dmamap_create(sc->sc_dmat, allocsize, 1, allocsize, 0,
BUS_DMA_NOWAIT, &vq->vq_dmamap);
if (r != 0) {
printf("virtqueue %d for %s dmamap creation failed, "
"error %d\n", index, name, r);
goto err;
}
r = bus_dmamap_load(sc->sc_dmat, vq->vq_dmamap, vq->vq_vaddr,
allocsize, NULL, BUS_DMA_NOWAIT);
if (r != 0) {
printf("virtqueue %d for %s dmamap load failed, error %d\n",
index, name, r);
goto err;
}
/* remember addresses and offsets for later use */
vq->vq_owner = sc;
vq->vq_num = vq_size;
vq->vq_mask = vq_size - 1;
vq->vq_index = index;
vq->vq_desc = vq->vq_vaddr;
vq->vq_availoffset = sizeof(struct vring_desc)*vq_size;
vq->vq_avail = (struct vring_avail*)(((char*)vq->vq_desc) +
vq->vq_availoffset);
vq->vq_usedoffset = allocsize1;
vq->vq_used = (struct vring_used*)(((char*)vq->vq_desc) +
vq->vq_usedoffset);
if (allocsize3 > 0) {
vq->vq_indirectoffset = allocsize1 + allocsize2;
vq->vq_indirect = (void*)(((char*)vq->vq_desc)
+ vq->vq_indirectoffset);
}
vq->vq_bytesize = allocsize;
vq->vq_maxnsegs = maxnsegs;
/* free slot management */
vq->vq_entries = mallocarray(vq_size, sizeof(struct vq_entry),
M_DEVBUF, M_NOWAIT | M_ZERO);
if (vq->vq_entries == NULL) {
r = ENOMEM;
goto err;
}
virtio_init_vq(sc, vq);
virtio_setup_queue(sc, vq, vq->vq_dmamap->dm_segs[0].ds_addr);
#if VIRTIO_DEBUG
printf("\nallocated %u byte for virtqueue %d for %s, size %d\n",
allocsize, index, name, vq_size);
if (allocsize3 > 0)
printf("using %d byte (%d entries) indirect descriptors\n",
allocsize3, maxnsegs * vq_size);
#endif
return 0;
err:
if (vq->vq_dmamap)
bus_dmamap_destroy(sc->sc_dmat, vq->vq_dmamap);
if (vq->vq_vaddr)
bus_dmamem_unmap(sc->sc_dmat, vq->vq_vaddr, allocsize);
if (vq->vq_segs[0].ds_addr)
bus_dmamem_free(sc->sc_dmat, &vq->vq_segs[0], 1);
memset(vq, 0, sizeof(*vq));
return -1;
}
int
virtio_free_vq(struct virtio_softc *sc, struct virtqueue *vq)
{
struct vq_entry *qe;
int i = 0;
/* device must be already deactivated */
/* confirm the vq is empty */
SLIST_FOREACH(qe, &vq->vq_freelist, qe_list) {
i++;
}
if (i != vq->vq_num) {
printf("%s: freeing non-empty vq, index %d\n",
sc->sc_dev.dv_xname, vq->vq_index);
return EBUSY;
}
/* tell device that there's no virtqueue any longer */
virtio_setup_queue(sc, vq, 0);
free(vq->vq_entries, M_DEVBUF, 0);
bus_dmamap_unload(sc->sc_dmat, vq->vq_dmamap);
bus_dmamap_destroy(sc->sc_dmat, vq->vq_dmamap);
bus_dmamem_unmap(sc->sc_dmat, vq->vq_vaddr, vq->vq_bytesize);
bus_dmamem_free(sc->sc_dmat, &vq->vq_segs[0], 1);
memset(vq, 0, sizeof(*vq));
return 0;
}
/*
* Free descriptor management.
*/
struct vq_entry *
vq_alloc_entry(struct virtqueue *vq)
{
struct vq_entry *qe;
if (SLIST_EMPTY(&vq->vq_freelist))
return NULL;
qe = SLIST_FIRST(&vq->vq_freelist);
SLIST_REMOVE_HEAD(&vq->vq_freelist, qe_list);
return qe;
}
void
vq_free_entry(struct virtqueue *vq, struct vq_entry *qe)
{
SLIST_INSERT_HEAD(&vq->vq_freelist, qe, qe_list);
}
/*
* Enqueue several dmamaps as a single request.
*/
/*
* Typical usage:
* <queue size> number of followings are stored in arrays
* - command blocks (in dmamem) should be pre-allocated and mapped
* - dmamaps for command blocks should be pre-allocated and loaded
* - dmamaps for payload should be pre-allocated
* r = virtio_enqueue_prep(sc, vq, &slot); // allocate a slot
* if (r) // currently 0 or EAGAIN
* return r;
* r = bus_dmamap_load(dmat, dmamap_payload[slot], data, count, ..);
* if (r) {
* virtio_enqueue_abort(sc, vq, slot);
* bus_dmamap_unload(dmat, dmamap_payload[slot]);
* return r;
* }
* r = virtio_enqueue_reserve(sc, vq, slot,
* dmamap_payload[slot]->dm_nsegs+1);
* // ^ +1 for command
* if (r) { // currently 0 or EAGAIN
* bus_dmamap_unload(dmat, dmamap_payload[slot]);
* return r; // do not call abort()
* }
* <setup and prepare commands>
* bus_dmamap_sync(dmat, dmamap_cmd[slot],... BUS_DMASYNC_PREWRITE);
* bus_dmamap_sync(dmat, dmamap_payload[slot],...);
* virtio_enqueue(sc, vq, slot, dmamap_cmd[slot], 0);
* virtio_enqueue(sc, vq, slot, dmamap_payload[slot], iswrite);
* virtio_enqueue_commit(sc, vq, slot, 1);
*
* Alternative usage with statically allocated slots:
* <during initialization>
* // while not out of slots, do
* virtio_enqueue_prep(sc, vq, &slot); // allocate a slot
* virtio_enqueue_reserve(sc, vq, slot, max_segs); // reserve all slots
* that may ever be needed
*
* <when enqueuing a request>
* // Don't call virtio_enqueue_prep()
* bus_dmamap_load(dmat, dmamap_payload[slot], data, count, ..);
* bus_dmamap_sync(dmat, dmamap_cmd[slot],... BUS_DMASYNC_PREWRITE);
* bus_dmamap_sync(dmat, dmamap_payload[slot],...);
* virtio_enqueue_trim(sc, vq, slot, num_segs_needed);
* virtio_enqueue(sc, vq, slot, dmamap_cmd[slot], 0);
* virtio_enqueue(sc, vq, slot, dmamap_payload[slot], iswrite);
* virtio_enqueue_commit(sc, vq, slot, 1);
*
* <when dequeuing>
* // don't call virtio_dequeue_commit()
*/
/*
* enqueue_prep: allocate a slot number
*/
int
virtio_enqueue_prep(struct virtqueue *vq, int *slotp)
{
struct vq_entry *qe1;
VIRTIO_ASSERT(slotp != NULL);
qe1 = vq_alloc_entry(vq);
if (qe1 == NULL)
return EAGAIN;
/* next slot is not allocated yet */
qe1->qe_next = -1;
*slotp = qe1->qe_index;
return 0;
}
/*
* enqueue_reserve: allocate remaining slots and build the descriptor chain.
* Calls virtio_enqueue_abort() on failure.
*/
int
virtio_enqueue_reserve(struct virtqueue *vq, int slot, int nsegs)
{
struct vq_entry *qe1 = &vq->vq_entries[slot];
VIRTIO_ASSERT(qe1->qe_next == -1);
VIRTIO_ASSERT(1 <= nsegs && nsegs <= vq->vq_num);
if (vq->vq_indirect != NULL && nsegs > 1 && nsegs <= vq->vq_maxnsegs) {
struct vring_desc *vd;
int i;
qe1->qe_indirect = 1;
vd = &vq->vq_desc[qe1->qe_index];
vd->addr = vq->vq_dmamap->dm_segs[0].ds_addr +
vq->vq_indirectoffset;
vd->addr += sizeof(struct vring_desc) * vq->vq_maxnsegs *
qe1->qe_index;
vd->len = sizeof(struct vring_desc) * nsegs;
vd->flags = VRING_DESC_F_INDIRECT;
vd = vq->vq_indirect;
vd += vq->vq_maxnsegs * qe1->qe_index;
qe1->qe_desc_base = vd;
for (i = 0; i < nsegs-1; i++)
vd[i].flags = VRING_DESC_F_NEXT;
vd[i].flags = 0;
qe1->qe_next = 0;
return 0;
} else {
struct vring_desc *vd;
struct vq_entry *qe;
int i, s;
qe1->qe_indirect = 0;
vd = &vq->vq_desc[0];
qe1->qe_desc_base = vd;
qe1->qe_next = qe1->qe_index;
s = slot;
for (i = 0; i < nsegs - 1; i++) {
qe = vq_alloc_entry(vq);
if (qe == NULL) {
vd[s].flags = 0;
virtio_enqueue_abort(vq, slot);
return EAGAIN;
}
vd[s].flags = VRING_DESC_F_NEXT;
vd[s].next = qe->qe_index;
s = qe->qe_index;
}
vd[s].flags = 0;
return 0;
}
}
/*
* enqueue: enqueue a single dmamap.
*/
int
virtio_enqueue(struct virtqueue *vq, int slot, bus_dmamap_t dmamap, int write)
{
struct vq_entry *qe1 = &vq->vq_entries[slot];
struct vring_desc *vd = qe1->qe_desc_base;
int i;
int s = qe1->qe_next;
VIRTIO_ASSERT(s >= 0);
VIRTIO_ASSERT(dmamap->dm_nsegs > 0);
if (dmamap->dm_nsegs > vq->vq_maxnsegs) {
#if VIRTIO_DEBUG
for (i = 0; i < dmamap->dm_nsegs; i++) {
printf(" %d (%d): %p %lx \n", i, write,
(void *)dmamap->dm_segs[i].ds_addr,
dmamap->dm_segs[i].ds_len);
}
#endif
panic("dmamap->dm_nseg %d > vq->vq_maxnsegs %d",
dmamap->dm_nsegs, vq->vq_maxnsegs);
}
for (i = 0; i < dmamap->dm_nsegs; i++) {
vd[s].addr = dmamap->dm_segs[i].ds_addr;
vd[s].len = dmamap->dm_segs[i].ds_len;
if (!write)
vd[s].flags |= VRING_DESC_F_WRITE;
s = vd[s].next;
}
qe1->qe_next = s;
return 0;
}
int
virtio_enqueue_p(struct virtqueue *vq, int slot, bus_dmamap_t dmamap,
bus_addr_t start, bus_size_t len, int write)
{
struct vq_entry *qe1 = &vq->vq_entries[slot];
struct vring_desc *vd = qe1->qe_desc_base;
int s = qe1->qe_next;
VIRTIO_ASSERT(s >= 0);
/* XXX todo: handle more segments */
VIRTIO_ASSERT(dmamap->dm_nsegs == 1);
VIRTIO_ASSERT((dmamap->dm_segs[0].ds_len > start) &&
(dmamap->dm_segs[0].ds_len >= start + len));
vd[s].addr = dmamap->dm_segs[0].ds_addr + start;
vd[s].len = len;
if (!write)
vd[s].flags |= VRING_DESC_F_WRITE;
qe1->qe_next = vd[s].next;
return 0;
}
static void
publish_avail_idx(struct virtio_softc *sc, struct virtqueue *vq)
{
/* first make sure the avail ring entries are visible to the device */
vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
virtio_membar_producer();
vq->vq_avail->idx = vq->vq_avail_idx;
/* make the avail idx visible to the device */
vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
vq->vq_queued = 1;
}
/*
* enqueue_commit: add it to the aring.
*/
void
virtio_enqueue_commit(struct virtio_softc *sc, struct virtqueue *vq, int slot,
int notifynow)
{
struct vq_entry *qe1;
if (slot < 0)
goto notify;
vq_sync_descs(sc, vq, BUS_DMASYNC_PREWRITE);
qe1 = &vq->vq_entries[slot];
if (qe1->qe_indirect)
vq_sync_indirect(sc, vq, slot, BUS_DMASYNC_PREWRITE);
vq->vq_avail->ring[(vq->vq_avail_idx++) & vq->vq_mask] = slot;
notify:
if (notifynow) {
if (virtio_has_feature(vq->vq_owner, VIRTIO_F_RING_EVENT_IDX)) {
uint16_t o = vq->vq_avail->idx;
uint16_t n = vq->vq_avail_idx;
uint16_t t;
publish_avail_idx(sc, vq);
virtio_membar_sync();
vq_sync_uring_avail_event(sc, vq, BUS_DMASYNC_POSTREAD);
t = VQ_AVAIL_EVENT(vq) + 1;
if ((uint16_t)(n - t) < (uint16_t)(n - o))
sc->sc_ops->kick(sc, vq->vq_index);
} else {
publish_avail_idx(sc, vq);
virtio_membar_sync();
vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD);
if (!(vq->vq_used->flags & VRING_USED_F_NO_NOTIFY))
sc->sc_ops->kick(sc, vq->vq_index);
}
}
}
/*
* enqueue_abort: rollback.
*/
int
virtio_enqueue_abort(struct virtqueue *vq, int slot)
{
struct vq_entry *qe = &vq->vq_entries[slot];
struct vring_desc *vd;
int s;
if (qe->qe_next < 0) {
vq_free_entry(vq, qe);
return 0;
}
s = slot;
vd = &vq->vq_desc[0];
while (vd[s].flags & VRING_DESC_F_NEXT) {
s = vd[s].next;
vq_free_entry(vq, qe);
qe = &vq->vq_entries[s];
}
vq_free_entry(vq, qe);
return 0;
}
/*
* enqueue_trim: adjust buffer size to given # of segments, a.k.a.
* descriptors.
*/
void
virtio_enqueue_trim(struct virtqueue *vq, int slot, int nsegs)
{
struct vq_entry *qe1 = &vq->vq_entries[slot];
struct vring_desc *vd = &vq->vq_desc[0];
int i;
if ((vd[slot].flags & VRING_DESC_F_INDIRECT) == 0) {
qe1->qe_next = qe1->qe_index;
/*
* N.B.: the vq_entries are ASSUMED to be a contiguous
* block with slot being the index to the first one.
*/
} else {
qe1->qe_next = 0;
vd = &vq->vq_desc[qe1->qe_index];
vd->len = sizeof(struct vring_desc) * nsegs;
vd = qe1->qe_desc_base;
slot = 0;
}
for (i = 0; i < nsegs -1 ; i++) {
vd[slot].flags = VRING_DESC_F_NEXT;
slot++;
}
vd[slot].flags = 0;
}
/*
* Dequeue a request.
*/
/*
* dequeue: dequeue a request from uring; bus_dmamap_sync for uring must
* already have been done, usually by virtio_check_vq()
* in the interrupt handler. This means that polling virtio_dequeue()
* repeatedly until it returns 0 does not work.
*/
int
virtio_dequeue(struct virtio_softc *sc, struct virtqueue *vq,
int *slotp, int *lenp)
{
uint16_t slot, usedidx;
struct vq_entry *qe;
if (vq->vq_used_idx == vq->vq_used->idx)
return ENOENT;
usedidx = vq->vq_used_idx++;
usedidx &= vq->vq_mask;
virtio_membar_consumer();
vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD);
slot = vq->vq_used->ring[usedidx].id;
qe = &vq->vq_entries[slot];
if (qe->qe_indirect)
vq_sync_indirect(sc, vq, slot, BUS_DMASYNC_POSTWRITE);
if (slotp)
*slotp = slot;
if (lenp)
*lenp = vq->vq_used->ring[usedidx].len;
return 0;
}
/*
* dequeue_commit: complete dequeue; the slot is recycled for future use.
* if you forget to call this the slot will be leaked.
*
* Don't call this if you use statically allocated slots
* and virtio_enqueue_trim().
*/
int
virtio_dequeue_commit(struct virtqueue *vq, int slot)
{
struct vq_entry *qe = &vq->vq_entries[slot];
struct vring_desc *vd = &vq->vq_desc[0];
int s = slot;
while (vd[s].flags & VRING_DESC_F_NEXT) {
s = vd[s].next;
vq_free_entry(vq, qe);
qe = &vq->vq_entries[s];
}
vq_free_entry(vq, qe);
return 0;
}
/*
* Increase the event index in order to delay interrupts.
* Returns 0 on success; returns 1 if the used ring has already advanced
* too far, and the caller must process the queue again (otherwise, no
* more interrupts will happen).
*/
int
virtio_postpone_intr(struct virtqueue *vq, uint16_t nslots)
{
uint16_t idx;
idx = vq->vq_used_idx + nslots;
/* set the new event index: avail_ring->used_event = idx */
VQ_USED_EVENT(vq) = idx;
virtio_membar_sync();
vq_sync_aring_used_event(vq->vq_owner, vq, BUS_DMASYNC_PREWRITE);
vq->vq_queued++;
if (nslots < virtio_nused(vq))
return 1;
return 0;
}
/*
* Postpone interrupt until 3/4 of the available descriptors have been
* consumed.
*/
int
virtio_postpone_intr_smart(struct virtqueue *vq)
{
uint16_t nslots;
nslots = (uint16_t)(vq->vq_avail->idx - vq->vq_used_idx) * 3 / 4;
return virtio_postpone_intr(vq, nslots);
}
/*
* Postpone interrupt until all of the available descriptors have been
* consumed.
*/
int
virtio_postpone_intr_far(struct virtqueue *vq)
{
uint16_t nslots;
nslots = (uint16_t)(vq->vq_avail->idx - vq->vq_used_idx);
return virtio_postpone_intr(vq, nslots);
}
/*
* Start/stop vq interrupt. No guarantee.
*/
void
virtio_stop_vq_intr(struct virtio_softc *sc, struct virtqueue *vq)
{
if (virtio_has_feature(sc, VIRTIO_F_RING_EVENT_IDX)) {
/*
* No way to disable the interrupt completely with
* RingEventIdx. Instead advance used_event by half
* the possible value. This won't happen soon and
* is far enough in the past to not trigger a spurious
* interrupt.
*/
VQ_USED_EVENT(vq) = vq->vq_used_idx + 0x8000;
vq_sync_aring_used_event(sc, vq, BUS_DMASYNC_PREWRITE);
} else {
vq->vq_avail->flags |= VRING_AVAIL_F_NO_INTERRUPT;
}
vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
vq->vq_queued++;
}
int
virtio_start_vq_intr(struct virtio_softc *sc, struct virtqueue *vq)
{
/*
* If event index feature is negotiated, enabling
* interrupts is done through setting the latest
* consumed index in the used_event field
*/
if (virtio_has_feature(sc, VIRTIO_F_RING_EVENT_IDX)) {
VQ_USED_EVENT(vq) = vq->vq_used_idx;
vq_sync_aring_used_event(sc, vq, BUS_DMASYNC_PREWRITE);
} else {
vq->vq_avail->flags &= ~VRING_AVAIL_F_NO_INTERRUPT;
vq_sync_aring(sc, vq, BUS_DMASYNC_PREWRITE);
}
virtio_membar_sync();
vq->vq_queued++;
vq_sync_uring(sc, vq, BUS_DMASYNC_POSTREAD);
if (vq->vq_used_idx != vq->vq_used->idx)
return 1;
return 0;
}
/*
* Returns a number of slots in the used ring available to
* be supplied to the avail ring.
*/
int
virtio_nused(struct virtqueue *vq)
{
uint16_t n;
vq_sync_uring(vq->vq_owner, vq, BUS_DMASYNC_POSTREAD);
n = (uint16_t)(vq->vq_used->idx - vq->vq_used_idx);
VIRTIO_ASSERT(n <= vq->vq_num);
return n;
}
#if VIRTIO_DEBUG
void
virtio_vq_dump(struct virtqueue *vq)
{
#if VIRTIO_DEBUG >= 2
int i;
#endif
/* Common fields */
printf(" + addr: %p\n", vq);
printf(" + vq num: %d\n", vq->vq_num);
printf(" + vq mask: 0x%X\n", vq->vq_mask);
printf(" + vq index: %d\n", vq->vq_index);
printf(" + vq used idx: %d\n", vq->vq_used_idx);
printf(" + vq avail idx: %d\n", vq->vq_avail_idx);
printf(" + vq queued: %d\n",vq->vq_queued);
#if VIRTIO_DEBUG >= 2
for (i = 0; i < vq->vq_num; i++) {
struct vring_desc *desc = &vq->vq_desc[i];
printf(" D%-3d len:%d flags:%d next:%d\n", i, desc->len,
desc->flags, desc->next);
}
#endif
/* Avail ring fields */
printf(" + avail flags: 0x%X\n", vq->vq_avail->flags);
printf(" + avail idx: %d\n", vq->vq_avail->idx);
printf(" + avail event: %d\n", VQ_AVAIL_EVENT(vq));
#if VIRTIO_DEBUG >= 2
for (i = 0; i < vq->vq_num; i++)
printf(" A%-3d idx:%d\n", i, vq->vq_avail->ring[i]);
#endif
/* Used ring fields */
printf(" + used flags: 0x%X\n",vq->vq_used->flags);
printf(" + used idx: %d\n",vq->vq_used->idx);
printf(" + used event: %d\n", VQ_USED_EVENT(vq));
#if VIRTIO_DEBUG >= 2
for (i = 0; i < vq->vq_num; i++) {
printf(" U%-3d id:%d len:%d\n", i,
vq->vq_used->ring[i].id,
vq->vq_used->ring[i].len);
}
#endif
printf(" +++++++++++++++++++++++++++\n");
}
#endif