Statistics
| Branch: | Revision:

root / hw / virtio.c @ bb61564c

History | View | Annotate | Download (18.9 kB)

1 967f97fa aliguori
/*
2 967f97fa aliguori
 * Virtio Support
3 967f97fa aliguori
 *
4 967f97fa aliguori
 * Copyright IBM, Corp. 2007
5 967f97fa aliguori
 *
6 967f97fa aliguori
 * Authors:
7 967f97fa aliguori
 *  Anthony Liguori   <aliguori@us.ibm.com>
8 967f97fa aliguori
 *
9 967f97fa aliguori
 * This work is licensed under the terms of the GNU GPL, version 2.  See
10 967f97fa aliguori
 * the COPYING file in the top-level directory.
11 967f97fa aliguori
 *
12 967f97fa aliguori
 */
13 967f97fa aliguori
14 967f97fa aliguori
#include <inttypes.h>
15 967f97fa aliguori
16 967f97fa aliguori
#include "virtio.h"
17 967f97fa aliguori
#include "sysemu.h"
18 967f97fa aliguori
19 f46f15bc aliguori
/* The alignment to use between consumer and producer parts of vring.
20 f46f15bc aliguori
 * x86 pagesize again. */
21 f46f15bc aliguori
#define VIRTIO_PCI_VRING_ALIGN         4096
22 f46f15bc aliguori
23 967f97fa aliguori
/* QEMU doesn't strictly need write barriers since everything runs in
24 967f97fa aliguori
 * lock-step.  We'll leave the calls to wmb() in though to make it obvious for
25 967f97fa aliguori
 * KVM or if kqemu gets SMP support.
26 79758e95 Michael S. Tsirkin
 * In any case, we must prevent the compiler from reordering the code.
27 79758e95 Michael S. Tsirkin
 * TODO: we likely need some rmb()/mb() as well.
28 967f97fa aliguori
 */
29 79758e95 Michael S. Tsirkin
30 79758e95 Michael S. Tsirkin
#define wmb() __asm__ __volatile__("": : :"memory")
31 967f97fa aliguori
32 967f97fa aliguori
typedef struct VRingDesc
33 967f97fa aliguori
{
34 967f97fa aliguori
    uint64_t addr;
35 967f97fa aliguori
    uint32_t len;
36 967f97fa aliguori
    uint16_t flags;
37 967f97fa aliguori
    uint16_t next;
38 967f97fa aliguori
} VRingDesc;
39 967f97fa aliguori
40 967f97fa aliguori
typedef struct VRingAvail
41 967f97fa aliguori
{
42 967f97fa aliguori
    uint16_t flags;
43 967f97fa aliguori
    uint16_t idx;
44 967f97fa aliguori
    uint16_t ring[0];
45 967f97fa aliguori
} VRingAvail;
46 967f97fa aliguori
47 967f97fa aliguori
typedef struct VRingUsedElem
48 967f97fa aliguori
{
49 967f97fa aliguori
    uint32_t id;
50 967f97fa aliguori
    uint32_t len;
51 967f97fa aliguori
} VRingUsedElem;
52 967f97fa aliguori
53 967f97fa aliguori
typedef struct VRingUsed
54 967f97fa aliguori
{
55 967f97fa aliguori
    uint16_t flags;
56 967f97fa aliguori
    uint16_t idx;
57 967f97fa aliguori
    VRingUsedElem ring[0];
58 967f97fa aliguori
} VRingUsed;
59 967f97fa aliguori
60 967f97fa aliguori
typedef struct VRing
61 967f97fa aliguori
{
62 967f97fa aliguori
    unsigned int num;
63 c227f099 Anthony Liguori
    target_phys_addr_t desc;
64 c227f099 Anthony Liguori
    target_phys_addr_t avail;
65 c227f099 Anthony Liguori
    target_phys_addr_t used;
66 967f97fa aliguori
} VRing;
67 967f97fa aliguori
68 967f97fa aliguori
struct VirtQueue
69 967f97fa aliguori
{
70 967f97fa aliguori
    VRing vring;
71 c227f099 Anthony Liguori
    target_phys_addr_t pa;
72 967f97fa aliguori
    uint16_t last_avail_idx;
73 967f97fa aliguori
    int inuse;
74 7055e687 Michael S. Tsirkin
    uint16_t vector;
75 967f97fa aliguori
    void (*handle_output)(VirtIODevice *vdev, VirtQueue *vq);
76 967f97fa aliguori
};
77 967f97fa aliguori
78 967f97fa aliguori
/* virt queue functions */
79 53c25cea Paul Brook
static void virtqueue_init(VirtQueue *vq)
80 967f97fa aliguori
{
81 c227f099 Anthony Liguori
    target_phys_addr_t pa = vq->pa;
82 53c25cea Paul Brook
83 967f97fa aliguori
    vq->vring.desc = pa;
84 967f97fa aliguori
    vq->vring.avail = pa + vq->vring.num * sizeof(VRingDesc);
85 f46f15bc aliguori
    vq->vring.used = vring_align(vq->vring.avail +
86 f46f15bc aliguori
                                 offsetof(VRingAvail, ring[vq->vring.num]),
87 f46f15bc aliguori
                                 VIRTIO_PCI_VRING_ALIGN);
88 967f97fa aliguori
}
89 967f97fa aliguori
90 c227f099 Anthony Liguori
static inline uint64_t vring_desc_addr(target_phys_addr_t desc_pa, int i)
91 967f97fa aliguori
{
92 c227f099 Anthony Liguori
    target_phys_addr_t pa;
93 5774cf98 Mark McLoughlin
    pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, addr);
94 967f97fa aliguori
    return ldq_phys(pa);
95 967f97fa aliguori
}
96 967f97fa aliguori
97 c227f099 Anthony Liguori
static inline uint32_t vring_desc_len(target_phys_addr_t desc_pa, int i)
98 967f97fa aliguori
{
99 c227f099 Anthony Liguori
    target_phys_addr_t pa;
100 5774cf98 Mark McLoughlin
    pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, len);
101 967f97fa aliguori
    return ldl_phys(pa);
102 967f97fa aliguori
}
103 967f97fa aliguori
104 c227f099 Anthony Liguori
static inline uint16_t vring_desc_flags(target_phys_addr_t desc_pa, int i)
105 967f97fa aliguori
{
106 c227f099 Anthony Liguori
    target_phys_addr_t pa;
107 5774cf98 Mark McLoughlin
    pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, flags);
108 967f97fa aliguori
    return lduw_phys(pa);
109 967f97fa aliguori
}
110 967f97fa aliguori
111 c227f099 Anthony Liguori
static inline uint16_t vring_desc_next(target_phys_addr_t desc_pa, int i)
112 967f97fa aliguori
{
113 c227f099 Anthony Liguori
    target_phys_addr_t pa;
114 5774cf98 Mark McLoughlin
    pa = desc_pa + sizeof(VRingDesc) * i + offsetof(VRingDesc, next);
115 967f97fa aliguori
    return lduw_phys(pa);
116 967f97fa aliguori
}
117 967f97fa aliguori
118 967f97fa aliguori
static inline uint16_t vring_avail_flags(VirtQueue *vq)
119 967f97fa aliguori
{
120 c227f099 Anthony Liguori
    target_phys_addr_t pa;
121 967f97fa aliguori
    pa = vq->vring.avail + offsetof(VRingAvail, flags);
122 967f97fa aliguori
    return lduw_phys(pa);
123 967f97fa aliguori
}
124 967f97fa aliguori
125 967f97fa aliguori
static inline uint16_t vring_avail_idx(VirtQueue *vq)
126 967f97fa aliguori
{
127 c227f099 Anthony Liguori
    target_phys_addr_t pa;
128 967f97fa aliguori
    pa = vq->vring.avail + offsetof(VRingAvail, idx);
129 967f97fa aliguori
    return lduw_phys(pa);
130 967f97fa aliguori
}
131 967f97fa aliguori
132 967f97fa aliguori
static inline uint16_t vring_avail_ring(VirtQueue *vq, int i)
133 967f97fa aliguori
{
134 c227f099 Anthony Liguori
    target_phys_addr_t pa;
135 967f97fa aliguori
    pa = vq->vring.avail + offsetof(VRingAvail, ring[i]);
136 967f97fa aliguori
    return lduw_phys(pa);
137 967f97fa aliguori
}
138 967f97fa aliguori
139 967f97fa aliguori
static inline void vring_used_ring_id(VirtQueue *vq, int i, uint32_t val)
140 967f97fa aliguori
{
141 c227f099 Anthony Liguori
    target_phys_addr_t pa;
142 967f97fa aliguori
    pa = vq->vring.used + offsetof(VRingUsed, ring[i].id);
143 967f97fa aliguori
    stl_phys(pa, val);
144 967f97fa aliguori
}
145 967f97fa aliguori
146 967f97fa aliguori
static inline void vring_used_ring_len(VirtQueue *vq, int i, uint32_t val)
147 967f97fa aliguori
{
148 c227f099 Anthony Liguori
    target_phys_addr_t pa;
149 967f97fa aliguori
    pa = vq->vring.used + offsetof(VRingUsed, ring[i].len);
150 967f97fa aliguori
    stl_phys(pa, val);
151 967f97fa aliguori
}
152 967f97fa aliguori
153 967f97fa aliguori
static uint16_t vring_used_idx(VirtQueue *vq)
154 967f97fa aliguori
{
155 c227f099 Anthony Liguori
    target_phys_addr_t pa;
156 967f97fa aliguori
    pa = vq->vring.used + offsetof(VRingUsed, idx);
157 967f97fa aliguori
    return lduw_phys(pa);
158 967f97fa aliguori
}
159 967f97fa aliguori
160 967f97fa aliguori
static inline void vring_used_idx_increment(VirtQueue *vq, uint16_t val)
161 967f97fa aliguori
{
162 c227f099 Anthony Liguori
    target_phys_addr_t pa;
163 967f97fa aliguori
    pa = vq->vring.used + offsetof(VRingUsed, idx);
164 967f97fa aliguori
    stw_phys(pa, vring_used_idx(vq) + val);
165 967f97fa aliguori
}
166 967f97fa aliguori
167 967f97fa aliguori
static inline void vring_used_flags_set_bit(VirtQueue *vq, int mask)
168 967f97fa aliguori
{
169 c227f099 Anthony Liguori
    target_phys_addr_t pa;
170 967f97fa aliguori
    pa = vq->vring.used + offsetof(VRingUsed, flags);
171 967f97fa aliguori
    stw_phys(pa, lduw_phys(pa) | mask);
172 967f97fa aliguori
}
173 967f97fa aliguori
174 967f97fa aliguori
static inline void vring_used_flags_unset_bit(VirtQueue *vq, int mask)
175 967f97fa aliguori
{
176 c227f099 Anthony Liguori
    target_phys_addr_t pa;
177 967f97fa aliguori
    pa = vq->vring.used + offsetof(VRingUsed, flags);
178 967f97fa aliguori
    stw_phys(pa, lduw_phys(pa) & ~mask);
179 967f97fa aliguori
}
180 967f97fa aliguori
181 967f97fa aliguori
void virtio_queue_set_notification(VirtQueue *vq, int enable)
182 967f97fa aliguori
{
183 967f97fa aliguori
    if (enable)
184 967f97fa aliguori
        vring_used_flags_unset_bit(vq, VRING_USED_F_NO_NOTIFY);
185 967f97fa aliguori
    else
186 967f97fa aliguori
        vring_used_flags_set_bit(vq, VRING_USED_F_NO_NOTIFY);
187 967f97fa aliguori
}
188 967f97fa aliguori
189 967f97fa aliguori
int virtio_queue_ready(VirtQueue *vq)
190 967f97fa aliguori
{
191 967f97fa aliguori
    return vq->vring.avail != 0;
192 967f97fa aliguori
}
193 967f97fa aliguori
194 967f97fa aliguori
int virtio_queue_empty(VirtQueue *vq)
195 967f97fa aliguori
{
196 967f97fa aliguori
    return vring_avail_idx(vq) == vq->last_avail_idx;
197 967f97fa aliguori
}
198 967f97fa aliguori
199 967f97fa aliguori
void virtqueue_fill(VirtQueue *vq, const VirtQueueElement *elem,
200 967f97fa aliguori
                    unsigned int len, unsigned int idx)
201 967f97fa aliguori
{
202 967f97fa aliguori
    unsigned int offset;
203 967f97fa aliguori
    int i;
204 967f97fa aliguori
205 967f97fa aliguori
    offset = 0;
206 967f97fa aliguori
    for (i = 0; i < elem->in_num; i++) {
207 967f97fa aliguori
        size_t size = MIN(len - offset, elem->in_sg[i].iov_len);
208 967f97fa aliguori
209 26b258e1 aliguori
        cpu_physical_memory_unmap(elem->in_sg[i].iov_base,
210 26b258e1 aliguori
                                  elem->in_sg[i].iov_len,
211 26b258e1 aliguori
                                  1, size);
212 967f97fa aliguori
213 26b258e1 aliguori
        offset += elem->in_sg[i].iov_len;
214 967f97fa aliguori
    }
215 967f97fa aliguori
216 26b258e1 aliguori
    for (i = 0; i < elem->out_num; i++)
217 26b258e1 aliguori
        cpu_physical_memory_unmap(elem->out_sg[i].iov_base,
218 26b258e1 aliguori
                                  elem->out_sg[i].iov_len,
219 26b258e1 aliguori
                                  0, elem->out_sg[i].iov_len);
220 26b258e1 aliguori
221 967f97fa aliguori
    idx = (idx + vring_used_idx(vq)) % vq->vring.num;
222 967f97fa aliguori
223 967f97fa aliguori
    /* Get a pointer to the next entry in the used ring. */
224 967f97fa aliguori
    vring_used_ring_id(vq, idx, elem->index);
225 967f97fa aliguori
    vring_used_ring_len(vq, idx, len);
226 967f97fa aliguori
}
227 967f97fa aliguori
228 967f97fa aliguori
void virtqueue_flush(VirtQueue *vq, unsigned int count)
229 967f97fa aliguori
{
230 967f97fa aliguori
    /* Make sure buffer is written before we update index. */
231 967f97fa aliguori
    wmb();
232 967f97fa aliguori
    vring_used_idx_increment(vq, count);
233 967f97fa aliguori
    vq->inuse -= count;
234 967f97fa aliguori
}
235 967f97fa aliguori
236 967f97fa aliguori
void virtqueue_push(VirtQueue *vq, const VirtQueueElement *elem,
237 967f97fa aliguori
                    unsigned int len)
238 967f97fa aliguori
{
239 967f97fa aliguori
    virtqueue_fill(vq, elem, len, 0);
240 967f97fa aliguori
    virtqueue_flush(vq, 1);
241 967f97fa aliguori
}
242 967f97fa aliguori
243 967f97fa aliguori
static int virtqueue_num_heads(VirtQueue *vq, unsigned int idx)
244 967f97fa aliguori
{
245 967f97fa aliguori
    uint16_t num_heads = vring_avail_idx(vq) - idx;
246 967f97fa aliguori
247 967f97fa aliguori
    /* Check it isn't doing very strange things with descriptor numbers. */
248 bb6834cf aliguori
    if (num_heads > vq->vring.num) {
249 bb6834cf aliguori
        fprintf(stderr, "Guest moved used index from %u to %u",
250 bb6834cf aliguori
                idx, vring_avail_idx(vq));
251 bb6834cf aliguori
        exit(1);
252 bb6834cf aliguori
    }
253 967f97fa aliguori
254 967f97fa aliguori
    return num_heads;
255 967f97fa aliguori
}
256 967f97fa aliguori
257 967f97fa aliguori
static unsigned int virtqueue_get_head(VirtQueue *vq, unsigned int idx)
258 967f97fa aliguori
{
259 967f97fa aliguori
    unsigned int head;
260 967f97fa aliguori
261 967f97fa aliguori
    /* Grab the next descriptor number they're advertising, and increment
262 967f97fa aliguori
     * the index we've seen. */
263 967f97fa aliguori
    head = vring_avail_ring(vq, idx % vq->vring.num);
264 967f97fa aliguori
265 967f97fa aliguori
    /* If their number is silly, that's a fatal mistake. */
266 bb6834cf aliguori
    if (head >= vq->vring.num) {
267 bb6834cf aliguori
        fprintf(stderr, "Guest says index %u is available", head);
268 bb6834cf aliguori
        exit(1);
269 bb6834cf aliguori
    }
270 967f97fa aliguori
271 967f97fa aliguori
    return head;
272 967f97fa aliguori
}
273 967f97fa aliguori
274 c227f099 Anthony Liguori
static unsigned virtqueue_next_desc(target_phys_addr_t desc_pa,
275 5774cf98 Mark McLoughlin
                                    unsigned int i, unsigned int max)
276 967f97fa aliguori
{
277 967f97fa aliguori
    unsigned int next;
278 967f97fa aliguori
279 967f97fa aliguori
    /* If this descriptor says it doesn't chain, we're done. */
280 5774cf98 Mark McLoughlin
    if (!(vring_desc_flags(desc_pa, i) & VRING_DESC_F_NEXT))
281 5774cf98 Mark McLoughlin
        return max;
282 967f97fa aliguori
283 967f97fa aliguori
    /* Check they're not leading us off end of descriptors. */
284 5774cf98 Mark McLoughlin
    next = vring_desc_next(desc_pa, i);
285 967f97fa aliguori
    /* Make sure compiler knows to grab that: we don't want it changing! */
286 967f97fa aliguori
    wmb();
287 967f97fa aliguori
288 5774cf98 Mark McLoughlin
    if (next >= max) {
289 bb6834cf aliguori
        fprintf(stderr, "Desc next is %u", next);
290 bb6834cf aliguori
        exit(1);
291 bb6834cf aliguori
    }
292 967f97fa aliguori
293 967f97fa aliguori
    return next;
294 967f97fa aliguori
}
295 967f97fa aliguori
296 967f97fa aliguori
int virtqueue_avail_bytes(VirtQueue *vq, int in_bytes, int out_bytes)
297 967f97fa aliguori
{
298 efeea6d0 Mark McLoughlin
    unsigned int idx;
299 efeea6d0 Mark McLoughlin
    int total_bufs, in_total, out_total;
300 967f97fa aliguori
301 967f97fa aliguori
    idx = vq->last_avail_idx;
302 967f97fa aliguori
303 efeea6d0 Mark McLoughlin
    total_bufs = in_total = out_total = 0;
304 967f97fa aliguori
    while (virtqueue_num_heads(vq, idx)) {
305 efeea6d0 Mark McLoughlin
        unsigned int max, num_bufs, indirect = 0;
306 c227f099 Anthony Liguori
        target_phys_addr_t desc_pa;
307 967f97fa aliguori
        int i;
308 967f97fa aliguori
309 efeea6d0 Mark McLoughlin
        max = vq->vring.num;
310 efeea6d0 Mark McLoughlin
        num_bufs = total_bufs;
311 967f97fa aliguori
        i = virtqueue_get_head(vq, idx++);
312 efeea6d0 Mark McLoughlin
        desc_pa = vq->vring.desc;
313 efeea6d0 Mark McLoughlin
314 efeea6d0 Mark McLoughlin
        if (vring_desc_flags(desc_pa, i) & VRING_DESC_F_INDIRECT) {
315 efeea6d0 Mark McLoughlin
            if (vring_desc_len(desc_pa, i) % sizeof(VRingDesc)) {
316 efeea6d0 Mark McLoughlin
                fprintf(stderr, "Invalid size for indirect buffer table\n");
317 efeea6d0 Mark McLoughlin
                exit(1);
318 efeea6d0 Mark McLoughlin
            }
319 efeea6d0 Mark McLoughlin
320 efeea6d0 Mark McLoughlin
            /* If we've got too many, that implies a descriptor loop. */
321 efeea6d0 Mark McLoughlin
            if (num_bufs >= max) {
322 efeea6d0 Mark McLoughlin
                fprintf(stderr, "Looped descriptor");
323 efeea6d0 Mark McLoughlin
                exit(1);
324 efeea6d0 Mark McLoughlin
            }
325 efeea6d0 Mark McLoughlin
326 efeea6d0 Mark McLoughlin
            /* loop over the indirect descriptor table */
327 efeea6d0 Mark McLoughlin
            indirect = 1;
328 efeea6d0 Mark McLoughlin
            max = vring_desc_len(desc_pa, i) / sizeof(VRingDesc);
329 efeea6d0 Mark McLoughlin
            num_bufs = i = 0;
330 efeea6d0 Mark McLoughlin
            desc_pa = vring_desc_addr(desc_pa, i);
331 efeea6d0 Mark McLoughlin
        }
332 efeea6d0 Mark McLoughlin
333 967f97fa aliguori
        do {
334 967f97fa aliguori
            /* If we've got too many, that implies a descriptor loop. */
335 5774cf98 Mark McLoughlin
            if (++num_bufs > max) {
336 bb6834cf aliguori
                fprintf(stderr, "Looped descriptor");
337 bb6834cf aliguori
                exit(1);
338 bb6834cf aliguori
            }
339 967f97fa aliguori
340 5774cf98 Mark McLoughlin
            if (vring_desc_flags(desc_pa, i) & VRING_DESC_F_WRITE) {
341 967f97fa aliguori
                if (in_bytes > 0 &&
342 5774cf98 Mark McLoughlin
                    (in_total += vring_desc_len(desc_pa, i)) >= in_bytes)
343 967f97fa aliguori
                    return 1;
344 967f97fa aliguori
            } else {
345 967f97fa aliguori
                if (out_bytes > 0 &&
346 5774cf98 Mark McLoughlin
                    (out_total += vring_desc_len(desc_pa, i)) >= out_bytes)
347 967f97fa aliguori
                    return 1;
348 967f97fa aliguori
            }
349 5774cf98 Mark McLoughlin
        } while ((i = virtqueue_next_desc(desc_pa, i, max)) != max);
350 efeea6d0 Mark McLoughlin
351 efeea6d0 Mark McLoughlin
        if (!indirect)
352 efeea6d0 Mark McLoughlin
            total_bufs = num_bufs;
353 efeea6d0 Mark McLoughlin
        else
354 efeea6d0 Mark McLoughlin
            total_bufs++;
355 967f97fa aliguori
    }
356 967f97fa aliguori
357 967f97fa aliguori
    return 0;
358 967f97fa aliguori
}
359 967f97fa aliguori
360 967f97fa aliguori
int virtqueue_pop(VirtQueue *vq, VirtQueueElement *elem)
361 967f97fa aliguori
{
362 5774cf98 Mark McLoughlin
    unsigned int i, head, max;
363 c227f099 Anthony Liguori
    target_phys_addr_t desc_pa = vq->vring.desc;
364 c227f099 Anthony Liguori
    target_phys_addr_t len;
365 967f97fa aliguori
366 967f97fa aliguori
    if (!virtqueue_num_heads(vq, vq->last_avail_idx))
367 967f97fa aliguori
        return 0;
368 967f97fa aliguori
369 967f97fa aliguori
    /* When we start there are none of either input nor output. */
370 967f97fa aliguori
    elem->out_num = elem->in_num = 0;
371 967f97fa aliguori
372 5774cf98 Mark McLoughlin
    max = vq->vring.num;
373 5774cf98 Mark McLoughlin
374 967f97fa aliguori
    i = head = virtqueue_get_head(vq, vq->last_avail_idx++);
375 efeea6d0 Mark McLoughlin
376 efeea6d0 Mark McLoughlin
    if (vring_desc_flags(desc_pa, i) & VRING_DESC_F_INDIRECT) {
377 efeea6d0 Mark McLoughlin
        if (vring_desc_len(desc_pa, i) % sizeof(VRingDesc)) {
378 efeea6d0 Mark McLoughlin
            fprintf(stderr, "Invalid size for indirect buffer table\n");
379 efeea6d0 Mark McLoughlin
            exit(1);
380 efeea6d0 Mark McLoughlin
        }
381 efeea6d0 Mark McLoughlin
382 efeea6d0 Mark McLoughlin
        /* loop over the indirect descriptor table */
383 efeea6d0 Mark McLoughlin
        max = vring_desc_len(desc_pa, i) / sizeof(VRingDesc);
384 efeea6d0 Mark McLoughlin
        desc_pa = vring_desc_addr(desc_pa, i);
385 efeea6d0 Mark McLoughlin
        i = 0;
386 efeea6d0 Mark McLoughlin
    }
387 efeea6d0 Mark McLoughlin
388 967f97fa aliguori
    do {
389 967f97fa aliguori
        struct iovec *sg;
390 26b258e1 aliguori
        int is_write = 0;
391 967f97fa aliguori
392 5774cf98 Mark McLoughlin
        if (vring_desc_flags(desc_pa, i) & VRING_DESC_F_WRITE) {
393 5774cf98 Mark McLoughlin
            elem->in_addr[elem->in_num] = vring_desc_addr(desc_pa, i);
394 967f97fa aliguori
            sg = &elem->in_sg[elem->in_num++];
395 26b258e1 aliguori
            is_write = 1;
396 967f97fa aliguori
        } else
397 967f97fa aliguori
            sg = &elem->out_sg[elem->out_num++];
398 967f97fa aliguori
399 967f97fa aliguori
        /* Grab the first descriptor, and check it's OK. */
400 5774cf98 Mark McLoughlin
        sg->iov_len = vring_desc_len(desc_pa, i);
401 26b258e1 aliguori
        len = sg->iov_len;
402 967f97fa aliguori
403 5774cf98 Mark McLoughlin
        sg->iov_base = cpu_physical_memory_map(vring_desc_addr(desc_pa, i),
404 5774cf98 Mark McLoughlin
                                               &len, is_write);
405 26b258e1 aliguori
406 26b258e1 aliguori
        if (sg->iov_base == NULL || len != sg->iov_len) {
407 26b258e1 aliguori
            fprintf(stderr, "virtio: trying to map MMIO memory\n");
408 bb6834cf aliguori
            exit(1);
409 bb6834cf aliguori
        }
410 967f97fa aliguori
411 967f97fa aliguori
        /* If we've got too many, that implies a descriptor loop. */
412 5774cf98 Mark McLoughlin
        if ((elem->in_num + elem->out_num) > max) {
413 bb6834cf aliguori
            fprintf(stderr, "Looped descriptor");
414 bb6834cf aliguori
            exit(1);
415 bb6834cf aliguori
        }
416 5774cf98 Mark McLoughlin
    } while ((i = virtqueue_next_desc(desc_pa, i, max)) != max);
417 967f97fa aliguori
418 967f97fa aliguori
    elem->index = head;
419 967f97fa aliguori
420 967f97fa aliguori
    vq->inuse++;
421 967f97fa aliguori
422 967f97fa aliguori
    return elem->in_num + elem->out_num;
423 967f97fa aliguori
}
424 967f97fa aliguori
425 967f97fa aliguori
/* virtio device */
426 7055e687 Michael S. Tsirkin
static void virtio_notify_vector(VirtIODevice *vdev, uint16_t vector)
427 7055e687 Michael S. Tsirkin
{
428 7055e687 Michael S. Tsirkin
    if (vdev->binding->notify) {
429 7055e687 Michael S. Tsirkin
        vdev->binding->notify(vdev->binding_opaque, vector);
430 7055e687 Michael S. Tsirkin
    }
431 7055e687 Michael S. Tsirkin
}
432 967f97fa aliguori
433 53c25cea Paul Brook
void virtio_update_irq(VirtIODevice *vdev)
434 967f97fa aliguori
{
435 7055e687 Michael S. Tsirkin
    virtio_notify_vector(vdev, VIRTIO_NO_VECTOR);
436 967f97fa aliguori
}
437 967f97fa aliguori
438 53c25cea Paul Brook
void virtio_reset(void *opaque)
439 967f97fa aliguori
{
440 967f97fa aliguori
    VirtIODevice *vdev = opaque;
441 967f97fa aliguori
    int i;
442 967f97fa aliguori
443 967f97fa aliguori
    if (vdev->reset)
444 967f97fa aliguori
        vdev->reset(vdev);
445 967f97fa aliguori
446 704a76fc Michael S. Tsirkin
    vdev->guest_features = 0;
447 967f97fa aliguori
    vdev->queue_sel = 0;
448 967f97fa aliguori
    vdev->status = 0;
449 967f97fa aliguori
    vdev->isr = 0;
450 7055e687 Michael S. Tsirkin
    vdev->config_vector = VIRTIO_NO_VECTOR;
451 7055e687 Michael S. Tsirkin
    virtio_notify_vector(vdev, vdev->config_vector);
452 967f97fa aliguori
453 967f97fa aliguori
    for(i = 0; i < VIRTIO_PCI_QUEUE_MAX; i++) {
454 967f97fa aliguori
        vdev->vq[i].vring.desc = 0;
455 967f97fa aliguori
        vdev->vq[i].vring.avail = 0;
456 967f97fa aliguori
        vdev->vq[i].vring.used = 0;
457 967f97fa aliguori
        vdev->vq[i].last_avail_idx = 0;
458 53c25cea Paul Brook
        vdev->vq[i].pa = 0;
459 7055e687 Michael S. Tsirkin
        vdev->vq[i].vector = VIRTIO_NO_VECTOR;
460 967f97fa aliguori
    }
461 967f97fa aliguori
}
462 967f97fa aliguori
463 53c25cea Paul Brook
uint32_t virtio_config_readb(VirtIODevice *vdev, uint32_t addr)
464 967f97fa aliguori
{
465 967f97fa aliguori
    uint8_t val;
466 967f97fa aliguori
467 967f97fa aliguori
    vdev->get_config(vdev, vdev->config);
468 967f97fa aliguori
469 967f97fa aliguori
    if (addr > (vdev->config_len - sizeof(val)))
470 967f97fa aliguori
        return (uint32_t)-1;
471 967f97fa aliguori
472 967f97fa aliguori
    memcpy(&val, vdev->config + addr, sizeof(val));
473 967f97fa aliguori
    return val;
474 967f97fa aliguori
}
475 967f97fa aliguori
476 53c25cea Paul Brook
uint32_t virtio_config_readw(VirtIODevice *vdev, uint32_t addr)
477 967f97fa aliguori
{
478 967f97fa aliguori
    uint16_t val;
479 967f97fa aliguori
480 967f97fa aliguori
    vdev->get_config(vdev, vdev->config);
481 967f97fa aliguori
482 967f97fa aliguori
    if (addr > (vdev->config_len - sizeof(val)))
483 967f97fa aliguori
        return (uint32_t)-1;
484 967f97fa aliguori
485 967f97fa aliguori
    memcpy(&val, vdev->config + addr, sizeof(val));
486 967f97fa aliguori
    return val;
487 967f97fa aliguori
}
488 967f97fa aliguori
489 53c25cea Paul Brook
uint32_t virtio_config_readl(VirtIODevice *vdev, uint32_t addr)
490 967f97fa aliguori
{
491 967f97fa aliguori
    uint32_t val;
492 967f97fa aliguori
493 967f97fa aliguori
    vdev->get_config(vdev, vdev->config);
494 967f97fa aliguori
495 967f97fa aliguori
    if (addr > (vdev->config_len - sizeof(val)))
496 967f97fa aliguori
        return (uint32_t)-1;
497 967f97fa aliguori
498 967f97fa aliguori
    memcpy(&val, vdev->config + addr, sizeof(val));
499 967f97fa aliguori
    return val;
500 967f97fa aliguori
}
501 967f97fa aliguori
502 53c25cea Paul Brook
void virtio_config_writeb(VirtIODevice *vdev, uint32_t addr, uint32_t data)
503 967f97fa aliguori
{
504 967f97fa aliguori
    uint8_t val = data;
505 967f97fa aliguori
506 967f97fa aliguori
    if (addr > (vdev->config_len - sizeof(val)))
507 967f97fa aliguori
        return;
508 967f97fa aliguori
509 967f97fa aliguori
    memcpy(vdev->config + addr, &val, sizeof(val));
510 967f97fa aliguori
511 967f97fa aliguori
    if (vdev->set_config)
512 967f97fa aliguori
        vdev->set_config(vdev, vdev->config);
513 967f97fa aliguori
}
514 967f97fa aliguori
515 53c25cea Paul Brook
void virtio_config_writew(VirtIODevice *vdev, uint32_t addr, uint32_t data)
516 967f97fa aliguori
{
517 967f97fa aliguori
    uint16_t val = data;
518 967f97fa aliguori
519 967f97fa aliguori
    if (addr > (vdev->config_len - sizeof(val)))
520 967f97fa aliguori
        return;
521 967f97fa aliguori
522 967f97fa aliguori
    memcpy(vdev->config + addr, &val, sizeof(val));
523 967f97fa aliguori
524 967f97fa aliguori
    if (vdev->set_config)
525 967f97fa aliguori
        vdev->set_config(vdev, vdev->config);
526 967f97fa aliguori
}
527 967f97fa aliguori
528 53c25cea Paul Brook
void virtio_config_writel(VirtIODevice *vdev, uint32_t addr, uint32_t data)
529 967f97fa aliguori
{
530 967f97fa aliguori
    uint32_t val = data;
531 967f97fa aliguori
532 967f97fa aliguori
    if (addr > (vdev->config_len - sizeof(val)))
533 967f97fa aliguori
        return;
534 967f97fa aliguori
535 967f97fa aliguori
    memcpy(vdev->config + addr, &val, sizeof(val));
536 967f97fa aliguori
537 967f97fa aliguori
    if (vdev->set_config)
538 967f97fa aliguori
        vdev->set_config(vdev, vdev->config);
539 967f97fa aliguori
}
540 967f97fa aliguori
541 c227f099 Anthony Liguori
void virtio_queue_set_addr(VirtIODevice *vdev, int n, target_phys_addr_t addr)
542 967f97fa aliguori
{
543 7055e687 Michael S. Tsirkin
    vdev->vq[n].pa = addr;
544 7055e687 Michael S. Tsirkin
    virtqueue_init(&vdev->vq[n]);
545 53c25cea Paul Brook
}
546 53c25cea Paul Brook
547 c227f099 Anthony Liguori
target_phys_addr_t virtio_queue_get_addr(VirtIODevice *vdev, int n)
548 53c25cea Paul Brook
{
549 53c25cea Paul Brook
    return vdev->vq[n].pa;
550 53c25cea Paul Brook
}
551 53c25cea Paul Brook
552 53c25cea Paul Brook
int virtio_queue_get_num(VirtIODevice *vdev, int n)
553 53c25cea Paul Brook
{
554 53c25cea Paul Brook
    return vdev->vq[n].vring.num;
555 53c25cea Paul Brook
}
556 967f97fa aliguori
557 53c25cea Paul Brook
void virtio_queue_notify(VirtIODevice *vdev, int n)
558 53c25cea Paul Brook
{
559 53c25cea Paul Brook
    if (n < VIRTIO_PCI_QUEUE_MAX && vdev->vq[n].vring.desc) {
560 53c25cea Paul Brook
        vdev->vq[n].handle_output(vdev, &vdev->vq[n]);
561 967f97fa aliguori
    }
562 967f97fa aliguori
}
563 967f97fa aliguori
564 7055e687 Michael S. Tsirkin
uint16_t virtio_queue_vector(VirtIODevice *vdev, int n)
565 7055e687 Michael S. Tsirkin
{
566 7055e687 Michael S. Tsirkin
    return n < VIRTIO_PCI_QUEUE_MAX ? vdev->vq[n].vector :
567 7055e687 Michael S. Tsirkin
        VIRTIO_NO_VECTOR;
568 7055e687 Michael S. Tsirkin
}
569 7055e687 Michael S. Tsirkin
570 7055e687 Michael S. Tsirkin
void virtio_queue_set_vector(VirtIODevice *vdev, int n, uint16_t vector)
571 7055e687 Michael S. Tsirkin
{
572 7055e687 Michael S. Tsirkin
    if (n < VIRTIO_PCI_QUEUE_MAX)
573 7055e687 Michael S. Tsirkin
        vdev->vq[n].vector = vector;
574 7055e687 Michael S. Tsirkin
}
575 7055e687 Michael S. Tsirkin
576 967f97fa aliguori
VirtQueue *virtio_add_queue(VirtIODevice *vdev, int queue_size,
577 967f97fa aliguori
                            void (*handle_output)(VirtIODevice *, VirtQueue *))
578 967f97fa aliguori
{
579 967f97fa aliguori
    int i;
580 967f97fa aliguori
581 967f97fa aliguori
    for (i = 0; i < VIRTIO_PCI_QUEUE_MAX; i++) {
582 967f97fa aliguori
        if (vdev->vq[i].vring.num == 0)
583 967f97fa aliguori
            break;
584 967f97fa aliguori
    }
585 967f97fa aliguori
586 967f97fa aliguori
    if (i == VIRTIO_PCI_QUEUE_MAX || queue_size > VIRTQUEUE_MAX_SIZE)
587 967f97fa aliguori
        abort();
588 967f97fa aliguori
589 967f97fa aliguori
    vdev->vq[i].vring.num = queue_size;
590 967f97fa aliguori
    vdev->vq[i].handle_output = handle_output;
591 967f97fa aliguori
592 967f97fa aliguori
    return &vdev->vq[i];
593 967f97fa aliguori
}
594 967f97fa aliguori
595 967f97fa aliguori
void virtio_notify(VirtIODevice *vdev, VirtQueue *vq)
596 967f97fa aliguori
{
597 97b83deb aliguori
    /* Always notify when queue is empty (when feature acknowledge) */
598 97b83deb aliguori
    if ((vring_avail_flags(vq) & VRING_AVAIL_F_NO_INTERRUPT) &&
599 704a76fc Michael S. Tsirkin
        (!(vdev->guest_features & (1 << VIRTIO_F_NOTIFY_ON_EMPTY)) ||
600 97b83deb aliguori
         (vq->inuse || vring_avail_idx(vq) != vq->last_avail_idx)))
601 967f97fa aliguori
        return;
602 967f97fa aliguori
603 967f97fa aliguori
    vdev->isr |= 0x01;
604 7055e687 Michael S. Tsirkin
    virtio_notify_vector(vdev, vq->vector);
605 967f97fa aliguori
}
606 967f97fa aliguori
607 967f97fa aliguori
void virtio_notify_config(VirtIODevice *vdev)
608 967f97fa aliguori
{
609 7625162c aliguori
    if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))
610 7625162c aliguori
        return;
611 7625162c aliguori
612 967f97fa aliguori
    vdev->isr |= 0x03;
613 7055e687 Michael S. Tsirkin
    virtio_notify_vector(vdev, vdev->config_vector);
614 967f97fa aliguori
}
615 967f97fa aliguori
616 967f97fa aliguori
void virtio_save(VirtIODevice *vdev, QEMUFile *f)
617 967f97fa aliguori
{
618 967f97fa aliguori
    int i;
619 967f97fa aliguori
620 ff24bd58 Michael S. Tsirkin
    if (vdev->binding->save_config)
621 ff24bd58 Michael S. Tsirkin
        vdev->binding->save_config(vdev->binding_opaque, f);
622 967f97fa aliguori
623 967f97fa aliguori
    qemu_put_8s(f, &vdev->status);
624 967f97fa aliguori
    qemu_put_8s(f, &vdev->isr);
625 967f97fa aliguori
    qemu_put_be16s(f, &vdev->queue_sel);
626 704a76fc Michael S. Tsirkin
    qemu_put_be32s(f, &vdev->guest_features);
627 967f97fa aliguori
    qemu_put_be32(f, vdev->config_len);
628 967f97fa aliguori
    qemu_put_buffer(f, vdev->config, vdev->config_len);
629 967f97fa aliguori
630 967f97fa aliguori
    for (i = 0; i < VIRTIO_PCI_QUEUE_MAX; i++) {
631 967f97fa aliguori
        if (vdev->vq[i].vring.num == 0)
632 967f97fa aliguori
            break;
633 967f97fa aliguori
    }
634 967f97fa aliguori
635 967f97fa aliguori
    qemu_put_be32(f, i);
636 967f97fa aliguori
637 967f97fa aliguori
    for (i = 0; i < VIRTIO_PCI_QUEUE_MAX; i++) {
638 967f97fa aliguori
        if (vdev->vq[i].vring.num == 0)
639 967f97fa aliguori
            break;
640 967f97fa aliguori
641 967f97fa aliguori
        qemu_put_be32(f, vdev->vq[i].vring.num);
642 53c25cea Paul Brook
        qemu_put_be64(f, vdev->vq[i].pa);
643 967f97fa aliguori
        qemu_put_be16s(f, &vdev->vq[i].last_avail_idx);
644 ff24bd58 Michael S. Tsirkin
        if (vdev->binding->save_queue)
645 ff24bd58 Michael S. Tsirkin
            vdev->binding->save_queue(vdev->binding_opaque, i, f);
646 967f97fa aliguori
    }
647 967f97fa aliguori
}
648 967f97fa aliguori
649 ff24bd58 Michael S. Tsirkin
int virtio_load(VirtIODevice *vdev, QEMUFile *f)
650 967f97fa aliguori
{
651 ff24bd58 Michael S. Tsirkin
    int num, i, ret;
652 6d74ca5a Michael S. Tsirkin
    uint32_t features;
653 8172539d Michael S. Tsirkin
    uint32_t supported_features =
654 6d74ca5a Michael S. Tsirkin
        vdev->binding->get_features(vdev->binding_opaque);
655 967f97fa aliguori
656 ff24bd58 Michael S. Tsirkin
    if (vdev->binding->load_config) {
657 ff24bd58 Michael S. Tsirkin
        ret = vdev->binding->load_config(vdev->binding_opaque, f);
658 ff24bd58 Michael S. Tsirkin
        if (ret)
659 ff24bd58 Michael S. Tsirkin
            return ret;
660 ff24bd58 Michael S. Tsirkin
    }
661 967f97fa aliguori
662 967f97fa aliguori
    qemu_get_8s(f, &vdev->status);
663 967f97fa aliguori
    qemu_get_8s(f, &vdev->isr);
664 967f97fa aliguori
    qemu_get_be16s(f, &vdev->queue_sel);
665 6d74ca5a Michael S. Tsirkin
    qemu_get_be32s(f, &features);
666 6d74ca5a Michael S. Tsirkin
    if (features & ~supported_features) {
667 6d74ca5a Michael S. Tsirkin
        fprintf(stderr, "Features 0x%x unsupported. Allowed features: 0x%x\n",
668 6d74ca5a Michael S. Tsirkin
                features, supported_features);
669 6d74ca5a Michael S. Tsirkin
        return -1;
670 6d74ca5a Michael S. Tsirkin
    }
671 704a76fc Michael S. Tsirkin
    vdev->guest_features = features;
672 967f97fa aliguori
    vdev->config_len = qemu_get_be32(f);
673 967f97fa aliguori
    qemu_get_buffer(f, vdev->config, vdev->config_len);
674 967f97fa aliguori
675 967f97fa aliguori
    num = qemu_get_be32(f);
676 967f97fa aliguori
677 967f97fa aliguori
    for (i = 0; i < num; i++) {
678 967f97fa aliguori
        vdev->vq[i].vring.num = qemu_get_be32(f);
679 53c25cea Paul Brook
        vdev->vq[i].pa = qemu_get_be64(f);
680 967f97fa aliguori
        qemu_get_be16s(f, &vdev->vq[i].last_avail_idx);
681 967f97fa aliguori
682 53c25cea Paul Brook
        if (vdev->vq[i].pa) {
683 53c25cea Paul Brook
            virtqueue_init(&vdev->vq[i]);
684 967f97fa aliguori
        }
685 ff24bd58 Michael S. Tsirkin
        if (vdev->binding->load_queue) {
686 ff24bd58 Michael S. Tsirkin
            ret = vdev->binding->load_queue(vdev->binding_opaque, i, f);
687 ff24bd58 Michael S. Tsirkin
            if (ret)
688 ff24bd58 Michael S. Tsirkin
                return ret;
689 7055e687 Michael S. Tsirkin
        }
690 967f97fa aliguori
    }
691 967f97fa aliguori
692 7055e687 Michael S. Tsirkin
    virtio_notify_vector(vdev, VIRTIO_NO_VECTOR);
693 ff24bd58 Michael S. Tsirkin
    return 0;
694 967f97fa aliguori
}
695 967f97fa aliguori
696 b946a153 aliguori
void virtio_cleanup(VirtIODevice *vdev)
697 b946a153 aliguori
{
698 b946a153 aliguori
    if (vdev->config)
699 b946a153 aliguori
        qemu_free(vdev->config);
700 b946a153 aliguori
    qemu_free(vdev->vq);
701 b946a153 aliguori
}
702 b946a153 aliguori
703 53c25cea Paul Brook
VirtIODevice *virtio_common_init(const char *name, uint16_t device_id,
704 53c25cea Paul Brook
                                 size_t config_size, size_t struct_size)
705 967f97fa aliguori
{
706 967f97fa aliguori
    VirtIODevice *vdev;
707 b8193adb Michael S. Tsirkin
    int i;
708 967f97fa aliguori
709 53c25cea Paul Brook
    vdev = qemu_mallocz(struct_size);
710 967f97fa aliguori
711 53c25cea Paul Brook
    vdev->device_id = device_id;
712 967f97fa aliguori
    vdev->status = 0;
713 967f97fa aliguori
    vdev->isr = 0;
714 967f97fa aliguori
    vdev->queue_sel = 0;
715 7055e687 Michael S. Tsirkin
    vdev->config_vector = VIRTIO_NO_VECTOR;
716 967f97fa aliguori
    vdev->vq = qemu_mallocz(sizeof(VirtQueue) * VIRTIO_PCI_QUEUE_MAX);
717 b8193adb Michael S. Tsirkin
    for(i = 0; i < VIRTIO_PCI_QUEUE_MAX; i++)
718 b8193adb Michael S. Tsirkin
        vdev->vq[i].vector = VIRTIO_NO_VECTOR;
719 967f97fa aliguori
720 967f97fa aliguori
    vdev->name = name;
721 967f97fa aliguori
    vdev->config_len = config_size;
722 967f97fa aliguori
    if (vdev->config_len)
723 967f97fa aliguori
        vdev->config = qemu_mallocz(config_size);
724 967f97fa aliguori
    else
725 967f97fa aliguori
        vdev->config = NULL;
726 967f97fa aliguori
727 967f97fa aliguori
    return vdev;
728 967f97fa aliguori
}
729 53c25cea Paul Brook
730 53c25cea Paul Brook
void virtio_bind_device(VirtIODevice *vdev, const VirtIOBindings *binding,
731 53c25cea Paul Brook
                        void *opaque)
732 53c25cea Paul Brook
{
733 53c25cea Paul Brook
    vdev->binding = binding;
734 53c25cea Paul Brook
    vdev->binding_opaque = opaque;
735 53c25cea Paul Brook
}