Statistics
| Branch: | Revision:

root / kvm-all.c @ a2eebe88

History | View | Annotate | Download (28.3 kB)

1 05330448 aliguori
/*
2 05330448 aliguori
 * QEMU KVM support
3 05330448 aliguori
 *
4 05330448 aliguori
 * Copyright IBM, Corp. 2008
5 5832d1f2 aliguori
 *           Red Hat, Inc. 2008
6 05330448 aliguori
 *
7 05330448 aliguori
 * Authors:
8 05330448 aliguori
 *  Anthony Liguori   <aliguori@us.ibm.com>
9 5832d1f2 aliguori
 *  Glauber Costa     <gcosta@redhat.com>
10 05330448 aliguori
 *
11 05330448 aliguori
 * This work is licensed under the terms of the GNU GPL, version 2 or later.
12 05330448 aliguori
 * See the COPYING file in the top-level directory.
13 05330448 aliguori
 *
14 05330448 aliguori
 */
15 05330448 aliguori
16 05330448 aliguori
#include <sys/types.h>
17 05330448 aliguori
#include <sys/ioctl.h>
18 05330448 aliguori
#include <sys/mman.h>
19 984b5181 aliguori
#include <stdarg.h>
20 05330448 aliguori
21 05330448 aliguori
#include <linux/kvm.h>
22 05330448 aliguori
23 05330448 aliguori
#include "qemu-common.h"
24 05330448 aliguori
#include "sysemu.h"
25 d33a1810 Jan Kiszka
#include "hw/hw.h"
26 e22a25c9 aliguori
#include "gdbstub.h"
27 05330448 aliguori
#include "kvm.h"
28 05330448 aliguori
29 f65ed4c1 aliguori
/* KVM uses PAGE_SIZE in it's definition of COALESCED_MMIO_MAX */
30 f65ed4c1 aliguori
#define PAGE_SIZE TARGET_PAGE_SIZE
31 f65ed4c1 aliguori
32 05330448 aliguori
//#define DEBUG_KVM
33 05330448 aliguori
34 05330448 aliguori
#ifdef DEBUG_KVM
35 05330448 aliguori
#define dprintf(fmt, ...) \
36 05330448 aliguori
    do { fprintf(stderr, fmt, ## __VA_ARGS__); } while (0)
37 05330448 aliguori
#else
38 05330448 aliguori
#define dprintf(fmt, ...) \
39 05330448 aliguori
    do { } while (0)
40 05330448 aliguori
#endif
41 05330448 aliguori
42 34fc643f aliguori
typedef struct KVMSlot
43 34fc643f aliguori
{
44 c227f099 Anthony Liguori
    target_phys_addr_t start_addr;
45 c227f099 Anthony Liguori
    ram_addr_t memory_size;
46 c227f099 Anthony Liguori
    ram_addr_t phys_offset;
47 34fc643f aliguori
    int slot;
48 34fc643f aliguori
    int flags;
49 34fc643f aliguori
} KVMSlot;
50 05330448 aliguori
51 5832d1f2 aliguori
typedef struct kvm_dirty_log KVMDirtyLog;
52 5832d1f2 aliguori
53 05330448 aliguori
int kvm_allowed = 0;
54 05330448 aliguori
55 05330448 aliguori
struct KVMState
56 05330448 aliguori
{
57 05330448 aliguori
    KVMSlot slots[32];
58 05330448 aliguori
    int fd;
59 05330448 aliguori
    int vmfd;
60 f65ed4c1 aliguori
    int coalesced_mmio;
61 62a2744c Sheng Yang
#ifdef KVM_CAP_COALESCED_MMIO
62 62a2744c Sheng Yang
    struct kvm_coalesced_mmio_ring *coalesced_mmio_ring;
63 62a2744c Sheng Yang
#endif
64 e69917e2 Jan Kiszka
    int broken_set_mem_region;
65 4495d6a7 Jan Kiszka
    int migration_log;
66 a0fb002c Jan Kiszka
    int vcpu_events;
67 e22a25c9 aliguori
#ifdef KVM_CAP_SET_GUEST_DEBUG
68 e22a25c9 aliguori
    struct kvm_sw_breakpoint_head kvm_sw_breakpoints;
69 e22a25c9 aliguori
#endif
70 6f725c13 Glauber Costa
    int irqchip_in_kernel;
71 6f725c13 Glauber Costa
    int pit_in_kernel;
72 05330448 aliguori
};
73 05330448 aliguori
74 05330448 aliguori
static KVMState *kvm_state;
75 05330448 aliguori
76 05330448 aliguori
static KVMSlot *kvm_alloc_slot(KVMState *s)
77 05330448 aliguori
{
78 05330448 aliguori
    int i;
79 05330448 aliguori
80 05330448 aliguori
    for (i = 0; i < ARRAY_SIZE(s->slots); i++) {
81 62d60e8c aliguori
        /* KVM private memory slots */
82 62d60e8c aliguori
        if (i >= 8 && i < 12)
83 62d60e8c aliguori
            continue;
84 05330448 aliguori
        if (s->slots[i].memory_size == 0)
85 05330448 aliguori
            return &s->slots[i];
86 05330448 aliguori
    }
87 05330448 aliguori
88 d3f8d37f aliguori
    fprintf(stderr, "%s: no free slot available\n", __func__);
89 d3f8d37f aliguori
    abort();
90 d3f8d37f aliguori
}
91 d3f8d37f aliguori
92 d3f8d37f aliguori
static KVMSlot *kvm_lookup_matching_slot(KVMState *s,
93 c227f099 Anthony Liguori
                                         target_phys_addr_t start_addr,
94 c227f099 Anthony Liguori
                                         target_phys_addr_t end_addr)
95 d3f8d37f aliguori
{
96 d3f8d37f aliguori
    int i;
97 d3f8d37f aliguori
98 d3f8d37f aliguori
    for (i = 0; i < ARRAY_SIZE(s->slots); i++) {
99 d3f8d37f aliguori
        KVMSlot *mem = &s->slots[i];
100 d3f8d37f aliguori
101 d3f8d37f aliguori
        if (start_addr == mem->start_addr &&
102 d3f8d37f aliguori
            end_addr == mem->start_addr + mem->memory_size) {
103 d3f8d37f aliguori
            return mem;
104 d3f8d37f aliguori
        }
105 d3f8d37f aliguori
    }
106 d3f8d37f aliguori
107 05330448 aliguori
    return NULL;
108 05330448 aliguori
}
109 05330448 aliguori
110 6152e2ae aliguori
/*
111 6152e2ae aliguori
 * Find overlapping slot with lowest start address
112 6152e2ae aliguori
 */
113 6152e2ae aliguori
static KVMSlot *kvm_lookup_overlapping_slot(KVMState *s,
114 c227f099 Anthony Liguori
                                            target_phys_addr_t start_addr,
115 c227f099 Anthony Liguori
                                            target_phys_addr_t end_addr)
116 05330448 aliguori
{
117 6152e2ae aliguori
    KVMSlot *found = NULL;
118 05330448 aliguori
    int i;
119 05330448 aliguori
120 05330448 aliguori
    for (i = 0; i < ARRAY_SIZE(s->slots); i++) {
121 05330448 aliguori
        KVMSlot *mem = &s->slots[i];
122 05330448 aliguori
123 6152e2ae aliguori
        if (mem->memory_size == 0 ||
124 6152e2ae aliguori
            (found && found->start_addr < mem->start_addr)) {
125 6152e2ae aliguori
            continue;
126 6152e2ae aliguori
        }
127 6152e2ae aliguori
128 6152e2ae aliguori
        if (end_addr > mem->start_addr &&
129 6152e2ae aliguori
            start_addr < mem->start_addr + mem->memory_size) {
130 6152e2ae aliguori
            found = mem;
131 6152e2ae aliguori
        }
132 05330448 aliguori
    }
133 05330448 aliguori
134 6152e2ae aliguori
    return found;
135 05330448 aliguori
}
136 05330448 aliguori
137 5832d1f2 aliguori
static int kvm_set_user_memory_region(KVMState *s, KVMSlot *slot)
138 5832d1f2 aliguori
{
139 5832d1f2 aliguori
    struct kvm_userspace_memory_region mem;
140 5832d1f2 aliguori
141 5832d1f2 aliguori
    mem.slot = slot->slot;
142 5832d1f2 aliguori
    mem.guest_phys_addr = slot->start_addr;
143 5832d1f2 aliguori
    mem.memory_size = slot->memory_size;
144 5579c7f3 pbrook
    mem.userspace_addr = (unsigned long)qemu_get_ram_ptr(slot->phys_offset);
145 5832d1f2 aliguori
    mem.flags = slot->flags;
146 4495d6a7 Jan Kiszka
    if (s->migration_log) {
147 4495d6a7 Jan Kiszka
        mem.flags |= KVM_MEM_LOG_DIRTY_PAGES;
148 4495d6a7 Jan Kiszka
    }
149 5832d1f2 aliguori
    return kvm_vm_ioctl(s, KVM_SET_USER_MEMORY_REGION, &mem);
150 5832d1f2 aliguori
}
151 5832d1f2 aliguori
152 8d2ba1fb Jan Kiszka
static void kvm_reset_vcpu(void *opaque)
153 8d2ba1fb Jan Kiszka
{
154 8d2ba1fb Jan Kiszka
    CPUState *env = opaque;
155 8d2ba1fb Jan Kiszka
156 caa5af0f Jan Kiszka
    kvm_arch_reset_vcpu(env);
157 8d2ba1fb Jan Kiszka
    if (kvm_arch_put_registers(env)) {
158 8d2ba1fb Jan Kiszka
        fprintf(stderr, "Fatal: kvm vcpu reset failed\n");
159 8d2ba1fb Jan Kiszka
        abort();
160 8d2ba1fb Jan Kiszka
    }
161 8d2ba1fb Jan Kiszka
}
162 5832d1f2 aliguori
163 6f725c13 Glauber Costa
int kvm_irqchip_in_kernel(void)
164 6f725c13 Glauber Costa
{
165 6f725c13 Glauber Costa
    return kvm_state->irqchip_in_kernel;
166 6f725c13 Glauber Costa
}
167 6f725c13 Glauber Costa
168 6f725c13 Glauber Costa
int kvm_pit_in_kernel(void)
169 6f725c13 Glauber Costa
{
170 6f725c13 Glauber Costa
    return kvm_state->pit_in_kernel;
171 6f725c13 Glauber Costa
}
172 6f725c13 Glauber Costa
173 6f725c13 Glauber Costa
174 05330448 aliguori
int kvm_init_vcpu(CPUState *env)
175 05330448 aliguori
{
176 05330448 aliguori
    KVMState *s = kvm_state;
177 05330448 aliguori
    long mmap_size;
178 05330448 aliguori
    int ret;
179 05330448 aliguori
180 05330448 aliguori
    dprintf("kvm_init_vcpu\n");
181 05330448 aliguori
182 984b5181 aliguori
    ret = kvm_vm_ioctl(s, KVM_CREATE_VCPU, env->cpu_index);
183 05330448 aliguori
    if (ret < 0) {
184 05330448 aliguori
        dprintf("kvm_create_vcpu failed\n");
185 05330448 aliguori
        goto err;
186 05330448 aliguori
    }
187 05330448 aliguori
188 05330448 aliguori
    env->kvm_fd = ret;
189 05330448 aliguori
    env->kvm_state = s;
190 05330448 aliguori
191 05330448 aliguori
    mmap_size = kvm_ioctl(s, KVM_GET_VCPU_MMAP_SIZE, 0);
192 05330448 aliguori
    if (mmap_size < 0) {
193 05330448 aliguori
        dprintf("KVM_GET_VCPU_MMAP_SIZE failed\n");
194 05330448 aliguori
        goto err;
195 05330448 aliguori
    }
196 05330448 aliguori
197 05330448 aliguori
    env->kvm_run = mmap(NULL, mmap_size, PROT_READ | PROT_WRITE, MAP_SHARED,
198 05330448 aliguori
                        env->kvm_fd, 0);
199 05330448 aliguori
    if (env->kvm_run == MAP_FAILED) {
200 05330448 aliguori
        ret = -errno;
201 05330448 aliguori
        dprintf("mmap'ing vcpu state failed\n");
202 05330448 aliguori
        goto err;
203 05330448 aliguori
    }
204 05330448 aliguori
205 62a2744c Sheng Yang
#ifdef KVM_CAP_COALESCED_MMIO
206 62a2744c Sheng Yang
    if (s->coalesced_mmio && !s->coalesced_mmio_ring)
207 62a2744c Sheng Yang
        s->coalesced_mmio_ring = (void *) env->kvm_run +
208 62a2744c Sheng Yang
                s->coalesced_mmio * PAGE_SIZE;
209 62a2744c Sheng Yang
#endif
210 62a2744c Sheng Yang
211 05330448 aliguori
    ret = kvm_arch_init_vcpu(env);
212 8d2ba1fb Jan Kiszka
    if (ret == 0) {
213 a08d4367 Jan Kiszka
        qemu_register_reset(kvm_reset_vcpu, env);
214 caa5af0f Jan Kiszka
        kvm_arch_reset_vcpu(env);
215 8d2ba1fb Jan Kiszka
        ret = kvm_arch_put_registers(env);
216 8d2ba1fb Jan Kiszka
    }
217 05330448 aliguori
err:
218 05330448 aliguori
    return ret;
219 05330448 aliguori
}
220 05330448 aliguori
221 5832d1f2 aliguori
/*
222 5832d1f2 aliguori
 * dirty pages logging control
223 5832d1f2 aliguori
 */
224 c227f099 Anthony Liguori
static int kvm_dirty_pages_log_change(target_phys_addr_t phys_addr,
225 c227f099 Anthony Liguori
                                      ram_addr_t size, int flags, int mask)
226 5832d1f2 aliguori
{
227 5832d1f2 aliguori
    KVMState *s = kvm_state;
228 d3f8d37f aliguori
    KVMSlot *mem = kvm_lookup_matching_slot(s, phys_addr, phys_addr + size);
229 4495d6a7 Jan Kiszka
    int old_flags;
230 4495d6a7 Jan Kiszka
231 5832d1f2 aliguori
    if (mem == NULL)  {
232 d3f8d37f aliguori
            fprintf(stderr, "BUG: %s: invalid parameters " TARGET_FMT_plx "-"
233 d3f8d37f aliguori
                    TARGET_FMT_plx "\n", __func__, phys_addr,
234 c227f099 Anthony Liguori
                    (target_phys_addr_t)(phys_addr + size - 1));
235 5832d1f2 aliguori
            return -EINVAL;
236 5832d1f2 aliguori
    }
237 5832d1f2 aliguori
238 4495d6a7 Jan Kiszka
    old_flags = mem->flags;
239 5832d1f2 aliguori
240 4495d6a7 Jan Kiszka
    flags = (mem->flags & ~mask) | flags;
241 5832d1f2 aliguori
    mem->flags = flags;
242 5832d1f2 aliguori
243 4495d6a7 Jan Kiszka
    /* If nothing changed effectively, no need to issue ioctl */
244 4495d6a7 Jan Kiszka
    if (s->migration_log) {
245 4495d6a7 Jan Kiszka
        flags |= KVM_MEM_LOG_DIRTY_PAGES;
246 4495d6a7 Jan Kiszka
    }
247 4495d6a7 Jan Kiszka
    if (flags == old_flags) {
248 4495d6a7 Jan Kiszka
            return 0;
249 4495d6a7 Jan Kiszka
    }
250 4495d6a7 Jan Kiszka
251 5832d1f2 aliguori
    return kvm_set_user_memory_region(s, mem);
252 5832d1f2 aliguori
}
253 5832d1f2 aliguori
254 c227f099 Anthony Liguori
int kvm_log_start(target_phys_addr_t phys_addr, ram_addr_t size)
255 5832d1f2 aliguori
{
256 d3f8d37f aliguori
        return kvm_dirty_pages_log_change(phys_addr, size,
257 5832d1f2 aliguori
                                          KVM_MEM_LOG_DIRTY_PAGES,
258 5832d1f2 aliguori
                                          KVM_MEM_LOG_DIRTY_PAGES);
259 5832d1f2 aliguori
}
260 5832d1f2 aliguori
261 c227f099 Anthony Liguori
int kvm_log_stop(target_phys_addr_t phys_addr, ram_addr_t size)
262 5832d1f2 aliguori
{
263 d3f8d37f aliguori
        return kvm_dirty_pages_log_change(phys_addr, size,
264 5832d1f2 aliguori
                                          0,
265 5832d1f2 aliguori
                                          KVM_MEM_LOG_DIRTY_PAGES);
266 5832d1f2 aliguori
}
267 5832d1f2 aliguori
268 7b8f3b78 Michael S. Tsirkin
static int kvm_set_migration_log(int enable)
269 4495d6a7 Jan Kiszka
{
270 4495d6a7 Jan Kiszka
    KVMState *s = kvm_state;
271 4495d6a7 Jan Kiszka
    KVMSlot *mem;
272 4495d6a7 Jan Kiszka
    int i, err;
273 4495d6a7 Jan Kiszka
274 4495d6a7 Jan Kiszka
    s->migration_log = enable;
275 4495d6a7 Jan Kiszka
276 4495d6a7 Jan Kiszka
    for (i = 0; i < ARRAY_SIZE(s->slots); i++) {
277 4495d6a7 Jan Kiszka
        mem = &s->slots[i];
278 4495d6a7 Jan Kiszka
279 4495d6a7 Jan Kiszka
        if (!!(mem->flags & KVM_MEM_LOG_DIRTY_PAGES) == enable) {
280 4495d6a7 Jan Kiszka
            continue;
281 4495d6a7 Jan Kiszka
        }
282 4495d6a7 Jan Kiszka
        err = kvm_set_user_memory_region(s, mem);
283 4495d6a7 Jan Kiszka
        if (err) {
284 4495d6a7 Jan Kiszka
            return err;
285 4495d6a7 Jan Kiszka
        }
286 4495d6a7 Jan Kiszka
    }
287 4495d6a7 Jan Kiszka
    return 0;
288 4495d6a7 Jan Kiszka
}
289 4495d6a7 Jan Kiszka
290 96c1606b Alexander Graf
static int test_le_bit(unsigned long nr, unsigned char *addr)
291 96c1606b Alexander Graf
{
292 96c1606b Alexander Graf
    return (addr[nr >> 3] >> (nr & 7)) & 1;
293 96c1606b Alexander Graf
}
294 96c1606b Alexander Graf
295 5832d1f2 aliguori
/**
296 5832d1f2 aliguori
 * kvm_physical_sync_dirty_bitmap - Grab dirty bitmap from kernel space
297 5832d1f2 aliguori
 * This function updates qemu's dirty bitmap using cpu_physical_memory_set_dirty().
298 5832d1f2 aliguori
 * This means all bits are set to dirty.
299 5832d1f2 aliguori
 *
300 d3f8d37f aliguori
 * @start_add: start of logged region.
301 5832d1f2 aliguori
 * @end_addr: end of logged region.
302 5832d1f2 aliguori
 */
303 7b8f3b78 Michael S. Tsirkin
static int kvm_physical_sync_dirty_bitmap(target_phys_addr_t start_addr,
304 7b8f3b78 Michael S. Tsirkin
                                          target_phys_addr_t end_addr)
305 5832d1f2 aliguori
{
306 5832d1f2 aliguori
    KVMState *s = kvm_state;
307 151f7749 Jan Kiszka
    unsigned long size, allocated_size = 0;
308 c227f099 Anthony Liguori
    target_phys_addr_t phys_addr;
309 c227f099 Anthony Liguori
    ram_addr_t addr;
310 151f7749 Jan Kiszka
    KVMDirtyLog d;
311 151f7749 Jan Kiszka
    KVMSlot *mem;
312 151f7749 Jan Kiszka
    int ret = 0;
313 5832d1f2 aliguori
314 151f7749 Jan Kiszka
    d.dirty_bitmap = NULL;
315 151f7749 Jan Kiszka
    while (start_addr < end_addr) {
316 151f7749 Jan Kiszka
        mem = kvm_lookup_overlapping_slot(s, start_addr, end_addr);
317 151f7749 Jan Kiszka
        if (mem == NULL) {
318 151f7749 Jan Kiszka
            break;
319 151f7749 Jan Kiszka
        }
320 5832d1f2 aliguori
321 151f7749 Jan Kiszka
        size = ((mem->memory_size >> TARGET_PAGE_BITS) + 7) / 8;
322 151f7749 Jan Kiszka
        if (!d.dirty_bitmap) {
323 151f7749 Jan Kiszka
            d.dirty_bitmap = qemu_malloc(size);
324 151f7749 Jan Kiszka
        } else if (size > allocated_size) {
325 151f7749 Jan Kiszka
            d.dirty_bitmap = qemu_realloc(d.dirty_bitmap, size);
326 151f7749 Jan Kiszka
        }
327 151f7749 Jan Kiszka
        allocated_size = size;
328 151f7749 Jan Kiszka
        memset(d.dirty_bitmap, 0, allocated_size);
329 5832d1f2 aliguori
330 151f7749 Jan Kiszka
        d.slot = mem->slot;
331 5832d1f2 aliguori
332 6e489f3f Anthony Liguori
        if (kvm_vm_ioctl(s, KVM_GET_DIRTY_LOG, &d) == -1) {
333 151f7749 Jan Kiszka
            dprintf("ioctl failed %d\n", errno);
334 151f7749 Jan Kiszka
            ret = -1;
335 151f7749 Jan Kiszka
            break;
336 151f7749 Jan Kiszka
        }
337 5832d1f2 aliguori
338 151f7749 Jan Kiszka
        for (phys_addr = mem->start_addr, addr = mem->phys_offset;
339 151f7749 Jan Kiszka
             phys_addr < mem->start_addr + mem->memory_size;
340 151f7749 Jan Kiszka
             phys_addr += TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
341 96c1606b Alexander Graf
            unsigned char *bitmap = (unsigned char *)d.dirty_bitmap;
342 151f7749 Jan Kiszka
            unsigned nr = (phys_addr - mem->start_addr) >> TARGET_PAGE_BITS;
343 151f7749 Jan Kiszka
344 96c1606b Alexander Graf
            if (test_le_bit(nr, bitmap)) {
345 151f7749 Jan Kiszka
                cpu_physical_memory_set_dirty(addr);
346 151f7749 Jan Kiszka
            }
347 151f7749 Jan Kiszka
        }
348 151f7749 Jan Kiszka
        start_addr = phys_addr;
349 5832d1f2 aliguori
    }
350 5832d1f2 aliguori
    qemu_free(d.dirty_bitmap);
351 151f7749 Jan Kiszka
352 151f7749 Jan Kiszka
    return ret;
353 5832d1f2 aliguori
}
354 5832d1f2 aliguori
355 c227f099 Anthony Liguori
int kvm_coalesce_mmio_region(target_phys_addr_t start, ram_addr_t size)
356 f65ed4c1 aliguori
{
357 f65ed4c1 aliguori
    int ret = -ENOSYS;
358 f65ed4c1 aliguori
#ifdef KVM_CAP_COALESCED_MMIO
359 f65ed4c1 aliguori
    KVMState *s = kvm_state;
360 f65ed4c1 aliguori
361 f65ed4c1 aliguori
    if (s->coalesced_mmio) {
362 f65ed4c1 aliguori
        struct kvm_coalesced_mmio_zone zone;
363 f65ed4c1 aliguori
364 f65ed4c1 aliguori
        zone.addr = start;
365 f65ed4c1 aliguori
        zone.size = size;
366 f65ed4c1 aliguori
367 f65ed4c1 aliguori
        ret = kvm_vm_ioctl(s, KVM_REGISTER_COALESCED_MMIO, &zone);
368 f65ed4c1 aliguori
    }
369 f65ed4c1 aliguori
#endif
370 f65ed4c1 aliguori
371 f65ed4c1 aliguori
    return ret;
372 f65ed4c1 aliguori
}
373 f65ed4c1 aliguori
374 c227f099 Anthony Liguori
int kvm_uncoalesce_mmio_region(target_phys_addr_t start, ram_addr_t size)
375 f65ed4c1 aliguori
{
376 f65ed4c1 aliguori
    int ret = -ENOSYS;
377 f65ed4c1 aliguori
#ifdef KVM_CAP_COALESCED_MMIO
378 f65ed4c1 aliguori
    KVMState *s = kvm_state;
379 f65ed4c1 aliguori
380 f65ed4c1 aliguori
    if (s->coalesced_mmio) {
381 f65ed4c1 aliguori
        struct kvm_coalesced_mmio_zone zone;
382 f65ed4c1 aliguori
383 f65ed4c1 aliguori
        zone.addr = start;
384 f65ed4c1 aliguori
        zone.size = size;
385 f65ed4c1 aliguori
386 f65ed4c1 aliguori
        ret = kvm_vm_ioctl(s, KVM_UNREGISTER_COALESCED_MMIO, &zone);
387 f65ed4c1 aliguori
    }
388 f65ed4c1 aliguori
#endif
389 f65ed4c1 aliguori
390 f65ed4c1 aliguori
    return ret;
391 f65ed4c1 aliguori
}
392 f65ed4c1 aliguori
393 ad7b8b33 Anthony Liguori
int kvm_check_extension(KVMState *s, unsigned int extension)
394 ad7b8b33 Anthony Liguori
{
395 ad7b8b33 Anthony Liguori
    int ret;
396 ad7b8b33 Anthony Liguori
397 ad7b8b33 Anthony Liguori
    ret = kvm_ioctl(s, KVM_CHECK_EXTENSION, extension);
398 ad7b8b33 Anthony Liguori
    if (ret < 0) {
399 ad7b8b33 Anthony Liguori
        ret = 0;
400 ad7b8b33 Anthony Liguori
    }
401 ad7b8b33 Anthony Liguori
402 ad7b8b33 Anthony Liguori
    return ret;
403 ad7b8b33 Anthony Liguori
}
404 ad7b8b33 Anthony Liguori
405 7b8f3b78 Michael S. Tsirkin
static void kvm_set_phys_mem(target_phys_addr_t start_addr,
406 7b8f3b78 Michael S. Tsirkin
                             ram_addr_t size,
407 7b8f3b78 Michael S. Tsirkin
                             ram_addr_t phys_offset)
408 46dbef6a Michael S. Tsirkin
{
409 46dbef6a Michael S. Tsirkin
    KVMState *s = kvm_state;
410 46dbef6a Michael S. Tsirkin
    ram_addr_t flags = phys_offset & ~TARGET_PAGE_MASK;
411 46dbef6a Michael S. Tsirkin
    KVMSlot *mem, old;
412 46dbef6a Michael S. Tsirkin
    int err;
413 46dbef6a Michael S. Tsirkin
414 46dbef6a Michael S. Tsirkin
    if (start_addr & ~TARGET_PAGE_MASK) {
415 46dbef6a Michael S. Tsirkin
        if (flags >= IO_MEM_UNASSIGNED) {
416 46dbef6a Michael S. Tsirkin
            if (!kvm_lookup_overlapping_slot(s, start_addr,
417 46dbef6a Michael S. Tsirkin
                                             start_addr + size)) {
418 46dbef6a Michael S. Tsirkin
                return;
419 46dbef6a Michael S. Tsirkin
            }
420 46dbef6a Michael S. Tsirkin
            fprintf(stderr, "Unaligned split of a KVM memory slot\n");
421 46dbef6a Michael S. Tsirkin
        } else {
422 46dbef6a Michael S. Tsirkin
            fprintf(stderr, "Only page-aligned memory slots supported\n");
423 46dbef6a Michael S. Tsirkin
        }
424 46dbef6a Michael S. Tsirkin
        abort();
425 46dbef6a Michael S. Tsirkin
    }
426 46dbef6a Michael S. Tsirkin
427 46dbef6a Michael S. Tsirkin
    /* KVM does not support read-only slots */
428 46dbef6a Michael S. Tsirkin
    phys_offset &= ~IO_MEM_ROM;
429 46dbef6a Michael S. Tsirkin
430 46dbef6a Michael S. Tsirkin
    while (1) {
431 46dbef6a Michael S. Tsirkin
        mem = kvm_lookup_overlapping_slot(s, start_addr, start_addr + size);
432 46dbef6a Michael S. Tsirkin
        if (!mem) {
433 46dbef6a Michael S. Tsirkin
            break;
434 46dbef6a Michael S. Tsirkin
        }
435 46dbef6a Michael S. Tsirkin
436 46dbef6a Michael S. Tsirkin
        if (flags < IO_MEM_UNASSIGNED && start_addr >= mem->start_addr &&
437 46dbef6a Michael S. Tsirkin
            (start_addr + size <= mem->start_addr + mem->memory_size) &&
438 46dbef6a Michael S. Tsirkin
            (phys_offset - start_addr == mem->phys_offset - mem->start_addr)) {
439 46dbef6a Michael S. Tsirkin
            /* The new slot fits into the existing one and comes with
440 46dbef6a Michael S. Tsirkin
             * identical parameters - nothing to be done. */
441 46dbef6a Michael S. Tsirkin
            return;
442 46dbef6a Michael S. Tsirkin
        }
443 46dbef6a Michael S. Tsirkin
444 46dbef6a Michael S. Tsirkin
        old = *mem;
445 46dbef6a Michael S. Tsirkin
446 46dbef6a Michael S. Tsirkin
        /* unregister the overlapping slot */
447 46dbef6a Michael S. Tsirkin
        mem->memory_size = 0;
448 46dbef6a Michael S. Tsirkin
        err = kvm_set_user_memory_region(s, mem);
449 46dbef6a Michael S. Tsirkin
        if (err) {
450 46dbef6a Michael S. Tsirkin
            fprintf(stderr, "%s: error unregistering overlapping slot: %s\n",
451 46dbef6a Michael S. Tsirkin
                    __func__, strerror(-err));
452 46dbef6a Michael S. Tsirkin
            abort();
453 46dbef6a Michael S. Tsirkin
        }
454 46dbef6a Michael S. Tsirkin
455 46dbef6a Michael S. Tsirkin
        /* Workaround for older KVM versions: we can't join slots, even not by
456 46dbef6a Michael S. Tsirkin
         * unregistering the previous ones and then registering the larger
457 46dbef6a Michael S. Tsirkin
         * slot. We have to maintain the existing fragmentation. Sigh.
458 46dbef6a Michael S. Tsirkin
         *
459 46dbef6a Michael S. Tsirkin
         * This workaround assumes that the new slot starts at the same
460 46dbef6a Michael S. Tsirkin
         * address as the first existing one. If not or if some overlapping
461 46dbef6a Michael S. Tsirkin
         * slot comes around later, we will fail (not seen in practice so far)
462 46dbef6a Michael S. Tsirkin
         * - and actually require a recent KVM version. */
463 46dbef6a Michael S. Tsirkin
        if (s->broken_set_mem_region &&
464 46dbef6a Michael S. Tsirkin
            old.start_addr == start_addr && old.memory_size < size &&
465 46dbef6a Michael S. Tsirkin
            flags < IO_MEM_UNASSIGNED) {
466 46dbef6a Michael S. Tsirkin
            mem = kvm_alloc_slot(s);
467 46dbef6a Michael S. Tsirkin
            mem->memory_size = old.memory_size;
468 46dbef6a Michael S. Tsirkin
            mem->start_addr = old.start_addr;
469 46dbef6a Michael S. Tsirkin
            mem->phys_offset = old.phys_offset;
470 46dbef6a Michael S. Tsirkin
            mem->flags = 0;
471 46dbef6a Michael S. Tsirkin
472 46dbef6a Michael S. Tsirkin
            err = kvm_set_user_memory_region(s, mem);
473 46dbef6a Michael S. Tsirkin
            if (err) {
474 46dbef6a Michael S. Tsirkin
                fprintf(stderr, "%s: error updating slot: %s\n", __func__,
475 46dbef6a Michael S. Tsirkin
                        strerror(-err));
476 46dbef6a Michael S. Tsirkin
                abort();
477 46dbef6a Michael S. Tsirkin
            }
478 46dbef6a Michael S. Tsirkin
479 46dbef6a Michael S. Tsirkin
            start_addr += old.memory_size;
480 46dbef6a Michael S. Tsirkin
            phys_offset += old.memory_size;
481 46dbef6a Michael S. Tsirkin
            size -= old.memory_size;
482 46dbef6a Michael S. Tsirkin
            continue;
483 46dbef6a Michael S. Tsirkin
        }
484 46dbef6a Michael S. Tsirkin
485 46dbef6a Michael S. Tsirkin
        /* register prefix slot */
486 46dbef6a Michael S. Tsirkin
        if (old.start_addr < start_addr) {
487 46dbef6a Michael S. Tsirkin
            mem = kvm_alloc_slot(s);
488 46dbef6a Michael S. Tsirkin
            mem->memory_size = start_addr - old.start_addr;
489 46dbef6a Michael S. Tsirkin
            mem->start_addr = old.start_addr;
490 46dbef6a Michael S. Tsirkin
            mem->phys_offset = old.phys_offset;
491 46dbef6a Michael S. Tsirkin
            mem->flags = 0;
492 46dbef6a Michael S. Tsirkin
493 46dbef6a Michael S. Tsirkin
            err = kvm_set_user_memory_region(s, mem);
494 46dbef6a Michael S. Tsirkin
            if (err) {
495 46dbef6a Michael S. Tsirkin
                fprintf(stderr, "%s: error registering prefix slot: %s\n",
496 46dbef6a Michael S. Tsirkin
                        __func__, strerror(-err));
497 46dbef6a Michael S. Tsirkin
                abort();
498 46dbef6a Michael S. Tsirkin
            }
499 46dbef6a Michael S. Tsirkin
        }
500 46dbef6a Michael S. Tsirkin
501 46dbef6a Michael S. Tsirkin
        /* register suffix slot */
502 46dbef6a Michael S. Tsirkin
        if (old.start_addr + old.memory_size > start_addr + size) {
503 46dbef6a Michael S. Tsirkin
            ram_addr_t size_delta;
504 46dbef6a Michael S. Tsirkin
505 46dbef6a Michael S. Tsirkin
            mem = kvm_alloc_slot(s);
506 46dbef6a Michael S. Tsirkin
            mem->start_addr = start_addr + size;
507 46dbef6a Michael S. Tsirkin
            size_delta = mem->start_addr - old.start_addr;
508 46dbef6a Michael S. Tsirkin
            mem->memory_size = old.memory_size - size_delta;
509 46dbef6a Michael S. Tsirkin
            mem->phys_offset = old.phys_offset + size_delta;
510 46dbef6a Michael S. Tsirkin
            mem->flags = 0;
511 46dbef6a Michael S. Tsirkin
512 46dbef6a Michael S. Tsirkin
            err = kvm_set_user_memory_region(s, mem);
513 46dbef6a Michael S. Tsirkin
            if (err) {
514 46dbef6a Michael S. Tsirkin
                fprintf(stderr, "%s: error registering suffix slot: %s\n",
515 46dbef6a Michael S. Tsirkin
                        __func__, strerror(-err));
516 46dbef6a Michael S. Tsirkin
                abort();
517 46dbef6a Michael S. Tsirkin
            }
518 46dbef6a Michael S. Tsirkin
        }
519 46dbef6a Michael S. Tsirkin
    }
520 46dbef6a Michael S. Tsirkin
521 46dbef6a Michael S. Tsirkin
    /* in case the KVM bug workaround already "consumed" the new slot */
522 46dbef6a Michael S. Tsirkin
    if (!size)
523 46dbef6a Michael S. Tsirkin
        return;
524 46dbef6a Michael S. Tsirkin
525 46dbef6a Michael S. Tsirkin
    /* KVM does not need to know about this memory */
526 46dbef6a Michael S. Tsirkin
    if (flags >= IO_MEM_UNASSIGNED)
527 46dbef6a Michael S. Tsirkin
        return;
528 46dbef6a Michael S. Tsirkin
529 46dbef6a Michael S. Tsirkin
    mem = kvm_alloc_slot(s);
530 46dbef6a Michael S. Tsirkin
    mem->memory_size = size;
531 46dbef6a Michael S. Tsirkin
    mem->start_addr = start_addr;
532 46dbef6a Michael S. Tsirkin
    mem->phys_offset = phys_offset;
533 46dbef6a Michael S. Tsirkin
    mem->flags = 0;
534 46dbef6a Michael S. Tsirkin
535 46dbef6a Michael S. Tsirkin
    err = kvm_set_user_memory_region(s, mem);
536 46dbef6a Michael S. Tsirkin
    if (err) {
537 46dbef6a Michael S. Tsirkin
        fprintf(stderr, "%s: error registering slot: %s\n", __func__,
538 46dbef6a Michael S. Tsirkin
                strerror(-err));
539 46dbef6a Michael S. Tsirkin
        abort();
540 46dbef6a Michael S. Tsirkin
    }
541 46dbef6a Michael S. Tsirkin
}
542 46dbef6a Michael S. Tsirkin
543 7b8f3b78 Michael S. Tsirkin
static void kvm_client_set_memory(struct CPUPhysMemoryClient *client,
544 7b8f3b78 Michael S. Tsirkin
                                  target_phys_addr_t start_addr,
545 7b8f3b78 Michael S. Tsirkin
                                  ram_addr_t size,
546 7b8f3b78 Michael S. Tsirkin
                                  ram_addr_t phys_offset)
547 7b8f3b78 Michael S. Tsirkin
{
548 7b8f3b78 Michael S. Tsirkin
        kvm_set_phys_mem(start_addr, size, phys_offset);
549 7b8f3b78 Michael S. Tsirkin
}
550 7b8f3b78 Michael S. Tsirkin
551 7b8f3b78 Michael S. Tsirkin
static int kvm_client_sync_dirty_bitmap(struct CPUPhysMemoryClient *client,
552 7b8f3b78 Michael S. Tsirkin
                                        target_phys_addr_t start_addr,
553 7b8f3b78 Michael S. Tsirkin
                                        target_phys_addr_t end_addr)
554 7b8f3b78 Michael S. Tsirkin
{
555 7b8f3b78 Michael S. Tsirkin
        return kvm_physical_sync_dirty_bitmap(start_addr, end_addr);
556 7b8f3b78 Michael S. Tsirkin
}
557 7b8f3b78 Michael S. Tsirkin
558 7b8f3b78 Michael S. Tsirkin
static int kvm_client_migration_log(struct CPUPhysMemoryClient *client,
559 7b8f3b78 Michael S. Tsirkin
                                    int enable)
560 7b8f3b78 Michael S. Tsirkin
{
561 7b8f3b78 Michael S. Tsirkin
        return kvm_set_migration_log(enable);
562 7b8f3b78 Michael S. Tsirkin
}
563 7b8f3b78 Michael S. Tsirkin
564 7b8f3b78 Michael S. Tsirkin
static CPUPhysMemoryClient kvm_cpu_phys_memory_client = {
565 7b8f3b78 Michael S. Tsirkin
        .set_memory = kvm_client_set_memory,
566 7b8f3b78 Michael S. Tsirkin
        .sync_dirty_bitmap = kvm_client_sync_dirty_bitmap,
567 7b8f3b78 Michael S. Tsirkin
        .migration_log = kvm_client_migration_log,
568 7b8f3b78 Michael S. Tsirkin
};
569 7b8f3b78 Michael S. Tsirkin
570 05330448 aliguori
int kvm_init(int smp_cpus)
571 05330448 aliguori
{
572 168ccc11 Jan Kiszka
    static const char upgrade_note[] =
573 168ccc11 Jan Kiszka
        "Please upgrade to at least kernel 2.6.29 or recent kvm-kmod\n"
574 168ccc11 Jan Kiszka
        "(see http://sourceforge.net/projects/kvm).\n";
575 05330448 aliguori
    KVMState *s;
576 05330448 aliguori
    int ret;
577 05330448 aliguori
    int i;
578 05330448 aliguori
579 9f8fd694 Mark McLoughlin
    if (smp_cpus > 1) {
580 9f8fd694 Mark McLoughlin
        fprintf(stderr, "No SMP KVM support, use '-smp 1'\n");
581 05330448 aliguori
        return -EINVAL;
582 9f8fd694 Mark McLoughlin
    }
583 05330448 aliguori
584 05330448 aliguori
    s = qemu_mallocz(sizeof(KVMState));
585 05330448 aliguori
586 e22a25c9 aliguori
#ifdef KVM_CAP_SET_GUEST_DEBUG
587 72cf2d4f Blue Swirl
    QTAILQ_INIT(&s->kvm_sw_breakpoints);
588 e22a25c9 aliguori
#endif
589 05330448 aliguori
    for (i = 0; i < ARRAY_SIZE(s->slots); i++)
590 05330448 aliguori
        s->slots[i].slot = i;
591 05330448 aliguori
592 05330448 aliguori
    s->vmfd = -1;
593 40ff6d7e Kevin Wolf
    s->fd = qemu_open("/dev/kvm", O_RDWR);
594 05330448 aliguori
    if (s->fd == -1) {
595 05330448 aliguori
        fprintf(stderr, "Could not access KVM kernel module: %m\n");
596 05330448 aliguori
        ret = -errno;
597 05330448 aliguori
        goto err;
598 05330448 aliguori
    }
599 05330448 aliguori
600 05330448 aliguori
    ret = kvm_ioctl(s, KVM_GET_API_VERSION, 0);
601 05330448 aliguori
    if (ret < KVM_API_VERSION) {
602 05330448 aliguori
        if (ret > 0)
603 05330448 aliguori
            ret = -EINVAL;
604 05330448 aliguori
        fprintf(stderr, "kvm version too old\n");
605 05330448 aliguori
        goto err;
606 05330448 aliguori
    }
607 05330448 aliguori
608 05330448 aliguori
    if (ret > KVM_API_VERSION) {
609 05330448 aliguori
        ret = -EINVAL;
610 05330448 aliguori
        fprintf(stderr, "kvm version not supported\n");
611 05330448 aliguori
        goto err;
612 05330448 aliguori
    }
613 05330448 aliguori
614 05330448 aliguori
    s->vmfd = kvm_ioctl(s, KVM_CREATE_VM, 0);
615 05330448 aliguori
    if (s->vmfd < 0)
616 05330448 aliguori
        goto err;
617 05330448 aliguori
618 05330448 aliguori
    /* initially, KVM allocated its own memory and we had to jump through
619 05330448 aliguori
     * hooks to make phys_ram_base point to this.  Modern versions of KVM
620 5579c7f3 pbrook
     * just use a user allocated buffer so we can use regular pages
621 05330448 aliguori
     * unmodified.  Make sure we have a sufficiently modern version of KVM.
622 05330448 aliguori
     */
623 ad7b8b33 Anthony Liguori
    if (!kvm_check_extension(s, KVM_CAP_USER_MEMORY)) {
624 ad7b8b33 Anthony Liguori
        ret = -EINVAL;
625 168ccc11 Jan Kiszka
        fprintf(stderr, "kvm does not support KVM_CAP_USER_MEMORY\n%s",
626 168ccc11 Jan Kiszka
                upgrade_note);
627 05330448 aliguori
        goto err;
628 05330448 aliguori
    }
629 05330448 aliguori
630 d85dc283 aliguori
    /* There was a nasty bug in < kvm-80 that prevents memory slots from being
631 d85dc283 aliguori
     * destroyed properly.  Since we rely on this capability, refuse to work
632 d85dc283 aliguori
     * with any kernel without this capability. */
633 ad7b8b33 Anthony Liguori
    if (!kvm_check_extension(s, KVM_CAP_DESTROY_MEMORY_REGION_WORKS)) {
634 ad7b8b33 Anthony Liguori
        ret = -EINVAL;
635 d85dc283 aliguori
636 d85dc283 aliguori
        fprintf(stderr,
637 168ccc11 Jan Kiszka
                "KVM kernel module broken (DESTROY_MEMORY_REGION).\n%s",
638 168ccc11 Jan Kiszka
                upgrade_note);
639 d85dc283 aliguori
        goto err;
640 d85dc283 aliguori
    }
641 d85dc283 aliguori
642 62a2744c Sheng Yang
    s->coalesced_mmio = 0;
643 f65ed4c1 aliguori
#ifdef KVM_CAP_COALESCED_MMIO
644 ad7b8b33 Anthony Liguori
    s->coalesced_mmio = kvm_check_extension(s, KVM_CAP_COALESCED_MMIO);
645 62a2744c Sheng Yang
    s->coalesced_mmio_ring = NULL;
646 f65ed4c1 aliguori
#endif
647 f65ed4c1 aliguori
648 e69917e2 Jan Kiszka
    s->broken_set_mem_region = 1;
649 e69917e2 Jan Kiszka
#ifdef KVM_CAP_JOIN_MEMORY_REGIONS_WORKS
650 e69917e2 Jan Kiszka
    ret = kvm_ioctl(s, KVM_CHECK_EXTENSION, KVM_CAP_JOIN_MEMORY_REGIONS_WORKS);
651 e69917e2 Jan Kiszka
    if (ret > 0) {
652 e69917e2 Jan Kiszka
        s->broken_set_mem_region = 0;
653 e69917e2 Jan Kiszka
    }
654 e69917e2 Jan Kiszka
#endif
655 e69917e2 Jan Kiszka
656 a0fb002c Jan Kiszka
    s->vcpu_events = 0;
657 a0fb002c Jan Kiszka
#ifdef KVM_CAP_VCPU_EVENTS
658 a0fb002c Jan Kiszka
    s->vcpu_events = kvm_check_extension(s, KVM_CAP_VCPU_EVENTS);
659 a0fb002c Jan Kiszka
#endif
660 a0fb002c Jan Kiszka
661 05330448 aliguori
    ret = kvm_arch_init(s, smp_cpus);
662 05330448 aliguori
    if (ret < 0)
663 05330448 aliguori
        goto err;
664 05330448 aliguori
665 05330448 aliguori
    kvm_state = s;
666 7b8f3b78 Michael S. Tsirkin
    cpu_register_phys_memory_client(&kvm_cpu_phys_memory_client);
667 05330448 aliguori
668 05330448 aliguori
    return 0;
669 05330448 aliguori
670 05330448 aliguori
err:
671 05330448 aliguori
    if (s) {
672 05330448 aliguori
        if (s->vmfd != -1)
673 05330448 aliguori
            close(s->vmfd);
674 05330448 aliguori
        if (s->fd != -1)
675 05330448 aliguori
            close(s->fd);
676 05330448 aliguori
    }
677 05330448 aliguori
    qemu_free(s);
678 05330448 aliguori
679 05330448 aliguori
    return ret;
680 05330448 aliguori
}
681 05330448 aliguori
682 afcea8cb Blue Swirl
static int kvm_handle_io(uint16_t port, void *data, int direction, int size,
683 afcea8cb Blue Swirl
                         uint32_t count)
684 05330448 aliguori
{
685 05330448 aliguori
    int i;
686 05330448 aliguori
    uint8_t *ptr = data;
687 05330448 aliguori
688 05330448 aliguori
    for (i = 0; i < count; i++) {
689 05330448 aliguori
        if (direction == KVM_EXIT_IO_IN) {
690 05330448 aliguori
            switch (size) {
691 05330448 aliguori
            case 1:
692 afcea8cb Blue Swirl
                stb_p(ptr, cpu_inb(port));
693 05330448 aliguori
                break;
694 05330448 aliguori
            case 2:
695 afcea8cb Blue Swirl
                stw_p(ptr, cpu_inw(port));
696 05330448 aliguori
                break;
697 05330448 aliguori
            case 4:
698 afcea8cb Blue Swirl
                stl_p(ptr, cpu_inl(port));
699 05330448 aliguori
                break;
700 05330448 aliguori
            }
701 05330448 aliguori
        } else {
702 05330448 aliguori
            switch (size) {
703 05330448 aliguori
            case 1:
704 afcea8cb Blue Swirl
                cpu_outb(port, ldub_p(ptr));
705 05330448 aliguori
                break;
706 05330448 aliguori
            case 2:
707 afcea8cb Blue Swirl
                cpu_outw(port, lduw_p(ptr));
708 05330448 aliguori
                break;
709 05330448 aliguori
            case 4:
710 afcea8cb Blue Swirl
                cpu_outl(port, ldl_p(ptr));
711 05330448 aliguori
                break;
712 05330448 aliguori
            }
713 05330448 aliguori
        }
714 05330448 aliguori
715 05330448 aliguori
        ptr += size;
716 05330448 aliguori
    }
717 05330448 aliguori
718 05330448 aliguori
    return 1;
719 05330448 aliguori
}
720 05330448 aliguori
721 62a2744c Sheng Yang
void kvm_flush_coalesced_mmio_buffer(void)
722 f65ed4c1 aliguori
{
723 f65ed4c1 aliguori
#ifdef KVM_CAP_COALESCED_MMIO
724 f65ed4c1 aliguori
    KVMState *s = kvm_state;
725 62a2744c Sheng Yang
    if (s->coalesced_mmio_ring) {
726 62a2744c Sheng Yang
        struct kvm_coalesced_mmio_ring *ring = s->coalesced_mmio_ring;
727 f65ed4c1 aliguori
        while (ring->first != ring->last) {
728 f65ed4c1 aliguori
            struct kvm_coalesced_mmio *ent;
729 f65ed4c1 aliguori
730 f65ed4c1 aliguori
            ent = &ring->coalesced_mmio[ring->first];
731 f65ed4c1 aliguori
732 f65ed4c1 aliguori
            cpu_physical_memory_write(ent->phys_addr, ent->data, ent->len);
733 f65ed4c1 aliguori
            /* FIXME smp_wmb() */
734 f65ed4c1 aliguori
            ring->first = (ring->first + 1) % KVM_COALESCED_MMIO_MAX;
735 f65ed4c1 aliguori
        }
736 f65ed4c1 aliguori
    }
737 f65ed4c1 aliguori
#endif
738 f65ed4c1 aliguori
}
739 f65ed4c1 aliguori
740 4c0960c0 Avi Kivity
void kvm_cpu_synchronize_state(CPUState *env)
741 4c0960c0 Avi Kivity
{
742 9ded2744 Jan Kiszka
    if (!env->kvm_vcpu_dirty) {
743 4c0960c0 Avi Kivity
        kvm_arch_get_registers(env);
744 9ded2744 Jan Kiszka
        env->kvm_vcpu_dirty = 1;
745 4c0960c0 Avi Kivity
    }
746 4c0960c0 Avi Kivity
}
747 4c0960c0 Avi Kivity
748 05330448 aliguori
int kvm_cpu_exec(CPUState *env)
749 05330448 aliguori
{
750 05330448 aliguori
    struct kvm_run *run = env->kvm_run;
751 05330448 aliguori
    int ret;
752 05330448 aliguori
753 05330448 aliguori
    dprintf("kvm_cpu_exec()\n");
754 05330448 aliguori
755 05330448 aliguori
    do {
756 be214e6c aurel32
        if (env->exit_request) {
757 05330448 aliguori
            dprintf("interrupt exit requested\n");
758 05330448 aliguori
            ret = 0;
759 05330448 aliguori
            break;
760 05330448 aliguori
        }
761 05330448 aliguori
762 9ded2744 Jan Kiszka
        if (env->kvm_vcpu_dirty) {
763 4c0960c0 Avi Kivity
            kvm_arch_put_registers(env);
764 9ded2744 Jan Kiszka
            env->kvm_vcpu_dirty = 0;
765 4c0960c0 Avi Kivity
        }
766 4c0960c0 Avi Kivity
767 8c14c173 Jan Kiszka
        kvm_arch_pre_run(env, run);
768 d549db5a Glauber Costa
        qemu_mutex_unlock_iothread();
769 05330448 aliguori
        ret = kvm_vcpu_ioctl(env, KVM_RUN, 0);
770 d549db5a Glauber Costa
        qemu_mutex_lock_iothread();
771 05330448 aliguori
        kvm_arch_post_run(env, run);
772 05330448 aliguori
773 05330448 aliguori
        if (ret == -EINTR || ret == -EAGAIN) {
774 05330448 aliguori
            dprintf("io window exit\n");
775 05330448 aliguori
            ret = 0;
776 05330448 aliguori
            break;
777 05330448 aliguori
        }
778 05330448 aliguori
779 05330448 aliguori
        if (ret < 0) {
780 05330448 aliguori
            dprintf("kvm run failed %s\n", strerror(-ret));
781 05330448 aliguori
            abort();
782 05330448 aliguori
        }
783 05330448 aliguori
784 62a2744c Sheng Yang
        kvm_flush_coalesced_mmio_buffer();
785 f65ed4c1 aliguori
786 05330448 aliguori
        ret = 0; /* exit loop */
787 05330448 aliguori
        switch (run->exit_reason) {
788 05330448 aliguori
        case KVM_EXIT_IO:
789 05330448 aliguori
            dprintf("handle_io\n");
790 afcea8cb Blue Swirl
            ret = kvm_handle_io(run->io.port,
791 05330448 aliguori
                                (uint8_t *)run + run->io.data_offset,
792 05330448 aliguori
                                run->io.direction,
793 05330448 aliguori
                                run->io.size,
794 05330448 aliguori
                                run->io.count);
795 05330448 aliguori
            break;
796 05330448 aliguori
        case KVM_EXIT_MMIO:
797 05330448 aliguori
            dprintf("handle_mmio\n");
798 05330448 aliguori
            cpu_physical_memory_rw(run->mmio.phys_addr,
799 05330448 aliguori
                                   run->mmio.data,
800 05330448 aliguori
                                   run->mmio.len,
801 05330448 aliguori
                                   run->mmio.is_write);
802 05330448 aliguori
            ret = 1;
803 05330448 aliguori
            break;
804 05330448 aliguori
        case KVM_EXIT_IRQ_WINDOW_OPEN:
805 05330448 aliguori
            dprintf("irq_window_open\n");
806 05330448 aliguori
            break;
807 05330448 aliguori
        case KVM_EXIT_SHUTDOWN:
808 05330448 aliguori
            dprintf("shutdown\n");
809 05330448 aliguori
            qemu_system_reset_request();
810 05330448 aliguori
            ret = 1;
811 05330448 aliguori
            break;
812 05330448 aliguori
        case KVM_EXIT_UNKNOWN:
813 05330448 aliguori
            dprintf("kvm_exit_unknown\n");
814 05330448 aliguori
            break;
815 05330448 aliguori
        case KVM_EXIT_FAIL_ENTRY:
816 05330448 aliguori
            dprintf("kvm_exit_fail_entry\n");
817 05330448 aliguori
            break;
818 05330448 aliguori
        case KVM_EXIT_EXCEPTION:
819 05330448 aliguori
            dprintf("kvm_exit_exception\n");
820 05330448 aliguori
            break;
821 05330448 aliguori
        case KVM_EXIT_DEBUG:
822 05330448 aliguori
            dprintf("kvm_exit_debug\n");
823 e22a25c9 aliguori
#ifdef KVM_CAP_SET_GUEST_DEBUG
824 e22a25c9 aliguori
            if (kvm_arch_debug(&run->debug.arch)) {
825 e22a25c9 aliguori
                gdb_set_stop_cpu(env);
826 e22a25c9 aliguori
                vm_stop(EXCP_DEBUG);
827 e22a25c9 aliguori
                env->exception_index = EXCP_DEBUG;
828 e22a25c9 aliguori
                return 0;
829 e22a25c9 aliguori
            }
830 e22a25c9 aliguori
            /* re-enter, this exception was guest-internal */
831 e22a25c9 aliguori
            ret = 1;
832 e22a25c9 aliguori
#endif /* KVM_CAP_SET_GUEST_DEBUG */
833 05330448 aliguori
            break;
834 05330448 aliguori
        default:
835 05330448 aliguori
            dprintf("kvm_arch_handle_exit\n");
836 05330448 aliguori
            ret = kvm_arch_handle_exit(env, run);
837 05330448 aliguori
            break;
838 05330448 aliguori
        }
839 05330448 aliguori
    } while (ret > 0);
840 05330448 aliguori
841 be214e6c aurel32
    if (env->exit_request) {
842 be214e6c aurel32
        env->exit_request = 0;
843 becfc390 aliguori
        env->exception_index = EXCP_INTERRUPT;
844 becfc390 aliguori
    }
845 becfc390 aliguori
846 05330448 aliguori
    return ret;
847 05330448 aliguori
}
848 05330448 aliguori
849 984b5181 aliguori
int kvm_ioctl(KVMState *s, int type, ...)
850 05330448 aliguori
{
851 05330448 aliguori
    int ret;
852 984b5181 aliguori
    void *arg;
853 984b5181 aliguori
    va_list ap;
854 05330448 aliguori
855 984b5181 aliguori
    va_start(ap, type);
856 984b5181 aliguori
    arg = va_arg(ap, void *);
857 984b5181 aliguori
    va_end(ap);
858 984b5181 aliguori
859 984b5181 aliguori
    ret = ioctl(s->fd, type, arg);
860 05330448 aliguori
    if (ret == -1)
861 05330448 aliguori
        ret = -errno;
862 05330448 aliguori
863 05330448 aliguori
    return ret;
864 05330448 aliguori
}
865 05330448 aliguori
866 984b5181 aliguori
int kvm_vm_ioctl(KVMState *s, int type, ...)
867 05330448 aliguori
{
868 05330448 aliguori
    int ret;
869 984b5181 aliguori
    void *arg;
870 984b5181 aliguori
    va_list ap;
871 984b5181 aliguori
872 984b5181 aliguori
    va_start(ap, type);
873 984b5181 aliguori
    arg = va_arg(ap, void *);
874 984b5181 aliguori
    va_end(ap);
875 05330448 aliguori
876 984b5181 aliguori
    ret = ioctl(s->vmfd, type, arg);
877 05330448 aliguori
    if (ret == -1)
878 05330448 aliguori
        ret = -errno;
879 05330448 aliguori
880 05330448 aliguori
    return ret;
881 05330448 aliguori
}
882 05330448 aliguori
883 984b5181 aliguori
int kvm_vcpu_ioctl(CPUState *env, int type, ...)
884 05330448 aliguori
{
885 05330448 aliguori
    int ret;
886 984b5181 aliguori
    void *arg;
887 984b5181 aliguori
    va_list ap;
888 984b5181 aliguori
889 984b5181 aliguori
    va_start(ap, type);
890 984b5181 aliguori
    arg = va_arg(ap, void *);
891 984b5181 aliguori
    va_end(ap);
892 05330448 aliguori
893 984b5181 aliguori
    ret = ioctl(env->kvm_fd, type, arg);
894 05330448 aliguori
    if (ret == -1)
895 05330448 aliguori
        ret = -errno;
896 05330448 aliguori
897 05330448 aliguori
    return ret;
898 05330448 aliguori
}
899 bd322087 aliguori
900 bd322087 aliguori
int kvm_has_sync_mmu(void)
901 bd322087 aliguori
{
902 a9c11522 aurel32
#ifdef KVM_CAP_SYNC_MMU
903 bd322087 aliguori
    KVMState *s = kvm_state;
904 bd322087 aliguori
905 ad7b8b33 Anthony Liguori
    return kvm_check_extension(s, KVM_CAP_SYNC_MMU);
906 ad7b8b33 Anthony Liguori
#else
907 bd322087 aliguori
    return 0;
908 ad7b8b33 Anthony Liguori
#endif
909 bd322087 aliguori
}
910 e22a25c9 aliguori
911 a0fb002c Jan Kiszka
int kvm_has_vcpu_events(void)
912 a0fb002c Jan Kiszka
{
913 a0fb002c Jan Kiszka
    return kvm_state->vcpu_events;
914 a0fb002c Jan Kiszka
}
915 a0fb002c Jan Kiszka
916 6f0437e8 Jan Kiszka
void kvm_setup_guest_memory(void *start, size_t size)
917 6f0437e8 Jan Kiszka
{
918 6f0437e8 Jan Kiszka
    if (!kvm_has_sync_mmu()) {
919 6f0437e8 Jan Kiszka
#ifdef MADV_DONTFORK
920 6f0437e8 Jan Kiszka
        int ret = madvise(start, size, MADV_DONTFORK);
921 6f0437e8 Jan Kiszka
922 6f0437e8 Jan Kiszka
        if (ret) {
923 6f0437e8 Jan Kiszka
            perror("madvice");
924 6f0437e8 Jan Kiszka
            exit(1);
925 6f0437e8 Jan Kiszka
        }
926 6f0437e8 Jan Kiszka
#else
927 6f0437e8 Jan Kiszka
        fprintf(stderr,
928 6f0437e8 Jan Kiszka
                "Need MADV_DONTFORK in absence of synchronous KVM MMU\n");
929 6f0437e8 Jan Kiszka
        exit(1);
930 6f0437e8 Jan Kiszka
#endif
931 6f0437e8 Jan Kiszka
    }
932 6f0437e8 Jan Kiszka
}
933 6f0437e8 Jan Kiszka
934 e22a25c9 aliguori
#ifdef KVM_CAP_SET_GUEST_DEBUG
935 fc5d642f Luiz Capitulino
static void on_vcpu(CPUState *env, void (*func)(void *data), void *data)
936 fc5d642f Luiz Capitulino
{
937 828566bc Glauber Costa
#ifdef CONFIG_IOTHREAD
938 a2eebe88 Amit Shah
    if (env != cpu_single_env) {
939 a2eebe88 Amit Shah
        abort();
940 fc5d642f Luiz Capitulino
    }
941 828566bc Glauber Costa
#endif
942 a2eebe88 Amit Shah
    func(data);
943 fc5d642f Luiz Capitulino
}
944 fc5d642f Luiz Capitulino
945 e22a25c9 aliguori
struct kvm_sw_breakpoint *kvm_find_sw_breakpoint(CPUState *env,
946 e22a25c9 aliguori
                                                 target_ulong pc)
947 e22a25c9 aliguori
{
948 e22a25c9 aliguori
    struct kvm_sw_breakpoint *bp;
949 e22a25c9 aliguori
950 72cf2d4f Blue Swirl
    QTAILQ_FOREACH(bp, &env->kvm_state->kvm_sw_breakpoints, entry) {
951 e22a25c9 aliguori
        if (bp->pc == pc)
952 e22a25c9 aliguori
            return bp;
953 e22a25c9 aliguori
    }
954 e22a25c9 aliguori
    return NULL;
955 e22a25c9 aliguori
}
956 e22a25c9 aliguori
957 e22a25c9 aliguori
int kvm_sw_breakpoints_active(CPUState *env)
958 e22a25c9 aliguori
{
959 72cf2d4f Blue Swirl
    return !QTAILQ_EMPTY(&env->kvm_state->kvm_sw_breakpoints);
960 e22a25c9 aliguori
}
961 e22a25c9 aliguori
962 452e4751 Glauber Costa
struct kvm_set_guest_debug_data {
963 452e4751 Glauber Costa
    struct kvm_guest_debug dbg;
964 452e4751 Glauber Costa
    CPUState *env;
965 452e4751 Glauber Costa
    int err;
966 452e4751 Glauber Costa
};
967 452e4751 Glauber Costa
968 452e4751 Glauber Costa
static void kvm_invoke_set_guest_debug(void *data)
969 452e4751 Glauber Costa
{
970 452e4751 Glauber Costa
    struct kvm_set_guest_debug_data *dbg_data = data;
971 b3807725 Jan Kiszka
    CPUState *env = dbg_data->env;
972 b3807725 Jan Kiszka
973 9ded2744 Jan Kiszka
    if (env->kvm_vcpu_dirty) {
974 b3807725 Jan Kiszka
        kvm_arch_put_registers(env);
975 9ded2744 Jan Kiszka
        env->kvm_vcpu_dirty = 0;
976 b3807725 Jan Kiszka
    }
977 b3807725 Jan Kiszka
    dbg_data->err = kvm_vcpu_ioctl(env, KVM_SET_GUEST_DEBUG, &dbg_data->dbg);
978 452e4751 Glauber Costa
}
979 452e4751 Glauber Costa
980 e22a25c9 aliguori
int kvm_update_guest_debug(CPUState *env, unsigned long reinject_trap)
981 e22a25c9 aliguori
{
982 452e4751 Glauber Costa
    struct kvm_set_guest_debug_data data;
983 e22a25c9 aliguori
984 452e4751 Glauber Costa
    data.dbg.control = 0;
985 e22a25c9 aliguori
    if (env->singlestep_enabled)
986 452e4751 Glauber Costa
        data.dbg.control = KVM_GUESTDBG_ENABLE | KVM_GUESTDBG_SINGLESTEP;
987 e22a25c9 aliguori
988 452e4751 Glauber Costa
    kvm_arch_update_guest_debug(env, &data.dbg);
989 452e4751 Glauber Costa
    data.dbg.control |= reinject_trap;
990 452e4751 Glauber Costa
    data.env = env;
991 e22a25c9 aliguori
992 452e4751 Glauber Costa
    on_vcpu(env, kvm_invoke_set_guest_debug, &data);
993 452e4751 Glauber Costa
    return data.err;
994 e22a25c9 aliguori
}
995 e22a25c9 aliguori
996 e22a25c9 aliguori
int kvm_insert_breakpoint(CPUState *current_env, target_ulong addr,
997 e22a25c9 aliguori
                          target_ulong len, int type)
998 e22a25c9 aliguori
{
999 e22a25c9 aliguori
    struct kvm_sw_breakpoint *bp;
1000 e22a25c9 aliguori
    CPUState *env;
1001 e22a25c9 aliguori
    int err;
1002 e22a25c9 aliguori
1003 e22a25c9 aliguori
    if (type == GDB_BREAKPOINT_SW) {
1004 e22a25c9 aliguori
        bp = kvm_find_sw_breakpoint(current_env, addr);
1005 e22a25c9 aliguori
        if (bp) {
1006 e22a25c9 aliguori
            bp->use_count++;
1007 e22a25c9 aliguori
            return 0;
1008 e22a25c9 aliguori
        }
1009 e22a25c9 aliguori
1010 e22a25c9 aliguori
        bp = qemu_malloc(sizeof(struct kvm_sw_breakpoint));
1011 e22a25c9 aliguori
        if (!bp)
1012 e22a25c9 aliguori
            return -ENOMEM;
1013 e22a25c9 aliguori
1014 e22a25c9 aliguori
        bp->pc = addr;
1015 e22a25c9 aliguori
        bp->use_count = 1;
1016 e22a25c9 aliguori
        err = kvm_arch_insert_sw_breakpoint(current_env, bp);
1017 e22a25c9 aliguori
        if (err) {
1018 e22a25c9 aliguori
            free(bp);
1019 e22a25c9 aliguori
            return err;
1020 e22a25c9 aliguori
        }
1021 e22a25c9 aliguori
1022 72cf2d4f Blue Swirl
        QTAILQ_INSERT_HEAD(&current_env->kvm_state->kvm_sw_breakpoints,
1023 e22a25c9 aliguori
                          bp, entry);
1024 e22a25c9 aliguori
    } else {
1025 e22a25c9 aliguori
        err = kvm_arch_insert_hw_breakpoint(addr, len, type);
1026 e22a25c9 aliguori
        if (err)
1027 e22a25c9 aliguori
            return err;
1028 e22a25c9 aliguori
    }
1029 e22a25c9 aliguori
1030 e22a25c9 aliguori
    for (env = first_cpu; env != NULL; env = env->next_cpu) {
1031 e22a25c9 aliguori
        err = kvm_update_guest_debug(env, 0);
1032 e22a25c9 aliguori
        if (err)
1033 e22a25c9 aliguori
            return err;
1034 e22a25c9 aliguori
    }
1035 e22a25c9 aliguori
    return 0;
1036 e22a25c9 aliguori
}
1037 e22a25c9 aliguori
1038 e22a25c9 aliguori
int kvm_remove_breakpoint(CPUState *current_env, target_ulong addr,
1039 e22a25c9 aliguori
                          target_ulong len, int type)
1040 e22a25c9 aliguori
{
1041 e22a25c9 aliguori
    struct kvm_sw_breakpoint *bp;
1042 e22a25c9 aliguori
    CPUState *env;
1043 e22a25c9 aliguori
    int err;
1044 e22a25c9 aliguori
1045 e22a25c9 aliguori
    if (type == GDB_BREAKPOINT_SW) {
1046 e22a25c9 aliguori
        bp = kvm_find_sw_breakpoint(current_env, addr);
1047 e22a25c9 aliguori
        if (!bp)
1048 e22a25c9 aliguori
            return -ENOENT;
1049 e22a25c9 aliguori
1050 e22a25c9 aliguori
        if (bp->use_count > 1) {
1051 e22a25c9 aliguori
            bp->use_count--;
1052 e22a25c9 aliguori
            return 0;
1053 e22a25c9 aliguori
        }
1054 e22a25c9 aliguori
1055 e22a25c9 aliguori
        err = kvm_arch_remove_sw_breakpoint(current_env, bp);
1056 e22a25c9 aliguori
        if (err)
1057 e22a25c9 aliguori
            return err;
1058 e22a25c9 aliguori
1059 72cf2d4f Blue Swirl
        QTAILQ_REMOVE(&current_env->kvm_state->kvm_sw_breakpoints, bp, entry);
1060 e22a25c9 aliguori
        qemu_free(bp);
1061 e22a25c9 aliguori
    } else {
1062 e22a25c9 aliguori
        err = kvm_arch_remove_hw_breakpoint(addr, len, type);
1063 e22a25c9 aliguori
        if (err)
1064 e22a25c9 aliguori
            return err;
1065 e22a25c9 aliguori
    }
1066 e22a25c9 aliguori
1067 e22a25c9 aliguori
    for (env = first_cpu; env != NULL; env = env->next_cpu) {
1068 e22a25c9 aliguori
        err = kvm_update_guest_debug(env, 0);
1069 e22a25c9 aliguori
        if (err)
1070 e22a25c9 aliguori
            return err;
1071 e22a25c9 aliguori
    }
1072 e22a25c9 aliguori
    return 0;
1073 e22a25c9 aliguori
}
1074 e22a25c9 aliguori
1075 e22a25c9 aliguori
void kvm_remove_all_breakpoints(CPUState *current_env)
1076 e22a25c9 aliguori
{
1077 e22a25c9 aliguori
    struct kvm_sw_breakpoint *bp, *next;
1078 e22a25c9 aliguori
    KVMState *s = current_env->kvm_state;
1079 e22a25c9 aliguori
    CPUState *env;
1080 e22a25c9 aliguori
1081 72cf2d4f Blue Swirl
    QTAILQ_FOREACH_SAFE(bp, &s->kvm_sw_breakpoints, entry, next) {
1082 e22a25c9 aliguori
        if (kvm_arch_remove_sw_breakpoint(current_env, bp) != 0) {
1083 e22a25c9 aliguori
            /* Try harder to find a CPU that currently sees the breakpoint. */
1084 e22a25c9 aliguori
            for (env = first_cpu; env != NULL; env = env->next_cpu) {
1085 e22a25c9 aliguori
                if (kvm_arch_remove_sw_breakpoint(env, bp) == 0)
1086 e22a25c9 aliguori
                    break;
1087 e22a25c9 aliguori
            }
1088 e22a25c9 aliguori
        }
1089 e22a25c9 aliguori
    }
1090 e22a25c9 aliguori
    kvm_arch_remove_all_hw_breakpoints();
1091 e22a25c9 aliguori
1092 e22a25c9 aliguori
    for (env = first_cpu; env != NULL; env = env->next_cpu)
1093 e22a25c9 aliguori
        kvm_update_guest_debug(env, 0);
1094 e22a25c9 aliguori
}
1095 e22a25c9 aliguori
1096 e22a25c9 aliguori
#else /* !KVM_CAP_SET_GUEST_DEBUG */
1097 e22a25c9 aliguori
1098 e22a25c9 aliguori
int kvm_update_guest_debug(CPUState *env, unsigned long reinject_trap)
1099 e22a25c9 aliguori
{
1100 e22a25c9 aliguori
    return -EINVAL;
1101 e22a25c9 aliguori
}
1102 e22a25c9 aliguori
1103 e22a25c9 aliguori
int kvm_insert_breakpoint(CPUState *current_env, target_ulong addr,
1104 e22a25c9 aliguori
                          target_ulong len, int type)
1105 e22a25c9 aliguori
{
1106 e22a25c9 aliguori
    return -EINVAL;
1107 e22a25c9 aliguori
}
1108 e22a25c9 aliguori
1109 e22a25c9 aliguori
int kvm_remove_breakpoint(CPUState *current_env, target_ulong addr,
1110 e22a25c9 aliguori
                          target_ulong len, int type)
1111 e22a25c9 aliguori
{
1112 e22a25c9 aliguori
    return -EINVAL;
1113 e22a25c9 aliguori
}
1114 e22a25c9 aliguori
1115 e22a25c9 aliguori
void kvm_remove_all_breakpoints(CPUState *current_env)
1116 e22a25c9 aliguori
{
1117 e22a25c9 aliguori
}
1118 e22a25c9 aliguori
#endif /* !KVM_CAP_SET_GUEST_DEBUG */