root / xen-all.c @ fd4aa979
History | View | Annotate | Download (29.1 kB)
1 |
/*
|
---|---|
2 |
* Copyright (C) 2010 Citrix Ltd.
|
3 |
*
|
4 |
* This work is licensed under the terms of the GNU GPL, version 2. See
|
5 |
* the COPYING file in the top-level directory.
|
6 |
*
|
7 |
* Contributions after 2012-01-13 are licensed under the terms of the
|
8 |
* GNU GPL, version 2 or (at your option) any later version.
|
9 |
*/
|
10 |
|
11 |
#include <sys/mman.h> |
12 |
|
13 |
#include "hw/pci.h" |
14 |
#include "hw/pc.h" |
15 |
#include "hw/xen_common.h" |
16 |
#include "hw/xen_backend.h" |
17 |
|
18 |
#include "range.h" |
19 |
#include "xen-mapcache.h" |
20 |
#include "trace.h" |
21 |
#include "exec-memory.h" |
22 |
|
23 |
#include <xen/hvm/ioreq.h> |
24 |
#include <xen/hvm/params.h> |
25 |
#include <xen/hvm/e820.h> |
26 |
|
27 |
//#define DEBUG_XEN
|
28 |
|
29 |
#ifdef DEBUG_XEN
|
30 |
#define DPRINTF(fmt, ...) \
|
31 |
do { fprintf(stderr, "xen: " fmt, ## __VA_ARGS__); } while (0) |
32 |
#else
|
33 |
#define DPRINTF(fmt, ...) \
|
34 |
do { } while (0) |
35 |
#endif
|
36 |
|
37 |
static MemoryRegion ram_memory, ram_640k, ram_lo, ram_hi;
|
38 |
static MemoryRegion *framebuffer;
|
39 |
|
40 |
/* Compatibility with older version */
|
41 |
#if __XEN_LATEST_INTERFACE_VERSION__ < 0x0003020a |
42 |
static inline uint32_t xen_vcpu_eport(shared_iopage_t *shared_page, int i) |
43 |
{ |
44 |
return shared_page->vcpu_iodata[i].vp_eport;
|
45 |
} |
46 |
static inline ioreq_t *xen_vcpu_ioreq(shared_iopage_t *shared_page, int vcpu) |
47 |
{ |
48 |
return &shared_page->vcpu_iodata[vcpu].vp_ioreq;
|
49 |
} |
50 |
# define FMT_ioreq_size PRIx64
|
51 |
#else
|
52 |
static inline uint32_t xen_vcpu_eport(shared_iopage_t *shared_page, int i) |
53 |
{ |
54 |
return shared_page->vcpu_ioreq[i].vp_eport;
|
55 |
} |
56 |
static inline ioreq_t *xen_vcpu_ioreq(shared_iopage_t *shared_page, int vcpu) |
57 |
{ |
58 |
return &shared_page->vcpu_ioreq[vcpu];
|
59 |
} |
60 |
# define FMT_ioreq_size "u" |
61 |
#endif
|
62 |
|
63 |
#define BUFFER_IO_MAX_DELAY 100 |
64 |
|
65 |
typedef struct XenPhysmap { |
66 |
target_phys_addr_t start_addr; |
67 |
ram_addr_t size; |
68 |
MemoryRegion *mr; |
69 |
target_phys_addr_t phys_offset; |
70 |
|
71 |
QLIST_ENTRY(XenPhysmap) list; |
72 |
} XenPhysmap; |
73 |
|
74 |
typedef struct XenIOState { |
75 |
shared_iopage_t *shared_page; |
76 |
buffered_iopage_t *buffered_io_page; |
77 |
QEMUTimer *buffered_io_timer; |
78 |
/* the evtchn port for polling the notification, */
|
79 |
evtchn_port_t *ioreq_local_port; |
80 |
/* the evtchn fd for polling */
|
81 |
XenEvtchn xce_handle; |
82 |
/* which vcpu we are serving */
|
83 |
int send_vcpu;
|
84 |
|
85 |
struct xs_handle *xenstore;
|
86 |
MemoryListener memory_listener; |
87 |
QLIST_HEAD(, XenPhysmap) physmap; |
88 |
target_phys_addr_t free_phys_offset; |
89 |
const XenPhysmap *log_for_dirtybit;
|
90 |
|
91 |
Notifier exit; |
92 |
} XenIOState; |
93 |
|
94 |
/* Xen specific function for piix pci */
|
95 |
|
96 |
int xen_pci_slot_get_pirq(PCIDevice *pci_dev, int irq_num) |
97 |
{ |
98 |
return irq_num + ((pci_dev->devfn >> 3) << 2); |
99 |
} |
100 |
|
101 |
void xen_piix3_set_irq(void *opaque, int irq_num, int level) |
102 |
{ |
103 |
xc_hvm_set_pci_intx_level(xen_xc, xen_domid, 0, 0, irq_num >> 2, |
104 |
irq_num & 3, level);
|
105 |
} |
106 |
|
107 |
void xen_piix_pci_write_config_client(uint32_t address, uint32_t val, int len) |
108 |
{ |
109 |
int i;
|
110 |
|
111 |
/* Scan for updates to PCI link routes (0x60-0x63). */
|
112 |
for (i = 0; i < len; i++) { |
113 |
uint8_t v = (val >> (8 * i)) & 0xff; |
114 |
if (v & 0x80) { |
115 |
v = 0;
|
116 |
} |
117 |
v &= 0xf;
|
118 |
if (((address + i) >= 0x60) && ((address + i) <= 0x63)) { |
119 |
xc_hvm_set_pci_link_route(xen_xc, xen_domid, address + i - 0x60, v);
|
120 |
} |
121 |
} |
122 |
} |
123 |
|
124 |
void xen_cmos_set_s3_resume(void *opaque, int irq, int level) |
125 |
{ |
126 |
pc_cmos_set_s3_resume(opaque, irq, level); |
127 |
if (level) {
|
128 |
xc_set_hvm_param(xen_xc, xen_domid, HVM_PARAM_ACPI_S_STATE, 3);
|
129 |
} |
130 |
} |
131 |
|
132 |
/* Xen Interrupt Controller */
|
133 |
|
134 |
static void xen_set_irq(void *opaque, int irq, int level) |
135 |
{ |
136 |
xc_hvm_set_isa_irq_level(xen_xc, xen_domid, irq, level); |
137 |
} |
138 |
|
139 |
qemu_irq *xen_interrupt_controller_init(void)
|
140 |
{ |
141 |
return qemu_allocate_irqs(xen_set_irq, NULL, 16); |
142 |
} |
143 |
|
144 |
/* Memory Ops */
|
145 |
|
146 |
static void xen_ram_init(ram_addr_t ram_size) |
147 |
{ |
148 |
MemoryRegion *sysmem = get_system_memory(); |
149 |
ram_addr_t below_4g_mem_size, above_4g_mem_size = 0;
|
150 |
ram_addr_t block_len; |
151 |
|
152 |
block_len = ram_size; |
153 |
if (ram_size >= HVM_BELOW_4G_RAM_END) {
|
154 |
/* Xen does not allocate the memory continuously, and keep a hole at
|
155 |
* HVM_BELOW_4G_MMIO_START of HVM_BELOW_4G_MMIO_LENGTH
|
156 |
*/
|
157 |
block_len += HVM_BELOW_4G_MMIO_LENGTH; |
158 |
} |
159 |
memory_region_init_ram(&ram_memory, "xen.ram", block_len);
|
160 |
vmstate_register_ram_global(&ram_memory); |
161 |
|
162 |
if (ram_size >= HVM_BELOW_4G_RAM_END) {
|
163 |
above_4g_mem_size = ram_size - HVM_BELOW_4G_RAM_END; |
164 |
below_4g_mem_size = HVM_BELOW_4G_RAM_END; |
165 |
} else {
|
166 |
below_4g_mem_size = ram_size; |
167 |
} |
168 |
|
169 |
memory_region_init_alias(&ram_640k, "xen.ram.640k",
|
170 |
&ram_memory, 0, 0xa0000); |
171 |
memory_region_add_subregion(sysmem, 0, &ram_640k);
|
172 |
/* Skip of the VGA IO memory space, it will be registered later by the VGA
|
173 |
* emulated device.
|
174 |
*
|
175 |
* The area between 0xc0000 and 0x100000 will be used by SeaBIOS to load
|
176 |
* the Options ROM, so it is registered here as RAM.
|
177 |
*/
|
178 |
memory_region_init_alias(&ram_lo, "xen.ram.lo",
|
179 |
&ram_memory, 0xc0000, below_4g_mem_size - 0xc0000); |
180 |
memory_region_add_subregion(sysmem, 0xc0000, &ram_lo);
|
181 |
if (above_4g_mem_size > 0) { |
182 |
memory_region_init_alias(&ram_hi, "xen.ram.hi",
|
183 |
&ram_memory, 0x100000000ULL,
|
184 |
above_4g_mem_size); |
185 |
memory_region_add_subregion(sysmem, 0x100000000ULL, &ram_hi);
|
186 |
} |
187 |
} |
188 |
|
189 |
void xen_ram_alloc(ram_addr_t ram_addr, ram_addr_t size, MemoryRegion *mr)
|
190 |
{ |
191 |
unsigned long nr_pfn; |
192 |
xen_pfn_t *pfn_list; |
193 |
int i;
|
194 |
|
195 |
if (mr == &ram_memory) {
|
196 |
return;
|
197 |
} |
198 |
|
199 |
trace_xen_ram_alloc(ram_addr, size); |
200 |
|
201 |
nr_pfn = size >> TARGET_PAGE_BITS; |
202 |
pfn_list = g_malloc(sizeof (*pfn_list) * nr_pfn);
|
203 |
|
204 |
for (i = 0; i < nr_pfn; i++) { |
205 |
pfn_list[i] = (ram_addr >> TARGET_PAGE_BITS) + i; |
206 |
} |
207 |
|
208 |
if (xc_domain_populate_physmap_exact(xen_xc, xen_domid, nr_pfn, 0, 0, pfn_list)) { |
209 |
hw_error("xen: failed to populate ram at " RAM_ADDR_FMT, ram_addr);
|
210 |
} |
211 |
|
212 |
g_free(pfn_list); |
213 |
} |
214 |
|
215 |
static XenPhysmap *get_physmapping(XenIOState *state,
|
216 |
target_phys_addr_t start_addr, ram_addr_t size) |
217 |
{ |
218 |
XenPhysmap *physmap = NULL;
|
219 |
|
220 |
start_addr &= TARGET_PAGE_MASK; |
221 |
|
222 |
QLIST_FOREACH(physmap, &state->physmap, list) { |
223 |
if (range_covers_byte(physmap->start_addr, physmap->size, start_addr)) {
|
224 |
return physmap;
|
225 |
} |
226 |
} |
227 |
return NULL; |
228 |
} |
229 |
|
230 |
#if CONFIG_XEN_CTRL_INTERFACE_VERSION >= 340 |
231 |
static int xen_add_to_physmap(XenIOState *state, |
232 |
target_phys_addr_t start_addr, |
233 |
ram_addr_t size, |
234 |
MemoryRegion *mr, |
235 |
target_phys_addr_t offset_within_region) |
236 |
{ |
237 |
unsigned long i = 0; |
238 |
int rc = 0; |
239 |
XenPhysmap *physmap = NULL;
|
240 |
target_phys_addr_t pfn, start_gpfn; |
241 |
target_phys_addr_t phys_offset = memory_region_get_ram_addr(mr); |
242 |
|
243 |
if (get_physmapping(state, start_addr, size)) {
|
244 |
return 0; |
245 |
} |
246 |
if (size <= 0) { |
247 |
return -1; |
248 |
} |
249 |
|
250 |
/* Xen can only handle a single dirty log region for now and we want
|
251 |
* the linear framebuffer to be that region.
|
252 |
* Avoid tracking any regions that is not videoram and avoid tracking
|
253 |
* the legacy vga region. */
|
254 |
if (mr == framebuffer && start_addr > 0xbffff) { |
255 |
goto go_physmap;
|
256 |
} |
257 |
return -1; |
258 |
|
259 |
go_physmap:
|
260 |
DPRINTF("mapping vram to %llx - %llx\n", start_addr, start_addr + size);
|
261 |
|
262 |
pfn = phys_offset >> TARGET_PAGE_BITS; |
263 |
start_gpfn = start_addr >> TARGET_PAGE_BITS; |
264 |
for (i = 0; i < size >> TARGET_PAGE_BITS; i++) { |
265 |
unsigned long idx = pfn + i; |
266 |
xen_pfn_t gpfn = start_gpfn + i; |
267 |
|
268 |
rc = xc_domain_add_to_physmap(xen_xc, xen_domid, XENMAPSPACE_gmfn, idx, gpfn); |
269 |
if (rc) {
|
270 |
DPRINTF("add_to_physmap MFN %"PRI_xen_pfn" to PFN %" |
271 |
PRI_xen_pfn" failed: %d\n", idx, gpfn, rc);
|
272 |
return -rc;
|
273 |
} |
274 |
} |
275 |
|
276 |
physmap = g_malloc(sizeof (XenPhysmap));
|
277 |
|
278 |
physmap->start_addr = start_addr; |
279 |
physmap->size = size; |
280 |
physmap->phys_offset = phys_offset; |
281 |
|
282 |
QLIST_INSERT_HEAD(&state->physmap, physmap, list); |
283 |
|
284 |
xc_domain_pin_memory_cacheattr(xen_xc, xen_domid, |
285 |
start_addr >> TARGET_PAGE_BITS, |
286 |
(start_addr + size) >> TARGET_PAGE_BITS, |
287 |
XEN_DOMCTL_MEM_CACHEATTR_WB); |
288 |
return 0; |
289 |
} |
290 |
|
291 |
static int xen_remove_from_physmap(XenIOState *state, |
292 |
target_phys_addr_t start_addr, |
293 |
ram_addr_t size) |
294 |
{ |
295 |
unsigned long i = 0; |
296 |
int rc = 0; |
297 |
XenPhysmap *physmap = NULL;
|
298 |
target_phys_addr_t phys_offset = 0;
|
299 |
|
300 |
physmap = get_physmapping(state, start_addr, size); |
301 |
if (physmap == NULL) { |
302 |
return -1; |
303 |
} |
304 |
|
305 |
phys_offset = physmap->phys_offset; |
306 |
size = physmap->size; |
307 |
|
308 |
DPRINTF("unmapping vram to %llx - %llx, from %llx\n",
|
309 |
phys_offset, phys_offset + size, start_addr); |
310 |
|
311 |
size >>= TARGET_PAGE_BITS; |
312 |
start_addr >>= TARGET_PAGE_BITS; |
313 |
phys_offset >>= TARGET_PAGE_BITS; |
314 |
for (i = 0; i < size; i++) { |
315 |
unsigned long idx = start_addr + i; |
316 |
xen_pfn_t gpfn = phys_offset + i; |
317 |
|
318 |
rc = xc_domain_add_to_physmap(xen_xc, xen_domid, XENMAPSPACE_gmfn, idx, gpfn); |
319 |
if (rc) {
|
320 |
fprintf(stderr, "add_to_physmap MFN %"PRI_xen_pfn" to PFN %" |
321 |
PRI_xen_pfn" failed: %d\n", idx, gpfn, rc);
|
322 |
return -rc;
|
323 |
} |
324 |
} |
325 |
|
326 |
QLIST_REMOVE(physmap, list); |
327 |
if (state->log_for_dirtybit == physmap) {
|
328 |
state->log_for_dirtybit = NULL;
|
329 |
} |
330 |
free(physmap); |
331 |
|
332 |
return 0; |
333 |
} |
334 |
|
335 |
#else
|
336 |
static int xen_add_to_physmap(XenIOState *state, |
337 |
target_phys_addr_t start_addr, |
338 |
ram_addr_t size, |
339 |
MemoryRegion *mr, |
340 |
target_phys_addr_t offset_within_region) |
341 |
{ |
342 |
return -ENOSYS;
|
343 |
} |
344 |
|
345 |
static int xen_remove_from_physmap(XenIOState *state, |
346 |
target_phys_addr_t start_addr, |
347 |
ram_addr_t size) |
348 |
{ |
349 |
return -ENOSYS;
|
350 |
} |
351 |
#endif
|
352 |
|
353 |
static void xen_set_memory(struct MemoryListener *listener, |
354 |
MemoryRegionSection *section, |
355 |
bool add)
|
356 |
{ |
357 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
358 |
target_phys_addr_t start_addr = section->offset_within_address_space; |
359 |
ram_addr_t size = section->size; |
360 |
bool log_dirty = memory_region_is_logging(section->mr);
|
361 |
hvmmem_type_t mem_type; |
362 |
|
363 |
if (!memory_region_is_ram(section->mr)) {
|
364 |
return;
|
365 |
} |
366 |
|
367 |
if (!(section->mr != &ram_memory
|
368 |
&& ( (log_dirty && add) || (!log_dirty && !add)))) { |
369 |
return;
|
370 |
} |
371 |
|
372 |
trace_xen_client_set_memory(start_addr, size, log_dirty); |
373 |
|
374 |
start_addr &= TARGET_PAGE_MASK; |
375 |
size = TARGET_PAGE_ALIGN(size); |
376 |
|
377 |
if (add) {
|
378 |
if (!memory_region_is_rom(section->mr)) {
|
379 |
xen_add_to_physmap(state, start_addr, size, |
380 |
section->mr, section->offset_within_region); |
381 |
} else {
|
382 |
mem_type = HVMMEM_ram_ro; |
383 |
if (xc_hvm_set_mem_type(xen_xc, xen_domid, mem_type,
|
384 |
start_addr >> TARGET_PAGE_BITS, |
385 |
size >> TARGET_PAGE_BITS)) { |
386 |
DPRINTF("xc_hvm_set_mem_type error, addr: "TARGET_FMT_plx"\n", |
387 |
start_addr); |
388 |
} |
389 |
} |
390 |
} else {
|
391 |
if (xen_remove_from_physmap(state, start_addr, size) < 0) { |
392 |
DPRINTF("physmapping does not exist at "TARGET_FMT_plx"\n", start_addr); |
393 |
} |
394 |
} |
395 |
} |
396 |
|
397 |
static void xen_region_add(MemoryListener *listener, |
398 |
MemoryRegionSection *section) |
399 |
{ |
400 |
xen_set_memory(listener, section, true);
|
401 |
} |
402 |
|
403 |
static void xen_region_del(MemoryListener *listener, |
404 |
MemoryRegionSection *section) |
405 |
{ |
406 |
xen_set_memory(listener, section, false);
|
407 |
} |
408 |
|
409 |
static void xen_sync_dirty_bitmap(XenIOState *state, |
410 |
target_phys_addr_t start_addr, |
411 |
ram_addr_t size) |
412 |
{ |
413 |
target_phys_addr_t npages = size >> TARGET_PAGE_BITS; |
414 |
const int width = sizeof(unsigned long) * 8; |
415 |
unsigned long bitmap[(npages + width - 1) / width]; |
416 |
int rc, i, j;
|
417 |
const XenPhysmap *physmap = NULL; |
418 |
|
419 |
physmap = get_physmapping(state, start_addr, size); |
420 |
if (physmap == NULL) { |
421 |
/* not handled */
|
422 |
return;
|
423 |
} |
424 |
|
425 |
if (state->log_for_dirtybit == NULL) { |
426 |
state->log_for_dirtybit = physmap; |
427 |
} else if (state->log_for_dirtybit != physmap) { |
428 |
/* Only one range for dirty bitmap can be tracked. */
|
429 |
return;
|
430 |
} |
431 |
|
432 |
rc = xc_hvm_track_dirty_vram(xen_xc, xen_domid, |
433 |
start_addr >> TARGET_PAGE_BITS, npages, |
434 |
bitmap); |
435 |
if (rc < 0) { |
436 |
if (rc != -ENODATA) {
|
437 |
fprintf(stderr, "xen: track_dirty_vram failed (0x" TARGET_FMT_plx
|
438 |
", 0x" TARGET_FMT_plx "): %s\n", |
439 |
start_addr, start_addr + size, strerror(-rc)); |
440 |
} |
441 |
return;
|
442 |
} |
443 |
|
444 |
for (i = 0; i < ARRAY_SIZE(bitmap); i++) { |
445 |
unsigned long map = bitmap[i]; |
446 |
while (map != 0) { |
447 |
j = ffsl(map) - 1;
|
448 |
map &= ~(1ul << j);
|
449 |
memory_region_set_dirty(framebuffer, |
450 |
(i * width + j) * TARGET_PAGE_SIZE, |
451 |
TARGET_PAGE_SIZE); |
452 |
}; |
453 |
} |
454 |
} |
455 |
|
456 |
static void xen_log_start(MemoryListener *listener, |
457 |
MemoryRegionSection *section) |
458 |
{ |
459 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
460 |
|
461 |
xen_sync_dirty_bitmap(state, section->offset_within_address_space, |
462 |
section->size); |
463 |
} |
464 |
|
465 |
static void xen_log_stop(MemoryListener *listener, MemoryRegionSection *section) |
466 |
{ |
467 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
468 |
|
469 |
state->log_for_dirtybit = NULL;
|
470 |
/* Disable dirty bit tracking */
|
471 |
xc_hvm_track_dirty_vram(xen_xc, xen_domid, 0, 0, NULL); |
472 |
} |
473 |
|
474 |
static void xen_log_sync(MemoryListener *listener, MemoryRegionSection *section) |
475 |
{ |
476 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
477 |
|
478 |
xen_sync_dirty_bitmap(state, section->offset_within_address_space, |
479 |
section->size); |
480 |
} |
481 |
|
482 |
static void xen_log_global_start(MemoryListener *listener) |
483 |
{ |
484 |
} |
485 |
|
486 |
static void xen_log_global_stop(MemoryListener *listener) |
487 |
{ |
488 |
} |
489 |
|
490 |
static MemoryListener xen_memory_listener = {
|
491 |
.region_add = xen_region_add, |
492 |
.region_del = xen_region_del, |
493 |
.log_start = xen_log_start, |
494 |
.log_stop = xen_log_stop, |
495 |
.log_sync = xen_log_sync, |
496 |
.log_global_start = xen_log_global_start, |
497 |
.log_global_stop = xen_log_global_stop, |
498 |
}; |
499 |
|
500 |
/* VCPU Operations, MMIO, IO ring ... */
|
501 |
|
502 |
static void xen_reset_vcpu(void *opaque) |
503 |
{ |
504 |
CPUState *env = opaque; |
505 |
|
506 |
env->halted = 1;
|
507 |
} |
508 |
|
509 |
void xen_vcpu_init(void) |
510 |
{ |
511 |
CPUState *first_cpu; |
512 |
|
513 |
if ((first_cpu = qemu_get_cpu(0))) { |
514 |
qemu_register_reset(xen_reset_vcpu, first_cpu); |
515 |
xen_reset_vcpu(first_cpu); |
516 |
} |
517 |
} |
518 |
|
519 |
/* get the ioreq packets from share mem */
|
520 |
static ioreq_t *cpu_get_ioreq_from_shared_memory(XenIOState *state, int vcpu) |
521 |
{ |
522 |
ioreq_t *req = xen_vcpu_ioreq(state->shared_page, vcpu); |
523 |
|
524 |
if (req->state != STATE_IOREQ_READY) {
|
525 |
DPRINTF("I/O request not ready: "
|
526 |
"%x, ptr: %x, port: %"PRIx64", " |
527 |
"data: %"PRIx64", count: %" FMT_ioreq_size ", size: %" FMT_ioreq_size "\n", |
528 |
req->state, req->data_is_ptr, req->addr, |
529 |
req->data, req->count, req->size); |
530 |
return NULL; |
531 |
} |
532 |
|
533 |
xen_rmb(); /* see IOREQ_READY /then/ read contents of ioreq */
|
534 |
|
535 |
req->state = STATE_IOREQ_INPROCESS; |
536 |
return req;
|
537 |
} |
538 |
|
539 |
/* use poll to get the port notification */
|
540 |
/* ioreq_vec--out,the */
|
541 |
/* retval--the number of ioreq packet */
|
542 |
static ioreq_t *cpu_get_ioreq(XenIOState *state)
|
543 |
{ |
544 |
int i;
|
545 |
evtchn_port_t port; |
546 |
|
547 |
port = xc_evtchn_pending(state->xce_handle); |
548 |
if (port != -1) { |
549 |
for (i = 0; i < smp_cpus; i++) { |
550 |
if (state->ioreq_local_port[i] == port) {
|
551 |
break;
|
552 |
} |
553 |
} |
554 |
|
555 |
if (i == smp_cpus) {
|
556 |
hw_error("Fatal error while trying to get io event!\n");
|
557 |
} |
558 |
|
559 |
/* unmask the wanted port again */
|
560 |
xc_evtchn_unmask(state->xce_handle, port); |
561 |
|
562 |
/* get the io packet from shared memory */
|
563 |
state->send_vcpu = i; |
564 |
return cpu_get_ioreq_from_shared_memory(state, i);
|
565 |
} |
566 |
|
567 |
/* read error or read nothing */
|
568 |
return NULL; |
569 |
} |
570 |
|
571 |
static uint32_t do_inp(pio_addr_t addr, unsigned long size) |
572 |
{ |
573 |
switch (size) {
|
574 |
case 1: |
575 |
return cpu_inb(addr);
|
576 |
case 2: |
577 |
return cpu_inw(addr);
|
578 |
case 4: |
579 |
return cpu_inl(addr);
|
580 |
default:
|
581 |
hw_error("inp: bad size: %04"FMT_pioaddr" %lx", addr, size); |
582 |
} |
583 |
} |
584 |
|
585 |
static void do_outp(pio_addr_t addr, |
586 |
unsigned long size, uint32_t val) |
587 |
{ |
588 |
switch (size) {
|
589 |
case 1: |
590 |
return cpu_outb(addr, val);
|
591 |
case 2: |
592 |
return cpu_outw(addr, val);
|
593 |
case 4: |
594 |
return cpu_outl(addr, val);
|
595 |
default:
|
596 |
hw_error("outp: bad size: %04"FMT_pioaddr" %lx", addr, size); |
597 |
} |
598 |
} |
599 |
|
600 |
static void cpu_ioreq_pio(ioreq_t *req) |
601 |
{ |
602 |
int i, sign;
|
603 |
|
604 |
sign = req->df ? -1 : 1; |
605 |
|
606 |
if (req->dir == IOREQ_READ) {
|
607 |
if (!req->data_is_ptr) {
|
608 |
req->data = do_inp(req->addr, req->size); |
609 |
} else {
|
610 |
uint32_t tmp; |
611 |
|
612 |
for (i = 0; i < req->count; i++) { |
613 |
tmp = do_inp(req->addr, req->size); |
614 |
cpu_physical_memory_write(req->data + (sign * i * req->size), |
615 |
(uint8_t *) &tmp, req->size); |
616 |
} |
617 |
} |
618 |
} else if (req->dir == IOREQ_WRITE) { |
619 |
if (!req->data_is_ptr) {
|
620 |
do_outp(req->addr, req->size, req->data); |
621 |
} else {
|
622 |
for (i = 0; i < req->count; i++) { |
623 |
uint32_t tmp = 0;
|
624 |
|
625 |
cpu_physical_memory_read(req->data + (sign * i * req->size), |
626 |
(uint8_t*) &tmp, req->size); |
627 |
do_outp(req->addr, req->size, tmp); |
628 |
} |
629 |
} |
630 |
} |
631 |
} |
632 |
|
633 |
static void cpu_ioreq_move(ioreq_t *req) |
634 |
{ |
635 |
int i, sign;
|
636 |
|
637 |
sign = req->df ? -1 : 1; |
638 |
|
639 |
if (!req->data_is_ptr) {
|
640 |
if (req->dir == IOREQ_READ) {
|
641 |
for (i = 0; i < req->count; i++) { |
642 |
cpu_physical_memory_read(req->addr + (sign * i * req->size), |
643 |
(uint8_t *) &req->data, req->size); |
644 |
} |
645 |
} else if (req->dir == IOREQ_WRITE) { |
646 |
for (i = 0; i < req->count; i++) { |
647 |
cpu_physical_memory_write(req->addr + (sign * i * req->size), |
648 |
(uint8_t *) &req->data, req->size); |
649 |
} |
650 |
} |
651 |
} else {
|
652 |
uint64_t tmp; |
653 |
|
654 |
if (req->dir == IOREQ_READ) {
|
655 |
for (i = 0; i < req->count; i++) { |
656 |
cpu_physical_memory_read(req->addr + (sign * i * req->size), |
657 |
(uint8_t*) &tmp, req->size); |
658 |
cpu_physical_memory_write(req->data + (sign * i * req->size), |
659 |
(uint8_t*) &tmp, req->size); |
660 |
} |
661 |
} else if (req->dir == IOREQ_WRITE) { |
662 |
for (i = 0; i < req->count; i++) { |
663 |
cpu_physical_memory_read(req->data + (sign * i * req->size), |
664 |
(uint8_t*) &tmp, req->size); |
665 |
cpu_physical_memory_write(req->addr + (sign * i * req->size), |
666 |
(uint8_t*) &tmp, req->size); |
667 |
} |
668 |
} |
669 |
} |
670 |
} |
671 |
|
672 |
static void handle_ioreq(ioreq_t *req) |
673 |
{ |
674 |
if (!req->data_is_ptr && (req->dir == IOREQ_WRITE) &&
|
675 |
(req->size < sizeof (target_ulong))) {
|
676 |
req->data &= ((target_ulong) 1 << (8 * req->size)) - 1; |
677 |
} |
678 |
|
679 |
switch (req->type) {
|
680 |
case IOREQ_TYPE_PIO:
|
681 |
cpu_ioreq_pio(req); |
682 |
break;
|
683 |
case IOREQ_TYPE_COPY:
|
684 |
cpu_ioreq_move(req); |
685 |
break;
|
686 |
case IOREQ_TYPE_TIMEOFFSET:
|
687 |
break;
|
688 |
case IOREQ_TYPE_INVALIDATE:
|
689 |
xen_invalidate_map_cache(); |
690 |
break;
|
691 |
default:
|
692 |
hw_error("Invalid ioreq type 0x%x\n", req->type);
|
693 |
} |
694 |
} |
695 |
|
696 |
static void handle_buffered_iopage(XenIOState *state) |
697 |
{ |
698 |
buf_ioreq_t *buf_req = NULL;
|
699 |
ioreq_t req; |
700 |
int qw;
|
701 |
|
702 |
if (!state->buffered_io_page) {
|
703 |
return;
|
704 |
} |
705 |
|
706 |
while (state->buffered_io_page->read_pointer != state->buffered_io_page->write_pointer) {
|
707 |
buf_req = &state->buffered_io_page->buf_ioreq[ |
708 |
state->buffered_io_page->read_pointer % IOREQ_BUFFER_SLOT_NUM]; |
709 |
req.size = 1UL << buf_req->size;
|
710 |
req.count = 1;
|
711 |
req.addr = buf_req->addr; |
712 |
req.data = buf_req->data; |
713 |
req.state = STATE_IOREQ_READY; |
714 |
req.dir = buf_req->dir; |
715 |
req.df = 1;
|
716 |
req.type = buf_req->type; |
717 |
req.data_is_ptr = 0;
|
718 |
qw = (req.size == 8);
|
719 |
if (qw) {
|
720 |
buf_req = &state->buffered_io_page->buf_ioreq[ |
721 |
(state->buffered_io_page->read_pointer + 1) % IOREQ_BUFFER_SLOT_NUM];
|
722 |
req.data |= ((uint64_t)buf_req->data) << 32;
|
723 |
} |
724 |
|
725 |
handle_ioreq(&req); |
726 |
|
727 |
xen_mb(); |
728 |
state->buffered_io_page->read_pointer += qw ? 2 : 1; |
729 |
} |
730 |
} |
731 |
|
732 |
static void handle_buffered_io(void *opaque) |
733 |
{ |
734 |
XenIOState *state = opaque; |
735 |
|
736 |
handle_buffered_iopage(state); |
737 |
qemu_mod_timer(state->buffered_io_timer, |
738 |
BUFFER_IO_MAX_DELAY + qemu_get_clock_ms(rt_clock)); |
739 |
} |
740 |
|
741 |
static void cpu_handle_ioreq(void *opaque) |
742 |
{ |
743 |
XenIOState *state = opaque; |
744 |
ioreq_t *req = cpu_get_ioreq(state); |
745 |
|
746 |
handle_buffered_iopage(state); |
747 |
if (req) {
|
748 |
handle_ioreq(req); |
749 |
|
750 |
if (req->state != STATE_IOREQ_INPROCESS) {
|
751 |
fprintf(stderr, "Badness in I/O request ... not in service?!: "
|
752 |
"%x, ptr: %x, port: %"PRIx64", " |
753 |
"data: %"PRIx64", count: %" FMT_ioreq_size ", size: %" FMT_ioreq_size "\n", |
754 |
req->state, req->data_is_ptr, req->addr, |
755 |
req->data, req->count, req->size); |
756 |
destroy_hvm_domain(); |
757 |
return;
|
758 |
} |
759 |
|
760 |
xen_wmb(); /* Update ioreq contents /then/ update state. */
|
761 |
|
762 |
/*
|
763 |
* We do this before we send the response so that the tools
|
764 |
* have the opportunity to pick up on the reset before the
|
765 |
* guest resumes and does a hlt with interrupts disabled which
|
766 |
* causes Xen to powerdown the domain.
|
767 |
*/
|
768 |
if (runstate_is_running()) {
|
769 |
if (qemu_shutdown_requested_get()) {
|
770 |
destroy_hvm_domain(); |
771 |
} |
772 |
if (qemu_reset_requested_get()) {
|
773 |
qemu_system_reset(VMRESET_REPORT); |
774 |
} |
775 |
} |
776 |
|
777 |
req->state = STATE_IORESP_READY; |
778 |
xc_evtchn_notify(state->xce_handle, state->ioreq_local_port[state->send_vcpu]); |
779 |
} |
780 |
} |
781 |
|
782 |
static int store_dev_info(int domid, CharDriverState *cs, const char *string) |
783 |
{ |
784 |
struct xs_handle *xs = NULL; |
785 |
char *path = NULL; |
786 |
char *newpath = NULL; |
787 |
char *pts = NULL; |
788 |
int ret = -1; |
789 |
|
790 |
/* Only continue if we're talking to a pty. */
|
791 |
if (strncmp(cs->filename, "pty:", 4)) { |
792 |
return 0; |
793 |
} |
794 |
pts = cs->filename + 4;
|
795 |
|
796 |
/* We now have everything we need to set the xenstore entry. */
|
797 |
xs = xs_open(0);
|
798 |
if (xs == NULL) { |
799 |
fprintf(stderr, "Could not contact XenStore\n");
|
800 |
goto out;
|
801 |
} |
802 |
|
803 |
path = xs_get_domain_path(xs, domid); |
804 |
if (path == NULL) { |
805 |
fprintf(stderr, "xs_get_domain_path() error\n");
|
806 |
goto out;
|
807 |
} |
808 |
newpath = realloc(path, (strlen(path) + strlen(string) + |
809 |
strlen("/tty") + 1)); |
810 |
if (newpath == NULL) { |
811 |
fprintf(stderr, "realloc error\n");
|
812 |
goto out;
|
813 |
} |
814 |
path = newpath; |
815 |
|
816 |
strcat(path, string); |
817 |
strcat(path, "/tty");
|
818 |
if (!xs_write(xs, XBT_NULL, path, pts, strlen(pts))) {
|
819 |
fprintf(stderr, "xs_write for '%s' fail", string);
|
820 |
goto out;
|
821 |
} |
822 |
ret = 0;
|
823 |
|
824 |
out:
|
825 |
free(path); |
826 |
xs_close(xs); |
827 |
|
828 |
return ret;
|
829 |
} |
830 |
|
831 |
void xenstore_store_pv_console_info(int i, CharDriverState *chr) |
832 |
{ |
833 |
if (i == 0) { |
834 |
store_dev_info(xen_domid, chr, "/console");
|
835 |
} else {
|
836 |
char buf[32]; |
837 |
snprintf(buf, sizeof(buf), "/device/console/%d", i); |
838 |
store_dev_info(xen_domid, chr, buf); |
839 |
} |
840 |
} |
841 |
|
842 |
static void xenstore_record_dm_state(struct xs_handle *xs, const char *state) |
843 |
{ |
844 |
char path[50]; |
845 |
|
846 |
if (xs == NULL) { |
847 |
fprintf(stderr, "xenstore connection not initialized\n");
|
848 |
exit(1);
|
849 |
} |
850 |
|
851 |
snprintf(path, sizeof (path), "/local/domain/0/device-model/%u/state", xen_domid); |
852 |
if (!xs_write(xs, XBT_NULL, path, state, strlen(state))) {
|
853 |
fprintf(stderr, "error recording dm state\n");
|
854 |
exit(1);
|
855 |
} |
856 |
} |
857 |
|
858 |
static void xen_main_loop_prepare(XenIOState *state) |
859 |
{ |
860 |
int evtchn_fd = -1; |
861 |
|
862 |
if (state->xce_handle != XC_HANDLER_INITIAL_VALUE) {
|
863 |
evtchn_fd = xc_evtchn_fd(state->xce_handle); |
864 |
} |
865 |
|
866 |
state->buffered_io_timer = qemu_new_timer_ms(rt_clock, handle_buffered_io, |
867 |
state); |
868 |
qemu_mod_timer(state->buffered_io_timer, qemu_get_clock_ms(rt_clock)); |
869 |
|
870 |
if (evtchn_fd != -1) { |
871 |
qemu_set_fd_handler(evtchn_fd, cpu_handle_ioreq, NULL, state);
|
872 |
} |
873 |
} |
874 |
|
875 |
|
876 |
/* Initialise Xen */
|
877 |
|
878 |
static void xen_change_state_handler(void *opaque, int running, |
879 |
RunState state) |
880 |
{ |
881 |
if (running) {
|
882 |
/* record state running */
|
883 |
xenstore_record_dm_state(xenstore, "running");
|
884 |
} |
885 |
} |
886 |
|
887 |
static void xen_hvm_change_state_handler(void *opaque, int running, |
888 |
RunState rstate) |
889 |
{ |
890 |
XenIOState *xstate = opaque; |
891 |
if (running) {
|
892 |
xen_main_loop_prepare(xstate); |
893 |
} |
894 |
} |
895 |
|
896 |
static void xen_exit_notifier(Notifier *n, void *data) |
897 |
{ |
898 |
XenIOState *state = container_of(n, XenIOState, exit); |
899 |
|
900 |
xc_evtchn_close(state->xce_handle); |
901 |
xs_daemon_close(state->xenstore); |
902 |
} |
903 |
|
904 |
int xen_init(void) |
905 |
{ |
906 |
xen_xc = xen_xc_interface_open(0, 0, 0); |
907 |
if (xen_xc == XC_HANDLER_INITIAL_VALUE) {
|
908 |
xen_be_printf(NULL, 0, "can't open xen interface\n"); |
909 |
return -1; |
910 |
} |
911 |
qemu_add_vm_change_state_handler(xen_change_state_handler, NULL);
|
912 |
|
913 |
return 0; |
914 |
} |
915 |
|
916 |
int xen_hvm_init(void) |
917 |
{ |
918 |
int i, rc;
|
919 |
unsigned long ioreq_pfn; |
920 |
XenIOState *state; |
921 |
|
922 |
state = g_malloc0(sizeof (XenIOState));
|
923 |
|
924 |
state->xce_handle = xen_xc_evtchn_open(NULL, 0); |
925 |
if (state->xce_handle == XC_HANDLER_INITIAL_VALUE) {
|
926 |
perror("xen: event channel open");
|
927 |
return -errno;
|
928 |
} |
929 |
|
930 |
state->xenstore = xs_daemon_open(); |
931 |
if (state->xenstore == NULL) { |
932 |
perror("xen: xenstore open");
|
933 |
return -errno;
|
934 |
} |
935 |
|
936 |
state->exit.notify = xen_exit_notifier; |
937 |
qemu_add_exit_notifier(&state->exit); |
938 |
|
939 |
xc_get_hvm_param(xen_xc, xen_domid, HVM_PARAM_IOREQ_PFN, &ioreq_pfn); |
940 |
DPRINTF("shared page at pfn %lx\n", ioreq_pfn);
|
941 |
state->shared_page = xc_map_foreign_range(xen_xc, xen_domid, XC_PAGE_SIZE, |
942 |
PROT_READ|PROT_WRITE, ioreq_pfn); |
943 |
if (state->shared_page == NULL) { |
944 |
hw_error("map shared IO page returned error %d handle=" XC_INTERFACE_FMT,
|
945 |
errno, xen_xc); |
946 |
} |
947 |
|
948 |
xc_get_hvm_param(xen_xc, xen_domid, HVM_PARAM_BUFIOREQ_PFN, &ioreq_pfn); |
949 |
DPRINTF("buffered io page at pfn %lx\n", ioreq_pfn);
|
950 |
state->buffered_io_page = xc_map_foreign_range(xen_xc, xen_domid, XC_PAGE_SIZE, |
951 |
PROT_READ|PROT_WRITE, ioreq_pfn); |
952 |
if (state->buffered_io_page == NULL) { |
953 |
hw_error("map buffered IO page returned error %d", errno);
|
954 |
} |
955 |
|
956 |
state->ioreq_local_port = g_malloc0(smp_cpus * sizeof (evtchn_port_t));
|
957 |
|
958 |
/* FIXME: how about if we overflow the page here? */
|
959 |
for (i = 0; i < smp_cpus; i++) { |
960 |
rc = xc_evtchn_bind_interdomain(state->xce_handle, xen_domid, |
961 |
xen_vcpu_eport(state->shared_page, i)); |
962 |
if (rc == -1) { |
963 |
fprintf(stderr, "bind interdomain ioctl error %d\n", errno);
|
964 |
return -1; |
965 |
} |
966 |
state->ioreq_local_port[i] = rc; |
967 |
} |
968 |
|
969 |
/* Init RAM management */
|
970 |
xen_map_cache_init(); |
971 |
xen_ram_init(ram_size); |
972 |
|
973 |
qemu_add_vm_change_state_handler(xen_hvm_change_state_handler, state); |
974 |
|
975 |
state->memory_listener = xen_memory_listener; |
976 |
QLIST_INIT(&state->physmap); |
977 |
memory_listener_register(&state->memory_listener); |
978 |
state->log_for_dirtybit = NULL;
|
979 |
|
980 |
/* Initialize backend core & drivers */
|
981 |
if (xen_be_init() != 0) { |
982 |
fprintf(stderr, "%s: xen backend core setup failed\n", __FUNCTION__);
|
983 |
exit(1);
|
984 |
} |
985 |
xen_be_register("console", &xen_console_ops);
|
986 |
xen_be_register("vkbd", &xen_kbdmouse_ops);
|
987 |
xen_be_register("qdisk", &xen_blkdev_ops);
|
988 |
|
989 |
return 0; |
990 |
} |
991 |
|
992 |
void destroy_hvm_domain(void) |
993 |
{ |
994 |
XenXC xc_handle; |
995 |
int sts;
|
996 |
|
997 |
xc_handle = xen_xc_interface_open(0, 0, 0); |
998 |
if (xc_handle == XC_HANDLER_INITIAL_VALUE) {
|
999 |
fprintf(stderr, "Cannot acquire xenctrl handle\n");
|
1000 |
} else {
|
1001 |
sts = xc_domain_shutdown(xc_handle, xen_domid, SHUTDOWN_poweroff); |
1002 |
if (sts != 0) { |
1003 |
fprintf(stderr, "? xc_domain_shutdown failed to issue poweroff, "
|
1004 |
"sts %d, %s\n", sts, strerror(errno));
|
1005 |
} else {
|
1006 |
fprintf(stderr, "Issued domain %d poweroff\n", xen_domid);
|
1007 |
} |
1008 |
xc_interface_close(xc_handle); |
1009 |
} |
1010 |
} |
1011 |
|
1012 |
void xen_register_framebuffer(MemoryRegion *mr)
|
1013 |
{ |
1014 |
framebuffer = mr; |
1015 |
} |