root / xen-all.c @ dbfe06c6
History | View | Annotate | Download (28.9 kB)
1 |
/*
|
---|---|
2 |
* Copyright (C) 2010 Citrix Ltd.
|
3 |
*
|
4 |
* This work is licensed under the terms of the GNU GPL, version 2. See
|
5 |
* the COPYING file in the top-level directory.
|
6 |
*
|
7 |
*/
|
8 |
|
9 |
#include <sys/mman.h> |
10 |
|
11 |
#include "hw/pci.h" |
12 |
#include "hw/pc.h" |
13 |
#include "hw/xen_common.h" |
14 |
#include "hw/xen_backend.h" |
15 |
|
16 |
#include "range.h" |
17 |
#include "xen-mapcache.h" |
18 |
#include "trace.h" |
19 |
#include "exec-memory.h" |
20 |
|
21 |
#include <xen/hvm/ioreq.h> |
22 |
#include <xen/hvm/params.h> |
23 |
#include <xen/hvm/e820.h> |
24 |
|
25 |
//#define DEBUG_XEN
|
26 |
|
27 |
#ifdef DEBUG_XEN
|
28 |
#define DPRINTF(fmt, ...) \
|
29 |
do { fprintf(stderr, "xen: " fmt, ## __VA_ARGS__); } while (0) |
30 |
#else
|
31 |
#define DPRINTF(fmt, ...) \
|
32 |
do { } while (0) |
33 |
#endif
|
34 |
|
35 |
static MemoryRegion ram_memory, ram_640k, ram_lo, ram_hi;
|
36 |
static MemoryRegion *framebuffer;
|
37 |
|
38 |
/* Compatibility with older version */
|
39 |
#if __XEN_LATEST_INTERFACE_VERSION__ < 0x0003020a |
40 |
static inline uint32_t xen_vcpu_eport(shared_iopage_t *shared_page, int i) |
41 |
{ |
42 |
return shared_page->vcpu_iodata[i].vp_eport;
|
43 |
} |
44 |
static inline ioreq_t *xen_vcpu_ioreq(shared_iopage_t *shared_page, int vcpu) |
45 |
{ |
46 |
return &shared_page->vcpu_iodata[vcpu].vp_ioreq;
|
47 |
} |
48 |
# define FMT_ioreq_size PRIx64
|
49 |
#else
|
50 |
static inline uint32_t xen_vcpu_eport(shared_iopage_t *shared_page, int i) |
51 |
{ |
52 |
return shared_page->vcpu_ioreq[i].vp_eport;
|
53 |
} |
54 |
static inline ioreq_t *xen_vcpu_ioreq(shared_iopage_t *shared_page, int vcpu) |
55 |
{ |
56 |
return &shared_page->vcpu_ioreq[vcpu];
|
57 |
} |
58 |
# define FMT_ioreq_size "u" |
59 |
#endif
|
60 |
|
61 |
#define BUFFER_IO_MAX_DELAY 100 |
62 |
|
63 |
typedef struct XenPhysmap { |
64 |
target_phys_addr_t start_addr; |
65 |
ram_addr_t size; |
66 |
MemoryRegion *mr; |
67 |
target_phys_addr_t phys_offset; |
68 |
|
69 |
QLIST_ENTRY(XenPhysmap) list; |
70 |
} XenPhysmap; |
71 |
|
72 |
typedef struct XenIOState { |
73 |
shared_iopage_t *shared_page; |
74 |
buffered_iopage_t *buffered_io_page; |
75 |
QEMUTimer *buffered_io_timer; |
76 |
/* the evtchn port for polling the notification, */
|
77 |
evtchn_port_t *ioreq_local_port; |
78 |
/* the evtchn fd for polling */
|
79 |
XenEvtchn xce_handle; |
80 |
/* which vcpu we are serving */
|
81 |
int send_vcpu;
|
82 |
|
83 |
struct xs_handle *xenstore;
|
84 |
MemoryListener memory_listener; |
85 |
QLIST_HEAD(, XenPhysmap) physmap; |
86 |
target_phys_addr_t free_phys_offset; |
87 |
const XenPhysmap *log_for_dirtybit;
|
88 |
|
89 |
Notifier exit; |
90 |
} XenIOState; |
91 |
|
92 |
/* Xen specific function for piix pci */
|
93 |
|
94 |
int xen_pci_slot_get_pirq(PCIDevice *pci_dev, int irq_num) |
95 |
{ |
96 |
return irq_num + ((pci_dev->devfn >> 3) << 2); |
97 |
} |
98 |
|
99 |
void xen_piix3_set_irq(void *opaque, int irq_num, int level) |
100 |
{ |
101 |
xc_hvm_set_pci_intx_level(xen_xc, xen_domid, 0, 0, irq_num >> 2, |
102 |
irq_num & 3, level);
|
103 |
} |
104 |
|
105 |
void xen_piix_pci_write_config_client(uint32_t address, uint32_t val, int len) |
106 |
{ |
107 |
int i;
|
108 |
|
109 |
/* Scan for updates to PCI link routes (0x60-0x63). */
|
110 |
for (i = 0; i < len; i++) { |
111 |
uint8_t v = (val >> (8 * i)) & 0xff; |
112 |
if (v & 0x80) { |
113 |
v = 0;
|
114 |
} |
115 |
v &= 0xf;
|
116 |
if (((address + i) >= 0x60) && ((address + i) <= 0x63)) { |
117 |
xc_hvm_set_pci_link_route(xen_xc, xen_domid, address + i - 0x60, v);
|
118 |
} |
119 |
} |
120 |
} |
121 |
|
122 |
void xen_cmos_set_s3_resume(void *opaque, int irq, int level) |
123 |
{ |
124 |
pc_cmos_set_s3_resume(opaque, irq, level); |
125 |
if (level) {
|
126 |
xc_set_hvm_param(xen_xc, xen_domid, HVM_PARAM_ACPI_S_STATE, 3);
|
127 |
} |
128 |
} |
129 |
|
130 |
/* Xen Interrupt Controller */
|
131 |
|
132 |
static void xen_set_irq(void *opaque, int irq, int level) |
133 |
{ |
134 |
xc_hvm_set_isa_irq_level(xen_xc, xen_domid, irq, level); |
135 |
} |
136 |
|
137 |
qemu_irq *xen_interrupt_controller_init(void)
|
138 |
{ |
139 |
return qemu_allocate_irqs(xen_set_irq, NULL, 16); |
140 |
} |
141 |
|
142 |
/* Memory Ops */
|
143 |
|
144 |
static void xen_ram_init(ram_addr_t ram_size) |
145 |
{ |
146 |
MemoryRegion *sysmem = get_system_memory(); |
147 |
ram_addr_t below_4g_mem_size, above_4g_mem_size = 0;
|
148 |
ram_addr_t block_len; |
149 |
|
150 |
block_len = ram_size; |
151 |
if (ram_size >= HVM_BELOW_4G_RAM_END) {
|
152 |
/* Xen does not allocate the memory continuously, and keep a hole at
|
153 |
* HVM_BELOW_4G_MMIO_START of HVM_BELOW_4G_MMIO_LENGTH
|
154 |
*/
|
155 |
block_len += HVM_BELOW_4G_MMIO_LENGTH; |
156 |
} |
157 |
memory_region_init_ram(&ram_memory, "xen.ram", block_len);
|
158 |
vmstate_register_ram_global(&ram_memory); |
159 |
|
160 |
if (ram_size >= HVM_BELOW_4G_RAM_END) {
|
161 |
above_4g_mem_size = ram_size - HVM_BELOW_4G_RAM_END; |
162 |
below_4g_mem_size = HVM_BELOW_4G_RAM_END; |
163 |
} else {
|
164 |
below_4g_mem_size = ram_size; |
165 |
} |
166 |
|
167 |
memory_region_init_alias(&ram_640k, "xen.ram.640k",
|
168 |
&ram_memory, 0, 0xa0000); |
169 |
memory_region_add_subregion(sysmem, 0, &ram_640k);
|
170 |
/* Skip of the VGA IO memory space, it will be registered later by the VGA
|
171 |
* emulated device.
|
172 |
*
|
173 |
* The area between 0xc0000 and 0x100000 will be used by SeaBIOS to load
|
174 |
* the Options ROM, so it is registered here as RAM.
|
175 |
*/
|
176 |
memory_region_init_alias(&ram_lo, "xen.ram.lo",
|
177 |
&ram_memory, 0xc0000, below_4g_mem_size - 0xc0000); |
178 |
memory_region_add_subregion(sysmem, 0xc0000, &ram_lo);
|
179 |
if (above_4g_mem_size > 0) { |
180 |
memory_region_init_alias(&ram_hi, "xen.ram.hi",
|
181 |
&ram_memory, 0x100000000ULL,
|
182 |
above_4g_mem_size); |
183 |
memory_region_add_subregion(sysmem, 0x100000000ULL, &ram_hi);
|
184 |
} |
185 |
} |
186 |
|
187 |
void xen_ram_alloc(ram_addr_t ram_addr, ram_addr_t size, MemoryRegion *mr)
|
188 |
{ |
189 |
unsigned long nr_pfn; |
190 |
xen_pfn_t *pfn_list; |
191 |
int i;
|
192 |
|
193 |
if (mr == &ram_memory) {
|
194 |
return;
|
195 |
} |
196 |
|
197 |
trace_xen_ram_alloc(ram_addr, size); |
198 |
|
199 |
nr_pfn = size >> TARGET_PAGE_BITS; |
200 |
pfn_list = g_malloc(sizeof (*pfn_list) * nr_pfn);
|
201 |
|
202 |
for (i = 0; i < nr_pfn; i++) { |
203 |
pfn_list[i] = (ram_addr >> TARGET_PAGE_BITS) + i; |
204 |
} |
205 |
|
206 |
if (xc_domain_populate_physmap_exact(xen_xc, xen_domid, nr_pfn, 0, 0, pfn_list)) { |
207 |
hw_error("xen: failed to populate ram at " RAM_ADDR_FMT, ram_addr);
|
208 |
} |
209 |
|
210 |
g_free(pfn_list); |
211 |
} |
212 |
|
213 |
static XenPhysmap *get_physmapping(XenIOState *state,
|
214 |
target_phys_addr_t start_addr, ram_addr_t size) |
215 |
{ |
216 |
XenPhysmap *physmap = NULL;
|
217 |
|
218 |
start_addr &= TARGET_PAGE_MASK; |
219 |
|
220 |
QLIST_FOREACH(physmap, &state->physmap, list) { |
221 |
if (range_covers_byte(physmap->start_addr, physmap->size, start_addr)) {
|
222 |
return physmap;
|
223 |
} |
224 |
} |
225 |
return NULL; |
226 |
} |
227 |
|
228 |
#if CONFIG_XEN_CTRL_INTERFACE_VERSION >= 340 |
229 |
static int xen_add_to_physmap(XenIOState *state, |
230 |
target_phys_addr_t start_addr, |
231 |
ram_addr_t size, |
232 |
MemoryRegion *mr, |
233 |
target_phys_addr_t offset_within_region) |
234 |
{ |
235 |
unsigned long i = 0; |
236 |
int rc = 0; |
237 |
XenPhysmap *physmap = NULL;
|
238 |
target_phys_addr_t pfn, start_gpfn; |
239 |
target_phys_addr_t phys_offset = memory_region_get_ram_addr(mr); |
240 |
|
241 |
if (get_physmapping(state, start_addr, size)) {
|
242 |
return 0; |
243 |
} |
244 |
if (size <= 0) { |
245 |
return -1; |
246 |
} |
247 |
|
248 |
/* Xen can only handle a single dirty log region for now and we want
|
249 |
* the linear framebuffer to be that region.
|
250 |
* Avoid tracking any regions that is not videoram and avoid tracking
|
251 |
* the legacy vga region. */
|
252 |
if (mr == framebuffer && start_addr > 0xbffff) { |
253 |
goto go_physmap;
|
254 |
} |
255 |
return -1; |
256 |
|
257 |
go_physmap:
|
258 |
DPRINTF("mapping vram to %llx - %llx\n", start_addr, start_addr + size);
|
259 |
|
260 |
pfn = phys_offset >> TARGET_PAGE_BITS; |
261 |
start_gpfn = start_addr >> TARGET_PAGE_BITS; |
262 |
for (i = 0; i < size >> TARGET_PAGE_BITS; i++) { |
263 |
unsigned long idx = pfn + i; |
264 |
xen_pfn_t gpfn = start_gpfn + i; |
265 |
|
266 |
rc = xc_domain_add_to_physmap(xen_xc, xen_domid, XENMAPSPACE_gmfn, idx, gpfn); |
267 |
if (rc) {
|
268 |
DPRINTF("add_to_physmap MFN %"PRI_xen_pfn" to PFN %" |
269 |
PRI_xen_pfn" failed: %d\n", idx, gpfn, rc);
|
270 |
return -rc;
|
271 |
} |
272 |
} |
273 |
|
274 |
physmap = g_malloc(sizeof (XenPhysmap));
|
275 |
|
276 |
physmap->start_addr = start_addr; |
277 |
physmap->size = size; |
278 |
physmap->phys_offset = phys_offset; |
279 |
|
280 |
QLIST_INSERT_HEAD(&state->physmap, physmap, list); |
281 |
|
282 |
xc_domain_pin_memory_cacheattr(xen_xc, xen_domid, |
283 |
start_addr >> TARGET_PAGE_BITS, |
284 |
(start_addr + size) >> TARGET_PAGE_BITS, |
285 |
XEN_DOMCTL_MEM_CACHEATTR_WB); |
286 |
return 0; |
287 |
} |
288 |
|
289 |
static int xen_remove_from_physmap(XenIOState *state, |
290 |
target_phys_addr_t start_addr, |
291 |
ram_addr_t size) |
292 |
{ |
293 |
unsigned long i = 0; |
294 |
int rc = 0; |
295 |
XenPhysmap *physmap = NULL;
|
296 |
target_phys_addr_t phys_offset = 0;
|
297 |
|
298 |
physmap = get_physmapping(state, start_addr, size); |
299 |
if (physmap == NULL) { |
300 |
return -1; |
301 |
} |
302 |
|
303 |
phys_offset = physmap->phys_offset; |
304 |
size = physmap->size; |
305 |
|
306 |
DPRINTF("unmapping vram to %llx - %llx, from %llx\n",
|
307 |
phys_offset, phys_offset + size, start_addr); |
308 |
|
309 |
size >>= TARGET_PAGE_BITS; |
310 |
start_addr >>= TARGET_PAGE_BITS; |
311 |
phys_offset >>= TARGET_PAGE_BITS; |
312 |
for (i = 0; i < size; i++) { |
313 |
unsigned long idx = start_addr + i; |
314 |
xen_pfn_t gpfn = phys_offset + i; |
315 |
|
316 |
rc = xc_domain_add_to_physmap(xen_xc, xen_domid, XENMAPSPACE_gmfn, idx, gpfn); |
317 |
if (rc) {
|
318 |
fprintf(stderr, "add_to_physmap MFN %"PRI_xen_pfn" to PFN %" |
319 |
PRI_xen_pfn" failed: %d\n", idx, gpfn, rc);
|
320 |
return -rc;
|
321 |
} |
322 |
} |
323 |
|
324 |
QLIST_REMOVE(physmap, list); |
325 |
if (state->log_for_dirtybit == physmap) {
|
326 |
state->log_for_dirtybit = NULL;
|
327 |
} |
328 |
free(physmap); |
329 |
|
330 |
return 0; |
331 |
} |
332 |
|
333 |
#else
|
334 |
static int xen_add_to_physmap(XenIOState *state, |
335 |
target_phys_addr_t start_addr, |
336 |
ram_addr_t size, |
337 |
MemoryRegion *mr, |
338 |
target_phys_addr_t offset_within_region) |
339 |
{ |
340 |
return -ENOSYS;
|
341 |
} |
342 |
|
343 |
static int xen_remove_from_physmap(XenIOState *state, |
344 |
target_phys_addr_t start_addr, |
345 |
ram_addr_t size) |
346 |
{ |
347 |
return -ENOSYS;
|
348 |
} |
349 |
#endif
|
350 |
|
351 |
static void xen_set_memory(struct MemoryListener *listener, |
352 |
MemoryRegionSection *section, |
353 |
bool add)
|
354 |
{ |
355 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
356 |
target_phys_addr_t start_addr = section->offset_within_address_space; |
357 |
ram_addr_t size = section->size; |
358 |
bool log_dirty = memory_region_is_logging(section->mr);
|
359 |
hvmmem_type_t mem_type; |
360 |
|
361 |
if (!memory_region_is_ram(section->mr)) {
|
362 |
return;
|
363 |
} |
364 |
|
365 |
if (!(section->mr != &ram_memory
|
366 |
&& ( (log_dirty && add) || (!log_dirty && !add)))) { |
367 |
return;
|
368 |
} |
369 |
|
370 |
trace_xen_client_set_memory(start_addr, size, log_dirty); |
371 |
|
372 |
start_addr &= TARGET_PAGE_MASK; |
373 |
size = TARGET_PAGE_ALIGN(size); |
374 |
|
375 |
if (add) {
|
376 |
if (!memory_region_is_rom(section->mr)) {
|
377 |
xen_add_to_physmap(state, start_addr, size, |
378 |
section->mr, section->offset_within_region); |
379 |
} else {
|
380 |
mem_type = HVMMEM_ram_ro; |
381 |
if (xc_hvm_set_mem_type(xen_xc, xen_domid, mem_type,
|
382 |
start_addr >> TARGET_PAGE_BITS, |
383 |
size >> TARGET_PAGE_BITS)) { |
384 |
DPRINTF("xc_hvm_set_mem_type error, addr: "TARGET_FMT_plx"\n", |
385 |
start_addr); |
386 |
} |
387 |
} |
388 |
} else {
|
389 |
if (xen_remove_from_physmap(state, start_addr, size) < 0) { |
390 |
DPRINTF("physmapping does not exist at "TARGET_FMT_plx"\n", start_addr); |
391 |
} |
392 |
} |
393 |
} |
394 |
|
395 |
static void xen_region_add(MemoryListener *listener, |
396 |
MemoryRegionSection *section) |
397 |
{ |
398 |
xen_set_memory(listener, section, true);
|
399 |
} |
400 |
|
401 |
static void xen_region_del(MemoryListener *listener, |
402 |
MemoryRegionSection *section) |
403 |
{ |
404 |
xen_set_memory(listener, section, false);
|
405 |
} |
406 |
|
407 |
static void xen_sync_dirty_bitmap(XenIOState *state, |
408 |
target_phys_addr_t start_addr, |
409 |
ram_addr_t size) |
410 |
{ |
411 |
target_phys_addr_t npages = size >> TARGET_PAGE_BITS; |
412 |
const int width = sizeof(unsigned long) * 8; |
413 |
unsigned long bitmap[(npages + width - 1) / width]; |
414 |
int rc, i, j;
|
415 |
const XenPhysmap *physmap = NULL; |
416 |
|
417 |
physmap = get_physmapping(state, start_addr, size); |
418 |
if (physmap == NULL) { |
419 |
/* not handled */
|
420 |
return;
|
421 |
} |
422 |
|
423 |
if (state->log_for_dirtybit == NULL) { |
424 |
state->log_for_dirtybit = physmap; |
425 |
} else if (state->log_for_dirtybit != physmap) { |
426 |
/* Only one range for dirty bitmap can be tracked. */
|
427 |
return;
|
428 |
} |
429 |
|
430 |
rc = xc_hvm_track_dirty_vram(xen_xc, xen_domid, |
431 |
start_addr >> TARGET_PAGE_BITS, npages, |
432 |
bitmap); |
433 |
if (rc < 0) { |
434 |
if (rc != -ENODATA) {
|
435 |
fprintf(stderr, "xen: track_dirty_vram failed (0x" TARGET_FMT_plx
|
436 |
", 0x" TARGET_FMT_plx "): %s\n", |
437 |
start_addr, start_addr + size, strerror(-rc)); |
438 |
} |
439 |
return;
|
440 |
} |
441 |
|
442 |
for (i = 0; i < ARRAY_SIZE(bitmap); i++) { |
443 |
unsigned long map = bitmap[i]; |
444 |
while (map != 0) { |
445 |
j = ffsl(map) - 1;
|
446 |
map &= ~(1ul << j);
|
447 |
memory_region_set_dirty(framebuffer, |
448 |
(i * width + j) * TARGET_PAGE_SIZE); |
449 |
}; |
450 |
} |
451 |
} |
452 |
|
453 |
static void xen_log_start(MemoryListener *listener, |
454 |
MemoryRegionSection *section) |
455 |
{ |
456 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
457 |
|
458 |
xen_sync_dirty_bitmap(state, section->offset_within_address_space, |
459 |
section->size); |
460 |
} |
461 |
|
462 |
static void xen_log_stop(MemoryListener *listener, MemoryRegionSection *section) |
463 |
{ |
464 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
465 |
|
466 |
state->log_for_dirtybit = NULL;
|
467 |
/* Disable dirty bit tracking */
|
468 |
xc_hvm_track_dirty_vram(xen_xc, xen_domid, 0, 0, NULL); |
469 |
} |
470 |
|
471 |
static void xen_log_sync(MemoryListener *listener, MemoryRegionSection *section) |
472 |
{ |
473 |
XenIOState *state = container_of(listener, XenIOState, memory_listener); |
474 |
|
475 |
xen_sync_dirty_bitmap(state, section->offset_within_address_space, |
476 |
section->size); |
477 |
} |
478 |
|
479 |
static void xen_log_global_start(MemoryListener *listener) |
480 |
{ |
481 |
} |
482 |
|
483 |
static void xen_log_global_stop(MemoryListener *listener) |
484 |
{ |
485 |
} |
486 |
|
487 |
static MemoryListener xen_memory_listener = {
|
488 |
.region_add = xen_region_add, |
489 |
.region_del = xen_region_del, |
490 |
.log_start = xen_log_start, |
491 |
.log_stop = xen_log_stop, |
492 |
.log_sync = xen_log_sync, |
493 |
.log_global_start = xen_log_global_start, |
494 |
.log_global_stop = xen_log_global_stop, |
495 |
}; |
496 |
|
497 |
/* VCPU Operations, MMIO, IO ring ... */
|
498 |
|
499 |
static void xen_reset_vcpu(void *opaque) |
500 |
{ |
501 |
CPUState *env = opaque; |
502 |
|
503 |
env->halted = 1;
|
504 |
} |
505 |
|
506 |
void xen_vcpu_init(void) |
507 |
{ |
508 |
CPUState *first_cpu; |
509 |
|
510 |
if ((first_cpu = qemu_get_cpu(0))) { |
511 |
qemu_register_reset(xen_reset_vcpu, first_cpu); |
512 |
xen_reset_vcpu(first_cpu); |
513 |
} |
514 |
} |
515 |
|
516 |
/* get the ioreq packets from share mem */
|
517 |
static ioreq_t *cpu_get_ioreq_from_shared_memory(XenIOState *state, int vcpu) |
518 |
{ |
519 |
ioreq_t *req = xen_vcpu_ioreq(state->shared_page, vcpu); |
520 |
|
521 |
if (req->state != STATE_IOREQ_READY) {
|
522 |
DPRINTF("I/O request not ready: "
|
523 |
"%x, ptr: %x, port: %"PRIx64", " |
524 |
"data: %"PRIx64", count: %" FMT_ioreq_size ", size: %" FMT_ioreq_size "\n", |
525 |
req->state, req->data_is_ptr, req->addr, |
526 |
req->data, req->count, req->size); |
527 |
return NULL; |
528 |
} |
529 |
|
530 |
xen_rmb(); /* see IOREQ_READY /then/ read contents of ioreq */
|
531 |
|
532 |
req->state = STATE_IOREQ_INPROCESS; |
533 |
return req;
|
534 |
} |
535 |
|
536 |
/* use poll to get the port notification */
|
537 |
/* ioreq_vec--out,the */
|
538 |
/* retval--the number of ioreq packet */
|
539 |
static ioreq_t *cpu_get_ioreq(XenIOState *state)
|
540 |
{ |
541 |
int i;
|
542 |
evtchn_port_t port; |
543 |
|
544 |
port = xc_evtchn_pending(state->xce_handle); |
545 |
if (port != -1) { |
546 |
for (i = 0; i < smp_cpus; i++) { |
547 |
if (state->ioreq_local_port[i] == port) {
|
548 |
break;
|
549 |
} |
550 |
} |
551 |
|
552 |
if (i == smp_cpus) {
|
553 |
hw_error("Fatal error while trying to get io event!\n");
|
554 |
} |
555 |
|
556 |
/* unmask the wanted port again */
|
557 |
xc_evtchn_unmask(state->xce_handle, port); |
558 |
|
559 |
/* get the io packet from shared memory */
|
560 |
state->send_vcpu = i; |
561 |
return cpu_get_ioreq_from_shared_memory(state, i);
|
562 |
} |
563 |
|
564 |
/* read error or read nothing */
|
565 |
return NULL; |
566 |
} |
567 |
|
568 |
static uint32_t do_inp(pio_addr_t addr, unsigned long size) |
569 |
{ |
570 |
switch (size) {
|
571 |
case 1: |
572 |
return cpu_inb(addr);
|
573 |
case 2: |
574 |
return cpu_inw(addr);
|
575 |
case 4: |
576 |
return cpu_inl(addr);
|
577 |
default:
|
578 |
hw_error("inp: bad size: %04"FMT_pioaddr" %lx", addr, size); |
579 |
} |
580 |
} |
581 |
|
582 |
static void do_outp(pio_addr_t addr, |
583 |
unsigned long size, uint32_t val) |
584 |
{ |
585 |
switch (size) {
|
586 |
case 1: |
587 |
return cpu_outb(addr, val);
|
588 |
case 2: |
589 |
return cpu_outw(addr, val);
|
590 |
case 4: |
591 |
return cpu_outl(addr, val);
|
592 |
default:
|
593 |
hw_error("outp: bad size: %04"FMT_pioaddr" %lx", addr, size); |
594 |
} |
595 |
} |
596 |
|
597 |
static void cpu_ioreq_pio(ioreq_t *req) |
598 |
{ |
599 |
int i, sign;
|
600 |
|
601 |
sign = req->df ? -1 : 1; |
602 |
|
603 |
if (req->dir == IOREQ_READ) {
|
604 |
if (!req->data_is_ptr) {
|
605 |
req->data = do_inp(req->addr, req->size); |
606 |
} else {
|
607 |
uint32_t tmp; |
608 |
|
609 |
for (i = 0; i < req->count; i++) { |
610 |
tmp = do_inp(req->addr, req->size); |
611 |
cpu_physical_memory_write(req->data + (sign * i * req->size), |
612 |
(uint8_t *) &tmp, req->size); |
613 |
} |
614 |
} |
615 |
} else if (req->dir == IOREQ_WRITE) { |
616 |
if (!req->data_is_ptr) {
|
617 |
do_outp(req->addr, req->size, req->data); |
618 |
} else {
|
619 |
for (i = 0; i < req->count; i++) { |
620 |
uint32_t tmp = 0;
|
621 |
|
622 |
cpu_physical_memory_read(req->data + (sign * i * req->size), |
623 |
(uint8_t*) &tmp, req->size); |
624 |
do_outp(req->addr, req->size, tmp); |
625 |
} |
626 |
} |
627 |
} |
628 |
} |
629 |
|
630 |
static void cpu_ioreq_move(ioreq_t *req) |
631 |
{ |
632 |
int i, sign;
|
633 |
|
634 |
sign = req->df ? -1 : 1; |
635 |
|
636 |
if (!req->data_is_ptr) {
|
637 |
if (req->dir == IOREQ_READ) {
|
638 |
for (i = 0; i < req->count; i++) { |
639 |
cpu_physical_memory_read(req->addr + (sign * i * req->size), |
640 |
(uint8_t *) &req->data, req->size); |
641 |
} |
642 |
} else if (req->dir == IOREQ_WRITE) { |
643 |
for (i = 0; i < req->count; i++) { |
644 |
cpu_physical_memory_write(req->addr + (sign * i * req->size), |
645 |
(uint8_t *) &req->data, req->size); |
646 |
} |
647 |
} |
648 |
} else {
|
649 |
uint64_t tmp; |
650 |
|
651 |
if (req->dir == IOREQ_READ) {
|
652 |
for (i = 0; i < req->count; i++) { |
653 |
cpu_physical_memory_read(req->addr + (sign * i * req->size), |
654 |
(uint8_t*) &tmp, req->size); |
655 |
cpu_physical_memory_write(req->data + (sign * i * req->size), |
656 |
(uint8_t*) &tmp, req->size); |
657 |
} |
658 |
} else if (req->dir == IOREQ_WRITE) { |
659 |
for (i = 0; i < req->count; i++) { |
660 |
cpu_physical_memory_read(req->data + (sign * i * req->size), |
661 |
(uint8_t*) &tmp, req->size); |
662 |
cpu_physical_memory_write(req->addr + (sign * i * req->size), |
663 |
(uint8_t*) &tmp, req->size); |
664 |
} |
665 |
} |
666 |
} |
667 |
} |
668 |
|
669 |
static void handle_ioreq(ioreq_t *req) |
670 |
{ |
671 |
if (!req->data_is_ptr && (req->dir == IOREQ_WRITE) &&
|
672 |
(req->size < sizeof (target_ulong))) {
|
673 |
req->data &= ((target_ulong) 1 << (8 * req->size)) - 1; |
674 |
} |
675 |
|
676 |
switch (req->type) {
|
677 |
case IOREQ_TYPE_PIO:
|
678 |
cpu_ioreq_pio(req); |
679 |
break;
|
680 |
case IOREQ_TYPE_COPY:
|
681 |
cpu_ioreq_move(req); |
682 |
break;
|
683 |
case IOREQ_TYPE_TIMEOFFSET:
|
684 |
break;
|
685 |
case IOREQ_TYPE_INVALIDATE:
|
686 |
xen_invalidate_map_cache(); |
687 |
break;
|
688 |
default:
|
689 |
hw_error("Invalid ioreq type 0x%x\n", req->type);
|
690 |
} |
691 |
} |
692 |
|
693 |
static void handle_buffered_iopage(XenIOState *state) |
694 |
{ |
695 |
buf_ioreq_t *buf_req = NULL;
|
696 |
ioreq_t req; |
697 |
int qw;
|
698 |
|
699 |
if (!state->buffered_io_page) {
|
700 |
return;
|
701 |
} |
702 |
|
703 |
while (state->buffered_io_page->read_pointer != state->buffered_io_page->write_pointer) {
|
704 |
buf_req = &state->buffered_io_page->buf_ioreq[ |
705 |
state->buffered_io_page->read_pointer % IOREQ_BUFFER_SLOT_NUM]; |
706 |
req.size = 1UL << buf_req->size;
|
707 |
req.count = 1;
|
708 |
req.addr = buf_req->addr; |
709 |
req.data = buf_req->data; |
710 |
req.state = STATE_IOREQ_READY; |
711 |
req.dir = buf_req->dir; |
712 |
req.df = 1;
|
713 |
req.type = buf_req->type; |
714 |
req.data_is_ptr = 0;
|
715 |
qw = (req.size == 8);
|
716 |
if (qw) {
|
717 |
buf_req = &state->buffered_io_page->buf_ioreq[ |
718 |
(state->buffered_io_page->read_pointer + 1) % IOREQ_BUFFER_SLOT_NUM];
|
719 |
req.data |= ((uint64_t)buf_req->data) << 32;
|
720 |
} |
721 |
|
722 |
handle_ioreq(&req); |
723 |
|
724 |
xen_mb(); |
725 |
state->buffered_io_page->read_pointer += qw ? 2 : 1; |
726 |
} |
727 |
} |
728 |
|
729 |
static void handle_buffered_io(void *opaque) |
730 |
{ |
731 |
XenIOState *state = opaque; |
732 |
|
733 |
handle_buffered_iopage(state); |
734 |
qemu_mod_timer(state->buffered_io_timer, |
735 |
BUFFER_IO_MAX_DELAY + qemu_get_clock_ms(rt_clock)); |
736 |
} |
737 |
|
738 |
static void cpu_handle_ioreq(void *opaque) |
739 |
{ |
740 |
XenIOState *state = opaque; |
741 |
ioreq_t *req = cpu_get_ioreq(state); |
742 |
|
743 |
handle_buffered_iopage(state); |
744 |
if (req) {
|
745 |
handle_ioreq(req); |
746 |
|
747 |
if (req->state != STATE_IOREQ_INPROCESS) {
|
748 |
fprintf(stderr, "Badness in I/O request ... not in service?!: "
|
749 |
"%x, ptr: %x, port: %"PRIx64", " |
750 |
"data: %"PRIx64", count: %" FMT_ioreq_size ", size: %" FMT_ioreq_size "\n", |
751 |
req->state, req->data_is_ptr, req->addr, |
752 |
req->data, req->count, req->size); |
753 |
destroy_hvm_domain(); |
754 |
return;
|
755 |
} |
756 |
|
757 |
xen_wmb(); /* Update ioreq contents /then/ update state. */
|
758 |
|
759 |
/*
|
760 |
* We do this before we send the response so that the tools
|
761 |
* have the opportunity to pick up on the reset before the
|
762 |
* guest resumes and does a hlt with interrupts disabled which
|
763 |
* causes Xen to powerdown the domain.
|
764 |
*/
|
765 |
if (runstate_is_running()) {
|
766 |
if (qemu_shutdown_requested_get()) {
|
767 |
destroy_hvm_domain(); |
768 |
} |
769 |
if (qemu_reset_requested_get()) {
|
770 |
qemu_system_reset(VMRESET_REPORT); |
771 |
} |
772 |
} |
773 |
|
774 |
req->state = STATE_IORESP_READY; |
775 |
xc_evtchn_notify(state->xce_handle, state->ioreq_local_port[state->send_vcpu]); |
776 |
} |
777 |
} |
778 |
|
779 |
static int store_dev_info(int domid, CharDriverState *cs, const char *string) |
780 |
{ |
781 |
struct xs_handle *xs = NULL; |
782 |
char *path = NULL; |
783 |
char *newpath = NULL; |
784 |
char *pts = NULL; |
785 |
int ret = -1; |
786 |
|
787 |
/* Only continue if we're talking to a pty. */
|
788 |
if (strncmp(cs->filename, "pty:", 4)) { |
789 |
return 0; |
790 |
} |
791 |
pts = cs->filename + 4;
|
792 |
|
793 |
/* We now have everything we need to set the xenstore entry. */
|
794 |
xs = xs_open(0);
|
795 |
if (xs == NULL) { |
796 |
fprintf(stderr, "Could not contact XenStore\n");
|
797 |
goto out;
|
798 |
} |
799 |
|
800 |
path = xs_get_domain_path(xs, domid); |
801 |
if (path == NULL) { |
802 |
fprintf(stderr, "xs_get_domain_path() error\n");
|
803 |
goto out;
|
804 |
} |
805 |
newpath = realloc(path, (strlen(path) + strlen(string) + |
806 |
strlen("/tty") + 1)); |
807 |
if (newpath == NULL) { |
808 |
fprintf(stderr, "realloc error\n");
|
809 |
goto out;
|
810 |
} |
811 |
path = newpath; |
812 |
|
813 |
strcat(path, string); |
814 |
strcat(path, "/tty");
|
815 |
if (!xs_write(xs, XBT_NULL, path, pts, strlen(pts))) {
|
816 |
fprintf(stderr, "xs_write for '%s' fail", string);
|
817 |
goto out;
|
818 |
} |
819 |
ret = 0;
|
820 |
|
821 |
out:
|
822 |
free(path); |
823 |
xs_close(xs); |
824 |
|
825 |
return ret;
|
826 |
} |
827 |
|
828 |
void xenstore_store_pv_console_info(int i, CharDriverState *chr) |
829 |
{ |
830 |
if (i == 0) { |
831 |
store_dev_info(xen_domid, chr, "/console");
|
832 |
} else {
|
833 |
char buf[32]; |
834 |
snprintf(buf, sizeof(buf), "/device/console/%d", i); |
835 |
store_dev_info(xen_domid, chr, buf); |
836 |
} |
837 |
} |
838 |
|
839 |
static void xenstore_record_dm_state(struct xs_handle *xs, const char *state) |
840 |
{ |
841 |
char path[50]; |
842 |
|
843 |
if (xs == NULL) { |
844 |
fprintf(stderr, "xenstore connection not initialized\n");
|
845 |
exit(1);
|
846 |
} |
847 |
|
848 |
snprintf(path, sizeof (path), "/local/domain/0/device-model/%u/state", xen_domid); |
849 |
if (!xs_write(xs, XBT_NULL, path, state, strlen(state))) {
|
850 |
fprintf(stderr, "error recording dm state\n");
|
851 |
exit(1);
|
852 |
} |
853 |
} |
854 |
|
855 |
static void xen_main_loop_prepare(XenIOState *state) |
856 |
{ |
857 |
int evtchn_fd = -1; |
858 |
|
859 |
if (state->xce_handle != XC_HANDLER_INITIAL_VALUE) {
|
860 |
evtchn_fd = xc_evtchn_fd(state->xce_handle); |
861 |
} |
862 |
|
863 |
state->buffered_io_timer = qemu_new_timer_ms(rt_clock, handle_buffered_io, |
864 |
state); |
865 |
qemu_mod_timer(state->buffered_io_timer, qemu_get_clock_ms(rt_clock)); |
866 |
|
867 |
if (evtchn_fd != -1) { |
868 |
qemu_set_fd_handler(evtchn_fd, cpu_handle_ioreq, NULL, state);
|
869 |
} |
870 |
} |
871 |
|
872 |
|
873 |
/* Initialise Xen */
|
874 |
|
875 |
static void xen_change_state_handler(void *opaque, int running, |
876 |
RunState state) |
877 |
{ |
878 |
if (running) {
|
879 |
/* record state running */
|
880 |
xenstore_record_dm_state(xenstore, "running");
|
881 |
} |
882 |
} |
883 |
|
884 |
static void xen_hvm_change_state_handler(void *opaque, int running, |
885 |
RunState rstate) |
886 |
{ |
887 |
XenIOState *xstate = opaque; |
888 |
if (running) {
|
889 |
xen_main_loop_prepare(xstate); |
890 |
} |
891 |
} |
892 |
|
893 |
static void xen_exit_notifier(Notifier *n, void *data) |
894 |
{ |
895 |
XenIOState *state = container_of(n, XenIOState, exit); |
896 |
|
897 |
xc_evtchn_close(state->xce_handle); |
898 |
xs_daemon_close(state->xenstore); |
899 |
} |
900 |
|
901 |
int xen_init(void) |
902 |
{ |
903 |
xen_xc = xen_xc_interface_open(0, 0, 0); |
904 |
if (xen_xc == XC_HANDLER_INITIAL_VALUE) {
|
905 |
xen_be_printf(NULL, 0, "can't open xen interface\n"); |
906 |
return -1; |
907 |
} |
908 |
qemu_add_vm_change_state_handler(xen_change_state_handler, NULL);
|
909 |
|
910 |
return 0; |
911 |
} |
912 |
|
913 |
int xen_hvm_init(void) |
914 |
{ |
915 |
int i, rc;
|
916 |
unsigned long ioreq_pfn; |
917 |
XenIOState *state; |
918 |
|
919 |
state = g_malloc0(sizeof (XenIOState));
|
920 |
|
921 |
state->xce_handle = xen_xc_evtchn_open(NULL, 0); |
922 |
if (state->xce_handle == XC_HANDLER_INITIAL_VALUE) {
|
923 |
perror("xen: event channel open");
|
924 |
return -errno;
|
925 |
} |
926 |
|
927 |
state->xenstore = xs_daemon_open(); |
928 |
if (state->xenstore == NULL) { |
929 |
perror("xen: xenstore open");
|
930 |
return -errno;
|
931 |
} |
932 |
|
933 |
state->exit.notify = xen_exit_notifier; |
934 |
qemu_add_exit_notifier(&state->exit); |
935 |
|
936 |
xc_get_hvm_param(xen_xc, xen_domid, HVM_PARAM_IOREQ_PFN, &ioreq_pfn); |
937 |
DPRINTF("shared page at pfn %lx\n", ioreq_pfn);
|
938 |
state->shared_page = xc_map_foreign_range(xen_xc, xen_domid, XC_PAGE_SIZE, |
939 |
PROT_READ|PROT_WRITE, ioreq_pfn); |
940 |
if (state->shared_page == NULL) { |
941 |
hw_error("map shared IO page returned error %d handle=" XC_INTERFACE_FMT,
|
942 |
errno, xen_xc); |
943 |
} |
944 |
|
945 |
xc_get_hvm_param(xen_xc, xen_domid, HVM_PARAM_BUFIOREQ_PFN, &ioreq_pfn); |
946 |
DPRINTF("buffered io page at pfn %lx\n", ioreq_pfn);
|
947 |
state->buffered_io_page = xc_map_foreign_range(xen_xc, xen_domid, XC_PAGE_SIZE, |
948 |
PROT_READ|PROT_WRITE, ioreq_pfn); |
949 |
if (state->buffered_io_page == NULL) { |
950 |
hw_error("map buffered IO page returned error %d", errno);
|
951 |
} |
952 |
|
953 |
state->ioreq_local_port = g_malloc0(smp_cpus * sizeof (evtchn_port_t));
|
954 |
|
955 |
/* FIXME: how about if we overflow the page here? */
|
956 |
for (i = 0; i < smp_cpus; i++) { |
957 |
rc = xc_evtchn_bind_interdomain(state->xce_handle, xen_domid, |
958 |
xen_vcpu_eport(state->shared_page, i)); |
959 |
if (rc == -1) { |
960 |
fprintf(stderr, "bind interdomain ioctl error %d\n", errno);
|
961 |
return -1; |
962 |
} |
963 |
state->ioreq_local_port[i] = rc; |
964 |
} |
965 |
|
966 |
/* Init RAM management */
|
967 |
xen_map_cache_init(); |
968 |
xen_ram_init(ram_size); |
969 |
|
970 |
qemu_add_vm_change_state_handler(xen_hvm_change_state_handler, state); |
971 |
|
972 |
state->memory_listener = xen_memory_listener; |
973 |
QLIST_INIT(&state->physmap); |
974 |
memory_listener_register(&state->memory_listener); |
975 |
state->log_for_dirtybit = NULL;
|
976 |
|
977 |
/* Initialize backend core & drivers */
|
978 |
if (xen_be_init() != 0) { |
979 |
fprintf(stderr, "%s: xen backend core setup failed\n", __FUNCTION__);
|
980 |
exit(1);
|
981 |
} |
982 |
xen_be_register("console", &xen_console_ops);
|
983 |
xen_be_register("vkbd", &xen_kbdmouse_ops);
|
984 |
xen_be_register("qdisk", &xen_blkdev_ops);
|
985 |
|
986 |
return 0; |
987 |
} |
988 |
|
989 |
void destroy_hvm_domain(void) |
990 |
{ |
991 |
XenXC xc_handle; |
992 |
int sts;
|
993 |
|
994 |
xc_handle = xen_xc_interface_open(0, 0, 0); |
995 |
if (xc_handle == XC_HANDLER_INITIAL_VALUE) {
|
996 |
fprintf(stderr, "Cannot acquire xenctrl handle\n");
|
997 |
} else {
|
998 |
sts = xc_domain_shutdown(xc_handle, xen_domid, SHUTDOWN_poweroff); |
999 |
if (sts != 0) { |
1000 |
fprintf(stderr, "? xc_domain_shutdown failed to issue poweroff, "
|
1001 |
"sts %d, %s\n", sts, strerror(errno));
|
1002 |
} else {
|
1003 |
fprintf(stderr, "Issued domain %d poweroff\n", xen_domid);
|
1004 |
} |
1005 |
xc_interface_close(xc_handle); |
1006 |
} |
1007 |
} |
1008 |
|
1009 |
void xen_register_framebuffer(MemoryRegion *mr)
|
1010 |
{ |
1011 |
framebuffer = mr; |
1012 |
} |