root / xen-mapcache.c @ 7fc7e584
History | View | Annotate | Download (11.4 kB)
1 |
/*
|
---|---|
2 |
* Copyright (C) 2011 Citrix Ltd.
|
3 |
*
|
4 |
* This work is licensed under the terms of the GNU GPL, version 2. See
|
5 |
* the COPYING file in the top-level directory.
|
6 |
*
|
7 |
*/
|
8 |
|
9 |
#include "config.h" |
10 |
|
11 |
#include <sys/resource.h> |
12 |
|
13 |
#include "hw/xen_backend.h" |
14 |
#include "blockdev.h" |
15 |
#include "bitmap.h" |
16 |
|
17 |
#include <xen/hvm/params.h> |
18 |
#include <sys/mman.h> |
19 |
|
20 |
#include "xen-mapcache.h" |
21 |
#include "trace.h" |
22 |
|
23 |
|
24 |
//#define MAPCACHE_DEBUG
|
25 |
|
26 |
#ifdef MAPCACHE_DEBUG
|
27 |
# define DPRINTF(fmt, ...) do { \ |
28 |
fprintf(stderr, "xen_mapcache: " fmt, ## __VA_ARGS__); \ |
29 |
} while (0) |
30 |
#else
|
31 |
# define DPRINTF(fmt, ...) do { } while (0) |
32 |
#endif
|
33 |
|
34 |
#if defined(__i386__)
|
35 |
# define MCACHE_BUCKET_SHIFT 16 |
36 |
# define MCACHE_MAX_SIZE (1UL<<31) /* 2GB Cap */ |
37 |
#elif defined(__x86_64__)
|
38 |
# define MCACHE_BUCKET_SHIFT 20 |
39 |
# define MCACHE_MAX_SIZE (1UL<<35) /* 32GB Cap */ |
40 |
#endif
|
41 |
#define MCACHE_BUCKET_SIZE (1UL << MCACHE_BUCKET_SHIFT) |
42 |
|
43 |
/* This is the size of the virtual address space reserve to QEMU that will not
|
44 |
* be use by MapCache.
|
45 |
* From empirical tests I observed that qemu use 75MB more than the
|
46 |
* max_mcache_size.
|
47 |
*/
|
48 |
#define NON_MCACHE_MEMORY_SIZE (80 * 1024 * 1024) |
49 |
|
50 |
#define mapcache_lock() ((void)0) |
51 |
#define mapcache_unlock() ((void)0) |
52 |
|
53 |
typedef struct MapCacheEntry { |
54 |
target_phys_addr_t paddr_index; |
55 |
uint8_t *vaddr_base; |
56 |
unsigned long *valid_mapping; |
57 |
uint8_t lock; |
58 |
target_phys_addr_t size; |
59 |
struct MapCacheEntry *next;
|
60 |
} MapCacheEntry; |
61 |
|
62 |
typedef struct MapCacheRev { |
63 |
uint8_t *vaddr_req; |
64 |
target_phys_addr_t paddr_index; |
65 |
target_phys_addr_t size; |
66 |
QTAILQ_ENTRY(MapCacheRev) next; |
67 |
} MapCacheRev; |
68 |
|
69 |
typedef struct MapCache { |
70 |
MapCacheEntry *entry; |
71 |
unsigned long nr_buckets; |
72 |
QTAILQ_HEAD(map_cache_head, MapCacheRev) locked_entries; |
73 |
|
74 |
/* For most cases (>99.9%), the page address is the same. */
|
75 |
target_phys_addr_t last_address_index; |
76 |
uint8_t *last_address_vaddr; |
77 |
unsigned long max_mcache_size; |
78 |
unsigned int mcache_bucket_shift; |
79 |
} MapCache; |
80 |
|
81 |
static MapCache *mapcache;
|
82 |
|
83 |
static inline int test_bits(int nr, int size, const unsigned long *addr) |
84 |
{ |
85 |
unsigned long res = find_next_zero_bit(addr, size + nr, nr); |
86 |
if (res >= nr + size)
|
87 |
return 1; |
88 |
else
|
89 |
return 0; |
90 |
} |
91 |
|
92 |
void xen_map_cache_init(void) |
93 |
{ |
94 |
unsigned long size; |
95 |
struct rlimit rlimit_as;
|
96 |
|
97 |
mapcache = g_malloc0(sizeof (MapCache));
|
98 |
|
99 |
QTAILQ_INIT(&mapcache->locked_entries); |
100 |
mapcache->last_address_index = -1;
|
101 |
|
102 |
if (geteuid() == 0) { |
103 |
rlimit_as.rlim_cur = RLIM_INFINITY; |
104 |
rlimit_as.rlim_max = RLIM_INFINITY; |
105 |
mapcache->max_mcache_size = MCACHE_MAX_SIZE; |
106 |
} else {
|
107 |
getrlimit(RLIMIT_AS, &rlimit_as); |
108 |
rlimit_as.rlim_cur = rlimit_as.rlim_max; |
109 |
|
110 |
if (rlimit_as.rlim_max != RLIM_INFINITY) {
|
111 |
fprintf(stderr, "Warning: QEMU's maximum size of virtual"
|
112 |
" memory is not infinity.\n");
|
113 |
} |
114 |
if (rlimit_as.rlim_max < MCACHE_MAX_SIZE + NON_MCACHE_MEMORY_SIZE) {
|
115 |
mapcache->max_mcache_size = rlimit_as.rlim_max - |
116 |
NON_MCACHE_MEMORY_SIZE; |
117 |
} else {
|
118 |
mapcache->max_mcache_size = MCACHE_MAX_SIZE; |
119 |
} |
120 |
} |
121 |
|
122 |
setrlimit(RLIMIT_AS, &rlimit_as); |
123 |
|
124 |
mapcache->nr_buckets = |
125 |
(((mapcache->max_mcache_size >> XC_PAGE_SHIFT) + |
126 |
(1UL << (MCACHE_BUCKET_SHIFT - XC_PAGE_SHIFT)) - 1) >> |
127 |
(MCACHE_BUCKET_SHIFT - XC_PAGE_SHIFT)); |
128 |
|
129 |
size = mapcache->nr_buckets * sizeof (MapCacheEntry);
|
130 |
size = (size + XC_PAGE_SIZE - 1) & ~(XC_PAGE_SIZE - 1); |
131 |
DPRINTF("%s, nr_buckets = %lx size %lu\n", __func__,
|
132 |
mapcache->nr_buckets, size); |
133 |
mapcache->entry = g_malloc0(size); |
134 |
} |
135 |
|
136 |
static void xen_remap_bucket(MapCacheEntry *entry, |
137 |
target_phys_addr_t size, |
138 |
target_phys_addr_t address_index) |
139 |
{ |
140 |
uint8_t *vaddr_base; |
141 |
xen_pfn_t *pfns; |
142 |
int *err;
|
143 |
unsigned int i; |
144 |
target_phys_addr_t nb_pfn = size >> XC_PAGE_SHIFT; |
145 |
|
146 |
trace_xen_remap_bucket(address_index); |
147 |
|
148 |
pfns = g_malloc0(nb_pfn * sizeof (xen_pfn_t));
|
149 |
err = g_malloc0(nb_pfn * sizeof (int)); |
150 |
|
151 |
if (entry->vaddr_base != NULL) { |
152 |
if (munmap(entry->vaddr_base, entry->size) != 0) { |
153 |
perror("unmap fails");
|
154 |
exit(-1);
|
155 |
} |
156 |
} |
157 |
if (entry->valid_mapping != NULL) { |
158 |
g_free(entry->valid_mapping); |
159 |
entry->valid_mapping = NULL;
|
160 |
} |
161 |
|
162 |
for (i = 0; i < nb_pfn; i++) { |
163 |
pfns[i] = (address_index << (MCACHE_BUCKET_SHIFT-XC_PAGE_SHIFT)) + i; |
164 |
} |
165 |
|
166 |
vaddr_base = xc_map_foreign_bulk(xen_xc, xen_domid, PROT_READ|PROT_WRITE, |
167 |
pfns, err, nb_pfn); |
168 |
if (vaddr_base == NULL) { |
169 |
perror("xc_map_foreign_bulk");
|
170 |
exit(-1);
|
171 |
} |
172 |
|
173 |
entry->vaddr_base = vaddr_base; |
174 |
entry->paddr_index = address_index; |
175 |
entry->size = size; |
176 |
entry->valid_mapping = (unsigned long *) g_malloc0(sizeof(unsigned long) * |
177 |
BITS_TO_LONGS(size >> XC_PAGE_SHIFT)); |
178 |
|
179 |
bitmap_zero(entry->valid_mapping, nb_pfn); |
180 |
for (i = 0; i < nb_pfn; i++) { |
181 |
if (!err[i]) {
|
182 |
bitmap_set(entry->valid_mapping, i, 1);
|
183 |
} |
184 |
} |
185 |
|
186 |
g_free(pfns); |
187 |
g_free(err); |
188 |
} |
189 |
|
190 |
uint8_t *xen_map_cache(target_phys_addr_t phys_addr, target_phys_addr_t size, |
191 |
uint8_t lock) |
192 |
{ |
193 |
MapCacheEntry *entry, *pentry = NULL;
|
194 |
target_phys_addr_t address_index = phys_addr >> MCACHE_BUCKET_SHIFT; |
195 |
target_phys_addr_t address_offset = phys_addr & (MCACHE_BUCKET_SIZE - 1);
|
196 |
target_phys_addr_t __size = size; |
197 |
|
198 |
trace_xen_map_cache(phys_addr); |
199 |
|
200 |
if (address_index == mapcache->last_address_index && !lock && !__size) {
|
201 |
trace_xen_map_cache_return(mapcache->last_address_vaddr + address_offset); |
202 |
return mapcache->last_address_vaddr + address_offset;
|
203 |
} |
204 |
|
205 |
/* size is always a multiple of MCACHE_BUCKET_SIZE */
|
206 |
if ((address_offset + (__size % MCACHE_BUCKET_SIZE)) > MCACHE_BUCKET_SIZE)
|
207 |
__size += MCACHE_BUCKET_SIZE; |
208 |
if (__size % MCACHE_BUCKET_SIZE)
|
209 |
__size += MCACHE_BUCKET_SIZE - (__size % MCACHE_BUCKET_SIZE); |
210 |
if (!__size)
|
211 |
__size = MCACHE_BUCKET_SIZE; |
212 |
|
213 |
entry = &mapcache->entry[address_index % mapcache->nr_buckets]; |
214 |
|
215 |
while (entry && entry->lock && entry->vaddr_base &&
|
216 |
(entry->paddr_index != address_index || entry->size != __size || |
217 |
!test_bits(address_offset >> XC_PAGE_SHIFT, size >> XC_PAGE_SHIFT, |
218 |
entry->valid_mapping))) { |
219 |
pentry = entry; |
220 |
entry = entry->next; |
221 |
} |
222 |
if (!entry) {
|
223 |
entry = g_malloc0(sizeof (MapCacheEntry));
|
224 |
pentry->next = entry; |
225 |
xen_remap_bucket(entry, __size, address_index); |
226 |
} else if (!entry->lock) { |
227 |
if (!entry->vaddr_base || entry->paddr_index != address_index ||
|
228 |
entry->size != __size || |
229 |
!test_bits(address_offset >> XC_PAGE_SHIFT, size >> XC_PAGE_SHIFT, |
230 |
entry->valid_mapping)) { |
231 |
xen_remap_bucket(entry, __size, address_index); |
232 |
} |
233 |
} |
234 |
|
235 |
if(!test_bits(address_offset >> XC_PAGE_SHIFT, size >> XC_PAGE_SHIFT,
|
236 |
entry->valid_mapping)) { |
237 |
mapcache->last_address_index = -1;
|
238 |
trace_xen_map_cache_return(NULL);
|
239 |
return NULL; |
240 |
} |
241 |
|
242 |
mapcache->last_address_index = address_index; |
243 |
mapcache->last_address_vaddr = entry->vaddr_base; |
244 |
if (lock) {
|
245 |
MapCacheRev *reventry = g_malloc0(sizeof(MapCacheRev));
|
246 |
entry->lock++; |
247 |
reventry->vaddr_req = mapcache->last_address_vaddr + address_offset; |
248 |
reventry->paddr_index = mapcache->last_address_index; |
249 |
reventry->size = entry->size; |
250 |
QTAILQ_INSERT_HEAD(&mapcache->locked_entries, reventry, next); |
251 |
} |
252 |
|
253 |
trace_xen_map_cache_return(mapcache->last_address_vaddr + address_offset); |
254 |
return mapcache->last_address_vaddr + address_offset;
|
255 |
} |
256 |
|
257 |
ram_addr_t xen_ram_addr_from_mapcache(void *ptr)
|
258 |
{ |
259 |
MapCacheEntry *entry = NULL;
|
260 |
MapCacheRev *reventry; |
261 |
target_phys_addr_t paddr_index; |
262 |
target_phys_addr_t size; |
263 |
int found = 0; |
264 |
|
265 |
QTAILQ_FOREACH(reventry, &mapcache->locked_entries, next) { |
266 |
if (reventry->vaddr_req == ptr) {
|
267 |
paddr_index = reventry->paddr_index; |
268 |
size = reventry->size; |
269 |
found = 1;
|
270 |
break;
|
271 |
} |
272 |
} |
273 |
if (!found) {
|
274 |
fprintf(stderr, "%s, could not find %p\n", __func__, ptr);
|
275 |
QTAILQ_FOREACH(reventry, &mapcache->locked_entries, next) { |
276 |
DPRINTF(" "TARGET_FMT_plx" -> %p is present\n", reventry->paddr_index, |
277 |
reventry->vaddr_req); |
278 |
} |
279 |
abort(); |
280 |
return 0; |
281 |
} |
282 |
|
283 |
entry = &mapcache->entry[paddr_index % mapcache->nr_buckets]; |
284 |
while (entry && (entry->paddr_index != paddr_index || entry->size != size)) {
|
285 |
entry = entry->next; |
286 |
} |
287 |
if (!entry) {
|
288 |
DPRINTF("Trying to find address %p that is not in the mapcache!\n", ptr);
|
289 |
return 0; |
290 |
} |
291 |
return (reventry->paddr_index << MCACHE_BUCKET_SHIFT) +
|
292 |
((unsigned long) ptr - (unsigned long) entry->vaddr_base); |
293 |
} |
294 |
|
295 |
void xen_invalidate_map_cache_entry(uint8_t *buffer)
|
296 |
{ |
297 |
MapCacheEntry *entry = NULL, *pentry = NULL; |
298 |
MapCacheRev *reventry; |
299 |
target_phys_addr_t paddr_index; |
300 |
target_phys_addr_t size; |
301 |
int found = 0; |
302 |
|
303 |
if (mapcache->last_address_vaddr == buffer) {
|
304 |
mapcache->last_address_index = -1;
|
305 |
} |
306 |
|
307 |
QTAILQ_FOREACH(reventry, &mapcache->locked_entries, next) { |
308 |
if (reventry->vaddr_req == buffer) {
|
309 |
paddr_index = reventry->paddr_index; |
310 |
size = reventry->size; |
311 |
found = 1;
|
312 |
break;
|
313 |
} |
314 |
} |
315 |
if (!found) {
|
316 |
DPRINTF("%s, could not find %p\n", __func__, buffer);
|
317 |
QTAILQ_FOREACH(reventry, &mapcache->locked_entries, next) { |
318 |
DPRINTF(" "TARGET_FMT_plx" -> %p is present\n", reventry->paddr_index, reventry->vaddr_req); |
319 |
} |
320 |
return;
|
321 |
} |
322 |
QTAILQ_REMOVE(&mapcache->locked_entries, reventry, next); |
323 |
g_free(reventry); |
324 |
|
325 |
entry = &mapcache->entry[paddr_index % mapcache->nr_buckets]; |
326 |
while (entry && (entry->paddr_index != paddr_index || entry->size != size)) {
|
327 |
pentry = entry; |
328 |
entry = entry->next; |
329 |
} |
330 |
if (!entry) {
|
331 |
DPRINTF("Trying to unmap address %p that is not in the mapcache!\n", buffer);
|
332 |
return;
|
333 |
} |
334 |
entry->lock--; |
335 |
if (entry->lock > 0 || pentry == NULL) { |
336 |
return;
|
337 |
} |
338 |
|
339 |
pentry->next = entry->next; |
340 |
if (munmap(entry->vaddr_base, entry->size) != 0) { |
341 |
perror("unmap fails");
|
342 |
exit(-1);
|
343 |
} |
344 |
g_free(entry->valid_mapping); |
345 |
g_free(entry); |
346 |
} |
347 |
|
348 |
void xen_invalidate_map_cache(void) |
349 |
{ |
350 |
unsigned long i; |
351 |
MapCacheRev *reventry; |
352 |
|
353 |
/* Flush pending AIO before destroying the mapcache */
|
354 |
qemu_aio_flush(); |
355 |
|
356 |
QTAILQ_FOREACH(reventry, &mapcache->locked_entries, next) { |
357 |
DPRINTF("There should be no locked mappings at this time, "
|
358 |
"but "TARGET_FMT_plx" -> %p is present\n", |
359 |
reventry->paddr_index, reventry->vaddr_req); |
360 |
} |
361 |
|
362 |
mapcache_lock(); |
363 |
|
364 |
for (i = 0; i < mapcache->nr_buckets; i++) { |
365 |
MapCacheEntry *entry = &mapcache->entry[i]; |
366 |
|
367 |
if (entry->vaddr_base == NULL) { |
368 |
continue;
|
369 |
} |
370 |
|
371 |
if (munmap(entry->vaddr_base, entry->size) != 0) { |
372 |
perror("unmap fails");
|
373 |
exit(-1);
|
374 |
} |
375 |
|
376 |
entry->paddr_index = 0;
|
377 |
entry->vaddr_base = NULL;
|
378 |
entry->size = 0;
|
379 |
g_free(entry->valid_mapping); |
380 |
entry->valid_mapping = NULL;
|
381 |
} |
382 |
|
383 |
mapcache->last_address_index = -1;
|
384 |
mapcache->last_address_vaddr = NULL;
|
385 |
|
386 |
mapcache_unlock(); |
387 |
} |