root / bsd-user / mmap.c @ b035ffd1
History | View | Annotate | Download (16 kB)
1 |
/*
|
---|---|
2 |
* mmap support for qemu
|
3 |
*
|
4 |
* Copyright (c) 2003 - 2008 Fabrice Bellard
|
5 |
*
|
6 |
* This program is free software; you can redistribute it and/or modify
|
7 |
* it under the terms of the GNU General Public License as published by
|
8 |
* the Free Software Foundation; either version 2 of the License, or
|
9 |
* (at your option) any later version.
|
10 |
*
|
11 |
* This program is distributed in the hope that it will be useful,
|
12 |
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
13 |
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
14 |
* GNU General Public License for more details.
|
15 |
*
|
16 |
* You should have received a copy of the GNU General Public License
|
17 |
* along with this program; if not, see <http://www.gnu.org/licenses/>.
|
18 |
*/
|
19 |
#include <stdlib.h> |
20 |
#include <stdio.h> |
21 |
#include <stdarg.h> |
22 |
#include <string.h> |
23 |
#include <unistd.h> |
24 |
#include <errno.h> |
25 |
#include <sys/mman.h> |
26 |
|
27 |
#include "qemu.h" |
28 |
#include "qemu-common.h" |
29 |
#include "bsd-mman.h" |
30 |
|
31 |
//#define DEBUG_MMAP
|
32 |
|
33 |
#if defined(CONFIG_USE_NPTL)
|
34 |
pthread_mutex_t mmap_mutex; |
35 |
static int __thread mmap_lock_count; |
36 |
|
37 |
void mmap_lock(void) |
38 |
{ |
39 |
if (mmap_lock_count++ == 0) { |
40 |
pthread_mutex_lock(&mmap_mutex); |
41 |
} |
42 |
} |
43 |
|
44 |
void mmap_unlock(void) |
45 |
{ |
46 |
if (--mmap_lock_count == 0) { |
47 |
pthread_mutex_unlock(&mmap_mutex); |
48 |
} |
49 |
} |
50 |
|
51 |
/* Grab lock to make sure things are in a consistent state after fork(). */
|
52 |
void mmap_fork_start(void) |
53 |
{ |
54 |
if (mmap_lock_count)
|
55 |
abort(); |
56 |
pthread_mutex_lock(&mmap_mutex); |
57 |
} |
58 |
|
59 |
void mmap_fork_end(int child) |
60 |
{ |
61 |
if (child)
|
62 |
pthread_mutex_init(&mmap_mutex, NULL);
|
63 |
else
|
64 |
pthread_mutex_unlock(&mmap_mutex); |
65 |
} |
66 |
#else
|
67 |
/* We aren't threadsafe to start with, so no need to worry about locking. */
|
68 |
void mmap_lock(void) |
69 |
{ |
70 |
} |
71 |
|
72 |
void mmap_unlock(void) |
73 |
{ |
74 |
} |
75 |
#endif
|
76 |
|
77 |
void *qemu_vmalloc(size_t size)
|
78 |
{ |
79 |
void *p;
|
80 |
mmap_lock(); |
81 |
/* Use map and mark the pages as used. */
|
82 |
p = mmap(NULL, size, PROT_READ | PROT_WRITE,
|
83 |
MAP_PRIVATE | MAP_ANON, -1, 0); |
84 |
|
85 |
if (h2g_valid(p)) {
|
86 |
/* Allocated region overlaps guest address space.
|
87 |
This may recurse. */
|
88 |
abi_ulong addr = h2g(p); |
89 |
page_set_flags(addr & TARGET_PAGE_MASK, TARGET_PAGE_ALIGN(addr + size), |
90 |
PAGE_RESERVED); |
91 |
} |
92 |
|
93 |
mmap_unlock(); |
94 |
return p;
|
95 |
} |
96 |
|
97 |
void *qemu_malloc(size_t size)
|
98 |
{ |
99 |
char * p;
|
100 |
size += 16;
|
101 |
p = qemu_vmalloc(size); |
102 |
*(size_t *)p = size; |
103 |
return p + 16; |
104 |
} |
105 |
|
106 |
/* We use map, which is always zero initialized. */
|
107 |
void * qemu_mallocz(size_t size)
|
108 |
{ |
109 |
return qemu_malloc(size);
|
110 |
} |
111 |
|
112 |
void qemu_free(void *ptr) |
113 |
{ |
114 |
/* FIXME: We should unmark the reserved pages here. However this gets
|
115 |
complicated when one target page spans multiple host pages, so we
|
116 |
don't bother. */
|
117 |
size_t *p; |
118 |
p = (size_t *)((char *)ptr - 16); |
119 |
munmap(p, *p); |
120 |
} |
121 |
|
122 |
void *qemu_realloc(void *ptr, size_t size) |
123 |
{ |
124 |
size_t old_size, copy; |
125 |
void *new_ptr;
|
126 |
|
127 |
if (!ptr)
|
128 |
return qemu_malloc(size);
|
129 |
old_size = *(size_t *)((char *)ptr - 16); |
130 |
copy = old_size < size ? old_size : size; |
131 |
new_ptr = qemu_malloc(size); |
132 |
memcpy(new_ptr, ptr, copy); |
133 |
qemu_free(ptr); |
134 |
return new_ptr;
|
135 |
} |
136 |
|
137 |
/* NOTE: all the constants are the HOST ones, but addresses are target. */
|
138 |
int target_mprotect(abi_ulong start, abi_ulong len, int prot) |
139 |
{ |
140 |
abi_ulong end, host_start, host_end, addr; |
141 |
int prot1, ret;
|
142 |
|
143 |
#ifdef DEBUG_MMAP
|
144 |
printf("mprotect: start=0x" TARGET_FMT_lx
|
145 |
" len=0x" TARGET_FMT_lx " prot=%c%c%c\n", start, len, |
146 |
prot & PROT_READ ? 'r' : '-', |
147 |
prot & PROT_WRITE ? 'w' : '-', |
148 |
prot & PROT_EXEC ? 'x' : '-'); |
149 |
#endif
|
150 |
|
151 |
if ((start & ~TARGET_PAGE_MASK) != 0) |
152 |
return -EINVAL;
|
153 |
len = TARGET_PAGE_ALIGN(len); |
154 |
end = start + len; |
155 |
if (end < start)
|
156 |
return -EINVAL;
|
157 |
prot &= PROT_READ | PROT_WRITE | PROT_EXEC; |
158 |
if (len == 0) |
159 |
return 0; |
160 |
|
161 |
mmap_lock(); |
162 |
host_start = start & qemu_host_page_mask; |
163 |
host_end = HOST_PAGE_ALIGN(end); |
164 |
if (start > host_start) {
|
165 |
/* handle host page containing start */
|
166 |
prot1 = prot; |
167 |
for(addr = host_start; addr < start; addr += TARGET_PAGE_SIZE) {
|
168 |
prot1 |= page_get_flags(addr); |
169 |
} |
170 |
if (host_end == host_start + qemu_host_page_size) {
|
171 |
for(addr = end; addr < host_end; addr += TARGET_PAGE_SIZE) {
|
172 |
prot1 |= page_get_flags(addr); |
173 |
} |
174 |
end = host_end; |
175 |
} |
176 |
ret = mprotect(g2h(host_start), qemu_host_page_size, prot1 & PAGE_BITS); |
177 |
if (ret != 0) |
178 |
goto error;
|
179 |
host_start += qemu_host_page_size; |
180 |
} |
181 |
if (end < host_end) {
|
182 |
prot1 = prot; |
183 |
for(addr = end; addr < host_end; addr += TARGET_PAGE_SIZE) {
|
184 |
prot1 |= page_get_flags(addr); |
185 |
} |
186 |
ret = mprotect(g2h(host_end - qemu_host_page_size), qemu_host_page_size, |
187 |
prot1 & PAGE_BITS); |
188 |
if (ret != 0) |
189 |
goto error;
|
190 |
host_end -= qemu_host_page_size; |
191 |
} |
192 |
|
193 |
/* handle the pages in the middle */
|
194 |
if (host_start < host_end) {
|
195 |
ret = mprotect(g2h(host_start), host_end - host_start, prot); |
196 |
if (ret != 0) |
197 |
goto error;
|
198 |
} |
199 |
page_set_flags(start, start + len, prot | PAGE_VALID); |
200 |
mmap_unlock(); |
201 |
return 0; |
202 |
error:
|
203 |
mmap_unlock(); |
204 |
return ret;
|
205 |
} |
206 |
|
207 |
/* map an incomplete host page */
|
208 |
static int mmap_frag(abi_ulong real_start, |
209 |
abi_ulong start, abi_ulong end, |
210 |
int prot, int flags, int fd, abi_ulong offset) |
211 |
{ |
212 |
abi_ulong real_end, addr; |
213 |
void *host_start;
|
214 |
int prot1, prot_new;
|
215 |
|
216 |
real_end = real_start + qemu_host_page_size; |
217 |
host_start = g2h(real_start); |
218 |
|
219 |
/* get the protection of the target pages outside the mapping */
|
220 |
prot1 = 0;
|
221 |
for(addr = real_start; addr < real_end; addr++) {
|
222 |
if (addr < start || addr >= end)
|
223 |
prot1 |= page_get_flags(addr); |
224 |
} |
225 |
|
226 |
if (prot1 == 0) { |
227 |
/* no page was there, so we allocate one */
|
228 |
void *p = mmap(host_start, qemu_host_page_size, prot,
|
229 |
flags | MAP_ANON, -1, 0); |
230 |
if (p == MAP_FAILED)
|
231 |
return -1; |
232 |
prot1 = prot; |
233 |
} |
234 |
prot1 &= PAGE_BITS; |
235 |
|
236 |
prot_new = prot | prot1; |
237 |
if (!(flags & MAP_ANON)) {
|
238 |
/* msync() won't work here, so we return an error if write is
|
239 |
possible while it is a shared mapping */
|
240 |
if ((flags & TARGET_BSD_MAP_FLAGMASK) == MAP_SHARED &&
|
241 |
(prot & PROT_WRITE)) |
242 |
return -1; |
243 |
|
244 |
/* adjust protection to be able to read */
|
245 |
if (!(prot1 & PROT_WRITE))
|
246 |
mprotect(host_start, qemu_host_page_size, prot1 | PROT_WRITE); |
247 |
|
248 |
/* read the corresponding file data */
|
249 |
pread(fd, g2h(start), end - start, offset); |
250 |
|
251 |
/* put final protection */
|
252 |
if (prot_new != (prot1 | PROT_WRITE))
|
253 |
mprotect(host_start, qemu_host_page_size, prot_new); |
254 |
} else {
|
255 |
/* just update the protection */
|
256 |
if (prot_new != prot1) {
|
257 |
mprotect(host_start, qemu_host_page_size, prot_new); |
258 |
} |
259 |
} |
260 |
return 0; |
261 |
} |
262 |
|
263 |
#if defined(__CYGWIN__)
|
264 |
/* Cygwin doesn't have a whole lot of address space. */
|
265 |
static abi_ulong mmap_next_start = 0x18000000; |
266 |
#else
|
267 |
static abi_ulong mmap_next_start = 0x40000000; |
268 |
#endif
|
269 |
|
270 |
unsigned long last_brk; |
271 |
|
272 |
/* find a free memory area of size 'size'. The search starts at
|
273 |
'start'. If 'start' == 0, then a default start address is used.
|
274 |
Return -1 if error.
|
275 |
*/
|
276 |
/* page_init() marks pages used by the host as reserved to be sure not
|
277 |
to use them. */
|
278 |
static abi_ulong mmap_find_vma(abi_ulong start, abi_ulong size)
|
279 |
{ |
280 |
abi_ulong addr, addr1, addr_start; |
281 |
int prot;
|
282 |
unsigned long new_brk; |
283 |
|
284 |
new_brk = (unsigned long)sbrk(0); |
285 |
if (last_brk && last_brk < new_brk && last_brk == (target_ulong)last_brk) {
|
286 |
/* This is a hack to catch the host allocating memory with brk().
|
287 |
If it uses mmap then we loose.
|
288 |
FIXME: We really want to avoid the host allocating memory in
|
289 |
the first place, and maybe leave some slack to avoid switching
|
290 |
to mmap. */
|
291 |
page_set_flags(last_brk & TARGET_PAGE_MASK, |
292 |
TARGET_PAGE_ALIGN(new_brk), |
293 |
PAGE_RESERVED); |
294 |
} |
295 |
last_brk = new_brk; |
296 |
|
297 |
size = HOST_PAGE_ALIGN(size); |
298 |
start = start & qemu_host_page_mask; |
299 |
addr = start; |
300 |
if (addr == 0) |
301 |
addr = mmap_next_start; |
302 |
addr_start = addr; |
303 |
for(;;) {
|
304 |
prot = 0;
|
305 |
for(addr1 = addr; addr1 < (addr + size); addr1 += TARGET_PAGE_SIZE) {
|
306 |
prot |= page_get_flags(addr1); |
307 |
} |
308 |
if (prot == 0) |
309 |
break;
|
310 |
addr += qemu_host_page_size; |
311 |
/* we found nothing */
|
312 |
if (addr == addr_start)
|
313 |
return (abi_ulong)-1; |
314 |
} |
315 |
if (start == 0) |
316 |
mmap_next_start = addr + size; |
317 |
return addr;
|
318 |
} |
319 |
|
320 |
/* NOTE: all the constants are the HOST ones */
|
321 |
abi_long target_mmap(abi_ulong start, abi_ulong len, int prot,
|
322 |
int flags, int fd, abi_ulong offset) |
323 |
{ |
324 |
abi_ulong ret, end, real_start, real_end, retaddr, host_offset, host_len; |
325 |
unsigned long host_start; |
326 |
|
327 |
mmap_lock(); |
328 |
#ifdef DEBUG_MMAP
|
329 |
{ |
330 |
printf("mmap: start=0x" TARGET_FMT_lx
|
331 |
" len=0x" TARGET_FMT_lx " prot=%c%c%c flags=", |
332 |
start, len, |
333 |
prot & PROT_READ ? 'r' : '-', |
334 |
prot & PROT_WRITE ? 'w' : '-', |
335 |
prot & PROT_EXEC ? 'x' : '-'); |
336 |
if (flags & MAP_FIXED)
|
337 |
printf("MAP_FIXED ");
|
338 |
if (flags & MAP_ANON)
|
339 |
printf("MAP_ANON ");
|
340 |
switch(flags & TARGET_BSD_MAP_FLAGMASK) {
|
341 |
case MAP_PRIVATE:
|
342 |
printf("MAP_PRIVATE ");
|
343 |
break;
|
344 |
case MAP_SHARED:
|
345 |
printf("MAP_SHARED ");
|
346 |
break;
|
347 |
default:
|
348 |
printf("[MAP_FLAGMASK=0x%x] ", flags & TARGET_BSD_MAP_FLAGMASK);
|
349 |
break;
|
350 |
} |
351 |
printf("fd=%d offset=" TARGET_FMT_lx "\n", fd, offset); |
352 |
} |
353 |
#endif
|
354 |
|
355 |
if (offset & ~TARGET_PAGE_MASK) {
|
356 |
errno = EINVAL; |
357 |
goto fail;
|
358 |
} |
359 |
|
360 |
len = TARGET_PAGE_ALIGN(len); |
361 |
if (len == 0) |
362 |
goto the_end;
|
363 |
real_start = start & qemu_host_page_mask; |
364 |
|
365 |
if (!(flags & MAP_FIXED)) {
|
366 |
abi_ulong mmap_start; |
367 |
void *p;
|
368 |
host_offset = offset & qemu_host_page_mask; |
369 |
host_len = len + offset - host_offset; |
370 |
host_len = HOST_PAGE_ALIGN(host_len); |
371 |
mmap_start = mmap_find_vma(real_start, host_len); |
372 |
if (mmap_start == (abi_ulong)-1) { |
373 |
errno = ENOMEM; |
374 |
goto fail;
|
375 |
} |
376 |
/* Note: we prefer to control the mapping address. It is
|
377 |
especially important if qemu_host_page_size >
|
378 |
qemu_real_host_page_size */
|
379 |
p = mmap(g2h(mmap_start), |
380 |
host_len, prot, flags | MAP_FIXED, fd, host_offset); |
381 |
if (p == MAP_FAILED)
|
382 |
goto fail;
|
383 |
/* update start so that it points to the file position at 'offset' */
|
384 |
host_start = (unsigned long)p; |
385 |
if (!(flags & MAP_ANON))
|
386 |
host_start += offset - host_offset; |
387 |
start = h2g(host_start); |
388 |
} else {
|
389 |
int flg;
|
390 |
target_ulong addr; |
391 |
|
392 |
if (start & ~TARGET_PAGE_MASK) {
|
393 |
errno = EINVAL; |
394 |
goto fail;
|
395 |
} |
396 |
end = start + len; |
397 |
real_end = HOST_PAGE_ALIGN(end); |
398 |
|
399 |
for(addr = real_start; addr < real_end; addr += TARGET_PAGE_SIZE) {
|
400 |
flg = page_get_flags(addr); |
401 |
if (flg & PAGE_RESERVED) {
|
402 |
errno = ENXIO; |
403 |
goto fail;
|
404 |
} |
405 |
} |
406 |
|
407 |
/* worst case: we cannot map the file because the offset is not
|
408 |
aligned, so we read it */
|
409 |
if (!(flags & MAP_ANON) &&
|
410 |
(offset & ~qemu_host_page_mask) != (start & ~qemu_host_page_mask)) { |
411 |
/* msync() won't work here, so we return an error if write is
|
412 |
possible while it is a shared mapping */
|
413 |
if ((flags & TARGET_BSD_MAP_FLAGMASK) == MAP_SHARED &&
|
414 |
(prot & PROT_WRITE)) { |
415 |
errno = EINVAL; |
416 |
goto fail;
|
417 |
} |
418 |
retaddr = target_mmap(start, len, prot | PROT_WRITE, |
419 |
MAP_FIXED | MAP_PRIVATE | MAP_ANON, |
420 |
-1, 0); |
421 |
if (retaddr == -1) |
422 |
goto fail;
|
423 |
pread(fd, g2h(start), len, offset); |
424 |
if (!(prot & PROT_WRITE)) {
|
425 |
ret = target_mprotect(start, len, prot); |
426 |
if (ret != 0) { |
427 |
start = ret; |
428 |
goto the_end;
|
429 |
} |
430 |
} |
431 |
goto the_end;
|
432 |
} |
433 |
|
434 |
/* handle the start of the mapping */
|
435 |
if (start > real_start) {
|
436 |
if (real_end == real_start + qemu_host_page_size) {
|
437 |
/* one single host page */
|
438 |
ret = mmap_frag(real_start, start, end, |
439 |
prot, flags, fd, offset); |
440 |
if (ret == -1) |
441 |
goto fail;
|
442 |
goto the_end1;
|
443 |
} |
444 |
ret = mmap_frag(real_start, start, real_start + qemu_host_page_size, |
445 |
prot, flags, fd, offset); |
446 |
if (ret == -1) |
447 |
goto fail;
|
448 |
real_start += qemu_host_page_size; |
449 |
} |
450 |
/* handle the end of the mapping */
|
451 |
if (end < real_end) {
|
452 |
ret = mmap_frag(real_end - qemu_host_page_size, |
453 |
real_end - qemu_host_page_size, real_end, |
454 |
prot, flags, fd, |
455 |
offset + real_end - qemu_host_page_size - start); |
456 |
if (ret == -1) |
457 |
goto fail;
|
458 |
real_end -= qemu_host_page_size; |
459 |
} |
460 |
|
461 |
/* map the middle (easier) */
|
462 |
if (real_start < real_end) {
|
463 |
void *p;
|
464 |
unsigned long offset1; |
465 |
if (flags & MAP_ANON)
|
466 |
offset1 = 0;
|
467 |
else
|
468 |
offset1 = offset + real_start - start; |
469 |
p = mmap(g2h(real_start), real_end - real_start, |
470 |
prot, flags, fd, offset1); |
471 |
if (p == MAP_FAILED)
|
472 |
goto fail;
|
473 |
} |
474 |
} |
475 |
the_end1:
|
476 |
page_set_flags(start, start + len, prot | PAGE_VALID); |
477 |
the_end:
|
478 |
#ifdef DEBUG_MMAP
|
479 |
printf("ret=0x" TARGET_FMT_lx "\n", start); |
480 |
page_dump(stdout); |
481 |
printf("\n");
|
482 |
#endif
|
483 |
mmap_unlock(); |
484 |
return start;
|
485 |
fail:
|
486 |
mmap_unlock(); |
487 |
return -1; |
488 |
} |
489 |
|
490 |
int target_munmap(abi_ulong start, abi_ulong len)
|
491 |
{ |
492 |
abi_ulong end, real_start, real_end, addr; |
493 |
int prot, ret;
|
494 |
|
495 |
#ifdef DEBUG_MMAP
|
496 |
printf("munmap: start=0x%lx len=0x%lx\n", start, len);
|
497 |
#endif
|
498 |
if (start & ~TARGET_PAGE_MASK)
|
499 |
return -EINVAL;
|
500 |
len = TARGET_PAGE_ALIGN(len); |
501 |
if (len == 0) |
502 |
return -EINVAL;
|
503 |
mmap_lock(); |
504 |
end = start + len; |
505 |
real_start = start & qemu_host_page_mask; |
506 |
real_end = HOST_PAGE_ALIGN(end); |
507 |
|
508 |
if (start > real_start) {
|
509 |
/* handle host page containing start */
|
510 |
prot = 0;
|
511 |
for(addr = real_start; addr < start; addr += TARGET_PAGE_SIZE) {
|
512 |
prot |= page_get_flags(addr); |
513 |
} |
514 |
if (real_end == real_start + qemu_host_page_size) {
|
515 |
for(addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) {
|
516 |
prot |= page_get_flags(addr); |
517 |
} |
518 |
end = real_end; |
519 |
} |
520 |
if (prot != 0) |
521 |
real_start += qemu_host_page_size; |
522 |
} |
523 |
if (end < real_end) {
|
524 |
prot = 0;
|
525 |
for(addr = end; addr < real_end; addr += TARGET_PAGE_SIZE) {
|
526 |
prot |= page_get_flags(addr); |
527 |
} |
528 |
if (prot != 0) |
529 |
real_end -= qemu_host_page_size; |
530 |
} |
531 |
|
532 |
ret = 0;
|
533 |
/* unmap what we can */
|
534 |
if (real_start < real_end) {
|
535 |
ret = munmap(g2h(real_start), real_end - real_start); |
536 |
} |
537 |
|
538 |
if (ret == 0) |
539 |
page_set_flags(start, start + len, 0);
|
540 |
mmap_unlock(); |
541 |
return ret;
|
542 |
} |
543 |
|
544 |
int target_msync(abi_ulong start, abi_ulong len, int flags) |
545 |
{ |
546 |
abi_ulong end; |
547 |
|
548 |
if (start & ~TARGET_PAGE_MASK)
|
549 |
return -EINVAL;
|
550 |
len = TARGET_PAGE_ALIGN(len); |
551 |
end = start + len; |
552 |
if (end < start)
|
553 |
return -EINVAL;
|
554 |
if (end == start)
|
555 |
return 0; |
556 |
|
557 |
start &= qemu_host_page_mask; |
558 |
return msync(g2h(start), end - start, flags);
|
559 |
} |