]> git.proxmox.com Git - qemu.git/blame - exec.c
Use mmap to allocate execute memory
[qemu.git] / exec.c
CommitLineData
54936004 1/*
fd6ce8f6 2 * virtual page mapping and translated block handling
5fafdf24 3 *
54936004
FB
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
8167ee88 17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
54936004 18 */
67b915a5 19#include "config.h"
d5a8f07c
FB
20#ifdef _WIN32
21#include <windows.h>
22#else
a98d49b1 23#include <sys/types.h>
d5a8f07c
FB
24#include <sys/mman.h>
25#endif
54936004 26
055403b2 27#include "qemu-common.h"
6180a181 28#include "cpu.h"
b67d9a52 29#include "tcg.h"
b3c7724c 30#include "hw/hw.h"
cc9e98cb 31#include "hw/qdev.h"
74576198 32#include "osdep.h"
7ba1e619 33#include "kvm.h"
432d268c 34#include "hw/xen.h"
29e922b6 35#include "qemu-timer.h"
62152b8a
AK
36#include "memory.h"
37#include "exec-memory.h"
53a5960a
PB
38#if defined(CONFIG_USER_ONLY)
39#include <qemu.h>
f01576f1
JL
40#if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
41#include <sys/param.h>
42#if __FreeBSD_version >= 700104
43#define HAVE_KINFO_GETVMMAP
44#define sigqueue sigqueue_freebsd /* avoid redefinition */
45#include <sys/time.h>
46#include <sys/proc.h>
47#include <machine/profile.h>
48#define _KERNEL
49#include <sys/user.h>
50#undef _KERNEL
51#undef sigqueue
52#include <libutil.h>
53#endif
54#endif
432d268c
JN
55#else /* !CONFIG_USER_ONLY */
56#include "xen-mapcache.h"
6506e4f9 57#include "trace.h"
53a5960a 58#endif
54936004 59
fd6ce8f6 60//#define DEBUG_TB_INVALIDATE
66e85a21 61//#define DEBUG_FLUSH
9fa3e853 62//#define DEBUG_TLB
67d3b957 63//#define DEBUG_UNASSIGNED
fd6ce8f6
FB
64
65/* make various TB consistency checks */
5fafdf24
TS
66//#define DEBUG_TB_CHECK
67//#define DEBUG_TLB_CHECK
fd6ce8f6 68
1196be37 69//#define DEBUG_IOPORT
db7b5426 70//#define DEBUG_SUBPAGE
1196be37 71
99773bd4
PB
72#if !defined(CONFIG_USER_ONLY)
73/* TB consistency checks only implemented for usermode emulation. */
74#undef DEBUG_TB_CHECK
75#endif
76
9fa3e853
FB
77#define SMC_BITMAP_USE_THRESHOLD 10
78
bdaf78e0 79static TranslationBlock *tbs;
24ab68ac 80static int code_gen_max_blocks;
9fa3e853 81TranslationBlock *tb_phys_hash[CODE_GEN_PHYS_HASH_SIZE];
bdaf78e0 82static int nb_tbs;
eb51d102 83/* any access to the tbs or the page table must use this lock */
c227f099 84spinlock_t tb_lock = SPIN_LOCK_UNLOCKED;
fd6ce8f6 85
141ac468
BS
86#if defined(__arm__) || defined(__sparc_v9__)
87/* The prologue must be reachable with a direct jump. ARM and Sparc64
88 have limited branch ranges (possibly also PPC) so place it in a
d03d860b
BS
89 section close to code segment. */
90#define code_gen_section \
91 __attribute__((__section__(".gen_code"))) \
92 __attribute__((aligned (32)))
f8e2af11
SW
93#elif defined(_WIN32)
94/* Maximum alignment for Win32 is 16. */
95#define code_gen_section \
96 __attribute__((aligned (16)))
d03d860b
BS
97#else
98#define code_gen_section \
99 __attribute__((aligned (32)))
100#endif
101
102uint8_t code_gen_prologue[1024] code_gen_section;
bdaf78e0
BS
103static uint8_t *code_gen_buffer;
104static unsigned long code_gen_buffer_size;
26a5f13b 105/* threshold to flush the translated code buffer */
bdaf78e0 106static unsigned long code_gen_buffer_max_size;
24ab68ac 107static uint8_t *code_gen_ptr;
fd6ce8f6 108
e2eef170 109#if !defined(CONFIG_USER_ONLY)
9fa3e853 110int phys_ram_fd;
74576198 111static int in_migration;
94a6b54f 112
f471a17e 113RAMList ram_list = { .blocks = QLIST_HEAD_INITIALIZER(ram_list) };
62152b8a
AK
114
115static MemoryRegion *system_memory;
116
e2eef170 117#endif
9fa3e853 118
6a00d601
FB
119CPUState *first_cpu;
120/* current CPU in the current thread. It is only valid inside
121 cpu_exec() */
5fafdf24 122CPUState *cpu_single_env;
2e70f6ef 123/* 0 = Do not count executed instructions.
bf20dc07 124 1 = Precise instruction counting.
2e70f6ef
PB
125 2 = Adaptive rate instruction counting. */
126int use_icount = 0;
127/* Current instruction counter. While executing translated code this may
128 include some instructions that have not yet been executed. */
129int64_t qemu_icount;
6a00d601 130
54936004 131typedef struct PageDesc {
92e873b9 132 /* list of TBs intersecting this ram page */
fd6ce8f6 133 TranslationBlock *first_tb;
9fa3e853
FB
134 /* in order to optimize self modifying code, we count the number
135 of lookups we do to a given page to use a bitmap */
136 unsigned int code_write_count;
137 uint8_t *code_bitmap;
138#if defined(CONFIG_USER_ONLY)
139 unsigned long flags;
140#endif
54936004
FB
141} PageDesc;
142
41c1b1c9 143/* In system mode we want L1_MAP to be based on ram offsets,
5cd2c5b6
RH
144 while in user mode we want it to be based on virtual addresses. */
145#if !defined(CONFIG_USER_ONLY)
41c1b1c9
PB
146#if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
147# define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
148#else
5cd2c5b6 149# define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
41c1b1c9 150#endif
bedb69ea 151#else
5cd2c5b6 152# define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
bedb69ea 153#endif
54936004 154
5cd2c5b6
RH
155/* Size of the L2 (and L3, etc) page tables. */
156#define L2_BITS 10
54936004
FB
157#define L2_SIZE (1 << L2_BITS)
158
5cd2c5b6
RH
159/* The bits remaining after N lower levels of page tables. */
160#define P_L1_BITS_REM \
161 ((TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
162#define V_L1_BITS_REM \
163 ((L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
164
165/* Size of the L1 page table. Avoid silly small sizes. */
166#if P_L1_BITS_REM < 4
167#define P_L1_BITS (P_L1_BITS_REM + L2_BITS)
168#else
169#define P_L1_BITS P_L1_BITS_REM
170#endif
171
172#if V_L1_BITS_REM < 4
173#define V_L1_BITS (V_L1_BITS_REM + L2_BITS)
174#else
175#define V_L1_BITS V_L1_BITS_REM
176#endif
177
178#define P_L1_SIZE ((target_phys_addr_t)1 << P_L1_BITS)
179#define V_L1_SIZE ((target_ulong)1 << V_L1_BITS)
180
181#define P_L1_SHIFT (TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS - P_L1_BITS)
182#define V_L1_SHIFT (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - V_L1_BITS)
183
83fb7adf
FB
184unsigned long qemu_real_host_page_size;
185unsigned long qemu_host_page_bits;
186unsigned long qemu_host_page_size;
187unsigned long qemu_host_page_mask;
54936004 188
5cd2c5b6
RH
189/* This is a multi-level map on the virtual address space.
190 The bottom level has pointers to PageDesc. */
191static void *l1_map[V_L1_SIZE];
54936004 192
e2eef170 193#if !defined(CONFIG_USER_ONLY)
41c1b1c9
PB
194typedef struct PhysPageDesc {
195 /* offset in host memory of the page + io_index in the low bits */
196 ram_addr_t phys_offset;
197 ram_addr_t region_offset;
198} PhysPageDesc;
199
5cd2c5b6
RH
200/* This is a multi-level map on the physical address space.
201 The bottom level has pointers to PhysPageDesc. */
202static void *l1_phys_map[P_L1_SIZE];
6d9a1304 203
e2eef170 204static void io_mem_init(void);
62152b8a 205static void memory_map_init(void);
e2eef170 206
33417e70 207/* io memory support */
33417e70
FB
208CPUWriteMemoryFunc *io_mem_write[IO_MEM_NB_ENTRIES][4];
209CPUReadMemoryFunc *io_mem_read[IO_MEM_NB_ENTRIES][4];
a4193c8a 210void *io_mem_opaque[IO_MEM_NB_ENTRIES];
511d2b14 211static char io_mem_used[IO_MEM_NB_ENTRIES];
6658ffb8
PB
212static int io_mem_watch;
213#endif
33417e70 214
34865134 215/* log support */
1e8b27ca
JR
216#ifdef WIN32
217static const char *logfilename = "qemu.log";
218#else
d9b630fd 219static const char *logfilename = "/tmp/qemu.log";
1e8b27ca 220#endif
34865134
FB
221FILE *logfile;
222int loglevel;
e735b91c 223static int log_append = 0;
34865134 224
e3db7226 225/* statistics */
b3755a91 226#if !defined(CONFIG_USER_ONLY)
e3db7226 227static int tlb_flush_count;
b3755a91 228#endif
e3db7226
FB
229static int tb_flush_count;
230static int tb_phys_invalidate_count;
231
7cb69cae
FB
232#ifdef _WIN32
233static void map_exec(void *addr, long size)
234{
235 DWORD old_protect;
236 VirtualProtect(addr, size,
237 PAGE_EXECUTE_READWRITE, &old_protect);
238
239}
240#else
241static void map_exec(void *addr, long size)
242{
4369415f 243 unsigned long start, end, page_size;
7cb69cae 244
4369415f 245 page_size = getpagesize();
7cb69cae 246 start = (unsigned long)addr;
4369415f 247 start &= ~(page_size - 1);
7cb69cae
FB
248
249 end = (unsigned long)addr + size;
4369415f
FB
250 end += page_size - 1;
251 end &= ~(page_size - 1);
7cb69cae
FB
252
253 mprotect((void *)start, end - start,
254 PROT_READ | PROT_WRITE | PROT_EXEC);
255}
256#endif
257
b346ff46 258static void page_init(void)
54936004 259{
83fb7adf 260 /* NOTE: we can always suppose that qemu_host_page_size >=
54936004 261 TARGET_PAGE_SIZE */
c2b48b69
AL
262#ifdef _WIN32
263 {
264 SYSTEM_INFO system_info;
265
266 GetSystemInfo(&system_info);
267 qemu_real_host_page_size = system_info.dwPageSize;
268 }
269#else
270 qemu_real_host_page_size = getpagesize();
271#endif
83fb7adf
FB
272 if (qemu_host_page_size == 0)
273 qemu_host_page_size = qemu_real_host_page_size;
274 if (qemu_host_page_size < TARGET_PAGE_SIZE)
275 qemu_host_page_size = TARGET_PAGE_SIZE;
276 qemu_host_page_bits = 0;
277 while ((1 << qemu_host_page_bits) < qemu_host_page_size)
278 qemu_host_page_bits++;
279 qemu_host_page_mask = ~(qemu_host_page_size - 1);
50a9569b 280
2e9a5713 281#if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
50a9569b 282 {
f01576f1
JL
283#ifdef HAVE_KINFO_GETVMMAP
284 struct kinfo_vmentry *freep;
285 int i, cnt;
286
287 freep = kinfo_getvmmap(getpid(), &cnt);
288 if (freep) {
289 mmap_lock();
290 for (i = 0; i < cnt; i++) {
291 unsigned long startaddr, endaddr;
292
293 startaddr = freep[i].kve_start;
294 endaddr = freep[i].kve_end;
295 if (h2g_valid(startaddr)) {
296 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
297
298 if (h2g_valid(endaddr)) {
299 endaddr = h2g(endaddr);
fd436907 300 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
f01576f1
JL
301 } else {
302#if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
303 endaddr = ~0ul;
fd436907 304 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
f01576f1
JL
305#endif
306 }
307 }
308 }
309 free(freep);
310 mmap_unlock();
311 }
312#else
50a9569b 313 FILE *f;
50a9569b 314
0776590d 315 last_brk = (unsigned long)sbrk(0);
5cd2c5b6 316
fd436907 317 f = fopen("/compat/linux/proc/self/maps", "r");
50a9569b 318 if (f) {
5cd2c5b6
RH
319 mmap_lock();
320
50a9569b 321 do {
5cd2c5b6
RH
322 unsigned long startaddr, endaddr;
323 int n;
324
325 n = fscanf (f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
326
327 if (n == 2 && h2g_valid(startaddr)) {
328 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
329
330 if (h2g_valid(endaddr)) {
331 endaddr = h2g(endaddr);
332 } else {
333 endaddr = ~0ul;
334 }
335 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
50a9569b
AZ
336 }
337 } while (!feof(f));
5cd2c5b6 338
50a9569b 339 fclose(f);
5cd2c5b6 340 mmap_unlock();
50a9569b 341 }
f01576f1 342#endif
50a9569b
AZ
343 }
344#endif
54936004
FB
345}
346
41c1b1c9 347static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
54936004 348{
41c1b1c9
PB
349 PageDesc *pd;
350 void **lp;
351 int i;
352
5cd2c5b6 353#if defined(CONFIG_USER_ONLY)
2e9a5713 354 /* We can't use qemu_malloc because it may recurse into a locked mutex. */
5cd2c5b6
RH
355# define ALLOC(P, SIZE) \
356 do { \
357 P = mmap(NULL, SIZE, PROT_READ | PROT_WRITE, \
358 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); \
5cd2c5b6
RH
359 } while (0)
360#else
361# define ALLOC(P, SIZE) \
362 do { P = qemu_mallocz(SIZE); } while (0)
17e2377a 363#endif
434929bf 364
5cd2c5b6
RH
365 /* Level 1. Always allocated. */
366 lp = l1_map + ((index >> V_L1_SHIFT) & (V_L1_SIZE - 1));
367
368 /* Level 2..N-1. */
369 for (i = V_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
370 void **p = *lp;
371
372 if (p == NULL) {
373 if (!alloc) {
374 return NULL;
375 }
376 ALLOC(p, sizeof(void *) * L2_SIZE);
377 *lp = p;
17e2377a 378 }
5cd2c5b6
RH
379
380 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
381 }
382
383 pd = *lp;
384 if (pd == NULL) {
385 if (!alloc) {
386 return NULL;
387 }
388 ALLOC(pd, sizeof(PageDesc) * L2_SIZE);
389 *lp = pd;
54936004 390 }
5cd2c5b6
RH
391
392#undef ALLOC
5cd2c5b6
RH
393
394 return pd + (index & (L2_SIZE - 1));
54936004
FB
395}
396
41c1b1c9 397static inline PageDesc *page_find(tb_page_addr_t index)
54936004 398{
5cd2c5b6 399 return page_find_alloc(index, 0);
fd6ce8f6
FB
400}
401
6d9a1304 402#if !defined(CONFIG_USER_ONLY)
c227f099 403static PhysPageDesc *phys_page_find_alloc(target_phys_addr_t index, int alloc)
92e873b9 404{
e3f4e2a4 405 PhysPageDesc *pd;
5cd2c5b6
RH
406 void **lp;
407 int i;
92e873b9 408
5cd2c5b6
RH
409 /* Level 1. Always allocated. */
410 lp = l1_phys_map + ((index >> P_L1_SHIFT) & (P_L1_SIZE - 1));
108c49b8 411
5cd2c5b6
RH
412 /* Level 2..N-1. */
413 for (i = P_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
414 void **p = *lp;
415 if (p == NULL) {
416 if (!alloc) {
417 return NULL;
418 }
419 *lp = p = qemu_mallocz(sizeof(void *) * L2_SIZE);
420 }
421 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
108c49b8 422 }
5cd2c5b6 423
e3f4e2a4 424 pd = *lp;
5cd2c5b6 425 if (pd == NULL) {
e3f4e2a4 426 int i;
5cd2c5b6
RH
427
428 if (!alloc) {
108c49b8 429 return NULL;
5cd2c5b6
RH
430 }
431
432 *lp = pd = qemu_malloc(sizeof(PhysPageDesc) * L2_SIZE);
433
67c4d23c 434 for (i = 0; i < L2_SIZE; i++) {
5cd2c5b6
RH
435 pd[i].phys_offset = IO_MEM_UNASSIGNED;
436 pd[i].region_offset = (index + i) << TARGET_PAGE_BITS;
67c4d23c 437 }
92e873b9 438 }
5cd2c5b6
RH
439
440 return pd + (index & (L2_SIZE - 1));
92e873b9
FB
441}
442
c227f099 443static inline PhysPageDesc *phys_page_find(target_phys_addr_t index)
92e873b9 444{
108c49b8 445 return phys_page_find_alloc(index, 0);
92e873b9
FB
446}
447
c227f099
AL
448static void tlb_protect_code(ram_addr_t ram_addr);
449static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
3a7d929e 450 target_ulong vaddr);
c8a706fe
PB
451#define mmap_lock() do { } while(0)
452#define mmap_unlock() do { } while(0)
9fa3e853 453#endif
fd6ce8f6 454
4369415f
FB
455#define DEFAULT_CODE_GEN_BUFFER_SIZE (32 * 1024 * 1024)
456
457#if defined(CONFIG_USER_ONLY)
ccbb4d44 458/* Currently it is not recommended to allocate big chunks of data in
4369415f
FB
459 user mode. It will change when a dedicated libc will be used */
460#define USE_STATIC_CODE_GEN_BUFFER
461#endif
462
463#ifdef USE_STATIC_CODE_GEN_BUFFER
ebf50fb3
AJ
464static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
465 __attribute__((aligned (CODE_GEN_ALIGN)));
4369415f
FB
466#endif
467
8fcd3692 468static void code_gen_alloc(unsigned long tb_size)
26a5f13b 469{
4369415f
FB
470#ifdef USE_STATIC_CODE_GEN_BUFFER
471 code_gen_buffer = static_code_gen_buffer;
472 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
473 map_exec(code_gen_buffer, code_gen_buffer_size);
474#else
26a5f13b
FB
475 code_gen_buffer_size = tb_size;
476 if (code_gen_buffer_size == 0) {
4369415f
FB
477#if defined(CONFIG_USER_ONLY)
478 /* in user mode, phys_ram_size is not meaningful */
479 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
480#else
ccbb4d44 481 /* XXX: needs adjustments */
94a6b54f 482 code_gen_buffer_size = (unsigned long)(ram_size / 4);
4369415f 483#endif
26a5f13b
FB
484 }
485 if (code_gen_buffer_size < MIN_CODE_GEN_BUFFER_SIZE)
486 code_gen_buffer_size = MIN_CODE_GEN_BUFFER_SIZE;
487 /* The code gen buffer location may have constraints depending on
488 the host cpu and OS */
489#if defined(__linux__)
490 {
491 int flags;
141ac468
BS
492 void *start = NULL;
493
26a5f13b
FB
494 flags = MAP_PRIVATE | MAP_ANONYMOUS;
495#if defined(__x86_64__)
496 flags |= MAP_32BIT;
497 /* Cannot map more than that */
498 if (code_gen_buffer_size > (800 * 1024 * 1024))
499 code_gen_buffer_size = (800 * 1024 * 1024);
141ac468
BS
500#elif defined(__sparc_v9__)
501 // Map the buffer below 2G, so we can use direct calls and branches
502 flags |= MAP_FIXED;
503 start = (void *) 0x60000000UL;
504 if (code_gen_buffer_size > (512 * 1024 * 1024))
505 code_gen_buffer_size = (512 * 1024 * 1024);
1cb0661e 506#elif defined(__arm__)
63d41246 507 /* Map the buffer below 32M, so we can use direct calls and branches */
1cb0661e
AZ
508 flags |= MAP_FIXED;
509 start = (void *) 0x01000000UL;
510 if (code_gen_buffer_size > 16 * 1024 * 1024)
511 code_gen_buffer_size = 16 * 1024 * 1024;
eba0b893
RH
512#elif defined(__s390x__)
513 /* Map the buffer so that we can use direct calls and branches. */
514 /* We have a +- 4GB range on the branches; leave some slop. */
515 if (code_gen_buffer_size > (3ul * 1024 * 1024 * 1024)) {
516 code_gen_buffer_size = 3ul * 1024 * 1024 * 1024;
517 }
518 start = (void *)0x90000000UL;
26a5f13b 519#endif
141ac468
BS
520 code_gen_buffer = mmap(start, code_gen_buffer_size,
521 PROT_WRITE | PROT_READ | PROT_EXEC,
26a5f13b
FB
522 flags, -1, 0);
523 if (code_gen_buffer == MAP_FAILED) {
524 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
525 exit(1);
526 }
527 }
cbb608a5 528#elif defined(__FreeBSD__) || defined(__FreeBSD_kernel__) \
9f4b09a4
TN
529 || defined(__DragonFly__) || defined(__OpenBSD__) \
530 || defined(__NetBSD__)
06e67a82
AL
531 {
532 int flags;
533 void *addr = NULL;
534 flags = MAP_PRIVATE | MAP_ANONYMOUS;
535#if defined(__x86_64__)
536 /* FreeBSD doesn't have MAP_32BIT, use MAP_FIXED and assume
537 * 0x40000000 is free */
538 flags |= MAP_FIXED;
539 addr = (void *)0x40000000;
540 /* Cannot map more than that */
541 if (code_gen_buffer_size > (800 * 1024 * 1024))
542 code_gen_buffer_size = (800 * 1024 * 1024);
4cd31ad2
BS
543#elif defined(__sparc_v9__)
544 // Map the buffer below 2G, so we can use direct calls and branches
545 flags |= MAP_FIXED;
546 addr = (void *) 0x60000000UL;
547 if (code_gen_buffer_size > (512 * 1024 * 1024)) {
548 code_gen_buffer_size = (512 * 1024 * 1024);
549 }
06e67a82
AL
550#endif
551 code_gen_buffer = mmap(addr, code_gen_buffer_size,
552 PROT_WRITE | PROT_READ | PROT_EXEC,
553 flags, -1, 0);
554 if (code_gen_buffer == MAP_FAILED) {
555 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
556 exit(1);
557 }
558 }
26a5f13b
FB
559#else
560 code_gen_buffer = qemu_malloc(code_gen_buffer_size);
26a5f13b
FB
561 map_exec(code_gen_buffer, code_gen_buffer_size);
562#endif
4369415f 563#endif /* !USE_STATIC_CODE_GEN_BUFFER */
26a5f13b 564 map_exec(code_gen_prologue, sizeof(code_gen_prologue));
a884da8a
PM
565 code_gen_buffer_max_size = code_gen_buffer_size -
566 (TCG_MAX_OP_SIZE * OPC_BUF_SIZE);
26a5f13b
FB
567 code_gen_max_blocks = code_gen_buffer_size / CODE_GEN_AVG_BLOCK_SIZE;
568 tbs = qemu_malloc(code_gen_max_blocks * sizeof(TranslationBlock));
569}
570
571/* Must be called before using the QEMU cpus. 'tb_size' is the size
572 (in bytes) allocated to the translation buffer. Zero means default
573 size. */
d5ab9713 574void tcg_exec_init(unsigned long tb_size)
26a5f13b 575{
26a5f13b
FB
576 cpu_gen_init();
577 code_gen_alloc(tb_size);
578 code_gen_ptr = code_gen_buffer;
4369415f 579 page_init();
9002ec79
RH
580#if !defined(CONFIG_USER_ONLY) || !defined(CONFIG_USE_GUEST_BASE)
581 /* There's no guest base to take into account, so go ahead and
582 initialize the prologue now. */
583 tcg_prologue_init(&tcg_ctx);
584#endif
26a5f13b
FB
585}
586
d5ab9713
JK
587bool tcg_enabled(void)
588{
589 return code_gen_buffer != NULL;
590}
591
592void cpu_exec_init_all(void)
593{
594#if !defined(CONFIG_USER_ONLY)
595 memory_map_init();
596 io_mem_init();
597#endif
598}
599
9656f324
PB
600#if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
601
e59fb374 602static int cpu_common_post_load(void *opaque, int version_id)
e7f4eff7
JQ
603{
604 CPUState *env = opaque;
9656f324 605
3098dba0
AJ
606 /* 0x01 was CPU_INTERRUPT_EXIT. This line can be removed when the
607 version_id is increased. */
608 env->interrupt_request &= ~0x01;
9656f324
PB
609 tlb_flush(env, 1);
610
611 return 0;
612}
e7f4eff7
JQ
613
614static const VMStateDescription vmstate_cpu_common = {
615 .name = "cpu_common",
616 .version_id = 1,
617 .minimum_version_id = 1,
618 .minimum_version_id_old = 1,
e7f4eff7
JQ
619 .post_load = cpu_common_post_load,
620 .fields = (VMStateField []) {
621 VMSTATE_UINT32(halted, CPUState),
622 VMSTATE_UINT32(interrupt_request, CPUState),
623 VMSTATE_END_OF_LIST()
624 }
625};
9656f324
PB
626#endif
627
950f1472
GC
628CPUState *qemu_get_cpu(int cpu)
629{
630 CPUState *env = first_cpu;
631
632 while (env) {
633 if (env->cpu_index == cpu)
634 break;
635 env = env->next_cpu;
636 }
637
638 return env;
639}
640
6a00d601 641void cpu_exec_init(CPUState *env)
fd6ce8f6 642{
6a00d601
FB
643 CPUState **penv;
644 int cpu_index;
645
c2764719
PB
646#if defined(CONFIG_USER_ONLY)
647 cpu_list_lock();
648#endif
6a00d601
FB
649 env->next_cpu = NULL;
650 penv = &first_cpu;
651 cpu_index = 0;
652 while (*penv != NULL) {
1e9fa730 653 penv = &(*penv)->next_cpu;
6a00d601
FB
654 cpu_index++;
655 }
656 env->cpu_index = cpu_index;
268a362c 657 env->numa_node = 0;
72cf2d4f
BS
658 QTAILQ_INIT(&env->breakpoints);
659 QTAILQ_INIT(&env->watchpoints);
dc7a09cf
JK
660#ifndef CONFIG_USER_ONLY
661 env->thread_id = qemu_get_thread_id();
662#endif
6a00d601 663 *penv = env;
c2764719
PB
664#if defined(CONFIG_USER_ONLY)
665 cpu_list_unlock();
666#endif
b3c7724c 667#if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
0be71e32
AW
668 vmstate_register(NULL, cpu_index, &vmstate_cpu_common, env);
669 register_savevm(NULL, "cpu", cpu_index, CPU_SAVE_VERSION,
b3c7724c
PB
670 cpu_save, cpu_load, env);
671#endif
fd6ce8f6
FB
672}
673
d1a1eb74
TG
674/* Allocate a new translation block. Flush the translation buffer if
675 too many translation blocks or too much generated code. */
676static TranslationBlock *tb_alloc(target_ulong pc)
677{
678 TranslationBlock *tb;
679
680 if (nb_tbs >= code_gen_max_blocks ||
681 (code_gen_ptr - code_gen_buffer) >= code_gen_buffer_max_size)
682 return NULL;
683 tb = &tbs[nb_tbs++];
684 tb->pc = pc;
685 tb->cflags = 0;
686 return tb;
687}
688
689void tb_free(TranslationBlock *tb)
690{
691 /* In practice this is mostly used for single use temporary TB
692 Ignore the hard cases and just back up if this TB happens to
693 be the last one generated. */
694 if (nb_tbs > 0 && tb == &tbs[nb_tbs - 1]) {
695 code_gen_ptr = tb->tc_ptr;
696 nb_tbs--;
697 }
698}
699
9fa3e853
FB
700static inline void invalidate_page_bitmap(PageDesc *p)
701{
702 if (p->code_bitmap) {
59817ccb 703 qemu_free(p->code_bitmap);
9fa3e853
FB
704 p->code_bitmap = NULL;
705 }
706 p->code_write_count = 0;
707}
708
5cd2c5b6
RH
709/* Set to NULL all the 'first_tb' fields in all PageDescs. */
710
711static void page_flush_tb_1 (int level, void **lp)
fd6ce8f6 712{
5cd2c5b6 713 int i;
fd6ce8f6 714
5cd2c5b6
RH
715 if (*lp == NULL) {
716 return;
717 }
718 if (level == 0) {
719 PageDesc *pd = *lp;
7296abac 720 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
721 pd[i].first_tb = NULL;
722 invalidate_page_bitmap(pd + i);
fd6ce8f6 723 }
5cd2c5b6
RH
724 } else {
725 void **pp = *lp;
7296abac 726 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
727 page_flush_tb_1 (level - 1, pp + i);
728 }
729 }
730}
731
732static void page_flush_tb(void)
733{
734 int i;
735 for (i = 0; i < V_L1_SIZE; i++) {
736 page_flush_tb_1(V_L1_SHIFT / L2_BITS - 1, l1_map + i);
fd6ce8f6
FB
737 }
738}
739
740/* flush all the translation blocks */
d4e8164f 741/* XXX: tb_flush is currently not thread safe */
6a00d601 742void tb_flush(CPUState *env1)
fd6ce8f6 743{
6a00d601 744 CPUState *env;
0124311e 745#if defined(DEBUG_FLUSH)
ab3d1727
BS
746 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
747 (unsigned long)(code_gen_ptr - code_gen_buffer),
748 nb_tbs, nb_tbs > 0 ?
749 ((unsigned long)(code_gen_ptr - code_gen_buffer)) / nb_tbs : 0);
fd6ce8f6 750#endif
26a5f13b 751 if ((unsigned long)(code_gen_ptr - code_gen_buffer) > code_gen_buffer_size)
a208e54a
PB
752 cpu_abort(env1, "Internal error: code buffer overflow\n");
753
fd6ce8f6 754 nb_tbs = 0;
3b46e624 755
6a00d601
FB
756 for(env = first_cpu; env != NULL; env = env->next_cpu) {
757 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
758 }
9fa3e853 759
8a8a608f 760 memset (tb_phys_hash, 0, CODE_GEN_PHYS_HASH_SIZE * sizeof (void *));
fd6ce8f6 761 page_flush_tb();
9fa3e853 762
fd6ce8f6 763 code_gen_ptr = code_gen_buffer;
d4e8164f
FB
764 /* XXX: flush processor icache at this point if cache flush is
765 expensive */
e3db7226 766 tb_flush_count++;
fd6ce8f6
FB
767}
768
769#ifdef DEBUG_TB_CHECK
770
bc98a7ef 771static void tb_invalidate_check(target_ulong address)
fd6ce8f6
FB
772{
773 TranslationBlock *tb;
774 int i;
775 address &= TARGET_PAGE_MASK;
99773bd4
PB
776 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
777 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
fd6ce8f6
FB
778 if (!(address + TARGET_PAGE_SIZE <= tb->pc ||
779 address >= tb->pc + tb->size)) {
0bf9e31a
BS
780 printf("ERROR invalidate: address=" TARGET_FMT_lx
781 " PC=%08lx size=%04x\n",
99773bd4 782 address, (long)tb->pc, tb->size);
fd6ce8f6
FB
783 }
784 }
785 }
786}
787
788/* verify that all the pages have correct rights for code */
789static void tb_page_check(void)
790{
791 TranslationBlock *tb;
792 int i, flags1, flags2;
3b46e624 793
99773bd4
PB
794 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
795 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
fd6ce8f6
FB
796 flags1 = page_get_flags(tb->pc);
797 flags2 = page_get_flags(tb->pc + tb->size - 1);
798 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
799 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
99773bd4 800 (long)tb->pc, tb->size, flags1, flags2);
fd6ce8f6
FB
801 }
802 }
803 }
804}
805
806#endif
807
808/* invalidate one TB */
809static inline void tb_remove(TranslationBlock **ptb, TranslationBlock *tb,
810 int next_offset)
811{
812 TranslationBlock *tb1;
813 for(;;) {
814 tb1 = *ptb;
815 if (tb1 == tb) {
816 *ptb = *(TranslationBlock **)((char *)tb1 + next_offset);
817 break;
818 }
819 ptb = (TranslationBlock **)((char *)tb1 + next_offset);
820 }
821}
822
9fa3e853
FB
823static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
824{
825 TranslationBlock *tb1;
826 unsigned int n1;
827
828 for(;;) {
829 tb1 = *ptb;
830 n1 = (long)tb1 & 3;
831 tb1 = (TranslationBlock *)((long)tb1 & ~3);
832 if (tb1 == tb) {
833 *ptb = tb1->page_next[n1];
834 break;
835 }
836 ptb = &tb1->page_next[n1];
837 }
838}
839
d4e8164f
FB
840static inline void tb_jmp_remove(TranslationBlock *tb, int n)
841{
842 TranslationBlock *tb1, **ptb;
843 unsigned int n1;
844
845 ptb = &tb->jmp_next[n];
846 tb1 = *ptb;
847 if (tb1) {
848 /* find tb(n) in circular list */
849 for(;;) {
850 tb1 = *ptb;
851 n1 = (long)tb1 & 3;
852 tb1 = (TranslationBlock *)((long)tb1 & ~3);
853 if (n1 == n && tb1 == tb)
854 break;
855 if (n1 == 2) {
856 ptb = &tb1->jmp_first;
857 } else {
858 ptb = &tb1->jmp_next[n1];
859 }
860 }
861 /* now we can suppress tb(n) from the list */
862 *ptb = tb->jmp_next[n];
863
864 tb->jmp_next[n] = NULL;
865 }
866}
867
868/* reset the jump entry 'n' of a TB so that it is not chained to
869 another TB */
870static inline void tb_reset_jump(TranslationBlock *tb, int n)
871{
872 tb_set_jmp_target(tb, n, (unsigned long)(tb->tc_ptr + tb->tb_next_offset[n]));
873}
874
41c1b1c9 875void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
fd6ce8f6 876{
6a00d601 877 CPUState *env;
8a40a180 878 PageDesc *p;
d4e8164f 879 unsigned int h, n1;
41c1b1c9 880 tb_page_addr_t phys_pc;
8a40a180 881 TranslationBlock *tb1, *tb2;
3b46e624 882
8a40a180
FB
883 /* remove the TB from the hash list */
884 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
885 h = tb_phys_hash_func(phys_pc);
5fafdf24 886 tb_remove(&tb_phys_hash[h], tb,
8a40a180
FB
887 offsetof(TranslationBlock, phys_hash_next));
888
889 /* remove the TB from the page list */
890 if (tb->page_addr[0] != page_addr) {
891 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
892 tb_page_remove(&p->first_tb, tb);
893 invalidate_page_bitmap(p);
894 }
895 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
896 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
897 tb_page_remove(&p->first_tb, tb);
898 invalidate_page_bitmap(p);
899 }
900
36bdbe54 901 tb_invalidated_flag = 1;
59817ccb 902
fd6ce8f6 903 /* remove the TB from the hash list */
8a40a180 904 h = tb_jmp_cache_hash_func(tb->pc);
6a00d601
FB
905 for(env = first_cpu; env != NULL; env = env->next_cpu) {
906 if (env->tb_jmp_cache[h] == tb)
907 env->tb_jmp_cache[h] = NULL;
908 }
d4e8164f
FB
909
910 /* suppress this TB from the two jump lists */
911 tb_jmp_remove(tb, 0);
912 tb_jmp_remove(tb, 1);
913
914 /* suppress any remaining jumps to this TB */
915 tb1 = tb->jmp_first;
916 for(;;) {
917 n1 = (long)tb1 & 3;
918 if (n1 == 2)
919 break;
920 tb1 = (TranslationBlock *)((long)tb1 & ~3);
921 tb2 = tb1->jmp_next[n1];
922 tb_reset_jump(tb1, n1);
923 tb1->jmp_next[n1] = NULL;
924 tb1 = tb2;
925 }
926 tb->jmp_first = (TranslationBlock *)((long)tb | 2); /* fail safe */
9fa3e853 927
e3db7226 928 tb_phys_invalidate_count++;
9fa3e853
FB
929}
930
931static inline void set_bits(uint8_t *tab, int start, int len)
932{
933 int end, mask, end1;
934
935 end = start + len;
936 tab += start >> 3;
937 mask = 0xff << (start & 7);
938 if ((start & ~7) == (end & ~7)) {
939 if (start < end) {
940 mask &= ~(0xff << (end & 7));
941 *tab |= mask;
942 }
943 } else {
944 *tab++ |= mask;
945 start = (start + 8) & ~7;
946 end1 = end & ~7;
947 while (start < end1) {
948 *tab++ = 0xff;
949 start += 8;
950 }
951 if (start < end) {
952 mask = ~(0xff << (end & 7));
953 *tab |= mask;
954 }
955 }
956}
957
958static void build_page_bitmap(PageDesc *p)
959{
960 int n, tb_start, tb_end;
961 TranslationBlock *tb;
3b46e624 962
b2a7081a 963 p->code_bitmap = qemu_mallocz(TARGET_PAGE_SIZE / 8);
9fa3e853
FB
964
965 tb = p->first_tb;
966 while (tb != NULL) {
967 n = (long)tb & 3;
968 tb = (TranslationBlock *)((long)tb & ~3);
969 /* NOTE: this is subtle as a TB may span two physical pages */
970 if (n == 0) {
971 /* NOTE: tb_end may be after the end of the page, but
972 it is not a problem */
973 tb_start = tb->pc & ~TARGET_PAGE_MASK;
974 tb_end = tb_start + tb->size;
975 if (tb_end > TARGET_PAGE_SIZE)
976 tb_end = TARGET_PAGE_SIZE;
977 } else {
978 tb_start = 0;
979 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
980 }
981 set_bits(p->code_bitmap, tb_start, tb_end - tb_start);
982 tb = tb->page_next[n];
983 }
984}
985
2e70f6ef
PB
986TranslationBlock *tb_gen_code(CPUState *env,
987 target_ulong pc, target_ulong cs_base,
988 int flags, int cflags)
d720b93d
FB
989{
990 TranslationBlock *tb;
991 uint8_t *tc_ptr;
41c1b1c9
PB
992 tb_page_addr_t phys_pc, phys_page2;
993 target_ulong virt_page2;
d720b93d
FB
994 int code_gen_size;
995
41c1b1c9 996 phys_pc = get_page_addr_code(env, pc);
c27004ec 997 tb = tb_alloc(pc);
d720b93d
FB
998 if (!tb) {
999 /* flush must be done */
1000 tb_flush(env);
1001 /* cannot fail at this point */
c27004ec 1002 tb = tb_alloc(pc);
2e70f6ef
PB
1003 /* Don't forget to invalidate previous TB info. */
1004 tb_invalidated_flag = 1;
d720b93d
FB
1005 }
1006 tc_ptr = code_gen_ptr;
1007 tb->tc_ptr = tc_ptr;
1008 tb->cs_base = cs_base;
1009 tb->flags = flags;
1010 tb->cflags = cflags;
d07bde88 1011 cpu_gen_code(env, tb, &code_gen_size);
d720b93d 1012 code_gen_ptr = (void *)(((unsigned long)code_gen_ptr + code_gen_size + CODE_GEN_ALIGN - 1) & ~(CODE_GEN_ALIGN - 1));
3b46e624 1013
d720b93d 1014 /* check next page if needed */
c27004ec 1015 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
d720b93d 1016 phys_page2 = -1;
c27004ec 1017 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
41c1b1c9 1018 phys_page2 = get_page_addr_code(env, virt_page2);
d720b93d 1019 }
41c1b1c9 1020 tb_link_page(tb, phys_pc, phys_page2);
2e70f6ef 1021 return tb;
d720b93d 1022}
3b46e624 1023
9fa3e853
FB
1024/* invalidate all TBs which intersect with the target physical page
1025 starting in range [start;end[. NOTE: start and end must refer to
d720b93d
FB
1026 the same physical page. 'is_cpu_write_access' should be true if called
1027 from a real cpu write access: the virtual CPU will exit the current
1028 TB if code is modified inside this TB. */
41c1b1c9 1029void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
d720b93d
FB
1030 int is_cpu_write_access)
1031{
6b917547 1032 TranslationBlock *tb, *tb_next, *saved_tb;
d720b93d 1033 CPUState *env = cpu_single_env;
41c1b1c9 1034 tb_page_addr_t tb_start, tb_end;
6b917547
AL
1035 PageDesc *p;
1036 int n;
1037#ifdef TARGET_HAS_PRECISE_SMC
1038 int current_tb_not_found = is_cpu_write_access;
1039 TranslationBlock *current_tb = NULL;
1040 int current_tb_modified = 0;
1041 target_ulong current_pc = 0;
1042 target_ulong current_cs_base = 0;
1043 int current_flags = 0;
1044#endif /* TARGET_HAS_PRECISE_SMC */
9fa3e853
FB
1045
1046 p = page_find(start >> TARGET_PAGE_BITS);
5fafdf24 1047 if (!p)
9fa3e853 1048 return;
5fafdf24 1049 if (!p->code_bitmap &&
d720b93d
FB
1050 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD &&
1051 is_cpu_write_access) {
9fa3e853
FB
1052 /* build code bitmap */
1053 build_page_bitmap(p);
1054 }
1055
1056 /* we remove all the TBs in the range [start, end[ */
1057 /* XXX: see if in some cases it could be faster to invalidate all the code */
1058 tb = p->first_tb;
1059 while (tb != NULL) {
1060 n = (long)tb & 3;
1061 tb = (TranslationBlock *)((long)tb & ~3);
1062 tb_next = tb->page_next[n];
1063 /* NOTE: this is subtle as a TB may span two physical pages */
1064 if (n == 0) {
1065 /* NOTE: tb_end may be after the end of the page, but
1066 it is not a problem */
1067 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1068 tb_end = tb_start + tb->size;
1069 } else {
1070 tb_start = tb->page_addr[1];
1071 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1072 }
1073 if (!(tb_end <= start || tb_start >= end)) {
d720b93d
FB
1074#ifdef TARGET_HAS_PRECISE_SMC
1075 if (current_tb_not_found) {
1076 current_tb_not_found = 0;
1077 current_tb = NULL;
2e70f6ef 1078 if (env->mem_io_pc) {
d720b93d 1079 /* now we have a real cpu fault */
2e70f6ef 1080 current_tb = tb_find_pc(env->mem_io_pc);
d720b93d
FB
1081 }
1082 }
1083 if (current_tb == tb &&
2e70f6ef 1084 (current_tb->cflags & CF_COUNT_MASK) != 1) {
d720b93d
FB
1085 /* If we are modifying the current TB, we must stop
1086 its execution. We could be more precise by checking
1087 that the modification is after the current PC, but it
1088 would require a specialized function to partially
1089 restore the CPU state */
3b46e624 1090
d720b93d 1091 current_tb_modified = 1;
618ba8e6 1092 cpu_restore_state(current_tb, env, env->mem_io_pc);
6b917547
AL
1093 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1094 &current_flags);
d720b93d
FB
1095 }
1096#endif /* TARGET_HAS_PRECISE_SMC */
6f5a9f7e
FB
1097 /* we need to do that to handle the case where a signal
1098 occurs while doing tb_phys_invalidate() */
1099 saved_tb = NULL;
1100 if (env) {
1101 saved_tb = env->current_tb;
1102 env->current_tb = NULL;
1103 }
9fa3e853 1104 tb_phys_invalidate(tb, -1);
6f5a9f7e
FB
1105 if (env) {
1106 env->current_tb = saved_tb;
1107 if (env->interrupt_request && env->current_tb)
1108 cpu_interrupt(env, env->interrupt_request);
1109 }
9fa3e853
FB
1110 }
1111 tb = tb_next;
1112 }
1113#if !defined(CONFIG_USER_ONLY)
1114 /* if no code remaining, no need to continue to use slow writes */
1115 if (!p->first_tb) {
1116 invalidate_page_bitmap(p);
d720b93d 1117 if (is_cpu_write_access) {
2e70f6ef 1118 tlb_unprotect_code_phys(env, start, env->mem_io_vaddr);
d720b93d
FB
1119 }
1120 }
1121#endif
1122#ifdef TARGET_HAS_PRECISE_SMC
1123 if (current_tb_modified) {
1124 /* we generate a block containing just the instruction
1125 modifying the memory. It will ensure that it cannot modify
1126 itself */
ea1c1802 1127 env->current_tb = NULL;
2e70f6ef 1128 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
d720b93d 1129 cpu_resume_from_signal(env, NULL);
9fa3e853 1130 }
fd6ce8f6 1131#endif
9fa3e853 1132}
fd6ce8f6 1133
9fa3e853 1134/* len must be <= 8 and start must be a multiple of len */
41c1b1c9 1135static inline void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
9fa3e853
FB
1136{
1137 PageDesc *p;
1138 int offset, b;
59817ccb 1139#if 0
a4193c8a 1140 if (1) {
93fcfe39
AL
1141 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1142 cpu_single_env->mem_io_vaddr, len,
1143 cpu_single_env->eip,
1144 cpu_single_env->eip + (long)cpu_single_env->segs[R_CS].base);
59817ccb
FB
1145 }
1146#endif
9fa3e853 1147 p = page_find(start >> TARGET_PAGE_BITS);
5fafdf24 1148 if (!p)
9fa3e853
FB
1149 return;
1150 if (p->code_bitmap) {
1151 offset = start & ~TARGET_PAGE_MASK;
1152 b = p->code_bitmap[offset >> 3] >> (offset & 7);
1153 if (b & ((1 << len) - 1))
1154 goto do_invalidate;
1155 } else {
1156 do_invalidate:
d720b93d 1157 tb_invalidate_phys_page_range(start, start + len, 1);
9fa3e853
FB
1158 }
1159}
1160
9fa3e853 1161#if !defined(CONFIG_SOFTMMU)
41c1b1c9 1162static void tb_invalidate_phys_page(tb_page_addr_t addr,
d720b93d 1163 unsigned long pc, void *puc)
9fa3e853 1164{
6b917547 1165 TranslationBlock *tb;
9fa3e853 1166 PageDesc *p;
6b917547 1167 int n;
d720b93d 1168#ifdef TARGET_HAS_PRECISE_SMC
6b917547 1169 TranslationBlock *current_tb = NULL;
d720b93d 1170 CPUState *env = cpu_single_env;
6b917547
AL
1171 int current_tb_modified = 0;
1172 target_ulong current_pc = 0;
1173 target_ulong current_cs_base = 0;
1174 int current_flags = 0;
d720b93d 1175#endif
9fa3e853
FB
1176
1177 addr &= TARGET_PAGE_MASK;
1178 p = page_find(addr >> TARGET_PAGE_BITS);
5fafdf24 1179 if (!p)
9fa3e853
FB
1180 return;
1181 tb = p->first_tb;
d720b93d
FB
1182#ifdef TARGET_HAS_PRECISE_SMC
1183 if (tb && pc != 0) {
1184 current_tb = tb_find_pc(pc);
1185 }
1186#endif
9fa3e853
FB
1187 while (tb != NULL) {
1188 n = (long)tb & 3;
1189 tb = (TranslationBlock *)((long)tb & ~3);
d720b93d
FB
1190#ifdef TARGET_HAS_PRECISE_SMC
1191 if (current_tb == tb &&
2e70f6ef 1192 (current_tb->cflags & CF_COUNT_MASK) != 1) {
d720b93d
FB
1193 /* If we are modifying the current TB, we must stop
1194 its execution. We could be more precise by checking
1195 that the modification is after the current PC, but it
1196 would require a specialized function to partially
1197 restore the CPU state */
3b46e624 1198
d720b93d 1199 current_tb_modified = 1;
618ba8e6 1200 cpu_restore_state(current_tb, env, pc);
6b917547
AL
1201 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1202 &current_flags);
d720b93d
FB
1203 }
1204#endif /* TARGET_HAS_PRECISE_SMC */
9fa3e853
FB
1205 tb_phys_invalidate(tb, addr);
1206 tb = tb->page_next[n];
1207 }
fd6ce8f6 1208 p->first_tb = NULL;
d720b93d
FB
1209#ifdef TARGET_HAS_PRECISE_SMC
1210 if (current_tb_modified) {
1211 /* we generate a block containing just the instruction
1212 modifying the memory. It will ensure that it cannot modify
1213 itself */
ea1c1802 1214 env->current_tb = NULL;
2e70f6ef 1215 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
d720b93d
FB
1216 cpu_resume_from_signal(env, puc);
1217 }
1218#endif
fd6ce8f6 1219}
9fa3e853 1220#endif
fd6ce8f6
FB
1221
1222/* add the tb in the target page and protect it if necessary */
5fafdf24 1223static inline void tb_alloc_page(TranslationBlock *tb,
41c1b1c9 1224 unsigned int n, tb_page_addr_t page_addr)
fd6ce8f6
FB
1225{
1226 PageDesc *p;
4429ab44
JQ
1227#ifndef CONFIG_USER_ONLY
1228 bool page_already_protected;
1229#endif
9fa3e853
FB
1230
1231 tb->page_addr[n] = page_addr;
5cd2c5b6 1232 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
9fa3e853 1233 tb->page_next[n] = p->first_tb;
4429ab44
JQ
1234#ifndef CONFIG_USER_ONLY
1235 page_already_protected = p->first_tb != NULL;
1236#endif
9fa3e853
FB
1237 p->first_tb = (TranslationBlock *)((long)tb | n);
1238 invalidate_page_bitmap(p);
fd6ce8f6 1239
107db443 1240#if defined(TARGET_HAS_SMC) || 1
d720b93d 1241
9fa3e853 1242#if defined(CONFIG_USER_ONLY)
fd6ce8f6 1243 if (p->flags & PAGE_WRITE) {
53a5960a
PB
1244 target_ulong addr;
1245 PageDesc *p2;
9fa3e853
FB
1246 int prot;
1247
fd6ce8f6
FB
1248 /* force the host page as non writable (writes will have a
1249 page fault + mprotect overhead) */
53a5960a 1250 page_addr &= qemu_host_page_mask;
fd6ce8f6 1251 prot = 0;
53a5960a
PB
1252 for(addr = page_addr; addr < page_addr + qemu_host_page_size;
1253 addr += TARGET_PAGE_SIZE) {
1254
1255 p2 = page_find (addr >> TARGET_PAGE_BITS);
1256 if (!p2)
1257 continue;
1258 prot |= p2->flags;
1259 p2->flags &= ~PAGE_WRITE;
53a5960a 1260 }
5fafdf24 1261 mprotect(g2h(page_addr), qemu_host_page_size,
fd6ce8f6
FB
1262 (prot & PAGE_BITS) & ~PAGE_WRITE);
1263#ifdef DEBUG_TB_INVALIDATE
ab3d1727 1264 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
53a5960a 1265 page_addr);
fd6ce8f6 1266#endif
fd6ce8f6 1267 }
9fa3e853
FB
1268#else
1269 /* if some code is already present, then the pages are already
1270 protected. So we handle the case where only the first TB is
1271 allocated in a physical page */
4429ab44 1272 if (!page_already_protected) {
6a00d601 1273 tlb_protect_code(page_addr);
9fa3e853
FB
1274 }
1275#endif
d720b93d
FB
1276
1277#endif /* TARGET_HAS_SMC */
fd6ce8f6
FB
1278}
1279
9fa3e853
FB
1280/* add a new TB and link it to the physical page tables. phys_page2 is
1281 (-1) to indicate that only one page contains the TB. */
41c1b1c9
PB
1282void tb_link_page(TranslationBlock *tb,
1283 tb_page_addr_t phys_pc, tb_page_addr_t phys_page2)
d4e8164f 1284{
9fa3e853
FB
1285 unsigned int h;
1286 TranslationBlock **ptb;
1287
c8a706fe
PB
1288 /* Grab the mmap lock to stop another thread invalidating this TB
1289 before we are done. */
1290 mmap_lock();
9fa3e853
FB
1291 /* add in the physical hash table */
1292 h = tb_phys_hash_func(phys_pc);
1293 ptb = &tb_phys_hash[h];
1294 tb->phys_hash_next = *ptb;
1295 *ptb = tb;
fd6ce8f6
FB
1296
1297 /* add in the page list */
9fa3e853
FB
1298 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1299 if (phys_page2 != -1)
1300 tb_alloc_page(tb, 1, phys_page2);
1301 else
1302 tb->page_addr[1] = -1;
9fa3e853 1303
d4e8164f
FB
1304 tb->jmp_first = (TranslationBlock *)((long)tb | 2);
1305 tb->jmp_next[0] = NULL;
1306 tb->jmp_next[1] = NULL;
1307
1308 /* init original jump addresses */
1309 if (tb->tb_next_offset[0] != 0xffff)
1310 tb_reset_jump(tb, 0);
1311 if (tb->tb_next_offset[1] != 0xffff)
1312 tb_reset_jump(tb, 1);
8a40a180
FB
1313
1314#ifdef DEBUG_TB_CHECK
1315 tb_page_check();
1316#endif
c8a706fe 1317 mmap_unlock();
fd6ce8f6
FB
1318}
1319
9fa3e853
FB
1320/* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1321 tb[1].tc_ptr. Return NULL if not found */
1322TranslationBlock *tb_find_pc(unsigned long tc_ptr)
fd6ce8f6 1323{
9fa3e853
FB
1324 int m_min, m_max, m;
1325 unsigned long v;
1326 TranslationBlock *tb;
a513fe19
FB
1327
1328 if (nb_tbs <= 0)
1329 return NULL;
1330 if (tc_ptr < (unsigned long)code_gen_buffer ||
1331 tc_ptr >= (unsigned long)code_gen_ptr)
1332 return NULL;
1333 /* binary search (cf Knuth) */
1334 m_min = 0;
1335 m_max = nb_tbs - 1;
1336 while (m_min <= m_max) {
1337 m = (m_min + m_max) >> 1;
1338 tb = &tbs[m];
1339 v = (unsigned long)tb->tc_ptr;
1340 if (v == tc_ptr)
1341 return tb;
1342 else if (tc_ptr < v) {
1343 m_max = m - 1;
1344 } else {
1345 m_min = m + 1;
1346 }
5fafdf24 1347 }
a513fe19
FB
1348 return &tbs[m_max];
1349}
7501267e 1350
ea041c0e
FB
1351static void tb_reset_jump_recursive(TranslationBlock *tb);
1352
1353static inline void tb_reset_jump_recursive2(TranslationBlock *tb, int n)
1354{
1355 TranslationBlock *tb1, *tb_next, **ptb;
1356 unsigned int n1;
1357
1358 tb1 = tb->jmp_next[n];
1359 if (tb1 != NULL) {
1360 /* find head of list */
1361 for(;;) {
1362 n1 = (long)tb1 & 3;
1363 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1364 if (n1 == 2)
1365 break;
1366 tb1 = tb1->jmp_next[n1];
1367 }
1368 /* we are now sure now that tb jumps to tb1 */
1369 tb_next = tb1;
1370
1371 /* remove tb from the jmp_first list */
1372 ptb = &tb_next->jmp_first;
1373 for(;;) {
1374 tb1 = *ptb;
1375 n1 = (long)tb1 & 3;
1376 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1377 if (n1 == n && tb1 == tb)
1378 break;
1379 ptb = &tb1->jmp_next[n1];
1380 }
1381 *ptb = tb->jmp_next[n];
1382 tb->jmp_next[n] = NULL;
3b46e624 1383
ea041c0e
FB
1384 /* suppress the jump to next tb in generated code */
1385 tb_reset_jump(tb, n);
1386
0124311e 1387 /* suppress jumps in the tb on which we could have jumped */
ea041c0e
FB
1388 tb_reset_jump_recursive(tb_next);
1389 }
1390}
1391
1392static void tb_reset_jump_recursive(TranslationBlock *tb)
1393{
1394 tb_reset_jump_recursive2(tb, 0);
1395 tb_reset_jump_recursive2(tb, 1);
1396}
1397
1fddef4b 1398#if defined(TARGET_HAS_ICE)
94df27fd
PB
1399#if defined(CONFIG_USER_ONLY)
1400static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1401{
1402 tb_invalidate_phys_page_range(pc, pc + 1, 0);
1403}
1404#else
d720b93d
FB
1405static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1406{
c227f099 1407 target_phys_addr_t addr;
9b3c35e0 1408 target_ulong pd;
c227f099 1409 ram_addr_t ram_addr;
c2f07f81 1410 PhysPageDesc *p;
d720b93d 1411
c2f07f81
PB
1412 addr = cpu_get_phys_page_debug(env, pc);
1413 p = phys_page_find(addr >> TARGET_PAGE_BITS);
1414 if (!p) {
1415 pd = IO_MEM_UNASSIGNED;
1416 } else {
1417 pd = p->phys_offset;
1418 }
1419 ram_addr = (pd & TARGET_PAGE_MASK) | (pc & ~TARGET_PAGE_MASK);
706cd4b5 1420 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
d720b93d 1421}
c27004ec 1422#endif
94df27fd 1423#endif /* TARGET_HAS_ICE */
d720b93d 1424
c527ee8f
PB
1425#if defined(CONFIG_USER_ONLY)
1426void cpu_watchpoint_remove_all(CPUState *env, int mask)
1427
1428{
1429}
1430
1431int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1432 int flags, CPUWatchpoint **watchpoint)
1433{
1434 return -ENOSYS;
1435}
1436#else
6658ffb8 1437/* Add a watchpoint. */
a1d1bb31
AL
1438int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1439 int flags, CPUWatchpoint **watchpoint)
6658ffb8 1440{
b4051334 1441 target_ulong len_mask = ~(len - 1);
c0ce998e 1442 CPUWatchpoint *wp;
6658ffb8 1443
b4051334
AL
1444 /* sanity checks: allow power-of-2 lengths, deny unaligned watchpoints */
1445 if ((len != 1 && len != 2 && len != 4 && len != 8) || (addr & ~len_mask)) {
1446 fprintf(stderr, "qemu: tried to set invalid watchpoint at "
1447 TARGET_FMT_lx ", len=" TARGET_FMT_lu "\n", addr, len);
1448 return -EINVAL;
1449 }
a1d1bb31 1450 wp = qemu_malloc(sizeof(*wp));
a1d1bb31
AL
1451
1452 wp->vaddr = addr;
b4051334 1453 wp->len_mask = len_mask;
a1d1bb31
AL
1454 wp->flags = flags;
1455
2dc9f411 1456 /* keep all GDB-injected watchpoints in front */
c0ce998e 1457 if (flags & BP_GDB)
72cf2d4f 1458 QTAILQ_INSERT_HEAD(&env->watchpoints, wp, entry);
c0ce998e 1459 else
72cf2d4f 1460 QTAILQ_INSERT_TAIL(&env->watchpoints, wp, entry);
6658ffb8 1461
6658ffb8 1462 tlb_flush_page(env, addr);
a1d1bb31
AL
1463
1464 if (watchpoint)
1465 *watchpoint = wp;
1466 return 0;
6658ffb8
PB
1467}
1468
a1d1bb31
AL
1469/* Remove a specific watchpoint. */
1470int cpu_watchpoint_remove(CPUState *env, target_ulong addr, target_ulong len,
1471 int flags)
6658ffb8 1472{
b4051334 1473 target_ulong len_mask = ~(len - 1);
a1d1bb31 1474 CPUWatchpoint *wp;
6658ffb8 1475
72cf2d4f 1476 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334 1477 if (addr == wp->vaddr && len_mask == wp->len_mask
6e140f28 1478 && flags == (wp->flags & ~BP_WATCHPOINT_HIT)) {
a1d1bb31 1479 cpu_watchpoint_remove_by_ref(env, wp);
6658ffb8
PB
1480 return 0;
1481 }
1482 }
a1d1bb31 1483 return -ENOENT;
6658ffb8
PB
1484}
1485
a1d1bb31
AL
1486/* Remove a specific watchpoint by reference. */
1487void cpu_watchpoint_remove_by_ref(CPUState *env, CPUWatchpoint *watchpoint)
1488{
72cf2d4f 1489 QTAILQ_REMOVE(&env->watchpoints, watchpoint, entry);
7d03f82f 1490
a1d1bb31
AL
1491 tlb_flush_page(env, watchpoint->vaddr);
1492
1493 qemu_free(watchpoint);
1494}
1495
1496/* Remove all matching watchpoints. */
1497void cpu_watchpoint_remove_all(CPUState *env, int mask)
1498{
c0ce998e 1499 CPUWatchpoint *wp, *next;
a1d1bb31 1500
72cf2d4f 1501 QTAILQ_FOREACH_SAFE(wp, &env->watchpoints, entry, next) {
a1d1bb31
AL
1502 if (wp->flags & mask)
1503 cpu_watchpoint_remove_by_ref(env, wp);
c0ce998e 1504 }
7d03f82f 1505}
c527ee8f 1506#endif
7d03f82f 1507
a1d1bb31
AL
1508/* Add a breakpoint. */
1509int cpu_breakpoint_insert(CPUState *env, target_ulong pc, int flags,
1510 CPUBreakpoint **breakpoint)
4c3a88a2 1511{
1fddef4b 1512#if defined(TARGET_HAS_ICE)
c0ce998e 1513 CPUBreakpoint *bp;
3b46e624 1514
a1d1bb31 1515 bp = qemu_malloc(sizeof(*bp));
4c3a88a2 1516
a1d1bb31
AL
1517 bp->pc = pc;
1518 bp->flags = flags;
1519
2dc9f411 1520 /* keep all GDB-injected breakpoints in front */
c0ce998e 1521 if (flags & BP_GDB)
72cf2d4f 1522 QTAILQ_INSERT_HEAD(&env->breakpoints, bp, entry);
c0ce998e 1523 else
72cf2d4f 1524 QTAILQ_INSERT_TAIL(&env->breakpoints, bp, entry);
3b46e624 1525
d720b93d 1526 breakpoint_invalidate(env, pc);
a1d1bb31
AL
1527
1528 if (breakpoint)
1529 *breakpoint = bp;
4c3a88a2
FB
1530 return 0;
1531#else
a1d1bb31 1532 return -ENOSYS;
4c3a88a2
FB
1533#endif
1534}
1535
a1d1bb31
AL
1536/* Remove a specific breakpoint. */
1537int cpu_breakpoint_remove(CPUState *env, target_ulong pc, int flags)
1538{
7d03f82f 1539#if defined(TARGET_HAS_ICE)
a1d1bb31
AL
1540 CPUBreakpoint *bp;
1541
72cf2d4f 1542 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
a1d1bb31
AL
1543 if (bp->pc == pc && bp->flags == flags) {
1544 cpu_breakpoint_remove_by_ref(env, bp);
1545 return 0;
1546 }
7d03f82f 1547 }
a1d1bb31
AL
1548 return -ENOENT;
1549#else
1550 return -ENOSYS;
7d03f82f
EI
1551#endif
1552}
1553
a1d1bb31
AL
1554/* Remove a specific breakpoint by reference. */
1555void cpu_breakpoint_remove_by_ref(CPUState *env, CPUBreakpoint *breakpoint)
4c3a88a2 1556{
1fddef4b 1557#if defined(TARGET_HAS_ICE)
72cf2d4f 1558 QTAILQ_REMOVE(&env->breakpoints, breakpoint, entry);
d720b93d 1559
a1d1bb31
AL
1560 breakpoint_invalidate(env, breakpoint->pc);
1561
1562 qemu_free(breakpoint);
1563#endif
1564}
1565
1566/* Remove all matching breakpoints. */
1567void cpu_breakpoint_remove_all(CPUState *env, int mask)
1568{
1569#if defined(TARGET_HAS_ICE)
c0ce998e 1570 CPUBreakpoint *bp, *next;
a1d1bb31 1571
72cf2d4f 1572 QTAILQ_FOREACH_SAFE(bp, &env->breakpoints, entry, next) {
a1d1bb31
AL
1573 if (bp->flags & mask)
1574 cpu_breakpoint_remove_by_ref(env, bp);
c0ce998e 1575 }
4c3a88a2
FB
1576#endif
1577}
1578
c33a346e
FB
1579/* enable or disable single step mode. EXCP_DEBUG is returned by the
1580 CPU loop after each instruction */
1581void cpu_single_step(CPUState *env, int enabled)
1582{
1fddef4b 1583#if defined(TARGET_HAS_ICE)
c33a346e
FB
1584 if (env->singlestep_enabled != enabled) {
1585 env->singlestep_enabled = enabled;
e22a25c9
AL
1586 if (kvm_enabled())
1587 kvm_update_guest_debug(env, 0);
1588 else {
ccbb4d44 1589 /* must flush all the translated code to avoid inconsistencies */
e22a25c9
AL
1590 /* XXX: only flush what is necessary */
1591 tb_flush(env);
1592 }
c33a346e
FB
1593 }
1594#endif
1595}
1596
34865134
FB
1597/* enable or disable low levels log */
1598void cpu_set_log(int log_flags)
1599{
1600 loglevel = log_flags;
1601 if (loglevel && !logfile) {
11fcfab4 1602 logfile = fopen(logfilename, log_append ? "a" : "w");
34865134
FB
1603 if (!logfile) {
1604 perror(logfilename);
1605 _exit(1);
1606 }
9fa3e853
FB
1607#if !defined(CONFIG_SOFTMMU)
1608 /* must avoid mmap() usage of glibc by setting a buffer "by hand" */
1609 {
b55266b5 1610 static char logfile_buf[4096];
9fa3e853
FB
1611 setvbuf(logfile, logfile_buf, _IOLBF, sizeof(logfile_buf));
1612 }
bf65f53f
FN
1613#elif !defined(_WIN32)
1614 /* Win32 doesn't support line-buffering and requires size >= 2 */
34865134 1615 setvbuf(logfile, NULL, _IOLBF, 0);
9fa3e853 1616#endif
e735b91c
PB
1617 log_append = 1;
1618 }
1619 if (!loglevel && logfile) {
1620 fclose(logfile);
1621 logfile = NULL;
34865134
FB
1622 }
1623}
1624
1625void cpu_set_log_filename(const char *filename)
1626{
1627 logfilename = strdup(filename);
e735b91c
PB
1628 if (logfile) {
1629 fclose(logfile);
1630 logfile = NULL;
1631 }
1632 cpu_set_log(loglevel);
34865134 1633}
c33a346e 1634
3098dba0 1635static void cpu_unlink_tb(CPUState *env)
ea041c0e 1636{
3098dba0
AJ
1637 /* FIXME: TB unchaining isn't SMP safe. For now just ignore the
1638 problem and hope the cpu will stop of its own accord. For userspace
1639 emulation this often isn't actually as bad as it sounds. Often
1640 signals are used primarily to interrupt blocking syscalls. */
ea041c0e 1641 TranslationBlock *tb;
c227f099 1642 static spinlock_t interrupt_lock = SPIN_LOCK_UNLOCKED;
59817ccb 1643
cab1b4bd 1644 spin_lock(&interrupt_lock);
3098dba0
AJ
1645 tb = env->current_tb;
1646 /* if the cpu is currently executing code, we must unlink it and
1647 all the potentially executing TB */
f76cfe56 1648 if (tb) {
3098dba0
AJ
1649 env->current_tb = NULL;
1650 tb_reset_jump_recursive(tb);
be214e6c 1651 }
cab1b4bd 1652 spin_unlock(&interrupt_lock);
3098dba0
AJ
1653}
1654
97ffbd8d 1655#ifndef CONFIG_USER_ONLY
3098dba0 1656/* mask must never be zero, except for A20 change call */
ec6959d0 1657static void tcg_handle_interrupt(CPUState *env, int mask)
3098dba0
AJ
1658{
1659 int old_mask;
be214e6c 1660
2e70f6ef 1661 old_mask = env->interrupt_request;
68a79315 1662 env->interrupt_request |= mask;
3098dba0 1663
8edac960
AL
1664 /*
1665 * If called from iothread context, wake the target cpu in
1666 * case its halted.
1667 */
b7680cb6 1668 if (!qemu_cpu_is_self(env)) {
8edac960
AL
1669 qemu_cpu_kick(env);
1670 return;
1671 }
8edac960 1672
2e70f6ef 1673 if (use_icount) {
266910c4 1674 env->icount_decr.u16.high = 0xffff;
2e70f6ef 1675 if (!can_do_io(env)
be214e6c 1676 && (mask & ~old_mask) != 0) {
2e70f6ef
PB
1677 cpu_abort(env, "Raised interrupt while not in I/O function");
1678 }
2e70f6ef 1679 } else {
3098dba0 1680 cpu_unlink_tb(env);
ea041c0e
FB
1681 }
1682}
1683
ec6959d0
JK
1684CPUInterruptHandler cpu_interrupt_handler = tcg_handle_interrupt;
1685
97ffbd8d
JK
1686#else /* CONFIG_USER_ONLY */
1687
1688void cpu_interrupt(CPUState *env, int mask)
1689{
1690 env->interrupt_request |= mask;
1691 cpu_unlink_tb(env);
1692}
1693#endif /* CONFIG_USER_ONLY */
1694
b54ad049
FB
1695void cpu_reset_interrupt(CPUState *env, int mask)
1696{
1697 env->interrupt_request &= ~mask;
1698}
1699
3098dba0
AJ
1700void cpu_exit(CPUState *env)
1701{
1702 env->exit_request = 1;
1703 cpu_unlink_tb(env);
1704}
1705
c7cd6a37 1706const CPULogItem cpu_log_items[] = {
5fafdf24 1707 { CPU_LOG_TB_OUT_ASM, "out_asm",
f193c797
FB
1708 "show generated host assembly code for each compiled TB" },
1709 { CPU_LOG_TB_IN_ASM, "in_asm",
1710 "show target assembly code for each compiled TB" },
5fafdf24 1711 { CPU_LOG_TB_OP, "op",
57fec1fe 1712 "show micro ops for each compiled TB" },
f193c797 1713 { CPU_LOG_TB_OP_OPT, "op_opt",
e01a1157
BS
1714 "show micro ops "
1715#ifdef TARGET_I386
1716 "before eflags optimization and "
f193c797 1717#endif
e01a1157 1718 "after liveness analysis" },
f193c797
FB
1719 { CPU_LOG_INT, "int",
1720 "show interrupts/exceptions in short format" },
1721 { CPU_LOG_EXEC, "exec",
1722 "show trace before each executed TB (lots of logs)" },
9fddaa0c 1723 { CPU_LOG_TB_CPU, "cpu",
e91c8a77 1724 "show CPU state before block translation" },
f193c797
FB
1725#ifdef TARGET_I386
1726 { CPU_LOG_PCALL, "pcall",
1727 "show protected mode far calls/returns/exceptions" },
eca1bdf4
AL
1728 { CPU_LOG_RESET, "cpu_reset",
1729 "show CPU state before CPU resets" },
f193c797 1730#endif
8e3a9fd2 1731#ifdef DEBUG_IOPORT
fd872598
FB
1732 { CPU_LOG_IOPORT, "ioport",
1733 "show all i/o ports accesses" },
8e3a9fd2 1734#endif
f193c797
FB
1735 { 0, NULL, NULL },
1736};
1737
f6f3fbca
MT
1738#ifndef CONFIG_USER_ONLY
1739static QLIST_HEAD(memory_client_list, CPUPhysMemoryClient) memory_client_list
1740 = QLIST_HEAD_INITIALIZER(memory_client_list);
1741
1742static void cpu_notify_set_memory(target_phys_addr_t start_addr,
9742bf26 1743 ram_addr_t size,
0fd542fb
MT
1744 ram_addr_t phys_offset,
1745 bool log_dirty)
f6f3fbca
MT
1746{
1747 CPUPhysMemoryClient *client;
1748 QLIST_FOREACH(client, &memory_client_list, list) {
0fd542fb 1749 client->set_memory(client, start_addr, size, phys_offset, log_dirty);
f6f3fbca
MT
1750 }
1751}
1752
1753static int cpu_notify_sync_dirty_bitmap(target_phys_addr_t start,
9742bf26 1754 target_phys_addr_t end)
f6f3fbca
MT
1755{
1756 CPUPhysMemoryClient *client;
1757 QLIST_FOREACH(client, &memory_client_list, list) {
1758 int r = client->sync_dirty_bitmap(client, start, end);
1759 if (r < 0)
1760 return r;
1761 }
1762 return 0;
1763}
1764
1765static int cpu_notify_migration_log(int enable)
1766{
1767 CPUPhysMemoryClient *client;
1768 QLIST_FOREACH(client, &memory_client_list, list) {
1769 int r = client->migration_log(client, enable);
1770 if (r < 0)
1771 return r;
1772 }
1773 return 0;
1774}
1775
2173a75f
AW
1776struct last_map {
1777 target_phys_addr_t start_addr;
1778 ram_addr_t size;
1779 ram_addr_t phys_offset;
1780};
1781
8d4c78e7
AW
1782/* The l1_phys_map provides the upper P_L1_BITs of the guest physical
1783 * address. Each intermediate table provides the next L2_BITs of guest
1784 * physical address space. The number of levels vary based on host and
1785 * guest configuration, making it efficient to build the final guest
1786 * physical address by seeding the L1 offset and shifting and adding in
1787 * each L2 offset as we recurse through them. */
2173a75f
AW
1788static void phys_page_for_each_1(CPUPhysMemoryClient *client, int level,
1789 void **lp, target_phys_addr_t addr,
1790 struct last_map *map)
f6f3fbca 1791{
5cd2c5b6 1792 int i;
f6f3fbca 1793
5cd2c5b6
RH
1794 if (*lp == NULL) {
1795 return;
1796 }
1797 if (level == 0) {
1798 PhysPageDesc *pd = *lp;
8d4c78e7 1799 addr <<= L2_BITS + TARGET_PAGE_BITS;
7296abac 1800 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6 1801 if (pd[i].phys_offset != IO_MEM_UNASSIGNED) {
2173a75f
AW
1802 target_phys_addr_t start_addr = addr | i << TARGET_PAGE_BITS;
1803
1804 if (map->size &&
1805 start_addr == map->start_addr + map->size &&
1806 pd[i].phys_offset == map->phys_offset + map->size) {
1807
1808 map->size += TARGET_PAGE_SIZE;
1809 continue;
1810 } else if (map->size) {
1811 client->set_memory(client, map->start_addr,
1812 map->size, map->phys_offset, false);
1813 }
1814
1815 map->start_addr = start_addr;
1816 map->size = TARGET_PAGE_SIZE;
1817 map->phys_offset = pd[i].phys_offset;
f6f3fbca 1818 }
5cd2c5b6
RH
1819 }
1820 } else {
1821 void **pp = *lp;
7296abac 1822 for (i = 0; i < L2_SIZE; ++i) {
8d4c78e7 1823 phys_page_for_each_1(client, level - 1, pp + i,
2173a75f 1824 (addr << L2_BITS) | i, map);
f6f3fbca
MT
1825 }
1826 }
1827}
1828
1829static void phys_page_for_each(CPUPhysMemoryClient *client)
1830{
5cd2c5b6 1831 int i;
2173a75f
AW
1832 struct last_map map = { };
1833
5cd2c5b6
RH
1834 for (i = 0; i < P_L1_SIZE; ++i) {
1835 phys_page_for_each_1(client, P_L1_SHIFT / L2_BITS - 1,
2173a75f
AW
1836 l1_phys_map + i, i, &map);
1837 }
1838 if (map.size) {
1839 client->set_memory(client, map.start_addr, map.size, map.phys_offset,
1840 false);
f6f3fbca 1841 }
f6f3fbca
MT
1842}
1843
1844void cpu_register_phys_memory_client(CPUPhysMemoryClient *client)
1845{
1846 QLIST_INSERT_HEAD(&memory_client_list, client, list);
1847 phys_page_for_each(client);
1848}
1849
1850void cpu_unregister_phys_memory_client(CPUPhysMemoryClient *client)
1851{
1852 QLIST_REMOVE(client, list);
1853}
1854#endif
1855
f193c797
FB
1856static int cmp1(const char *s1, int n, const char *s2)
1857{
1858 if (strlen(s2) != n)
1859 return 0;
1860 return memcmp(s1, s2, n) == 0;
1861}
3b46e624 1862
f193c797
FB
1863/* takes a comma separated list of log masks. Return 0 if error. */
1864int cpu_str_to_log_mask(const char *str)
1865{
c7cd6a37 1866 const CPULogItem *item;
f193c797
FB
1867 int mask;
1868 const char *p, *p1;
1869
1870 p = str;
1871 mask = 0;
1872 for(;;) {
1873 p1 = strchr(p, ',');
1874 if (!p1)
1875 p1 = p + strlen(p);
9742bf26
YT
1876 if(cmp1(p,p1-p,"all")) {
1877 for(item = cpu_log_items; item->mask != 0; item++) {
1878 mask |= item->mask;
1879 }
1880 } else {
1881 for(item = cpu_log_items; item->mask != 0; item++) {
1882 if (cmp1(p, p1 - p, item->name))
1883 goto found;
1884 }
1885 return 0;
f193c797 1886 }
f193c797
FB
1887 found:
1888 mask |= item->mask;
1889 if (*p1 != ',')
1890 break;
1891 p = p1 + 1;
1892 }
1893 return mask;
1894}
ea041c0e 1895
7501267e
FB
1896void cpu_abort(CPUState *env, const char *fmt, ...)
1897{
1898 va_list ap;
493ae1f0 1899 va_list ap2;
7501267e
FB
1900
1901 va_start(ap, fmt);
493ae1f0 1902 va_copy(ap2, ap);
7501267e
FB
1903 fprintf(stderr, "qemu: fatal: ");
1904 vfprintf(stderr, fmt, ap);
1905 fprintf(stderr, "\n");
1906#ifdef TARGET_I386
7fe48483
FB
1907 cpu_dump_state(env, stderr, fprintf, X86_DUMP_FPU | X86_DUMP_CCOP);
1908#else
1909 cpu_dump_state(env, stderr, fprintf, 0);
7501267e 1910#endif
93fcfe39
AL
1911 if (qemu_log_enabled()) {
1912 qemu_log("qemu: fatal: ");
1913 qemu_log_vprintf(fmt, ap2);
1914 qemu_log("\n");
f9373291 1915#ifdef TARGET_I386
93fcfe39 1916 log_cpu_state(env, X86_DUMP_FPU | X86_DUMP_CCOP);
f9373291 1917#else
93fcfe39 1918 log_cpu_state(env, 0);
f9373291 1919#endif
31b1a7b4 1920 qemu_log_flush();
93fcfe39 1921 qemu_log_close();
924edcae 1922 }
493ae1f0 1923 va_end(ap2);
f9373291 1924 va_end(ap);
fd052bf6
RV
1925#if defined(CONFIG_USER_ONLY)
1926 {
1927 struct sigaction act;
1928 sigfillset(&act.sa_mask);
1929 act.sa_handler = SIG_DFL;
1930 sigaction(SIGABRT, &act, NULL);
1931 }
1932#endif
7501267e
FB
1933 abort();
1934}
1935
c5be9f08
TS
1936CPUState *cpu_copy(CPUState *env)
1937{
01ba9816 1938 CPUState *new_env = cpu_init(env->cpu_model_str);
c5be9f08
TS
1939 CPUState *next_cpu = new_env->next_cpu;
1940 int cpu_index = new_env->cpu_index;
5a38f081
AL
1941#if defined(TARGET_HAS_ICE)
1942 CPUBreakpoint *bp;
1943 CPUWatchpoint *wp;
1944#endif
1945
c5be9f08 1946 memcpy(new_env, env, sizeof(CPUState));
5a38f081
AL
1947
1948 /* Preserve chaining and index. */
c5be9f08
TS
1949 new_env->next_cpu = next_cpu;
1950 new_env->cpu_index = cpu_index;
5a38f081
AL
1951
1952 /* Clone all break/watchpoints.
1953 Note: Once we support ptrace with hw-debug register access, make sure
1954 BP_CPU break/watchpoints are handled correctly on clone. */
72cf2d4f
BS
1955 QTAILQ_INIT(&env->breakpoints);
1956 QTAILQ_INIT(&env->watchpoints);
5a38f081 1957#if defined(TARGET_HAS_ICE)
72cf2d4f 1958 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
5a38f081
AL
1959 cpu_breakpoint_insert(new_env, bp->pc, bp->flags, NULL);
1960 }
72cf2d4f 1961 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
5a38f081
AL
1962 cpu_watchpoint_insert(new_env, wp->vaddr, (~wp->len_mask) + 1,
1963 wp->flags, NULL);
1964 }
1965#endif
1966
c5be9f08
TS
1967 return new_env;
1968}
1969
0124311e
FB
1970#if !defined(CONFIG_USER_ONLY)
1971
5c751e99
EI
1972static inline void tlb_flush_jmp_cache(CPUState *env, target_ulong addr)
1973{
1974 unsigned int i;
1975
1976 /* Discard jump cache entries for any tb which might potentially
1977 overlap the flushed page. */
1978 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1979 memset (&env->tb_jmp_cache[i], 0,
9742bf26 1980 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
5c751e99
EI
1981
1982 i = tb_jmp_cache_hash_page(addr);
1983 memset (&env->tb_jmp_cache[i], 0,
9742bf26 1984 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
5c751e99
EI
1985}
1986
08738984
IK
1987static CPUTLBEntry s_cputlb_empty_entry = {
1988 .addr_read = -1,
1989 .addr_write = -1,
1990 .addr_code = -1,
1991 .addend = -1,
1992};
1993
ee8b7021
FB
1994/* NOTE: if flush_global is true, also flush global entries (not
1995 implemented yet) */
1996void tlb_flush(CPUState *env, int flush_global)
33417e70 1997{
33417e70 1998 int i;
0124311e 1999
9fa3e853
FB
2000#if defined(DEBUG_TLB)
2001 printf("tlb_flush:\n");
2002#endif
0124311e
FB
2003 /* must reset current TB so that interrupts cannot modify the
2004 links while we are modifying them */
2005 env->current_tb = NULL;
2006
33417e70 2007 for(i = 0; i < CPU_TLB_SIZE; i++) {
cfde4bd9
IY
2008 int mmu_idx;
2009 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
08738984 2010 env->tlb_table[mmu_idx][i] = s_cputlb_empty_entry;
cfde4bd9 2011 }
33417e70 2012 }
9fa3e853 2013
8a40a180 2014 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
9fa3e853 2015
d4c430a8
PB
2016 env->tlb_flush_addr = -1;
2017 env->tlb_flush_mask = 0;
e3db7226 2018 tlb_flush_count++;
33417e70
FB
2019}
2020
274da6b2 2021static inline void tlb_flush_entry(CPUTLBEntry *tlb_entry, target_ulong addr)
61382a50 2022{
5fafdf24 2023 if (addr == (tlb_entry->addr_read &
84b7b8e7 2024 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
5fafdf24 2025 addr == (tlb_entry->addr_write &
84b7b8e7 2026 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
5fafdf24 2027 addr == (tlb_entry->addr_code &
84b7b8e7 2028 (TARGET_PAGE_MASK | TLB_INVALID_MASK))) {
08738984 2029 *tlb_entry = s_cputlb_empty_entry;
84b7b8e7 2030 }
61382a50
FB
2031}
2032
2e12669a 2033void tlb_flush_page(CPUState *env, target_ulong addr)
33417e70 2034{
8a40a180 2035 int i;
cfde4bd9 2036 int mmu_idx;
0124311e 2037
9fa3e853 2038#if defined(DEBUG_TLB)
108c49b8 2039 printf("tlb_flush_page: " TARGET_FMT_lx "\n", addr);
9fa3e853 2040#endif
d4c430a8
PB
2041 /* Check if we need to flush due to large pages. */
2042 if ((addr & env->tlb_flush_mask) == env->tlb_flush_addr) {
2043#if defined(DEBUG_TLB)
2044 printf("tlb_flush_page: forced full flush ("
2045 TARGET_FMT_lx "/" TARGET_FMT_lx ")\n",
2046 env->tlb_flush_addr, env->tlb_flush_mask);
2047#endif
2048 tlb_flush(env, 1);
2049 return;
2050 }
0124311e
FB
2051 /* must reset current TB so that interrupts cannot modify the
2052 links while we are modifying them */
2053 env->current_tb = NULL;
61382a50
FB
2054
2055 addr &= TARGET_PAGE_MASK;
2056 i = (addr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
cfde4bd9
IY
2057 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
2058 tlb_flush_entry(&env->tlb_table[mmu_idx][i], addr);
0124311e 2059
5c751e99 2060 tlb_flush_jmp_cache(env, addr);
9fa3e853
FB
2061}
2062
9fa3e853
FB
2063/* update the TLBs so that writes to code in the virtual page 'addr'
2064 can be detected */
c227f099 2065static void tlb_protect_code(ram_addr_t ram_addr)
9fa3e853 2066{
5fafdf24 2067 cpu_physical_memory_reset_dirty(ram_addr,
6a00d601
FB
2068 ram_addr + TARGET_PAGE_SIZE,
2069 CODE_DIRTY_FLAG);
9fa3e853
FB
2070}
2071
9fa3e853 2072/* update the TLB so that writes in physical page 'phys_addr' are no longer
3a7d929e 2073 tested for self modifying code */
c227f099 2074static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
3a7d929e 2075 target_ulong vaddr)
9fa3e853 2076{
f7c11b53 2077 cpu_physical_memory_set_dirty_flags(ram_addr, CODE_DIRTY_FLAG);
1ccde1cb
FB
2078}
2079
5fafdf24 2080static inline void tlb_reset_dirty_range(CPUTLBEntry *tlb_entry,
1ccde1cb
FB
2081 unsigned long start, unsigned long length)
2082{
2083 unsigned long addr;
84b7b8e7
FB
2084 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
2085 addr = (tlb_entry->addr_write & TARGET_PAGE_MASK) + tlb_entry->addend;
1ccde1cb 2086 if ((addr - start) < length) {
0f459d16 2087 tlb_entry->addr_write = (tlb_entry->addr_write & TARGET_PAGE_MASK) | TLB_NOTDIRTY;
1ccde1cb
FB
2088 }
2089 }
2090}
2091
5579c7f3 2092/* Note: start and end must be within the same ram block. */
c227f099 2093void cpu_physical_memory_reset_dirty(ram_addr_t start, ram_addr_t end,
0a962c02 2094 int dirty_flags)
1ccde1cb
FB
2095{
2096 CPUState *env;
4f2ac237 2097 unsigned long length, start1;
f7c11b53 2098 int i;
1ccde1cb
FB
2099
2100 start &= TARGET_PAGE_MASK;
2101 end = TARGET_PAGE_ALIGN(end);
2102
2103 length = end - start;
2104 if (length == 0)
2105 return;
f7c11b53 2106 cpu_physical_memory_mask_dirty_range(start, length, dirty_flags);
f23db169 2107
1ccde1cb
FB
2108 /* we modify the TLB cache so that the dirty bit will be set again
2109 when accessing the range */
b2e0a138 2110 start1 = (unsigned long)qemu_safe_ram_ptr(start);
a57d23e4 2111 /* Check that we don't span multiple blocks - this breaks the
5579c7f3 2112 address comparisons below. */
b2e0a138 2113 if ((unsigned long)qemu_safe_ram_ptr(end - 1) - start1
5579c7f3
PB
2114 != (end - 1) - start) {
2115 abort();
2116 }
2117
6a00d601 2118 for(env = first_cpu; env != NULL; env = env->next_cpu) {
cfde4bd9
IY
2119 int mmu_idx;
2120 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2121 for(i = 0; i < CPU_TLB_SIZE; i++)
2122 tlb_reset_dirty_range(&env->tlb_table[mmu_idx][i],
2123 start1, length);
2124 }
6a00d601 2125 }
1ccde1cb
FB
2126}
2127
74576198
AL
2128int cpu_physical_memory_set_dirty_tracking(int enable)
2129{
f6f3fbca 2130 int ret = 0;
74576198 2131 in_migration = enable;
f6f3fbca
MT
2132 ret = cpu_notify_migration_log(!!enable);
2133 return ret;
74576198
AL
2134}
2135
2136int cpu_physical_memory_get_dirty_tracking(void)
2137{
2138 return in_migration;
2139}
2140
c227f099
AL
2141int cpu_physical_sync_dirty_bitmap(target_phys_addr_t start_addr,
2142 target_phys_addr_t end_addr)
2bec46dc 2143{
7b8f3b78 2144 int ret;
151f7749 2145
f6f3fbca 2146 ret = cpu_notify_sync_dirty_bitmap(start_addr, end_addr);
151f7749 2147 return ret;
2bec46dc
AL
2148}
2149
e5896b12
AP
2150int cpu_physical_log_start(target_phys_addr_t start_addr,
2151 ram_addr_t size)
2152{
2153 CPUPhysMemoryClient *client;
2154 QLIST_FOREACH(client, &memory_client_list, list) {
2155 if (client->log_start) {
2156 int r = client->log_start(client, start_addr, size);
2157 if (r < 0) {
2158 return r;
2159 }
2160 }
2161 }
2162 return 0;
2163}
2164
2165int cpu_physical_log_stop(target_phys_addr_t start_addr,
2166 ram_addr_t size)
2167{
2168 CPUPhysMemoryClient *client;
2169 QLIST_FOREACH(client, &memory_client_list, list) {
2170 if (client->log_stop) {
2171 int r = client->log_stop(client, start_addr, size);
2172 if (r < 0) {
2173 return r;
2174 }
2175 }
2176 }
2177 return 0;
2178}
2179
3a7d929e
FB
2180static inline void tlb_update_dirty(CPUTLBEntry *tlb_entry)
2181{
c227f099 2182 ram_addr_t ram_addr;
5579c7f3 2183 void *p;
3a7d929e 2184
84b7b8e7 2185 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
5579c7f3
PB
2186 p = (void *)(unsigned long)((tlb_entry->addr_write & TARGET_PAGE_MASK)
2187 + tlb_entry->addend);
e890261f 2188 ram_addr = qemu_ram_addr_from_host_nofail(p);
3a7d929e 2189 if (!cpu_physical_memory_is_dirty(ram_addr)) {
0f459d16 2190 tlb_entry->addr_write |= TLB_NOTDIRTY;
3a7d929e
FB
2191 }
2192 }
2193}
2194
2195/* update the TLB according to the current state of the dirty bits */
2196void cpu_tlb_update_dirty(CPUState *env)
2197{
2198 int i;
cfde4bd9
IY
2199 int mmu_idx;
2200 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2201 for(i = 0; i < CPU_TLB_SIZE; i++)
2202 tlb_update_dirty(&env->tlb_table[mmu_idx][i]);
2203 }
3a7d929e
FB
2204}
2205
0f459d16 2206static inline void tlb_set_dirty1(CPUTLBEntry *tlb_entry, target_ulong vaddr)
1ccde1cb 2207{
0f459d16
PB
2208 if (tlb_entry->addr_write == (vaddr | TLB_NOTDIRTY))
2209 tlb_entry->addr_write = vaddr;
1ccde1cb
FB
2210}
2211
0f459d16
PB
2212/* update the TLB corresponding to virtual page vaddr
2213 so that it is no longer dirty */
2214static inline void tlb_set_dirty(CPUState *env, target_ulong vaddr)
1ccde1cb 2215{
1ccde1cb 2216 int i;
cfde4bd9 2217 int mmu_idx;
1ccde1cb 2218
0f459d16 2219 vaddr &= TARGET_PAGE_MASK;
1ccde1cb 2220 i = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
cfde4bd9
IY
2221 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
2222 tlb_set_dirty1(&env->tlb_table[mmu_idx][i], vaddr);
9fa3e853
FB
2223}
2224
d4c430a8
PB
2225/* Our TLB does not support large pages, so remember the area covered by
2226 large pages and trigger a full TLB flush if these are invalidated. */
2227static void tlb_add_large_page(CPUState *env, target_ulong vaddr,
2228 target_ulong size)
2229{
2230 target_ulong mask = ~(size - 1);
2231
2232 if (env->tlb_flush_addr == (target_ulong)-1) {
2233 env->tlb_flush_addr = vaddr & mask;
2234 env->tlb_flush_mask = mask;
2235 return;
2236 }
2237 /* Extend the existing region to include the new page.
2238 This is a compromise between unnecessary flushes and the cost
2239 of maintaining a full variable size TLB. */
2240 mask &= env->tlb_flush_mask;
2241 while (((env->tlb_flush_addr ^ vaddr) & mask) != 0) {
2242 mask <<= 1;
2243 }
2244 env->tlb_flush_addr &= mask;
2245 env->tlb_flush_mask = mask;
2246}
2247
2248/* Add a new TLB entry. At most one entry for a given virtual address
2249 is permitted. Only a single TARGET_PAGE_SIZE region is mapped, the
2250 supplied size is only used by tlb_flush_page. */
2251void tlb_set_page(CPUState *env, target_ulong vaddr,
2252 target_phys_addr_t paddr, int prot,
2253 int mmu_idx, target_ulong size)
9fa3e853 2254{
92e873b9 2255 PhysPageDesc *p;
4f2ac237 2256 unsigned long pd;
9fa3e853 2257 unsigned int index;
4f2ac237 2258 target_ulong address;
0f459d16 2259 target_ulong code_address;
355b1943 2260 unsigned long addend;
84b7b8e7 2261 CPUTLBEntry *te;
a1d1bb31 2262 CPUWatchpoint *wp;
c227f099 2263 target_phys_addr_t iotlb;
9fa3e853 2264
d4c430a8
PB
2265 assert(size >= TARGET_PAGE_SIZE);
2266 if (size != TARGET_PAGE_SIZE) {
2267 tlb_add_large_page(env, vaddr, size);
2268 }
92e873b9 2269 p = phys_page_find(paddr >> TARGET_PAGE_BITS);
9fa3e853
FB
2270 if (!p) {
2271 pd = IO_MEM_UNASSIGNED;
9fa3e853
FB
2272 } else {
2273 pd = p->phys_offset;
9fa3e853
FB
2274 }
2275#if defined(DEBUG_TLB)
7fd3f494
SW
2276 printf("tlb_set_page: vaddr=" TARGET_FMT_lx " paddr=0x" TARGET_FMT_plx
2277 " prot=%x idx=%d pd=0x%08lx\n",
2278 vaddr, paddr, prot, mmu_idx, pd);
9fa3e853
FB
2279#endif
2280
0f459d16
PB
2281 address = vaddr;
2282 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM && !(pd & IO_MEM_ROMD)) {
2283 /* IO memory case (romd handled later) */
2284 address |= TLB_MMIO;
2285 }
5579c7f3 2286 addend = (unsigned long)qemu_get_ram_ptr(pd & TARGET_PAGE_MASK);
0f459d16
PB
2287 if ((pd & ~TARGET_PAGE_MASK) <= IO_MEM_ROM) {
2288 /* Normal RAM. */
2289 iotlb = pd & TARGET_PAGE_MASK;
2290 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM)
2291 iotlb |= IO_MEM_NOTDIRTY;
2292 else
2293 iotlb |= IO_MEM_ROM;
2294 } else {
ccbb4d44 2295 /* IO handlers are currently passed a physical address.
0f459d16
PB
2296 It would be nice to pass an offset from the base address
2297 of that region. This would avoid having to special case RAM,
2298 and avoid full address decoding in every device.
2299 We can't use the high bits of pd for this because
2300 IO_MEM_ROMD uses these as a ram address. */
8da3ff18
PB
2301 iotlb = (pd & ~TARGET_PAGE_MASK);
2302 if (p) {
8da3ff18
PB
2303 iotlb += p->region_offset;
2304 } else {
2305 iotlb += paddr;
2306 }
0f459d16
PB
2307 }
2308
2309 code_address = address;
2310 /* Make accesses to pages with watchpoints go via the
2311 watchpoint trap routines. */
72cf2d4f 2312 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
a1d1bb31 2313 if (vaddr == (wp->vaddr & TARGET_PAGE_MASK)) {
bf298f83
JK
2314 /* Avoid trapping reads of pages with a write breakpoint. */
2315 if ((prot & PAGE_WRITE) || (wp->flags & BP_MEM_READ)) {
2316 iotlb = io_mem_watch + paddr;
2317 address |= TLB_MMIO;
2318 break;
2319 }
6658ffb8 2320 }
0f459d16 2321 }
d79acba4 2322
0f459d16
PB
2323 index = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
2324 env->iotlb[mmu_idx][index] = iotlb - vaddr;
2325 te = &env->tlb_table[mmu_idx][index];
2326 te->addend = addend - vaddr;
2327 if (prot & PAGE_READ) {
2328 te->addr_read = address;
2329 } else {
2330 te->addr_read = -1;
2331 }
5c751e99 2332
0f459d16
PB
2333 if (prot & PAGE_EXEC) {
2334 te->addr_code = code_address;
2335 } else {
2336 te->addr_code = -1;
2337 }
2338 if (prot & PAGE_WRITE) {
2339 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_ROM ||
2340 (pd & IO_MEM_ROMD)) {
2341 /* Write access calls the I/O callback. */
2342 te->addr_write = address | TLB_MMIO;
2343 } else if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM &&
2344 !cpu_physical_memory_is_dirty(pd)) {
2345 te->addr_write = address | TLB_NOTDIRTY;
9fa3e853 2346 } else {
0f459d16 2347 te->addr_write = address;
9fa3e853 2348 }
0f459d16
PB
2349 } else {
2350 te->addr_write = -1;
9fa3e853 2351 }
9fa3e853
FB
2352}
2353
0124311e
FB
2354#else
2355
ee8b7021 2356void tlb_flush(CPUState *env, int flush_global)
0124311e
FB
2357{
2358}
2359
2e12669a 2360void tlb_flush_page(CPUState *env, target_ulong addr)
0124311e
FB
2361{
2362}
2363
edf8e2af
MW
2364/*
2365 * Walks guest process memory "regions" one by one
2366 * and calls callback function 'fn' for each region.
2367 */
5cd2c5b6
RH
2368
2369struct walk_memory_regions_data
2370{
2371 walk_memory_regions_fn fn;
2372 void *priv;
2373 unsigned long start;
2374 int prot;
2375};
2376
2377static int walk_memory_regions_end(struct walk_memory_regions_data *data,
b480d9b7 2378 abi_ulong end, int new_prot)
5cd2c5b6
RH
2379{
2380 if (data->start != -1ul) {
2381 int rc = data->fn(data->priv, data->start, end, data->prot);
2382 if (rc != 0) {
2383 return rc;
2384 }
2385 }
2386
2387 data->start = (new_prot ? end : -1ul);
2388 data->prot = new_prot;
2389
2390 return 0;
2391}
2392
2393static int walk_memory_regions_1(struct walk_memory_regions_data *data,
b480d9b7 2394 abi_ulong base, int level, void **lp)
5cd2c5b6 2395{
b480d9b7 2396 abi_ulong pa;
5cd2c5b6
RH
2397 int i, rc;
2398
2399 if (*lp == NULL) {
2400 return walk_memory_regions_end(data, base, 0);
2401 }
2402
2403 if (level == 0) {
2404 PageDesc *pd = *lp;
7296abac 2405 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
2406 int prot = pd[i].flags;
2407
2408 pa = base | (i << TARGET_PAGE_BITS);
2409 if (prot != data->prot) {
2410 rc = walk_memory_regions_end(data, pa, prot);
2411 if (rc != 0) {
2412 return rc;
9fa3e853 2413 }
9fa3e853 2414 }
5cd2c5b6
RH
2415 }
2416 } else {
2417 void **pp = *lp;
7296abac 2418 for (i = 0; i < L2_SIZE; ++i) {
b480d9b7
PB
2419 pa = base | ((abi_ulong)i <<
2420 (TARGET_PAGE_BITS + L2_BITS * level));
5cd2c5b6
RH
2421 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
2422 if (rc != 0) {
2423 return rc;
2424 }
2425 }
2426 }
2427
2428 return 0;
2429}
2430
2431int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
2432{
2433 struct walk_memory_regions_data data;
2434 unsigned long i;
2435
2436 data.fn = fn;
2437 data.priv = priv;
2438 data.start = -1ul;
2439 data.prot = 0;
2440
2441 for (i = 0; i < V_L1_SIZE; i++) {
b480d9b7 2442 int rc = walk_memory_regions_1(&data, (abi_ulong)i << V_L1_SHIFT,
5cd2c5b6
RH
2443 V_L1_SHIFT / L2_BITS - 1, l1_map + i);
2444 if (rc != 0) {
2445 return rc;
9fa3e853 2446 }
33417e70 2447 }
5cd2c5b6
RH
2448
2449 return walk_memory_regions_end(&data, 0, 0);
edf8e2af
MW
2450}
2451
b480d9b7
PB
2452static int dump_region(void *priv, abi_ulong start,
2453 abi_ulong end, unsigned long prot)
edf8e2af
MW
2454{
2455 FILE *f = (FILE *)priv;
2456
b480d9b7
PB
2457 (void) fprintf(f, TARGET_ABI_FMT_lx"-"TARGET_ABI_FMT_lx
2458 " "TARGET_ABI_FMT_lx" %c%c%c\n",
edf8e2af
MW
2459 start, end, end - start,
2460 ((prot & PAGE_READ) ? 'r' : '-'),
2461 ((prot & PAGE_WRITE) ? 'w' : '-'),
2462 ((prot & PAGE_EXEC) ? 'x' : '-'));
2463
2464 return (0);
2465}
2466
2467/* dump memory mappings */
2468void page_dump(FILE *f)
2469{
2470 (void) fprintf(f, "%-8s %-8s %-8s %s\n",
2471 "start", "end", "size", "prot");
2472 walk_memory_regions(f, dump_region);
33417e70
FB
2473}
2474
53a5960a 2475int page_get_flags(target_ulong address)
33417e70 2476{
9fa3e853
FB
2477 PageDesc *p;
2478
2479 p = page_find(address >> TARGET_PAGE_BITS);
33417e70 2480 if (!p)
9fa3e853
FB
2481 return 0;
2482 return p->flags;
2483}
2484
376a7909
RH
2485/* Modify the flags of a page and invalidate the code if necessary.
2486 The flag PAGE_WRITE_ORG is positioned automatically depending
2487 on PAGE_WRITE. The mmap_lock should already be held. */
53a5960a 2488void page_set_flags(target_ulong start, target_ulong end, int flags)
9fa3e853 2489{
376a7909
RH
2490 target_ulong addr, len;
2491
2492 /* This function should never be called with addresses outside the
2493 guest address space. If this assert fires, it probably indicates
2494 a missing call to h2g_valid. */
b480d9b7
PB
2495#if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2496 assert(end < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
376a7909
RH
2497#endif
2498 assert(start < end);
9fa3e853
FB
2499
2500 start = start & TARGET_PAGE_MASK;
2501 end = TARGET_PAGE_ALIGN(end);
376a7909
RH
2502
2503 if (flags & PAGE_WRITE) {
9fa3e853 2504 flags |= PAGE_WRITE_ORG;
376a7909
RH
2505 }
2506
2507 for (addr = start, len = end - start;
2508 len != 0;
2509 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2510 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2511
2512 /* If the write protection bit is set, then we invalidate
2513 the code inside. */
5fafdf24 2514 if (!(p->flags & PAGE_WRITE) &&
9fa3e853
FB
2515 (flags & PAGE_WRITE) &&
2516 p->first_tb) {
d720b93d 2517 tb_invalidate_phys_page(addr, 0, NULL);
9fa3e853
FB
2518 }
2519 p->flags = flags;
2520 }
33417e70
FB
2521}
2522
3d97b40b
TS
2523int page_check_range(target_ulong start, target_ulong len, int flags)
2524{
2525 PageDesc *p;
2526 target_ulong end;
2527 target_ulong addr;
2528
376a7909
RH
2529 /* This function should never be called with addresses outside the
2530 guest address space. If this assert fires, it probably indicates
2531 a missing call to h2g_valid. */
338e9e6c
BS
2532#if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2533 assert(start < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
376a7909
RH
2534#endif
2535
3e0650a9
RH
2536 if (len == 0) {
2537 return 0;
2538 }
376a7909
RH
2539 if (start + len - 1 < start) {
2540 /* We've wrapped around. */
55f280c9 2541 return -1;
376a7909 2542 }
55f280c9 2543
3d97b40b
TS
2544 end = TARGET_PAGE_ALIGN(start+len); /* must do before we loose bits in the next step */
2545 start = start & TARGET_PAGE_MASK;
2546
376a7909
RH
2547 for (addr = start, len = end - start;
2548 len != 0;
2549 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
3d97b40b
TS
2550 p = page_find(addr >> TARGET_PAGE_BITS);
2551 if( !p )
2552 return -1;
2553 if( !(p->flags & PAGE_VALID) )
2554 return -1;
2555
dae3270c 2556 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ))
3d97b40b 2557 return -1;
dae3270c
FB
2558 if (flags & PAGE_WRITE) {
2559 if (!(p->flags & PAGE_WRITE_ORG))
2560 return -1;
2561 /* unprotect the page if it was put read-only because it
2562 contains translated code */
2563 if (!(p->flags & PAGE_WRITE)) {
2564 if (!page_unprotect(addr, 0, NULL))
2565 return -1;
2566 }
2567 return 0;
2568 }
3d97b40b
TS
2569 }
2570 return 0;
2571}
2572
9fa3e853 2573/* called from signal handler: invalidate the code and unprotect the
ccbb4d44 2574 page. Return TRUE if the fault was successfully handled. */
53a5960a 2575int page_unprotect(target_ulong address, unsigned long pc, void *puc)
9fa3e853 2576{
45d679d6
AJ
2577 unsigned int prot;
2578 PageDesc *p;
53a5960a 2579 target_ulong host_start, host_end, addr;
9fa3e853 2580
c8a706fe
PB
2581 /* Technically this isn't safe inside a signal handler. However we
2582 know this only ever happens in a synchronous SEGV handler, so in
2583 practice it seems to be ok. */
2584 mmap_lock();
2585
45d679d6
AJ
2586 p = page_find(address >> TARGET_PAGE_BITS);
2587 if (!p) {
c8a706fe 2588 mmap_unlock();
9fa3e853 2589 return 0;
c8a706fe 2590 }
45d679d6 2591
9fa3e853
FB
2592 /* if the page was really writable, then we change its
2593 protection back to writable */
45d679d6
AJ
2594 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
2595 host_start = address & qemu_host_page_mask;
2596 host_end = host_start + qemu_host_page_size;
2597
2598 prot = 0;
2599 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
2600 p = page_find(addr >> TARGET_PAGE_BITS);
2601 p->flags |= PAGE_WRITE;
2602 prot |= p->flags;
2603
9fa3e853
FB
2604 /* and since the content will be modified, we must invalidate
2605 the corresponding translated code. */
45d679d6 2606 tb_invalidate_phys_page(addr, pc, puc);
9fa3e853 2607#ifdef DEBUG_TB_CHECK
45d679d6 2608 tb_invalidate_check(addr);
9fa3e853 2609#endif
9fa3e853 2610 }
45d679d6
AJ
2611 mprotect((void *)g2h(host_start), qemu_host_page_size,
2612 prot & PAGE_BITS);
2613
2614 mmap_unlock();
2615 return 1;
9fa3e853 2616 }
c8a706fe 2617 mmap_unlock();
9fa3e853
FB
2618 return 0;
2619}
2620
6a00d601
FB
2621static inline void tlb_set_dirty(CPUState *env,
2622 unsigned long addr, target_ulong vaddr)
1ccde1cb
FB
2623{
2624}
9fa3e853
FB
2625#endif /* defined(CONFIG_USER_ONLY) */
2626
e2eef170 2627#if !defined(CONFIG_USER_ONLY)
8da3ff18 2628
c04b2b78
PB
2629#define SUBPAGE_IDX(addr) ((addr) & ~TARGET_PAGE_MASK)
2630typedef struct subpage_t {
2631 target_phys_addr_t base;
f6405247
RH
2632 ram_addr_t sub_io_index[TARGET_PAGE_SIZE];
2633 ram_addr_t region_offset[TARGET_PAGE_SIZE];
c04b2b78
PB
2634} subpage_t;
2635
c227f099
AL
2636static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
2637 ram_addr_t memory, ram_addr_t region_offset);
f6405247
RH
2638static subpage_t *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
2639 ram_addr_t orig_memory,
2640 ram_addr_t region_offset);
db7b5426
BS
2641#define CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2, \
2642 need_subpage) \
2643 do { \
2644 if (addr > start_addr) \
2645 start_addr2 = 0; \
2646 else { \
2647 start_addr2 = start_addr & ~TARGET_PAGE_MASK; \
2648 if (start_addr2 > 0) \
2649 need_subpage = 1; \
2650 } \
2651 \
49e9fba2 2652 if ((start_addr + orig_size) - addr >= TARGET_PAGE_SIZE) \
db7b5426
BS
2653 end_addr2 = TARGET_PAGE_SIZE - 1; \
2654 else { \
2655 end_addr2 = (start_addr + orig_size - 1) & ~TARGET_PAGE_MASK; \
2656 if (end_addr2 < TARGET_PAGE_SIZE - 1) \
2657 need_subpage = 1; \
2658 } \
2659 } while (0)
2660
8f2498f9
MT
2661/* register physical memory.
2662 For RAM, 'size' must be a multiple of the target page size.
2663 If (phys_offset & ~TARGET_PAGE_MASK) != 0, then it is an
8da3ff18
PB
2664 io memory page. The address used when calling the IO function is
2665 the offset from the start of the region, plus region_offset. Both
ccbb4d44 2666 start_addr and region_offset are rounded down to a page boundary
8da3ff18
PB
2667 before calculating this offset. This should not be a problem unless
2668 the low bits of start_addr and region_offset differ. */
0fd542fb 2669void cpu_register_physical_memory_log(target_phys_addr_t start_addr,
c227f099
AL
2670 ram_addr_t size,
2671 ram_addr_t phys_offset,
0fd542fb
MT
2672 ram_addr_t region_offset,
2673 bool log_dirty)
33417e70 2674{
c227f099 2675 target_phys_addr_t addr, end_addr;
92e873b9 2676 PhysPageDesc *p;
9d42037b 2677 CPUState *env;
c227f099 2678 ram_addr_t orig_size = size;
f6405247 2679 subpage_t *subpage;
33417e70 2680
3b8e6a2d 2681 assert(size);
0fd542fb 2682 cpu_notify_set_memory(start_addr, size, phys_offset, log_dirty);
f6f3fbca 2683
67c4d23c
PB
2684 if (phys_offset == IO_MEM_UNASSIGNED) {
2685 region_offset = start_addr;
2686 }
8da3ff18 2687 region_offset &= TARGET_PAGE_MASK;
5fd386f6 2688 size = (size + TARGET_PAGE_SIZE - 1) & TARGET_PAGE_MASK;
c227f099 2689 end_addr = start_addr + (target_phys_addr_t)size;
3b8e6a2d
EI
2690
2691 addr = start_addr;
2692 do {
db7b5426
BS
2693 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2694 if (p && p->phys_offset != IO_MEM_UNASSIGNED) {
c227f099
AL
2695 ram_addr_t orig_memory = p->phys_offset;
2696 target_phys_addr_t start_addr2, end_addr2;
db7b5426
BS
2697 int need_subpage = 0;
2698
2699 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2,
2700 need_subpage);
f6405247 2701 if (need_subpage) {
db7b5426
BS
2702 if (!(orig_memory & IO_MEM_SUBPAGE)) {
2703 subpage = subpage_init((addr & TARGET_PAGE_MASK),
8da3ff18
PB
2704 &p->phys_offset, orig_memory,
2705 p->region_offset);
db7b5426
BS
2706 } else {
2707 subpage = io_mem_opaque[(orig_memory & ~TARGET_PAGE_MASK)
2708 >> IO_MEM_SHIFT];
2709 }
8da3ff18
PB
2710 subpage_register(subpage, start_addr2, end_addr2, phys_offset,
2711 region_offset);
2712 p->region_offset = 0;
db7b5426
BS
2713 } else {
2714 p->phys_offset = phys_offset;
2715 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
2716 (phys_offset & IO_MEM_ROMD))
2717 phys_offset += TARGET_PAGE_SIZE;
2718 }
2719 } else {
2720 p = phys_page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2721 p->phys_offset = phys_offset;
8da3ff18 2722 p->region_offset = region_offset;
db7b5426 2723 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
8da3ff18 2724 (phys_offset & IO_MEM_ROMD)) {
db7b5426 2725 phys_offset += TARGET_PAGE_SIZE;
0e8f0967 2726 } else {
c227f099 2727 target_phys_addr_t start_addr2, end_addr2;
db7b5426
BS
2728 int need_subpage = 0;
2729
2730 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr,
2731 end_addr2, need_subpage);
2732
f6405247 2733 if (need_subpage) {
db7b5426 2734 subpage = subpage_init((addr & TARGET_PAGE_MASK),
8da3ff18 2735 &p->phys_offset, IO_MEM_UNASSIGNED,
67c4d23c 2736 addr & TARGET_PAGE_MASK);
db7b5426 2737 subpage_register(subpage, start_addr2, end_addr2,
8da3ff18
PB
2738 phys_offset, region_offset);
2739 p->region_offset = 0;
db7b5426
BS
2740 }
2741 }
2742 }
8da3ff18 2743 region_offset += TARGET_PAGE_SIZE;
3b8e6a2d
EI
2744 addr += TARGET_PAGE_SIZE;
2745 } while (addr != end_addr);
3b46e624 2746
9d42037b
FB
2747 /* since each CPU stores ram addresses in its TLB cache, we must
2748 reset the modified entries */
2749 /* XXX: slow ! */
2750 for(env = first_cpu; env != NULL; env = env->next_cpu) {
2751 tlb_flush(env, 1);
2752 }
33417e70
FB
2753}
2754
ba863458 2755/* XXX: temporary until new memory mapping API */
c227f099 2756ram_addr_t cpu_get_physical_page_desc(target_phys_addr_t addr)
ba863458
FB
2757{
2758 PhysPageDesc *p;
2759
2760 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2761 if (!p)
2762 return IO_MEM_UNASSIGNED;
2763 return p->phys_offset;
2764}
2765
c227f099 2766void qemu_register_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
f65ed4c1
AL
2767{
2768 if (kvm_enabled())
2769 kvm_coalesce_mmio_region(addr, size);
2770}
2771
c227f099 2772void qemu_unregister_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
f65ed4c1
AL
2773{
2774 if (kvm_enabled())
2775 kvm_uncoalesce_mmio_region(addr, size);
2776}
2777
62a2744c
SY
2778void qemu_flush_coalesced_mmio_buffer(void)
2779{
2780 if (kvm_enabled())
2781 kvm_flush_coalesced_mmio_buffer();
2782}
2783
c902760f
MT
2784#if defined(__linux__) && !defined(TARGET_S390X)
2785
2786#include <sys/vfs.h>
2787
2788#define HUGETLBFS_MAGIC 0x958458f6
2789
2790static long gethugepagesize(const char *path)
2791{
2792 struct statfs fs;
2793 int ret;
2794
2795 do {
9742bf26 2796 ret = statfs(path, &fs);
c902760f
MT
2797 } while (ret != 0 && errno == EINTR);
2798
2799 if (ret != 0) {
9742bf26
YT
2800 perror(path);
2801 return 0;
c902760f
MT
2802 }
2803
2804 if (fs.f_type != HUGETLBFS_MAGIC)
9742bf26 2805 fprintf(stderr, "Warning: path not on HugeTLBFS: %s\n", path);
c902760f
MT
2806
2807 return fs.f_bsize;
2808}
2809
04b16653
AW
2810static void *file_ram_alloc(RAMBlock *block,
2811 ram_addr_t memory,
2812 const char *path)
c902760f
MT
2813{
2814 char *filename;
2815 void *area;
2816 int fd;
2817#ifdef MAP_POPULATE
2818 int flags;
2819#endif
2820 unsigned long hpagesize;
2821
2822 hpagesize = gethugepagesize(path);
2823 if (!hpagesize) {
9742bf26 2824 return NULL;
c902760f
MT
2825 }
2826
2827 if (memory < hpagesize) {
2828 return NULL;
2829 }
2830
2831 if (kvm_enabled() && !kvm_has_sync_mmu()) {
2832 fprintf(stderr, "host lacks kvm mmu notifiers, -mem-path unsupported\n");
2833 return NULL;
2834 }
2835
2836 if (asprintf(&filename, "%s/qemu_back_mem.XXXXXX", path) == -1) {
9742bf26 2837 return NULL;
c902760f
MT
2838 }
2839
2840 fd = mkstemp(filename);
2841 if (fd < 0) {
9742bf26
YT
2842 perror("unable to create backing store for hugepages");
2843 free(filename);
2844 return NULL;
c902760f
MT
2845 }
2846 unlink(filename);
2847 free(filename);
2848
2849 memory = (memory+hpagesize-1) & ~(hpagesize-1);
2850
2851 /*
2852 * ftruncate is not supported by hugetlbfs in older
2853 * hosts, so don't bother bailing out on errors.
2854 * If anything goes wrong with it under other filesystems,
2855 * mmap will fail.
2856 */
2857 if (ftruncate(fd, memory))
9742bf26 2858 perror("ftruncate");
c902760f
MT
2859
2860#ifdef MAP_POPULATE
2861 /* NB: MAP_POPULATE won't exhaustively alloc all phys pages in the case
2862 * MAP_PRIVATE is requested. For mem_prealloc we mmap as MAP_SHARED
2863 * to sidestep this quirk.
2864 */
2865 flags = mem_prealloc ? MAP_POPULATE | MAP_SHARED : MAP_PRIVATE;
2866 area = mmap(0, memory, PROT_READ | PROT_WRITE, flags, fd, 0);
2867#else
2868 area = mmap(0, memory, PROT_READ | PROT_WRITE, MAP_PRIVATE, fd, 0);
2869#endif
2870 if (area == MAP_FAILED) {
9742bf26
YT
2871 perror("file_ram_alloc: can't mmap RAM pages");
2872 close(fd);
2873 return (NULL);
c902760f 2874 }
04b16653 2875 block->fd = fd;
c902760f
MT
2876 return area;
2877}
2878#endif
2879
d17b5288 2880static ram_addr_t find_ram_offset(ram_addr_t size)
04b16653
AW
2881{
2882 RAMBlock *block, *next_block;
f15fbc4b 2883 ram_addr_t offset = 0, mingap = RAM_ADDR_MAX;
04b16653
AW
2884
2885 if (QLIST_EMPTY(&ram_list.blocks))
2886 return 0;
2887
2888 QLIST_FOREACH(block, &ram_list.blocks, next) {
f15fbc4b 2889 ram_addr_t end, next = RAM_ADDR_MAX;
04b16653
AW
2890
2891 end = block->offset + block->length;
2892
2893 QLIST_FOREACH(next_block, &ram_list.blocks, next) {
2894 if (next_block->offset >= end) {
2895 next = MIN(next, next_block->offset);
2896 }
2897 }
2898 if (next - end >= size && next - end < mingap) {
2899 offset = end;
2900 mingap = next - end;
2901 }
2902 }
2903 return offset;
2904}
2905
2906static ram_addr_t last_ram_offset(void)
d17b5288
AW
2907{
2908 RAMBlock *block;
2909 ram_addr_t last = 0;
2910
2911 QLIST_FOREACH(block, &ram_list.blocks, next)
2912 last = MAX(last, block->offset + block->length);
2913
2914 return last;
2915}
2916
84b89d78 2917ram_addr_t qemu_ram_alloc_from_ptr(DeviceState *dev, const char *name,
6977dfe6 2918 ram_addr_t size, void *host)
84b89d78
CM
2919{
2920 RAMBlock *new_block, *block;
2921
2922 size = TARGET_PAGE_ALIGN(size);
2923 new_block = qemu_mallocz(sizeof(*new_block));
2924
2925 if (dev && dev->parent_bus && dev->parent_bus->info->get_dev_path) {
2926 char *id = dev->parent_bus->info->get_dev_path(dev);
2927 if (id) {
2928 snprintf(new_block->idstr, sizeof(new_block->idstr), "%s/", id);
2929 qemu_free(id);
2930 }
2931 }
2932 pstrcat(new_block->idstr, sizeof(new_block->idstr), name);
2933
2934 QLIST_FOREACH(block, &ram_list.blocks, next) {
2935 if (!strcmp(block->idstr, new_block->idstr)) {
2936 fprintf(stderr, "RAMBlock \"%s\" already registered, abort!\n",
2937 new_block->idstr);
2938 abort();
2939 }
2940 }
2941
432d268c 2942 new_block->offset = find_ram_offset(size);
6977dfe6
YT
2943 if (host) {
2944 new_block->host = host;
cd19cfa2 2945 new_block->flags |= RAM_PREALLOC_MASK;
6977dfe6
YT
2946 } else {
2947 if (mem_path) {
c902760f 2948#if defined (__linux__) && !defined(TARGET_S390X)
6977dfe6
YT
2949 new_block->host = file_ram_alloc(new_block, size, mem_path);
2950 if (!new_block->host) {
2951 new_block->host = qemu_vmalloc(size);
e78815a5 2952 qemu_madvise(new_block->host, size, QEMU_MADV_MERGEABLE);
6977dfe6 2953 }
c902760f 2954#else
6977dfe6
YT
2955 fprintf(stderr, "-mem-path option unsupported\n");
2956 exit(1);
c902760f 2957#endif
6977dfe6 2958 } else {
6b02494d 2959#if defined(TARGET_S390X) && defined(CONFIG_KVM)
ff83678a
CB
2960 /* S390 KVM requires the topmost vma of the RAM to be smaller than
2961 an system defined value, which is at least 256GB. Larger systems
2962 have larger values. We put the guest between the end of data
2963 segment (system break) and this value. We use 32GB as a base to
2964 have enough room for the system break to grow. */
2965 new_block->host = mmap((void*)0x800000000, size,
6977dfe6 2966 PROT_EXEC|PROT_READ|PROT_WRITE,
ff83678a 2967 MAP_SHARED | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
fb8b2735
AG
2968 if (new_block->host == MAP_FAILED) {
2969 fprintf(stderr, "Allocating RAM failed\n");
2970 abort();
2971 }
6b02494d 2972#else
868bb33f 2973 if (xen_enabled()) {
432d268c
JN
2974 xen_ram_alloc(new_block->offset, size);
2975 } else {
2976 new_block->host = qemu_vmalloc(size);
2977 }
6b02494d 2978#endif
e78815a5 2979 qemu_madvise(new_block->host, size, QEMU_MADV_MERGEABLE);
6977dfe6 2980 }
c902760f 2981 }
94a6b54f
PB
2982 new_block->length = size;
2983
f471a17e 2984 QLIST_INSERT_HEAD(&ram_list.blocks, new_block, next);
94a6b54f 2985
f471a17e 2986 ram_list.phys_dirty = qemu_realloc(ram_list.phys_dirty,
04b16653 2987 last_ram_offset() >> TARGET_PAGE_BITS);
d17b5288 2988 memset(ram_list.phys_dirty + (new_block->offset >> TARGET_PAGE_BITS),
94a6b54f
PB
2989 0xff, size >> TARGET_PAGE_BITS);
2990
6f0437e8
JK
2991 if (kvm_enabled())
2992 kvm_setup_guest_memory(new_block->host, size);
2993
94a6b54f
PB
2994 return new_block->offset;
2995}
e9a1ab19 2996
6977dfe6
YT
2997ram_addr_t qemu_ram_alloc(DeviceState *dev, const char *name, ram_addr_t size)
2998{
2999 return qemu_ram_alloc_from_ptr(dev, name, size, NULL);
3000}
3001
1f2e98b6
AW
3002void qemu_ram_free_from_ptr(ram_addr_t addr)
3003{
3004 RAMBlock *block;
3005
3006 QLIST_FOREACH(block, &ram_list.blocks, next) {
3007 if (addr == block->offset) {
3008 QLIST_REMOVE(block, next);
3009 qemu_free(block);
3010 return;
3011 }
3012 }
3013}
3014
c227f099 3015void qemu_ram_free(ram_addr_t addr)
e9a1ab19 3016{
04b16653
AW
3017 RAMBlock *block;
3018
3019 QLIST_FOREACH(block, &ram_list.blocks, next) {
3020 if (addr == block->offset) {
3021 QLIST_REMOVE(block, next);
cd19cfa2
HY
3022 if (block->flags & RAM_PREALLOC_MASK) {
3023 ;
3024 } else if (mem_path) {
04b16653
AW
3025#if defined (__linux__) && !defined(TARGET_S390X)
3026 if (block->fd) {
3027 munmap(block->host, block->length);
3028 close(block->fd);
3029 } else {
3030 qemu_vfree(block->host);
3031 }
fd28aa13
JK
3032#else
3033 abort();
04b16653
AW
3034#endif
3035 } else {
3036#if defined(TARGET_S390X) && defined(CONFIG_KVM)
3037 munmap(block->host, block->length);
3038#else
868bb33f 3039 if (xen_enabled()) {
e41d7c69 3040 xen_invalidate_map_cache_entry(block->host);
432d268c
JN
3041 } else {
3042 qemu_vfree(block->host);
3043 }
04b16653
AW
3044#endif
3045 }
3046 qemu_free(block);
3047 return;
3048 }
3049 }
3050
e9a1ab19
FB
3051}
3052
cd19cfa2
HY
3053#ifndef _WIN32
3054void qemu_ram_remap(ram_addr_t addr, ram_addr_t length)
3055{
3056 RAMBlock *block;
3057 ram_addr_t offset;
3058 int flags;
3059 void *area, *vaddr;
3060
3061 QLIST_FOREACH(block, &ram_list.blocks, next) {
3062 offset = addr - block->offset;
3063 if (offset < block->length) {
3064 vaddr = block->host + offset;
3065 if (block->flags & RAM_PREALLOC_MASK) {
3066 ;
3067 } else {
3068 flags = MAP_FIXED;
3069 munmap(vaddr, length);
3070 if (mem_path) {
3071#if defined(__linux__) && !defined(TARGET_S390X)
3072 if (block->fd) {
3073#ifdef MAP_POPULATE
3074 flags |= mem_prealloc ? MAP_POPULATE | MAP_SHARED :
3075 MAP_PRIVATE;
3076#else
3077 flags |= MAP_PRIVATE;
3078#endif
3079 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3080 flags, block->fd, offset);
3081 } else {
3082 flags |= MAP_PRIVATE | MAP_ANONYMOUS;
3083 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3084 flags, -1, 0);
3085 }
fd28aa13
JK
3086#else
3087 abort();
cd19cfa2
HY
3088#endif
3089 } else {
3090#if defined(TARGET_S390X) && defined(CONFIG_KVM)
3091 flags |= MAP_SHARED | MAP_ANONYMOUS;
3092 area = mmap(vaddr, length, PROT_EXEC|PROT_READ|PROT_WRITE,
3093 flags, -1, 0);
3094#else
3095 flags |= MAP_PRIVATE | MAP_ANONYMOUS;
3096 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3097 flags, -1, 0);
3098#endif
3099 }
3100 if (area != vaddr) {
f15fbc4b
AP
3101 fprintf(stderr, "Could not remap addr: "
3102 RAM_ADDR_FMT "@" RAM_ADDR_FMT "\n",
cd19cfa2
HY
3103 length, addr);
3104 exit(1);
3105 }
3106 qemu_madvise(vaddr, length, QEMU_MADV_MERGEABLE);
3107 }
3108 return;
3109 }
3110 }
3111}
3112#endif /* !_WIN32 */
3113
dc828ca1 3114/* Return a host pointer to ram allocated with qemu_ram_alloc.
5579c7f3
PB
3115 With the exception of the softmmu code in this file, this should
3116 only be used for local memory (e.g. video ram) that the device owns,
3117 and knows it isn't going to access beyond the end of the block.
3118
3119 It should not be used for general purpose DMA.
3120 Use cpu_physical_memory_map/cpu_physical_memory_rw instead.
3121 */
c227f099 3122void *qemu_get_ram_ptr(ram_addr_t addr)
dc828ca1 3123{
94a6b54f
PB
3124 RAMBlock *block;
3125
f471a17e
AW
3126 QLIST_FOREACH(block, &ram_list.blocks, next) {
3127 if (addr - block->offset < block->length) {
7d82af38
VP
3128 /* Move this entry to to start of the list. */
3129 if (block != QLIST_FIRST(&ram_list.blocks)) {
3130 QLIST_REMOVE(block, next);
3131 QLIST_INSERT_HEAD(&ram_list.blocks, block, next);
3132 }
868bb33f 3133 if (xen_enabled()) {
432d268c
JN
3134 /* We need to check if the requested address is in the RAM
3135 * because we don't want to map the entire memory in QEMU.
712c2b41 3136 * In that case just map until the end of the page.
432d268c
JN
3137 */
3138 if (block->offset == 0) {
e41d7c69 3139 return xen_map_cache(addr, 0, 0);
432d268c 3140 } else if (block->host == NULL) {
e41d7c69
JK
3141 block->host =
3142 xen_map_cache(block->offset, block->length, 1);
432d268c
JN
3143 }
3144 }
f471a17e
AW
3145 return block->host + (addr - block->offset);
3146 }
94a6b54f 3147 }
f471a17e
AW
3148
3149 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3150 abort();
3151
3152 return NULL;
dc828ca1
PB
3153}
3154
b2e0a138
MT
3155/* Return a host pointer to ram allocated with qemu_ram_alloc.
3156 * Same as qemu_get_ram_ptr but avoid reordering ramblocks.
3157 */
3158void *qemu_safe_ram_ptr(ram_addr_t addr)
3159{
3160 RAMBlock *block;
3161
3162 QLIST_FOREACH(block, &ram_list.blocks, next) {
3163 if (addr - block->offset < block->length) {
868bb33f 3164 if (xen_enabled()) {
432d268c
JN
3165 /* We need to check if the requested address is in the RAM
3166 * because we don't want to map the entire memory in QEMU.
712c2b41 3167 * In that case just map until the end of the page.
432d268c
JN
3168 */
3169 if (block->offset == 0) {
e41d7c69 3170 return xen_map_cache(addr, 0, 0);
432d268c 3171 } else if (block->host == NULL) {
e41d7c69
JK
3172 block->host =
3173 xen_map_cache(block->offset, block->length, 1);
432d268c
JN
3174 }
3175 }
b2e0a138
MT
3176 return block->host + (addr - block->offset);
3177 }
3178 }
3179
3180 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3181 abort();
3182
3183 return NULL;
3184}
3185
38bee5dc
SS
3186/* Return a host pointer to guest's ram. Similar to qemu_get_ram_ptr
3187 * but takes a size argument */
8ab934f9 3188void *qemu_ram_ptr_length(ram_addr_t addr, ram_addr_t *size)
38bee5dc 3189{
8ab934f9
SS
3190 if (*size == 0) {
3191 return NULL;
3192 }
868bb33f 3193 if (xen_enabled()) {
e41d7c69 3194 return xen_map_cache(addr, *size, 1);
868bb33f 3195 } else {
38bee5dc
SS
3196 RAMBlock *block;
3197
3198 QLIST_FOREACH(block, &ram_list.blocks, next) {
3199 if (addr - block->offset < block->length) {
3200 if (addr - block->offset + *size > block->length)
3201 *size = block->length - addr + block->offset;
3202 return block->host + (addr - block->offset);
3203 }
3204 }
3205
3206 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3207 abort();
38bee5dc
SS
3208 }
3209}
3210
050a0ddf
AP
3211void qemu_put_ram_ptr(void *addr)
3212{
3213 trace_qemu_put_ram_ptr(addr);
050a0ddf
AP
3214}
3215
e890261f 3216int qemu_ram_addr_from_host(void *ptr, ram_addr_t *ram_addr)
5579c7f3 3217{
94a6b54f
PB
3218 RAMBlock *block;
3219 uint8_t *host = ptr;
3220
868bb33f 3221 if (xen_enabled()) {
e41d7c69 3222 *ram_addr = xen_ram_addr_from_mapcache(ptr);
712c2b41
SS
3223 return 0;
3224 }
3225
f471a17e 3226 QLIST_FOREACH(block, &ram_list.blocks, next) {
432d268c
JN
3227 /* This case append when the block is not mapped. */
3228 if (block->host == NULL) {
3229 continue;
3230 }
f471a17e 3231 if (host - block->host < block->length) {
e890261f
MT
3232 *ram_addr = block->offset + (host - block->host);
3233 return 0;
f471a17e 3234 }
94a6b54f 3235 }
432d268c 3236
e890261f
MT
3237 return -1;
3238}
f471a17e 3239
e890261f
MT
3240/* Some of the softmmu routines need to translate from a host pointer
3241 (typically a TLB entry) back to a ram offset. */
3242ram_addr_t qemu_ram_addr_from_host_nofail(void *ptr)
3243{
3244 ram_addr_t ram_addr;
f471a17e 3245
e890261f
MT
3246 if (qemu_ram_addr_from_host(ptr, &ram_addr)) {
3247 fprintf(stderr, "Bad ram pointer %p\n", ptr);
3248 abort();
3249 }
3250 return ram_addr;
5579c7f3
PB
3251}
3252
c227f099 3253static uint32_t unassigned_mem_readb(void *opaque, target_phys_addr_t addr)
33417e70 3254{
67d3b957 3255#ifdef DEBUG_UNASSIGNED
ab3d1727 3256 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
b4f0a316 3257#endif
5b450407 3258#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3259 cpu_unassigned_access(cpu_single_env, addr, 0, 0, 0, 1);
e18231a3
BS
3260#endif
3261 return 0;
3262}
3263
c227f099 3264static uint32_t unassigned_mem_readw(void *opaque, target_phys_addr_t addr)
e18231a3
BS
3265{
3266#ifdef DEBUG_UNASSIGNED
3267 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
3268#endif
5b450407 3269#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3270 cpu_unassigned_access(cpu_single_env, addr, 0, 0, 0, 2);
e18231a3
BS
3271#endif
3272 return 0;
3273}
3274
c227f099 3275static uint32_t unassigned_mem_readl(void *opaque, target_phys_addr_t addr)
e18231a3
BS
3276{
3277#ifdef DEBUG_UNASSIGNED
3278 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
3279#endif
5b450407 3280#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3281 cpu_unassigned_access(cpu_single_env, addr, 0, 0, 0, 4);
67d3b957 3282#endif
33417e70
FB
3283 return 0;
3284}
3285
c227f099 3286static void unassigned_mem_writeb(void *opaque, target_phys_addr_t addr, uint32_t val)
33417e70 3287{
67d3b957 3288#ifdef DEBUG_UNASSIGNED
ab3d1727 3289 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
67d3b957 3290#endif
5b450407 3291#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3292 cpu_unassigned_access(cpu_single_env, addr, 1, 0, 0, 1);
e18231a3
BS
3293#endif
3294}
3295
c227f099 3296static void unassigned_mem_writew(void *opaque, target_phys_addr_t addr, uint32_t val)
e18231a3
BS
3297{
3298#ifdef DEBUG_UNASSIGNED
3299 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
3300#endif
5b450407 3301#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3302 cpu_unassigned_access(cpu_single_env, addr, 1, 0, 0, 2);
e18231a3
BS
3303#endif
3304}
3305
c227f099 3306static void unassigned_mem_writel(void *opaque, target_phys_addr_t addr, uint32_t val)
e18231a3
BS
3307{
3308#ifdef DEBUG_UNASSIGNED
3309 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
3310#endif
5b450407 3311#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3312 cpu_unassigned_access(cpu_single_env, addr, 1, 0, 0, 4);
b4f0a316 3313#endif
33417e70
FB
3314}
3315
d60efc6b 3316static CPUReadMemoryFunc * const unassigned_mem_read[3] = {
33417e70 3317 unassigned_mem_readb,
e18231a3
BS
3318 unassigned_mem_readw,
3319 unassigned_mem_readl,
33417e70
FB
3320};
3321
d60efc6b 3322static CPUWriteMemoryFunc * const unassigned_mem_write[3] = {
33417e70 3323 unassigned_mem_writeb,
e18231a3
BS
3324 unassigned_mem_writew,
3325 unassigned_mem_writel,
33417e70
FB
3326};
3327
c227f099 3328static void notdirty_mem_writeb(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3329 uint32_t val)
9fa3e853 3330{
3a7d929e 3331 int dirty_flags;
f7c11b53 3332 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3333 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3334#if !defined(CONFIG_USER_ONLY)
3a7d929e 3335 tb_invalidate_phys_page_fast(ram_addr, 1);
f7c11b53 3336 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3337#endif
3a7d929e 3338 }
5579c7f3 3339 stb_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3340 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3341 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3342 /* we remove the notdirty callback only if the code has been
3343 flushed */
3344 if (dirty_flags == 0xff)
2e70f6ef 3345 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3346}
3347
c227f099 3348static void notdirty_mem_writew(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3349 uint32_t val)
9fa3e853 3350{
3a7d929e 3351 int dirty_flags;
f7c11b53 3352 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3353 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3354#if !defined(CONFIG_USER_ONLY)
3a7d929e 3355 tb_invalidate_phys_page_fast(ram_addr, 2);
f7c11b53 3356 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3357#endif
3a7d929e 3358 }
5579c7f3 3359 stw_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3360 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3361 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3362 /* we remove the notdirty callback only if the code has been
3363 flushed */
3364 if (dirty_flags == 0xff)
2e70f6ef 3365 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3366}
3367
c227f099 3368static void notdirty_mem_writel(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3369 uint32_t val)
9fa3e853 3370{
3a7d929e 3371 int dirty_flags;
f7c11b53 3372 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3373 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3374#if !defined(CONFIG_USER_ONLY)
3a7d929e 3375 tb_invalidate_phys_page_fast(ram_addr, 4);
f7c11b53 3376 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3377#endif
3a7d929e 3378 }
5579c7f3 3379 stl_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3380 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3381 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3382 /* we remove the notdirty callback only if the code has been
3383 flushed */
3384 if (dirty_flags == 0xff)
2e70f6ef 3385 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3386}
3387
d60efc6b 3388static CPUReadMemoryFunc * const error_mem_read[3] = {
9fa3e853
FB
3389 NULL, /* never used */
3390 NULL, /* never used */
3391 NULL, /* never used */
3392};
3393
d60efc6b 3394static CPUWriteMemoryFunc * const notdirty_mem_write[3] = {
1ccde1cb
FB
3395 notdirty_mem_writeb,
3396 notdirty_mem_writew,
3397 notdirty_mem_writel,
3398};
3399
0f459d16 3400/* Generate a debug exception if a watchpoint has been hit. */
b4051334 3401static void check_watchpoint(int offset, int len_mask, int flags)
0f459d16
PB
3402{
3403 CPUState *env = cpu_single_env;
06d55cc1
AL
3404 target_ulong pc, cs_base;
3405 TranslationBlock *tb;
0f459d16 3406 target_ulong vaddr;
a1d1bb31 3407 CPUWatchpoint *wp;
06d55cc1 3408 int cpu_flags;
0f459d16 3409
06d55cc1
AL
3410 if (env->watchpoint_hit) {
3411 /* We re-entered the check after replacing the TB. Now raise
3412 * the debug interrupt so that is will trigger after the
3413 * current instruction. */
3414 cpu_interrupt(env, CPU_INTERRUPT_DEBUG);
3415 return;
3416 }
2e70f6ef 3417 vaddr = (env->mem_io_vaddr & TARGET_PAGE_MASK) + offset;
72cf2d4f 3418 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334
AL
3419 if ((vaddr == (wp->vaddr & len_mask) ||
3420 (vaddr & wp->len_mask) == wp->vaddr) && (wp->flags & flags)) {
6e140f28
AL
3421 wp->flags |= BP_WATCHPOINT_HIT;
3422 if (!env->watchpoint_hit) {
3423 env->watchpoint_hit = wp;
3424 tb = tb_find_pc(env->mem_io_pc);
3425 if (!tb) {
3426 cpu_abort(env, "check_watchpoint: could not find TB for "
3427 "pc=%p", (void *)env->mem_io_pc);
3428 }
618ba8e6 3429 cpu_restore_state(tb, env, env->mem_io_pc);
6e140f28
AL
3430 tb_phys_invalidate(tb, -1);
3431 if (wp->flags & BP_STOP_BEFORE_ACCESS) {
3432 env->exception_index = EXCP_DEBUG;
3433 } else {
3434 cpu_get_tb_cpu_state(env, &pc, &cs_base, &cpu_flags);
3435 tb_gen_code(env, pc, cs_base, cpu_flags, 1);
3436 }
3437 cpu_resume_from_signal(env, NULL);
06d55cc1 3438 }
6e140f28
AL
3439 } else {
3440 wp->flags &= ~BP_WATCHPOINT_HIT;
0f459d16
PB
3441 }
3442 }
3443}
3444
6658ffb8
PB
3445/* Watchpoint access routines. Watchpoints are inserted using TLB tricks,
3446 so these check for a hit then pass through to the normal out-of-line
3447 phys routines. */
c227f099 3448static uint32_t watch_mem_readb(void *opaque, target_phys_addr_t addr)
6658ffb8 3449{
b4051334 3450 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_READ);
6658ffb8
PB
3451 return ldub_phys(addr);
3452}
3453
c227f099 3454static uint32_t watch_mem_readw(void *opaque, target_phys_addr_t addr)
6658ffb8 3455{
b4051334 3456 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_READ);
6658ffb8
PB
3457 return lduw_phys(addr);
3458}
3459
c227f099 3460static uint32_t watch_mem_readl(void *opaque, target_phys_addr_t addr)
6658ffb8 3461{
b4051334 3462 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_READ);
6658ffb8
PB
3463 return ldl_phys(addr);
3464}
3465
c227f099 3466static void watch_mem_writeb(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3467 uint32_t val)
3468{
b4051334 3469 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_WRITE);
6658ffb8
PB
3470 stb_phys(addr, val);
3471}
3472
c227f099 3473static void watch_mem_writew(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3474 uint32_t val)
3475{
b4051334 3476 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_WRITE);
6658ffb8
PB
3477 stw_phys(addr, val);
3478}
3479
c227f099 3480static void watch_mem_writel(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3481 uint32_t val)
3482{
b4051334 3483 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_WRITE);
6658ffb8
PB
3484 stl_phys(addr, val);
3485}
3486
d60efc6b 3487static CPUReadMemoryFunc * const watch_mem_read[3] = {
6658ffb8
PB
3488 watch_mem_readb,
3489 watch_mem_readw,
3490 watch_mem_readl,
3491};
3492
d60efc6b 3493static CPUWriteMemoryFunc * const watch_mem_write[3] = {
6658ffb8
PB
3494 watch_mem_writeb,
3495 watch_mem_writew,
3496 watch_mem_writel,
3497};
6658ffb8 3498
f6405247
RH
3499static inline uint32_t subpage_readlen (subpage_t *mmio,
3500 target_phys_addr_t addr,
3501 unsigned int len)
db7b5426 3502{
f6405247 3503 unsigned int idx = SUBPAGE_IDX(addr);
db7b5426
BS
3504#if defined(DEBUG_SUBPAGE)
3505 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d\n", __func__,
3506 mmio, len, addr, idx);
3507#endif
db7b5426 3508
f6405247
RH
3509 addr += mmio->region_offset[idx];
3510 idx = mmio->sub_io_index[idx];
3511 return io_mem_read[idx][len](io_mem_opaque[idx], addr);
db7b5426
BS
3512}
3513
c227f099 3514static inline void subpage_writelen (subpage_t *mmio, target_phys_addr_t addr,
f6405247 3515 uint32_t value, unsigned int len)
db7b5426 3516{
f6405247 3517 unsigned int idx = SUBPAGE_IDX(addr);
db7b5426 3518#if defined(DEBUG_SUBPAGE)
f6405247
RH
3519 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d value %08x\n",
3520 __func__, mmio, len, addr, idx, value);
db7b5426 3521#endif
f6405247
RH
3522
3523 addr += mmio->region_offset[idx];
3524 idx = mmio->sub_io_index[idx];
3525 io_mem_write[idx][len](io_mem_opaque[idx], addr, value);
db7b5426
BS
3526}
3527
c227f099 3528static uint32_t subpage_readb (void *opaque, target_phys_addr_t addr)
db7b5426 3529{
db7b5426
BS
3530 return subpage_readlen(opaque, addr, 0);
3531}
3532
c227f099 3533static void subpage_writeb (void *opaque, target_phys_addr_t addr,
db7b5426
BS
3534 uint32_t value)
3535{
db7b5426
BS
3536 subpage_writelen(opaque, addr, value, 0);
3537}
3538
c227f099 3539static uint32_t subpage_readw (void *opaque, target_phys_addr_t addr)
db7b5426 3540{
db7b5426
BS
3541 return subpage_readlen(opaque, addr, 1);
3542}
3543
c227f099 3544static void subpage_writew (void *opaque, target_phys_addr_t addr,
db7b5426
BS
3545 uint32_t value)
3546{
db7b5426
BS
3547 subpage_writelen(opaque, addr, value, 1);
3548}
3549
c227f099 3550static uint32_t subpage_readl (void *opaque, target_phys_addr_t addr)
db7b5426 3551{
db7b5426
BS
3552 return subpage_readlen(opaque, addr, 2);
3553}
3554
f6405247
RH
3555static void subpage_writel (void *opaque, target_phys_addr_t addr,
3556 uint32_t value)
db7b5426 3557{
db7b5426
BS
3558 subpage_writelen(opaque, addr, value, 2);
3559}
3560
d60efc6b 3561static CPUReadMemoryFunc * const subpage_read[] = {
db7b5426
BS
3562 &subpage_readb,
3563 &subpage_readw,
3564 &subpage_readl,
3565};
3566
d60efc6b 3567static CPUWriteMemoryFunc * const subpage_write[] = {
db7b5426
BS
3568 &subpage_writeb,
3569 &subpage_writew,
3570 &subpage_writel,
3571};
3572
c227f099
AL
3573static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
3574 ram_addr_t memory, ram_addr_t region_offset)
db7b5426
BS
3575{
3576 int idx, eidx;
3577
3578 if (start >= TARGET_PAGE_SIZE || end >= TARGET_PAGE_SIZE)
3579 return -1;
3580 idx = SUBPAGE_IDX(start);
3581 eidx = SUBPAGE_IDX(end);
3582#if defined(DEBUG_SUBPAGE)
0bf9e31a 3583 printf("%s: %p start %08x end %08x idx %08x eidx %08x mem %ld\n", __func__,
db7b5426
BS
3584 mmio, start, end, idx, eidx, memory);
3585#endif
95c318f5
GN
3586 if ((memory & ~TARGET_PAGE_MASK) == IO_MEM_RAM)
3587 memory = IO_MEM_UNASSIGNED;
f6405247 3588 memory = (memory >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
db7b5426 3589 for (; idx <= eidx; idx++) {
f6405247
RH
3590 mmio->sub_io_index[idx] = memory;
3591 mmio->region_offset[idx] = region_offset;
db7b5426
BS
3592 }
3593
3594 return 0;
3595}
3596
f6405247
RH
3597static subpage_t *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
3598 ram_addr_t orig_memory,
3599 ram_addr_t region_offset)
db7b5426 3600{
c227f099 3601 subpage_t *mmio;
db7b5426
BS
3602 int subpage_memory;
3603
c227f099 3604 mmio = qemu_mallocz(sizeof(subpage_t));
1eec614b
AL
3605
3606 mmio->base = base;
2507c12a
AG
3607 subpage_memory = cpu_register_io_memory(subpage_read, subpage_write, mmio,
3608 DEVICE_NATIVE_ENDIAN);
db7b5426 3609#if defined(DEBUG_SUBPAGE)
1eec614b
AL
3610 printf("%s: %p base " TARGET_FMT_plx " len %08x %d\n", __func__,
3611 mmio, base, TARGET_PAGE_SIZE, subpage_memory);
db7b5426 3612#endif
1eec614b 3613 *phys = subpage_memory | IO_MEM_SUBPAGE;
f6405247 3614 subpage_register(mmio, 0, TARGET_PAGE_SIZE-1, orig_memory, region_offset);
db7b5426
BS
3615
3616 return mmio;
3617}
3618
88715657
AL
3619static int get_free_io_mem_idx(void)
3620{
3621 int i;
3622
3623 for (i = 0; i<IO_MEM_NB_ENTRIES; i++)
3624 if (!io_mem_used[i]) {
3625 io_mem_used[i] = 1;
3626 return i;
3627 }
c6703b47 3628 fprintf(stderr, "RAN out out io_mem_idx, max %d !\n", IO_MEM_NB_ENTRIES);
88715657
AL
3629 return -1;
3630}
3631
dd310534
AG
3632/*
3633 * Usually, devices operate in little endian mode. There are devices out
3634 * there that operate in big endian too. Each device gets byte swapped
3635 * mmio if plugged onto a CPU that does the other endianness.
3636 *
3637 * CPU Device swap?
3638 *
3639 * little little no
3640 * little big yes
3641 * big little yes
3642 * big big no
3643 */
3644
3645typedef struct SwapEndianContainer {
3646 CPUReadMemoryFunc *read[3];
3647 CPUWriteMemoryFunc *write[3];
3648 void *opaque;
3649} SwapEndianContainer;
3650
3651static uint32_t swapendian_mem_readb (void *opaque, target_phys_addr_t addr)
3652{
3653 uint32_t val;
3654 SwapEndianContainer *c = opaque;
3655 val = c->read[0](c->opaque, addr);
3656 return val;
3657}
3658
3659static uint32_t swapendian_mem_readw(void *opaque, target_phys_addr_t addr)
3660{
3661 uint32_t val;
3662 SwapEndianContainer *c = opaque;
3663 val = bswap16(c->read[1](c->opaque, addr));
3664 return val;
3665}
3666
3667static uint32_t swapendian_mem_readl(void *opaque, target_phys_addr_t addr)
3668{
3669 uint32_t val;
3670 SwapEndianContainer *c = opaque;
3671 val = bswap32(c->read[2](c->opaque, addr));
3672 return val;
3673}
3674
3675static CPUReadMemoryFunc * const swapendian_readfn[3]={
3676 swapendian_mem_readb,
3677 swapendian_mem_readw,
3678 swapendian_mem_readl
3679};
3680
3681static void swapendian_mem_writeb(void *opaque, target_phys_addr_t addr,
3682 uint32_t val)
3683{
3684 SwapEndianContainer *c = opaque;
3685 c->write[0](c->opaque, addr, val);
3686}
3687
3688static void swapendian_mem_writew(void *opaque, target_phys_addr_t addr,
3689 uint32_t val)
3690{
3691 SwapEndianContainer *c = opaque;
3692 c->write[1](c->opaque, addr, bswap16(val));
3693}
3694
3695static void swapendian_mem_writel(void *opaque, target_phys_addr_t addr,
3696 uint32_t val)
3697{
3698 SwapEndianContainer *c = opaque;
3699 c->write[2](c->opaque, addr, bswap32(val));
3700}
3701
3702static CPUWriteMemoryFunc * const swapendian_writefn[3]={
3703 swapendian_mem_writeb,
3704 swapendian_mem_writew,
3705 swapendian_mem_writel
3706};
3707
3708static void swapendian_init(int io_index)
3709{
3710 SwapEndianContainer *c = qemu_malloc(sizeof(SwapEndianContainer));
3711 int i;
3712
3713 /* Swap mmio for big endian targets */
3714 c->opaque = io_mem_opaque[io_index];
3715 for (i = 0; i < 3; i++) {
3716 c->read[i] = io_mem_read[io_index][i];
3717 c->write[i] = io_mem_write[io_index][i];
3718
3719 io_mem_read[io_index][i] = swapendian_readfn[i];
3720 io_mem_write[io_index][i] = swapendian_writefn[i];
3721 }
3722 io_mem_opaque[io_index] = c;
3723}
3724
3725static void swapendian_del(int io_index)
3726{
3727 if (io_mem_read[io_index][0] == swapendian_readfn[0]) {
3728 qemu_free(io_mem_opaque[io_index]);
3729 }
3730}
3731
33417e70
FB
3732/* mem_read and mem_write are arrays of functions containing the
3733 function to access byte (index 0), word (index 1) and dword (index
0b4e6e3e 3734 2). Functions can be omitted with a NULL function pointer.
3ee89922 3735 If io_index is non zero, the corresponding io zone is
4254fab8
BS
3736 modified. If it is zero, a new io zone is allocated. The return
3737 value can be used with cpu_register_physical_memory(). (-1) is
3738 returned if error. */
1eed09cb 3739static int cpu_register_io_memory_fixed(int io_index,
d60efc6b
BS
3740 CPUReadMemoryFunc * const *mem_read,
3741 CPUWriteMemoryFunc * const *mem_write,
dd310534 3742 void *opaque, enum device_endian endian)
33417e70 3743{
3cab721d
RH
3744 int i;
3745
33417e70 3746 if (io_index <= 0) {
88715657
AL
3747 io_index = get_free_io_mem_idx();
3748 if (io_index == -1)
3749 return io_index;
33417e70 3750 } else {
1eed09cb 3751 io_index >>= IO_MEM_SHIFT;
33417e70
FB
3752 if (io_index >= IO_MEM_NB_ENTRIES)
3753 return -1;
3754 }
b5ff1b31 3755
3cab721d
RH
3756 for (i = 0; i < 3; ++i) {
3757 io_mem_read[io_index][i]
3758 = (mem_read[i] ? mem_read[i] : unassigned_mem_read[i]);
3759 }
3760 for (i = 0; i < 3; ++i) {
3761 io_mem_write[io_index][i]
3762 = (mem_write[i] ? mem_write[i] : unassigned_mem_write[i]);
3763 }
a4193c8a 3764 io_mem_opaque[io_index] = opaque;
f6405247 3765
dd310534
AG
3766 switch (endian) {
3767 case DEVICE_BIG_ENDIAN:
3768#ifndef TARGET_WORDS_BIGENDIAN
3769 swapendian_init(io_index);
3770#endif
3771 break;
3772 case DEVICE_LITTLE_ENDIAN:
3773#ifdef TARGET_WORDS_BIGENDIAN
3774 swapendian_init(io_index);
3775#endif
3776 break;
3777 case DEVICE_NATIVE_ENDIAN:
3778 default:
3779 break;
3780 }
3781
f6405247 3782 return (io_index << IO_MEM_SHIFT);
33417e70 3783}
61382a50 3784
d60efc6b
BS
3785int cpu_register_io_memory(CPUReadMemoryFunc * const *mem_read,
3786 CPUWriteMemoryFunc * const *mem_write,
dd310534 3787 void *opaque, enum device_endian endian)
1eed09cb 3788{
2507c12a 3789 return cpu_register_io_memory_fixed(0, mem_read, mem_write, opaque, endian);
1eed09cb
AK
3790}
3791
88715657
AL
3792void cpu_unregister_io_memory(int io_table_address)
3793{
3794 int i;
3795 int io_index = io_table_address >> IO_MEM_SHIFT;
3796
dd310534
AG
3797 swapendian_del(io_index);
3798
88715657
AL
3799 for (i=0;i < 3; i++) {
3800 io_mem_read[io_index][i] = unassigned_mem_read[i];
3801 io_mem_write[io_index][i] = unassigned_mem_write[i];
3802 }
3803 io_mem_opaque[io_index] = NULL;
3804 io_mem_used[io_index] = 0;
3805}
3806
e9179ce1
AK
3807static void io_mem_init(void)
3808{
3809 int i;
3810
2507c12a
AG
3811 cpu_register_io_memory_fixed(IO_MEM_ROM, error_mem_read,
3812 unassigned_mem_write, NULL,
3813 DEVICE_NATIVE_ENDIAN);
3814 cpu_register_io_memory_fixed(IO_MEM_UNASSIGNED, unassigned_mem_read,
3815 unassigned_mem_write, NULL,
3816 DEVICE_NATIVE_ENDIAN);
3817 cpu_register_io_memory_fixed(IO_MEM_NOTDIRTY, error_mem_read,
3818 notdirty_mem_write, NULL,
3819 DEVICE_NATIVE_ENDIAN);
e9179ce1
AK
3820 for (i=0; i<5; i++)
3821 io_mem_used[i] = 1;
3822
3823 io_mem_watch = cpu_register_io_memory(watch_mem_read,
2507c12a
AG
3824 watch_mem_write, NULL,
3825 DEVICE_NATIVE_ENDIAN);
e9179ce1
AK
3826}
3827
62152b8a
AK
3828static void memory_map_init(void)
3829{
3830 system_memory = qemu_malloc(sizeof(*system_memory));
8417cebf 3831 memory_region_init(system_memory, "system", INT64_MAX);
62152b8a
AK
3832 set_system_memory_map(system_memory);
3833}
3834
3835MemoryRegion *get_system_memory(void)
3836{
3837 return system_memory;
3838}
3839
e2eef170
PB
3840#endif /* !defined(CONFIG_USER_ONLY) */
3841
13eb76e0
FB
3842/* physical memory access (slow version, mainly for debug) */
3843#if defined(CONFIG_USER_ONLY)
a68fe89c
PB
3844int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
3845 uint8_t *buf, int len, int is_write)
13eb76e0
FB
3846{
3847 int l, flags;
3848 target_ulong page;
53a5960a 3849 void * p;
13eb76e0
FB
3850
3851 while (len > 0) {
3852 page = addr & TARGET_PAGE_MASK;
3853 l = (page + TARGET_PAGE_SIZE) - addr;
3854 if (l > len)
3855 l = len;
3856 flags = page_get_flags(page);
3857 if (!(flags & PAGE_VALID))
a68fe89c 3858 return -1;
13eb76e0
FB
3859 if (is_write) {
3860 if (!(flags & PAGE_WRITE))
a68fe89c 3861 return -1;
579a97f7 3862 /* XXX: this code should not depend on lock_user */
72fb7daa 3863 if (!(p = lock_user(VERIFY_WRITE, addr, l, 0)))
a68fe89c 3864 return -1;
72fb7daa
AJ
3865 memcpy(p, buf, l);
3866 unlock_user(p, addr, l);
13eb76e0
FB
3867 } else {
3868 if (!(flags & PAGE_READ))
a68fe89c 3869 return -1;
579a97f7 3870 /* XXX: this code should not depend on lock_user */
72fb7daa 3871 if (!(p = lock_user(VERIFY_READ, addr, l, 1)))
a68fe89c 3872 return -1;
72fb7daa 3873 memcpy(buf, p, l);
5b257578 3874 unlock_user(p, addr, 0);
13eb76e0
FB
3875 }
3876 len -= l;
3877 buf += l;
3878 addr += l;
3879 }
a68fe89c 3880 return 0;
13eb76e0 3881}
8df1cd07 3882
13eb76e0 3883#else
c227f099 3884void cpu_physical_memory_rw(target_phys_addr_t addr, uint8_t *buf,
13eb76e0
FB
3885 int len, int is_write)
3886{
3887 int l, io_index;
3888 uint8_t *ptr;
3889 uint32_t val;
c227f099 3890 target_phys_addr_t page;
8ca5692d 3891 ram_addr_t pd;
92e873b9 3892 PhysPageDesc *p;
3b46e624 3893
13eb76e0
FB
3894 while (len > 0) {
3895 page = addr & TARGET_PAGE_MASK;
3896 l = (page + TARGET_PAGE_SIZE) - addr;
3897 if (l > len)
3898 l = len;
92e873b9 3899 p = phys_page_find(page >> TARGET_PAGE_BITS);
13eb76e0
FB
3900 if (!p) {
3901 pd = IO_MEM_UNASSIGNED;
3902 } else {
3903 pd = p->phys_offset;
3904 }
3b46e624 3905
13eb76e0 3906 if (is_write) {
3a7d929e 3907 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
c227f099 3908 target_phys_addr_t addr1 = addr;
13eb76e0 3909 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18 3910 if (p)
6c2934db 3911 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
6a00d601
FB
3912 /* XXX: could force cpu_single_env to NULL to avoid
3913 potential bugs */
6c2934db 3914 if (l >= 4 && ((addr1 & 3) == 0)) {
1c213d19 3915 /* 32 bit write access */
c27004ec 3916 val = ldl_p(buf);
6c2934db 3917 io_mem_write[io_index][2](io_mem_opaque[io_index], addr1, val);
13eb76e0 3918 l = 4;
6c2934db 3919 } else if (l >= 2 && ((addr1 & 1) == 0)) {
1c213d19 3920 /* 16 bit write access */
c27004ec 3921 val = lduw_p(buf);
6c2934db 3922 io_mem_write[io_index][1](io_mem_opaque[io_index], addr1, val);
13eb76e0
FB
3923 l = 2;
3924 } else {
1c213d19 3925 /* 8 bit write access */
c27004ec 3926 val = ldub_p(buf);
6c2934db 3927 io_mem_write[io_index][0](io_mem_opaque[io_index], addr1, val);
13eb76e0
FB
3928 l = 1;
3929 }
3930 } else {
8ca5692d 3931 ram_addr_t addr1;
b448f2f3 3932 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
13eb76e0 3933 /* RAM case */
5579c7f3 3934 ptr = qemu_get_ram_ptr(addr1);
13eb76e0 3935 memcpy(ptr, buf, l);
3a7d929e
FB
3936 if (!cpu_physical_memory_is_dirty(addr1)) {
3937 /* invalidate code */
3938 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
3939 /* set dirty bit */
f7c11b53
YT
3940 cpu_physical_memory_set_dirty_flags(
3941 addr1, (0xff & ~CODE_DIRTY_FLAG));
3a7d929e 3942 }
050a0ddf 3943 qemu_put_ram_ptr(ptr);
13eb76e0
FB
3944 }
3945 } else {
5fafdf24 3946 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
2a4188a3 3947 !(pd & IO_MEM_ROMD)) {
c227f099 3948 target_phys_addr_t addr1 = addr;
13eb76e0
FB
3949 /* I/O case */
3950 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18 3951 if (p)
6c2934db
AJ
3952 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3953 if (l >= 4 && ((addr1 & 3) == 0)) {
13eb76e0 3954 /* 32 bit read access */
6c2934db 3955 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr1);
c27004ec 3956 stl_p(buf, val);
13eb76e0 3957 l = 4;
6c2934db 3958 } else if (l >= 2 && ((addr1 & 1) == 0)) {
13eb76e0 3959 /* 16 bit read access */
6c2934db 3960 val = io_mem_read[io_index][1](io_mem_opaque[io_index], addr1);
c27004ec 3961 stw_p(buf, val);
13eb76e0
FB
3962 l = 2;
3963 } else {
1c213d19 3964 /* 8 bit read access */
6c2934db 3965 val = io_mem_read[io_index][0](io_mem_opaque[io_index], addr1);
c27004ec 3966 stb_p(buf, val);
13eb76e0
FB
3967 l = 1;
3968 }
3969 } else {
3970 /* RAM case */
050a0ddf
AP
3971 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK);
3972 memcpy(buf, ptr + (addr & ~TARGET_PAGE_MASK), l);
3973 qemu_put_ram_ptr(ptr);
13eb76e0
FB
3974 }
3975 }
3976 len -= l;
3977 buf += l;
3978 addr += l;
3979 }
3980}
8df1cd07 3981
d0ecd2aa 3982/* used for ROM loading : can write in RAM and ROM */
c227f099 3983void cpu_physical_memory_write_rom(target_phys_addr_t addr,
d0ecd2aa
FB
3984 const uint8_t *buf, int len)
3985{
3986 int l;
3987 uint8_t *ptr;
c227f099 3988 target_phys_addr_t page;
d0ecd2aa
FB
3989 unsigned long pd;
3990 PhysPageDesc *p;
3b46e624 3991
d0ecd2aa
FB
3992 while (len > 0) {
3993 page = addr & TARGET_PAGE_MASK;
3994 l = (page + TARGET_PAGE_SIZE) - addr;
3995 if (l > len)
3996 l = len;
3997 p = phys_page_find(page >> TARGET_PAGE_BITS);
3998 if (!p) {
3999 pd = IO_MEM_UNASSIGNED;
4000 } else {
4001 pd = p->phys_offset;
4002 }
3b46e624 4003
d0ecd2aa 4004 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM &&
2a4188a3
FB
4005 (pd & ~TARGET_PAGE_MASK) != IO_MEM_ROM &&
4006 !(pd & IO_MEM_ROMD)) {
d0ecd2aa
FB
4007 /* do nothing */
4008 } else {
4009 unsigned long addr1;
4010 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4011 /* ROM/RAM case */
5579c7f3 4012 ptr = qemu_get_ram_ptr(addr1);
d0ecd2aa 4013 memcpy(ptr, buf, l);
050a0ddf 4014 qemu_put_ram_ptr(ptr);
d0ecd2aa
FB
4015 }
4016 len -= l;
4017 buf += l;
4018 addr += l;
4019 }
4020}
4021
6d16c2f8
AL
4022typedef struct {
4023 void *buffer;
c227f099
AL
4024 target_phys_addr_t addr;
4025 target_phys_addr_t len;
6d16c2f8
AL
4026} BounceBuffer;
4027
4028static BounceBuffer bounce;
4029
ba223c29
AL
4030typedef struct MapClient {
4031 void *opaque;
4032 void (*callback)(void *opaque);
72cf2d4f 4033 QLIST_ENTRY(MapClient) link;
ba223c29
AL
4034} MapClient;
4035
72cf2d4f
BS
4036static QLIST_HEAD(map_client_list, MapClient) map_client_list
4037 = QLIST_HEAD_INITIALIZER(map_client_list);
ba223c29
AL
4038
4039void *cpu_register_map_client(void *opaque, void (*callback)(void *opaque))
4040{
4041 MapClient *client = qemu_malloc(sizeof(*client));
4042
4043 client->opaque = opaque;
4044 client->callback = callback;
72cf2d4f 4045 QLIST_INSERT_HEAD(&map_client_list, client, link);
ba223c29
AL
4046 return client;
4047}
4048
4049void cpu_unregister_map_client(void *_client)
4050{
4051 MapClient *client = (MapClient *)_client;
4052
72cf2d4f 4053 QLIST_REMOVE(client, link);
34d5e948 4054 qemu_free(client);
ba223c29
AL
4055}
4056
4057static void cpu_notify_map_clients(void)
4058{
4059 MapClient *client;
4060
72cf2d4f
BS
4061 while (!QLIST_EMPTY(&map_client_list)) {
4062 client = QLIST_FIRST(&map_client_list);
ba223c29 4063 client->callback(client->opaque);
34d5e948 4064 cpu_unregister_map_client(client);
ba223c29
AL
4065 }
4066}
4067
6d16c2f8
AL
4068/* Map a physical memory region into a host virtual address.
4069 * May map a subset of the requested range, given by and returned in *plen.
4070 * May return NULL if resources needed to perform the mapping are exhausted.
4071 * Use only for reads OR writes - not for read-modify-write operations.
ba223c29
AL
4072 * Use cpu_register_map_client() to know when retrying the map operation is
4073 * likely to succeed.
6d16c2f8 4074 */
c227f099
AL
4075void *cpu_physical_memory_map(target_phys_addr_t addr,
4076 target_phys_addr_t *plen,
6d16c2f8
AL
4077 int is_write)
4078{
c227f099 4079 target_phys_addr_t len = *plen;
38bee5dc 4080 target_phys_addr_t todo = 0;
6d16c2f8 4081 int l;
c227f099 4082 target_phys_addr_t page;
6d16c2f8
AL
4083 unsigned long pd;
4084 PhysPageDesc *p;
f15fbc4b 4085 ram_addr_t raddr = RAM_ADDR_MAX;
8ab934f9
SS
4086 ram_addr_t rlen;
4087 void *ret;
6d16c2f8
AL
4088
4089 while (len > 0) {
4090 page = addr & TARGET_PAGE_MASK;
4091 l = (page + TARGET_PAGE_SIZE) - addr;
4092 if (l > len)
4093 l = len;
4094 p = phys_page_find(page >> TARGET_PAGE_BITS);
4095 if (!p) {
4096 pd = IO_MEM_UNASSIGNED;
4097 } else {
4098 pd = p->phys_offset;
4099 }
4100
4101 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
38bee5dc 4102 if (todo || bounce.buffer) {
6d16c2f8
AL
4103 break;
4104 }
4105 bounce.buffer = qemu_memalign(TARGET_PAGE_SIZE, TARGET_PAGE_SIZE);
4106 bounce.addr = addr;
4107 bounce.len = l;
4108 if (!is_write) {
54f7b4a3 4109 cpu_physical_memory_read(addr, bounce.buffer, l);
6d16c2f8 4110 }
38bee5dc
SS
4111
4112 *plen = l;
4113 return bounce.buffer;
6d16c2f8 4114 }
8ab934f9
SS
4115 if (!todo) {
4116 raddr = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4117 }
6d16c2f8
AL
4118
4119 len -= l;
4120 addr += l;
38bee5dc 4121 todo += l;
6d16c2f8 4122 }
8ab934f9
SS
4123 rlen = todo;
4124 ret = qemu_ram_ptr_length(raddr, &rlen);
4125 *plen = rlen;
4126 return ret;
6d16c2f8
AL
4127}
4128
4129/* Unmaps a memory region previously mapped by cpu_physical_memory_map().
4130 * Will also mark the memory as dirty if is_write == 1. access_len gives
4131 * the amount of memory that was actually read or written by the caller.
4132 */
c227f099
AL
4133void cpu_physical_memory_unmap(void *buffer, target_phys_addr_t len,
4134 int is_write, target_phys_addr_t access_len)
6d16c2f8
AL
4135{
4136 if (buffer != bounce.buffer) {
4137 if (is_write) {
e890261f 4138 ram_addr_t addr1 = qemu_ram_addr_from_host_nofail(buffer);
6d16c2f8
AL
4139 while (access_len) {
4140 unsigned l;
4141 l = TARGET_PAGE_SIZE;
4142 if (l > access_len)
4143 l = access_len;
4144 if (!cpu_physical_memory_is_dirty(addr1)) {
4145 /* invalidate code */
4146 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
4147 /* set dirty bit */
f7c11b53
YT
4148 cpu_physical_memory_set_dirty_flags(
4149 addr1, (0xff & ~CODE_DIRTY_FLAG));
6d16c2f8
AL
4150 }
4151 addr1 += l;
4152 access_len -= l;
4153 }
4154 }
868bb33f 4155 if (xen_enabled()) {
e41d7c69 4156 xen_invalidate_map_cache_entry(buffer);
050a0ddf 4157 }
6d16c2f8
AL
4158 return;
4159 }
4160 if (is_write) {
4161 cpu_physical_memory_write(bounce.addr, bounce.buffer, access_len);
4162 }
f8a83245 4163 qemu_vfree(bounce.buffer);
6d16c2f8 4164 bounce.buffer = NULL;
ba223c29 4165 cpu_notify_map_clients();
6d16c2f8 4166}
d0ecd2aa 4167
8df1cd07 4168/* warning: addr must be aligned */
1e78bcc1
AG
4169static inline uint32_t ldl_phys_internal(target_phys_addr_t addr,
4170 enum device_endian endian)
8df1cd07
FB
4171{
4172 int io_index;
4173 uint8_t *ptr;
4174 uint32_t val;
4175 unsigned long pd;
4176 PhysPageDesc *p;
4177
4178 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4179 if (!p) {
4180 pd = IO_MEM_UNASSIGNED;
4181 } else {
4182 pd = p->phys_offset;
4183 }
3b46e624 4184
5fafdf24 4185 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
2a4188a3 4186 !(pd & IO_MEM_ROMD)) {
8df1cd07
FB
4187 /* I/O case */
4188 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4189 if (p)
4190 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
8df1cd07 4191 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
1e78bcc1
AG
4192#if defined(TARGET_WORDS_BIGENDIAN)
4193 if (endian == DEVICE_LITTLE_ENDIAN) {
4194 val = bswap32(val);
4195 }
4196#else
4197 if (endian == DEVICE_BIG_ENDIAN) {
4198 val = bswap32(val);
4199 }
4200#endif
8df1cd07
FB
4201 } else {
4202 /* RAM case */
5579c7f3 4203 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
8df1cd07 4204 (addr & ~TARGET_PAGE_MASK);
1e78bcc1
AG
4205 switch (endian) {
4206 case DEVICE_LITTLE_ENDIAN:
4207 val = ldl_le_p(ptr);
4208 break;
4209 case DEVICE_BIG_ENDIAN:
4210 val = ldl_be_p(ptr);
4211 break;
4212 default:
4213 val = ldl_p(ptr);
4214 break;
4215 }
8df1cd07
FB
4216 }
4217 return val;
4218}
4219
1e78bcc1
AG
4220uint32_t ldl_phys(target_phys_addr_t addr)
4221{
4222 return ldl_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
4223}
4224
4225uint32_t ldl_le_phys(target_phys_addr_t addr)
4226{
4227 return ldl_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
4228}
4229
4230uint32_t ldl_be_phys(target_phys_addr_t addr)
4231{
4232 return ldl_phys_internal(addr, DEVICE_BIG_ENDIAN);
4233}
4234
84b7b8e7 4235/* warning: addr must be aligned */
1e78bcc1
AG
4236static inline uint64_t ldq_phys_internal(target_phys_addr_t addr,
4237 enum device_endian endian)
84b7b8e7
FB
4238{
4239 int io_index;
4240 uint8_t *ptr;
4241 uint64_t val;
4242 unsigned long pd;
4243 PhysPageDesc *p;
4244
4245 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4246 if (!p) {
4247 pd = IO_MEM_UNASSIGNED;
4248 } else {
4249 pd = p->phys_offset;
4250 }
3b46e624 4251
2a4188a3
FB
4252 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
4253 !(pd & IO_MEM_ROMD)) {
84b7b8e7
FB
4254 /* I/O case */
4255 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4256 if (p)
4257 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
1e78bcc1
AG
4258
4259 /* XXX This is broken when device endian != cpu endian.
4260 Fix and add "endian" variable check */
84b7b8e7
FB
4261#ifdef TARGET_WORDS_BIGENDIAN
4262 val = (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr) << 32;
4263 val |= io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4);
4264#else
4265 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
4266 val |= (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4) << 32;
4267#endif
4268 } else {
4269 /* RAM case */
5579c7f3 4270 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
84b7b8e7 4271 (addr & ~TARGET_PAGE_MASK);
1e78bcc1
AG
4272 switch (endian) {
4273 case DEVICE_LITTLE_ENDIAN:
4274 val = ldq_le_p(ptr);
4275 break;
4276 case DEVICE_BIG_ENDIAN:
4277 val = ldq_be_p(ptr);
4278 break;
4279 default:
4280 val = ldq_p(ptr);
4281 break;
4282 }
84b7b8e7
FB
4283 }
4284 return val;
4285}
4286
1e78bcc1
AG
4287uint64_t ldq_phys(target_phys_addr_t addr)
4288{
4289 return ldq_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
4290}
4291
4292uint64_t ldq_le_phys(target_phys_addr_t addr)
4293{
4294 return ldq_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
4295}
4296
4297uint64_t ldq_be_phys(target_phys_addr_t addr)
4298{
4299 return ldq_phys_internal(addr, DEVICE_BIG_ENDIAN);
4300}
4301
aab33094 4302/* XXX: optimize */
c227f099 4303uint32_t ldub_phys(target_phys_addr_t addr)
aab33094
FB
4304{
4305 uint8_t val;
4306 cpu_physical_memory_read(addr, &val, 1);
4307 return val;
4308}
4309
733f0b02 4310/* warning: addr must be aligned */
1e78bcc1
AG
4311static inline uint32_t lduw_phys_internal(target_phys_addr_t addr,
4312 enum device_endian endian)
aab33094 4313{
733f0b02
MT
4314 int io_index;
4315 uint8_t *ptr;
4316 uint64_t val;
4317 unsigned long pd;
4318 PhysPageDesc *p;
4319
4320 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4321 if (!p) {
4322 pd = IO_MEM_UNASSIGNED;
4323 } else {
4324 pd = p->phys_offset;
4325 }
4326
4327 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
4328 !(pd & IO_MEM_ROMD)) {
4329 /* I/O case */
4330 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
4331 if (p)
4332 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
4333 val = io_mem_read[io_index][1](io_mem_opaque[io_index], addr);
1e78bcc1
AG
4334#if defined(TARGET_WORDS_BIGENDIAN)
4335 if (endian == DEVICE_LITTLE_ENDIAN) {
4336 val = bswap16(val);
4337 }
4338#else
4339 if (endian == DEVICE_BIG_ENDIAN) {
4340 val = bswap16(val);
4341 }
4342#endif
733f0b02
MT
4343 } else {
4344 /* RAM case */
4345 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
4346 (addr & ~TARGET_PAGE_MASK);
1e78bcc1
AG
4347 switch (endian) {
4348 case DEVICE_LITTLE_ENDIAN:
4349 val = lduw_le_p(ptr);
4350 break;
4351 case DEVICE_BIG_ENDIAN:
4352 val = lduw_be_p(ptr);
4353 break;
4354 default:
4355 val = lduw_p(ptr);
4356 break;
4357 }
733f0b02
MT
4358 }
4359 return val;
aab33094
FB
4360}
4361
1e78bcc1
AG
4362uint32_t lduw_phys(target_phys_addr_t addr)
4363{
4364 return lduw_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
4365}
4366
4367uint32_t lduw_le_phys(target_phys_addr_t addr)
4368{
4369 return lduw_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
4370}
4371
4372uint32_t lduw_be_phys(target_phys_addr_t addr)
4373{
4374 return lduw_phys_internal(addr, DEVICE_BIG_ENDIAN);
4375}
4376
8df1cd07
FB
4377/* warning: addr must be aligned. The ram page is not masked as dirty
4378 and the code inside is not invalidated. It is useful if the dirty
4379 bits are used to track modified PTEs */
c227f099 4380void stl_phys_notdirty(target_phys_addr_t addr, uint32_t val)
8df1cd07
FB
4381{
4382 int io_index;
4383 uint8_t *ptr;
4384 unsigned long pd;
4385 PhysPageDesc *p;
4386
4387 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4388 if (!p) {
4389 pd = IO_MEM_UNASSIGNED;
4390 } else {
4391 pd = p->phys_offset;
4392 }
3b46e624 4393
3a7d929e 4394 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
8df1cd07 4395 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4396 if (p)
4397 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
8df1cd07
FB
4398 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4399 } else {
74576198 4400 unsigned long addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
5579c7f3 4401 ptr = qemu_get_ram_ptr(addr1);
8df1cd07 4402 stl_p(ptr, val);
74576198
AL
4403
4404 if (unlikely(in_migration)) {
4405 if (!cpu_physical_memory_is_dirty(addr1)) {
4406 /* invalidate code */
4407 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
4408 /* set dirty bit */
f7c11b53
YT
4409 cpu_physical_memory_set_dirty_flags(
4410 addr1, (0xff & ~CODE_DIRTY_FLAG));
74576198
AL
4411 }
4412 }
8df1cd07
FB
4413 }
4414}
4415
c227f099 4416void stq_phys_notdirty(target_phys_addr_t addr, uint64_t val)
bc98a7ef
JM
4417{
4418 int io_index;
4419 uint8_t *ptr;
4420 unsigned long pd;
4421 PhysPageDesc *p;
4422
4423 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4424 if (!p) {
4425 pd = IO_MEM_UNASSIGNED;
4426 } else {
4427 pd = p->phys_offset;
4428 }
3b46e624 4429
bc98a7ef
JM
4430 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
4431 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4432 if (p)
4433 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
bc98a7ef
JM
4434#ifdef TARGET_WORDS_BIGENDIAN
4435 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val >> 32);
4436 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val);
4437#else
4438 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4439 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val >> 32);
4440#endif
4441 } else {
5579c7f3 4442 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
bc98a7ef
JM
4443 (addr & ~TARGET_PAGE_MASK);
4444 stq_p(ptr, val);
4445 }
4446}
4447
8df1cd07 4448/* warning: addr must be aligned */
1e78bcc1
AG
4449static inline void stl_phys_internal(target_phys_addr_t addr, uint32_t val,
4450 enum device_endian endian)
8df1cd07
FB
4451{
4452 int io_index;
4453 uint8_t *ptr;
4454 unsigned long pd;
4455 PhysPageDesc *p;
4456
4457 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4458 if (!p) {
4459 pd = IO_MEM_UNASSIGNED;
4460 } else {
4461 pd = p->phys_offset;
4462 }
3b46e624 4463
3a7d929e 4464 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
8df1cd07 4465 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4466 if (p)
4467 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
1e78bcc1
AG
4468#if defined(TARGET_WORDS_BIGENDIAN)
4469 if (endian == DEVICE_LITTLE_ENDIAN) {
4470 val = bswap32(val);
4471 }
4472#else
4473 if (endian == DEVICE_BIG_ENDIAN) {
4474 val = bswap32(val);
4475 }
4476#endif
8df1cd07
FB
4477 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4478 } else {
4479 unsigned long addr1;
4480 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4481 /* RAM case */
5579c7f3 4482 ptr = qemu_get_ram_ptr(addr1);
1e78bcc1
AG
4483 switch (endian) {
4484 case DEVICE_LITTLE_ENDIAN:
4485 stl_le_p(ptr, val);
4486 break;
4487 case DEVICE_BIG_ENDIAN:
4488 stl_be_p(ptr, val);
4489 break;
4490 default:
4491 stl_p(ptr, val);
4492 break;
4493 }
3a7d929e
FB
4494 if (!cpu_physical_memory_is_dirty(addr1)) {
4495 /* invalidate code */
4496 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
4497 /* set dirty bit */
f7c11b53
YT
4498 cpu_physical_memory_set_dirty_flags(addr1,
4499 (0xff & ~CODE_DIRTY_FLAG));
3a7d929e 4500 }
8df1cd07
FB
4501 }
4502}
4503
1e78bcc1
AG
4504void stl_phys(target_phys_addr_t addr, uint32_t val)
4505{
4506 stl_phys_internal(addr, val, DEVICE_NATIVE_ENDIAN);
4507}
4508
4509void stl_le_phys(target_phys_addr_t addr, uint32_t val)
4510{
4511 stl_phys_internal(addr, val, DEVICE_LITTLE_ENDIAN);
4512}
4513
4514void stl_be_phys(target_phys_addr_t addr, uint32_t val)
4515{
4516 stl_phys_internal(addr, val, DEVICE_BIG_ENDIAN);
4517}
4518
aab33094 4519/* XXX: optimize */
c227f099 4520void stb_phys(target_phys_addr_t addr, uint32_t val)
aab33094
FB
4521{
4522 uint8_t v = val;
4523 cpu_physical_memory_write(addr, &v, 1);
4524}
4525
733f0b02 4526/* warning: addr must be aligned */
1e78bcc1
AG
4527static inline void stw_phys_internal(target_phys_addr_t addr, uint32_t val,
4528 enum device_endian endian)
aab33094 4529{
733f0b02
MT
4530 int io_index;
4531 uint8_t *ptr;
4532 unsigned long pd;
4533 PhysPageDesc *p;
4534
4535 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4536 if (!p) {
4537 pd = IO_MEM_UNASSIGNED;
4538 } else {
4539 pd = p->phys_offset;
4540 }
4541
4542 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
4543 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
4544 if (p)
4545 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
1e78bcc1
AG
4546#if defined(TARGET_WORDS_BIGENDIAN)
4547 if (endian == DEVICE_LITTLE_ENDIAN) {
4548 val = bswap16(val);
4549 }
4550#else
4551 if (endian == DEVICE_BIG_ENDIAN) {
4552 val = bswap16(val);
4553 }
4554#endif
733f0b02
MT
4555 io_mem_write[io_index][1](io_mem_opaque[io_index], addr, val);
4556 } else {
4557 unsigned long addr1;
4558 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4559 /* RAM case */
4560 ptr = qemu_get_ram_ptr(addr1);
1e78bcc1
AG
4561 switch (endian) {
4562 case DEVICE_LITTLE_ENDIAN:
4563 stw_le_p(ptr, val);
4564 break;
4565 case DEVICE_BIG_ENDIAN:
4566 stw_be_p(ptr, val);
4567 break;
4568 default:
4569 stw_p(ptr, val);
4570 break;
4571 }
733f0b02
MT
4572 if (!cpu_physical_memory_is_dirty(addr1)) {
4573 /* invalidate code */
4574 tb_invalidate_phys_page_range(addr1, addr1 + 2, 0);
4575 /* set dirty bit */
4576 cpu_physical_memory_set_dirty_flags(addr1,
4577 (0xff & ~CODE_DIRTY_FLAG));
4578 }
4579 }
aab33094
FB
4580}
4581
1e78bcc1
AG
4582void stw_phys(target_phys_addr_t addr, uint32_t val)
4583{
4584 stw_phys_internal(addr, val, DEVICE_NATIVE_ENDIAN);
4585}
4586
4587void stw_le_phys(target_phys_addr_t addr, uint32_t val)
4588{
4589 stw_phys_internal(addr, val, DEVICE_LITTLE_ENDIAN);
4590}
4591
4592void stw_be_phys(target_phys_addr_t addr, uint32_t val)
4593{
4594 stw_phys_internal(addr, val, DEVICE_BIG_ENDIAN);
4595}
4596
aab33094 4597/* XXX: optimize */
c227f099 4598void stq_phys(target_phys_addr_t addr, uint64_t val)
aab33094
FB
4599{
4600 val = tswap64(val);
71d2b725 4601 cpu_physical_memory_write(addr, &val, 8);
aab33094
FB
4602}
4603
1e78bcc1
AG
4604void stq_le_phys(target_phys_addr_t addr, uint64_t val)
4605{
4606 val = cpu_to_le64(val);
4607 cpu_physical_memory_write(addr, &val, 8);
4608}
4609
4610void stq_be_phys(target_phys_addr_t addr, uint64_t val)
4611{
4612 val = cpu_to_be64(val);
4613 cpu_physical_memory_write(addr, &val, 8);
4614}
4615
5e2972fd 4616/* virtual memory access for debug (includes writing to ROM) */
5fafdf24 4617int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
b448f2f3 4618 uint8_t *buf, int len, int is_write)
13eb76e0
FB
4619{
4620 int l;
c227f099 4621 target_phys_addr_t phys_addr;
9b3c35e0 4622 target_ulong page;
13eb76e0
FB
4623
4624 while (len > 0) {
4625 page = addr & TARGET_PAGE_MASK;
4626 phys_addr = cpu_get_phys_page_debug(env, page);
4627 /* if no physical page mapped, return an error */
4628 if (phys_addr == -1)
4629 return -1;
4630 l = (page + TARGET_PAGE_SIZE) - addr;
4631 if (l > len)
4632 l = len;
5e2972fd 4633 phys_addr += (addr & ~TARGET_PAGE_MASK);
5e2972fd
AL
4634 if (is_write)
4635 cpu_physical_memory_write_rom(phys_addr, buf, l);
4636 else
5e2972fd 4637 cpu_physical_memory_rw(phys_addr, buf, l, is_write);
13eb76e0
FB
4638 len -= l;
4639 buf += l;
4640 addr += l;
4641 }
4642 return 0;
4643}
a68fe89c 4644#endif
13eb76e0 4645
2e70f6ef
PB
4646/* in deterministic execution mode, instructions doing device I/Os
4647 must be at the end of the TB */
4648void cpu_io_recompile(CPUState *env, void *retaddr)
4649{
4650 TranslationBlock *tb;
4651 uint32_t n, cflags;
4652 target_ulong pc, cs_base;
4653 uint64_t flags;
4654
4655 tb = tb_find_pc((unsigned long)retaddr);
4656 if (!tb) {
4657 cpu_abort(env, "cpu_io_recompile: could not find TB for pc=%p",
4658 retaddr);
4659 }
4660 n = env->icount_decr.u16.low + tb->icount;
618ba8e6 4661 cpu_restore_state(tb, env, (unsigned long)retaddr);
2e70f6ef 4662 /* Calculate how many instructions had been executed before the fault
bf20dc07 4663 occurred. */
2e70f6ef
PB
4664 n = n - env->icount_decr.u16.low;
4665 /* Generate a new TB ending on the I/O insn. */
4666 n++;
4667 /* On MIPS and SH, delay slot instructions can only be restarted if
4668 they were already the first instruction in the TB. If this is not
bf20dc07 4669 the first instruction in a TB then re-execute the preceding
2e70f6ef
PB
4670 branch. */
4671#if defined(TARGET_MIPS)
4672 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
4673 env->active_tc.PC -= 4;
4674 env->icount_decr.u16.low++;
4675 env->hflags &= ~MIPS_HFLAG_BMASK;
4676 }
4677#elif defined(TARGET_SH4)
4678 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
4679 && n > 1) {
4680 env->pc -= 2;
4681 env->icount_decr.u16.low++;
4682 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
4683 }
4684#endif
4685 /* This should never happen. */
4686 if (n > CF_COUNT_MASK)
4687 cpu_abort(env, "TB too big during recompile");
4688
4689 cflags = n | CF_LAST_IO;
4690 pc = tb->pc;
4691 cs_base = tb->cs_base;
4692 flags = tb->flags;
4693 tb_phys_invalidate(tb, -1);
4694 /* FIXME: In theory this could raise an exception. In practice
4695 we have already translated the block once so it's probably ok. */
4696 tb_gen_code(env, pc, cs_base, flags, cflags);
bf20dc07 4697 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
2e70f6ef
PB
4698 the first in the TB) then we end up generating a whole new TB and
4699 repeating the fault, which is horribly inefficient.
4700 Better would be to execute just this insn uncached, or generate a
4701 second new TB. */
4702 cpu_resume_from_signal(env, NULL);
4703}
4704
b3755a91
PB
4705#if !defined(CONFIG_USER_ONLY)
4706
055403b2 4707void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
e3db7226
FB
4708{
4709 int i, target_code_size, max_target_code_size;
4710 int direct_jmp_count, direct_jmp2_count, cross_page;
4711 TranslationBlock *tb;
3b46e624 4712
e3db7226
FB
4713 target_code_size = 0;
4714 max_target_code_size = 0;
4715 cross_page = 0;
4716 direct_jmp_count = 0;
4717 direct_jmp2_count = 0;
4718 for(i = 0; i < nb_tbs; i++) {
4719 tb = &tbs[i];
4720 target_code_size += tb->size;
4721 if (tb->size > max_target_code_size)
4722 max_target_code_size = tb->size;
4723 if (tb->page_addr[1] != -1)
4724 cross_page++;
4725 if (tb->tb_next_offset[0] != 0xffff) {
4726 direct_jmp_count++;
4727 if (tb->tb_next_offset[1] != 0xffff) {
4728 direct_jmp2_count++;
4729 }
4730 }
4731 }
4732 /* XXX: avoid using doubles ? */
57fec1fe 4733 cpu_fprintf(f, "Translation buffer state:\n");
055403b2 4734 cpu_fprintf(f, "gen code size %td/%ld\n",
26a5f13b
FB
4735 code_gen_ptr - code_gen_buffer, code_gen_buffer_max_size);
4736 cpu_fprintf(f, "TB count %d/%d\n",
4737 nb_tbs, code_gen_max_blocks);
5fafdf24 4738 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
e3db7226
FB
4739 nb_tbs ? target_code_size / nb_tbs : 0,
4740 max_target_code_size);
055403b2 4741 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
e3db7226
FB
4742 nb_tbs ? (code_gen_ptr - code_gen_buffer) / nb_tbs : 0,
4743 target_code_size ? (double) (code_gen_ptr - code_gen_buffer) / target_code_size : 0);
5fafdf24
TS
4744 cpu_fprintf(f, "cross page TB count %d (%d%%)\n",
4745 cross_page,
e3db7226
FB
4746 nb_tbs ? (cross_page * 100) / nb_tbs : 0);
4747 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
5fafdf24 4748 direct_jmp_count,
e3db7226
FB
4749 nb_tbs ? (direct_jmp_count * 100) / nb_tbs : 0,
4750 direct_jmp2_count,
4751 nb_tbs ? (direct_jmp2_count * 100) / nb_tbs : 0);
57fec1fe 4752 cpu_fprintf(f, "\nStatistics:\n");
e3db7226
FB
4753 cpu_fprintf(f, "TB flush count %d\n", tb_flush_count);
4754 cpu_fprintf(f, "TB invalidate count %d\n", tb_phys_invalidate_count);
4755 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
b67d9a52 4756 tcg_dump_info(f, cpu_fprintf);
e3db7226
FB
4757}
4758
61382a50
FB
4759#define MMUSUFFIX _cmmu
4760#define GETPC() NULL
4761#define env cpu_single_env
b769d8fe 4762#define SOFTMMU_CODE_ACCESS
61382a50
FB
4763
4764#define SHIFT 0
4765#include "softmmu_template.h"
4766
4767#define SHIFT 1
4768#include "softmmu_template.h"
4769
4770#define SHIFT 2
4771#include "softmmu_template.h"
4772
4773#define SHIFT 3
4774#include "softmmu_template.h"
4775
4776#undef env
4777
4778#endif