]> git.proxmox.com Git - qemu.git/blame - exec.c
s390x: fix memory detection for guests > 64GB
[qemu.git] / exec.c
CommitLineData
54936004 1/*
fd6ce8f6 2 * virtual page mapping and translated block handling
5fafdf24 3 *
54936004
FB
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
8167ee88 17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
54936004 18 */
67b915a5 19#include "config.h"
d5a8f07c
FB
20#ifdef _WIN32
21#include <windows.h>
22#else
a98d49b1 23#include <sys/types.h>
d5a8f07c
FB
24#include <sys/mman.h>
25#endif
54936004 26
055403b2 27#include "qemu-common.h"
6180a181
FB
28#include "cpu.h"
29#include "exec-all.h"
b67d9a52 30#include "tcg.h"
b3c7724c 31#include "hw/hw.h"
cc9e98cb 32#include "hw/qdev.h"
74576198 33#include "osdep.h"
7ba1e619 34#include "kvm.h"
432d268c 35#include "hw/xen.h"
29e922b6 36#include "qemu-timer.h"
53a5960a
PB
37#if defined(CONFIG_USER_ONLY)
38#include <qemu.h>
fd052bf6 39#include <signal.h>
f01576f1
JL
40#if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
41#include <sys/param.h>
42#if __FreeBSD_version >= 700104
43#define HAVE_KINFO_GETVMMAP
44#define sigqueue sigqueue_freebsd /* avoid redefinition */
45#include <sys/time.h>
46#include <sys/proc.h>
47#include <machine/profile.h>
48#define _KERNEL
49#include <sys/user.h>
50#undef _KERNEL
51#undef sigqueue
52#include <libutil.h>
53#endif
54#endif
432d268c
JN
55#else /* !CONFIG_USER_ONLY */
56#include "xen-mapcache.h"
53a5960a 57#endif
54936004 58
fd6ce8f6 59//#define DEBUG_TB_INVALIDATE
66e85a21 60//#define DEBUG_FLUSH
9fa3e853 61//#define DEBUG_TLB
67d3b957 62//#define DEBUG_UNASSIGNED
fd6ce8f6
FB
63
64/* make various TB consistency checks */
5fafdf24
TS
65//#define DEBUG_TB_CHECK
66//#define DEBUG_TLB_CHECK
fd6ce8f6 67
1196be37 68//#define DEBUG_IOPORT
db7b5426 69//#define DEBUG_SUBPAGE
1196be37 70
99773bd4
PB
71#if !defined(CONFIG_USER_ONLY)
72/* TB consistency checks only implemented for usermode emulation. */
73#undef DEBUG_TB_CHECK
74#endif
75
9fa3e853
FB
76#define SMC_BITMAP_USE_THRESHOLD 10
77
bdaf78e0 78static TranslationBlock *tbs;
24ab68ac 79static int code_gen_max_blocks;
9fa3e853 80TranslationBlock *tb_phys_hash[CODE_GEN_PHYS_HASH_SIZE];
bdaf78e0 81static int nb_tbs;
eb51d102 82/* any access to the tbs or the page table must use this lock */
c227f099 83spinlock_t tb_lock = SPIN_LOCK_UNLOCKED;
fd6ce8f6 84
141ac468
BS
85#if defined(__arm__) || defined(__sparc_v9__)
86/* The prologue must be reachable with a direct jump. ARM and Sparc64
87 have limited branch ranges (possibly also PPC) so place it in a
d03d860b
BS
88 section close to code segment. */
89#define code_gen_section \
90 __attribute__((__section__(".gen_code"))) \
91 __attribute__((aligned (32)))
f8e2af11
SW
92#elif defined(_WIN32)
93/* Maximum alignment for Win32 is 16. */
94#define code_gen_section \
95 __attribute__((aligned (16)))
d03d860b
BS
96#else
97#define code_gen_section \
98 __attribute__((aligned (32)))
99#endif
100
101uint8_t code_gen_prologue[1024] code_gen_section;
bdaf78e0
BS
102static uint8_t *code_gen_buffer;
103static unsigned long code_gen_buffer_size;
26a5f13b 104/* threshold to flush the translated code buffer */
bdaf78e0 105static unsigned long code_gen_buffer_max_size;
24ab68ac 106static uint8_t *code_gen_ptr;
fd6ce8f6 107
e2eef170 108#if !defined(CONFIG_USER_ONLY)
9fa3e853 109int phys_ram_fd;
74576198 110static int in_migration;
94a6b54f 111
f471a17e 112RAMList ram_list = { .blocks = QLIST_HEAD_INITIALIZER(ram_list) };
e2eef170 113#endif
9fa3e853 114
6a00d601
FB
115CPUState *first_cpu;
116/* current CPU in the current thread. It is only valid inside
117 cpu_exec() */
5fafdf24 118CPUState *cpu_single_env;
2e70f6ef 119/* 0 = Do not count executed instructions.
bf20dc07 120 1 = Precise instruction counting.
2e70f6ef
PB
121 2 = Adaptive rate instruction counting. */
122int use_icount = 0;
123/* Current instruction counter. While executing translated code this may
124 include some instructions that have not yet been executed. */
125int64_t qemu_icount;
6a00d601 126
54936004 127typedef struct PageDesc {
92e873b9 128 /* list of TBs intersecting this ram page */
fd6ce8f6 129 TranslationBlock *first_tb;
9fa3e853
FB
130 /* in order to optimize self modifying code, we count the number
131 of lookups we do to a given page to use a bitmap */
132 unsigned int code_write_count;
133 uint8_t *code_bitmap;
134#if defined(CONFIG_USER_ONLY)
135 unsigned long flags;
136#endif
54936004
FB
137} PageDesc;
138
41c1b1c9 139/* In system mode we want L1_MAP to be based on ram offsets,
5cd2c5b6
RH
140 while in user mode we want it to be based on virtual addresses. */
141#if !defined(CONFIG_USER_ONLY)
41c1b1c9
PB
142#if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
143# define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
144#else
5cd2c5b6 145# define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
41c1b1c9 146#endif
bedb69ea 147#else
5cd2c5b6 148# define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
bedb69ea 149#endif
54936004 150
5cd2c5b6
RH
151/* Size of the L2 (and L3, etc) page tables. */
152#define L2_BITS 10
54936004
FB
153#define L2_SIZE (1 << L2_BITS)
154
5cd2c5b6
RH
155/* The bits remaining after N lower levels of page tables. */
156#define P_L1_BITS_REM \
157 ((TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
158#define V_L1_BITS_REM \
159 ((L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
160
161/* Size of the L1 page table. Avoid silly small sizes. */
162#if P_L1_BITS_REM < 4
163#define P_L1_BITS (P_L1_BITS_REM + L2_BITS)
164#else
165#define P_L1_BITS P_L1_BITS_REM
166#endif
167
168#if V_L1_BITS_REM < 4
169#define V_L1_BITS (V_L1_BITS_REM + L2_BITS)
170#else
171#define V_L1_BITS V_L1_BITS_REM
172#endif
173
174#define P_L1_SIZE ((target_phys_addr_t)1 << P_L1_BITS)
175#define V_L1_SIZE ((target_ulong)1 << V_L1_BITS)
176
177#define P_L1_SHIFT (TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS - P_L1_BITS)
178#define V_L1_SHIFT (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - V_L1_BITS)
179
83fb7adf
FB
180unsigned long qemu_real_host_page_size;
181unsigned long qemu_host_page_bits;
182unsigned long qemu_host_page_size;
183unsigned long qemu_host_page_mask;
54936004 184
5cd2c5b6
RH
185/* This is a multi-level map on the virtual address space.
186 The bottom level has pointers to PageDesc. */
187static void *l1_map[V_L1_SIZE];
54936004 188
e2eef170 189#if !defined(CONFIG_USER_ONLY)
41c1b1c9
PB
190typedef struct PhysPageDesc {
191 /* offset in host memory of the page + io_index in the low bits */
192 ram_addr_t phys_offset;
193 ram_addr_t region_offset;
194} PhysPageDesc;
195
5cd2c5b6
RH
196/* This is a multi-level map on the physical address space.
197 The bottom level has pointers to PhysPageDesc. */
198static void *l1_phys_map[P_L1_SIZE];
6d9a1304 199
e2eef170
PB
200static void io_mem_init(void);
201
33417e70 202/* io memory support */
33417e70
FB
203CPUWriteMemoryFunc *io_mem_write[IO_MEM_NB_ENTRIES][4];
204CPUReadMemoryFunc *io_mem_read[IO_MEM_NB_ENTRIES][4];
a4193c8a 205void *io_mem_opaque[IO_MEM_NB_ENTRIES];
511d2b14 206static char io_mem_used[IO_MEM_NB_ENTRIES];
6658ffb8
PB
207static int io_mem_watch;
208#endif
33417e70 209
34865134 210/* log support */
1e8b27ca
JR
211#ifdef WIN32
212static const char *logfilename = "qemu.log";
213#else
d9b630fd 214static const char *logfilename = "/tmp/qemu.log";
1e8b27ca 215#endif
34865134
FB
216FILE *logfile;
217int loglevel;
e735b91c 218static int log_append = 0;
34865134 219
e3db7226 220/* statistics */
b3755a91 221#if !defined(CONFIG_USER_ONLY)
e3db7226 222static int tlb_flush_count;
b3755a91 223#endif
e3db7226
FB
224static int tb_flush_count;
225static int tb_phys_invalidate_count;
226
7cb69cae
FB
227#ifdef _WIN32
228static void map_exec(void *addr, long size)
229{
230 DWORD old_protect;
231 VirtualProtect(addr, size,
232 PAGE_EXECUTE_READWRITE, &old_protect);
233
234}
235#else
236static void map_exec(void *addr, long size)
237{
4369415f 238 unsigned long start, end, page_size;
7cb69cae 239
4369415f 240 page_size = getpagesize();
7cb69cae 241 start = (unsigned long)addr;
4369415f 242 start &= ~(page_size - 1);
7cb69cae
FB
243
244 end = (unsigned long)addr + size;
4369415f
FB
245 end += page_size - 1;
246 end &= ~(page_size - 1);
7cb69cae
FB
247
248 mprotect((void *)start, end - start,
249 PROT_READ | PROT_WRITE | PROT_EXEC);
250}
251#endif
252
b346ff46 253static void page_init(void)
54936004 254{
83fb7adf 255 /* NOTE: we can always suppose that qemu_host_page_size >=
54936004 256 TARGET_PAGE_SIZE */
c2b48b69
AL
257#ifdef _WIN32
258 {
259 SYSTEM_INFO system_info;
260
261 GetSystemInfo(&system_info);
262 qemu_real_host_page_size = system_info.dwPageSize;
263 }
264#else
265 qemu_real_host_page_size = getpagesize();
266#endif
83fb7adf
FB
267 if (qemu_host_page_size == 0)
268 qemu_host_page_size = qemu_real_host_page_size;
269 if (qemu_host_page_size < TARGET_PAGE_SIZE)
270 qemu_host_page_size = TARGET_PAGE_SIZE;
271 qemu_host_page_bits = 0;
272 while ((1 << qemu_host_page_bits) < qemu_host_page_size)
273 qemu_host_page_bits++;
274 qemu_host_page_mask = ~(qemu_host_page_size - 1);
50a9569b 275
2e9a5713 276#if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
50a9569b 277 {
f01576f1
JL
278#ifdef HAVE_KINFO_GETVMMAP
279 struct kinfo_vmentry *freep;
280 int i, cnt;
281
282 freep = kinfo_getvmmap(getpid(), &cnt);
283 if (freep) {
284 mmap_lock();
285 for (i = 0; i < cnt; i++) {
286 unsigned long startaddr, endaddr;
287
288 startaddr = freep[i].kve_start;
289 endaddr = freep[i].kve_end;
290 if (h2g_valid(startaddr)) {
291 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
292
293 if (h2g_valid(endaddr)) {
294 endaddr = h2g(endaddr);
fd436907 295 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
f01576f1
JL
296 } else {
297#if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
298 endaddr = ~0ul;
fd436907 299 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
f01576f1
JL
300#endif
301 }
302 }
303 }
304 free(freep);
305 mmap_unlock();
306 }
307#else
50a9569b 308 FILE *f;
50a9569b 309
0776590d 310 last_brk = (unsigned long)sbrk(0);
5cd2c5b6 311
fd436907 312 f = fopen("/compat/linux/proc/self/maps", "r");
50a9569b 313 if (f) {
5cd2c5b6
RH
314 mmap_lock();
315
50a9569b 316 do {
5cd2c5b6
RH
317 unsigned long startaddr, endaddr;
318 int n;
319
320 n = fscanf (f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
321
322 if (n == 2 && h2g_valid(startaddr)) {
323 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
324
325 if (h2g_valid(endaddr)) {
326 endaddr = h2g(endaddr);
327 } else {
328 endaddr = ~0ul;
329 }
330 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
50a9569b
AZ
331 }
332 } while (!feof(f));
5cd2c5b6 333
50a9569b 334 fclose(f);
5cd2c5b6 335 mmap_unlock();
50a9569b 336 }
f01576f1 337#endif
50a9569b
AZ
338 }
339#endif
54936004
FB
340}
341
41c1b1c9 342static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
54936004 343{
41c1b1c9
PB
344 PageDesc *pd;
345 void **lp;
346 int i;
347
5cd2c5b6 348#if defined(CONFIG_USER_ONLY)
2e9a5713 349 /* We can't use qemu_malloc because it may recurse into a locked mutex. */
5cd2c5b6
RH
350# define ALLOC(P, SIZE) \
351 do { \
352 P = mmap(NULL, SIZE, PROT_READ | PROT_WRITE, \
353 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); \
5cd2c5b6
RH
354 } while (0)
355#else
356# define ALLOC(P, SIZE) \
357 do { P = qemu_mallocz(SIZE); } while (0)
17e2377a 358#endif
434929bf 359
5cd2c5b6
RH
360 /* Level 1. Always allocated. */
361 lp = l1_map + ((index >> V_L1_SHIFT) & (V_L1_SIZE - 1));
362
363 /* Level 2..N-1. */
364 for (i = V_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
365 void **p = *lp;
366
367 if (p == NULL) {
368 if (!alloc) {
369 return NULL;
370 }
371 ALLOC(p, sizeof(void *) * L2_SIZE);
372 *lp = p;
17e2377a 373 }
5cd2c5b6
RH
374
375 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
376 }
377
378 pd = *lp;
379 if (pd == NULL) {
380 if (!alloc) {
381 return NULL;
382 }
383 ALLOC(pd, sizeof(PageDesc) * L2_SIZE);
384 *lp = pd;
54936004 385 }
5cd2c5b6
RH
386
387#undef ALLOC
5cd2c5b6
RH
388
389 return pd + (index & (L2_SIZE - 1));
54936004
FB
390}
391
41c1b1c9 392static inline PageDesc *page_find(tb_page_addr_t index)
54936004 393{
5cd2c5b6 394 return page_find_alloc(index, 0);
fd6ce8f6
FB
395}
396
6d9a1304 397#if !defined(CONFIG_USER_ONLY)
c227f099 398static PhysPageDesc *phys_page_find_alloc(target_phys_addr_t index, int alloc)
92e873b9 399{
e3f4e2a4 400 PhysPageDesc *pd;
5cd2c5b6
RH
401 void **lp;
402 int i;
92e873b9 403
5cd2c5b6
RH
404 /* Level 1. Always allocated. */
405 lp = l1_phys_map + ((index >> P_L1_SHIFT) & (P_L1_SIZE - 1));
108c49b8 406
5cd2c5b6
RH
407 /* Level 2..N-1. */
408 for (i = P_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
409 void **p = *lp;
410 if (p == NULL) {
411 if (!alloc) {
412 return NULL;
413 }
414 *lp = p = qemu_mallocz(sizeof(void *) * L2_SIZE);
415 }
416 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
108c49b8 417 }
5cd2c5b6 418
e3f4e2a4 419 pd = *lp;
5cd2c5b6 420 if (pd == NULL) {
e3f4e2a4 421 int i;
5cd2c5b6
RH
422
423 if (!alloc) {
108c49b8 424 return NULL;
5cd2c5b6
RH
425 }
426
427 *lp = pd = qemu_malloc(sizeof(PhysPageDesc) * L2_SIZE);
428
67c4d23c 429 for (i = 0; i < L2_SIZE; i++) {
5cd2c5b6
RH
430 pd[i].phys_offset = IO_MEM_UNASSIGNED;
431 pd[i].region_offset = (index + i) << TARGET_PAGE_BITS;
67c4d23c 432 }
92e873b9 433 }
5cd2c5b6
RH
434
435 return pd + (index & (L2_SIZE - 1));
92e873b9
FB
436}
437
c227f099 438static inline PhysPageDesc *phys_page_find(target_phys_addr_t index)
92e873b9 439{
108c49b8 440 return phys_page_find_alloc(index, 0);
92e873b9
FB
441}
442
c227f099
AL
443static void tlb_protect_code(ram_addr_t ram_addr);
444static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
3a7d929e 445 target_ulong vaddr);
c8a706fe
PB
446#define mmap_lock() do { } while(0)
447#define mmap_unlock() do { } while(0)
9fa3e853 448#endif
fd6ce8f6 449
4369415f
FB
450#define DEFAULT_CODE_GEN_BUFFER_SIZE (32 * 1024 * 1024)
451
452#if defined(CONFIG_USER_ONLY)
ccbb4d44 453/* Currently it is not recommended to allocate big chunks of data in
4369415f
FB
454 user mode. It will change when a dedicated libc will be used */
455#define USE_STATIC_CODE_GEN_BUFFER
456#endif
457
458#ifdef USE_STATIC_CODE_GEN_BUFFER
ebf50fb3
AJ
459static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
460 __attribute__((aligned (CODE_GEN_ALIGN)));
4369415f
FB
461#endif
462
8fcd3692 463static void code_gen_alloc(unsigned long tb_size)
26a5f13b 464{
4369415f
FB
465#ifdef USE_STATIC_CODE_GEN_BUFFER
466 code_gen_buffer = static_code_gen_buffer;
467 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
468 map_exec(code_gen_buffer, code_gen_buffer_size);
469#else
26a5f13b
FB
470 code_gen_buffer_size = tb_size;
471 if (code_gen_buffer_size == 0) {
4369415f
FB
472#if defined(CONFIG_USER_ONLY)
473 /* in user mode, phys_ram_size is not meaningful */
474 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
475#else
ccbb4d44 476 /* XXX: needs adjustments */
94a6b54f 477 code_gen_buffer_size = (unsigned long)(ram_size / 4);
4369415f 478#endif
26a5f13b
FB
479 }
480 if (code_gen_buffer_size < MIN_CODE_GEN_BUFFER_SIZE)
481 code_gen_buffer_size = MIN_CODE_GEN_BUFFER_SIZE;
482 /* The code gen buffer location may have constraints depending on
483 the host cpu and OS */
484#if defined(__linux__)
485 {
486 int flags;
141ac468
BS
487 void *start = NULL;
488
26a5f13b
FB
489 flags = MAP_PRIVATE | MAP_ANONYMOUS;
490#if defined(__x86_64__)
491 flags |= MAP_32BIT;
492 /* Cannot map more than that */
493 if (code_gen_buffer_size > (800 * 1024 * 1024))
494 code_gen_buffer_size = (800 * 1024 * 1024);
141ac468
BS
495#elif defined(__sparc_v9__)
496 // Map the buffer below 2G, so we can use direct calls and branches
497 flags |= MAP_FIXED;
498 start = (void *) 0x60000000UL;
499 if (code_gen_buffer_size > (512 * 1024 * 1024))
500 code_gen_buffer_size = (512 * 1024 * 1024);
1cb0661e 501#elif defined(__arm__)
63d41246 502 /* Map the buffer below 32M, so we can use direct calls and branches */
1cb0661e
AZ
503 flags |= MAP_FIXED;
504 start = (void *) 0x01000000UL;
505 if (code_gen_buffer_size > 16 * 1024 * 1024)
506 code_gen_buffer_size = 16 * 1024 * 1024;
eba0b893
RH
507#elif defined(__s390x__)
508 /* Map the buffer so that we can use direct calls and branches. */
509 /* We have a +- 4GB range on the branches; leave some slop. */
510 if (code_gen_buffer_size > (3ul * 1024 * 1024 * 1024)) {
511 code_gen_buffer_size = 3ul * 1024 * 1024 * 1024;
512 }
513 start = (void *)0x90000000UL;
26a5f13b 514#endif
141ac468
BS
515 code_gen_buffer = mmap(start, code_gen_buffer_size,
516 PROT_WRITE | PROT_READ | PROT_EXEC,
26a5f13b
FB
517 flags, -1, 0);
518 if (code_gen_buffer == MAP_FAILED) {
519 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
520 exit(1);
521 }
522 }
cbb608a5
B
523#elif defined(__FreeBSD__) || defined(__FreeBSD_kernel__) \
524 || defined(__DragonFly__) || defined(__OpenBSD__)
06e67a82
AL
525 {
526 int flags;
527 void *addr = NULL;
528 flags = MAP_PRIVATE | MAP_ANONYMOUS;
529#if defined(__x86_64__)
530 /* FreeBSD doesn't have MAP_32BIT, use MAP_FIXED and assume
531 * 0x40000000 is free */
532 flags |= MAP_FIXED;
533 addr = (void *)0x40000000;
534 /* Cannot map more than that */
535 if (code_gen_buffer_size > (800 * 1024 * 1024))
536 code_gen_buffer_size = (800 * 1024 * 1024);
4cd31ad2
BS
537#elif defined(__sparc_v9__)
538 // Map the buffer below 2G, so we can use direct calls and branches
539 flags |= MAP_FIXED;
540 addr = (void *) 0x60000000UL;
541 if (code_gen_buffer_size > (512 * 1024 * 1024)) {
542 code_gen_buffer_size = (512 * 1024 * 1024);
543 }
06e67a82
AL
544#endif
545 code_gen_buffer = mmap(addr, code_gen_buffer_size,
546 PROT_WRITE | PROT_READ | PROT_EXEC,
547 flags, -1, 0);
548 if (code_gen_buffer == MAP_FAILED) {
549 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
550 exit(1);
551 }
552 }
26a5f13b
FB
553#else
554 code_gen_buffer = qemu_malloc(code_gen_buffer_size);
26a5f13b
FB
555 map_exec(code_gen_buffer, code_gen_buffer_size);
556#endif
4369415f 557#endif /* !USE_STATIC_CODE_GEN_BUFFER */
26a5f13b
FB
558 map_exec(code_gen_prologue, sizeof(code_gen_prologue));
559 code_gen_buffer_max_size = code_gen_buffer_size -
239fda31 560 (TCG_MAX_OP_SIZE * OPC_MAX_SIZE);
26a5f13b
FB
561 code_gen_max_blocks = code_gen_buffer_size / CODE_GEN_AVG_BLOCK_SIZE;
562 tbs = qemu_malloc(code_gen_max_blocks * sizeof(TranslationBlock));
563}
564
565/* Must be called before using the QEMU cpus. 'tb_size' is the size
566 (in bytes) allocated to the translation buffer. Zero means default
567 size. */
568void cpu_exec_init_all(unsigned long tb_size)
569{
26a5f13b
FB
570 cpu_gen_init();
571 code_gen_alloc(tb_size);
572 code_gen_ptr = code_gen_buffer;
4369415f 573 page_init();
e2eef170 574#if !defined(CONFIG_USER_ONLY)
26a5f13b 575 io_mem_init();
e2eef170 576#endif
9002ec79
RH
577#if !defined(CONFIG_USER_ONLY) || !defined(CONFIG_USE_GUEST_BASE)
578 /* There's no guest base to take into account, so go ahead and
579 initialize the prologue now. */
580 tcg_prologue_init(&tcg_ctx);
581#endif
26a5f13b
FB
582}
583
9656f324
PB
584#if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
585
e59fb374 586static int cpu_common_post_load(void *opaque, int version_id)
e7f4eff7
JQ
587{
588 CPUState *env = opaque;
9656f324 589
3098dba0
AJ
590 /* 0x01 was CPU_INTERRUPT_EXIT. This line can be removed when the
591 version_id is increased. */
592 env->interrupt_request &= ~0x01;
9656f324
PB
593 tlb_flush(env, 1);
594
595 return 0;
596}
e7f4eff7
JQ
597
598static const VMStateDescription vmstate_cpu_common = {
599 .name = "cpu_common",
600 .version_id = 1,
601 .minimum_version_id = 1,
602 .minimum_version_id_old = 1,
e7f4eff7
JQ
603 .post_load = cpu_common_post_load,
604 .fields = (VMStateField []) {
605 VMSTATE_UINT32(halted, CPUState),
606 VMSTATE_UINT32(interrupt_request, CPUState),
607 VMSTATE_END_OF_LIST()
608 }
609};
9656f324
PB
610#endif
611
950f1472
GC
612CPUState *qemu_get_cpu(int cpu)
613{
614 CPUState *env = first_cpu;
615
616 while (env) {
617 if (env->cpu_index == cpu)
618 break;
619 env = env->next_cpu;
620 }
621
622 return env;
623}
624
6a00d601 625void cpu_exec_init(CPUState *env)
fd6ce8f6 626{
6a00d601
FB
627 CPUState **penv;
628 int cpu_index;
629
c2764719
PB
630#if defined(CONFIG_USER_ONLY)
631 cpu_list_lock();
632#endif
6a00d601
FB
633 env->next_cpu = NULL;
634 penv = &first_cpu;
635 cpu_index = 0;
636 while (*penv != NULL) {
1e9fa730 637 penv = &(*penv)->next_cpu;
6a00d601
FB
638 cpu_index++;
639 }
640 env->cpu_index = cpu_index;
268a362c 641 env->numa_node = 0;
72cf2d4f
BS
642 QTAILQ_INIT(&env->breakpoints);
643 QTAILQ_INIT(&env->watchpoints);
dc7a09cf
JK
644#ifndef CONFIG_USER_ONLY
645 env->thread_id = qemu_get_thread_id();
646#endif
6a00d601 647 *penv = env;
c2764719
PB
648#if defined(CONFIG_USER_ONLY)
649 cpu_list_unlock();
650#endif
b3c7724c 651#if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
0be71e32
AW
652 vmstate_register(NULL, cpu_index, &vmstate_cpu_common, env);
653 register_savevm(NULL, "cpu", cpu_index, CPU_SAVE_VERSION,
b3c7724c
PB
654 cpu_save, cpu_load, env);
655#endif
fd6ce8f6
FB
656}
657
d1a1eb74
TG
658/* Allocate a new translation block. Flush the translation buffer if
659 too many translation blocks or too much generated code. */
660static TranslationBlock *tb_alloc(target_ulong pc)
661{
662 TranslationBlock *tb;
663
664 if (nb_tbs >= code_gen_max_blocks ||
665 (code_gen_ptr - code_gen_buffer) >= code_gen_buffer_max_size)
666 return NULL;
667 tb = &tbs[nb_tbs++];
668 tb->pc = pc;
669 tb->cflags = 0;
670 return tb;
671}
672
673void tb_free(TranslationBlock *tb)
674{
675 /* In practice this is mostly used for single use temporary TB
676 Ignore the hard cases and just back up if this TB happens to
677 be the last one generated. */
678 if (nb_tbs > 0 && tb == &tbs[nb_tbs - 1]) {
679 code_gen_ptr = tb->tc_ptr;
680 nb_tbs--;
681 }
682}
683
9fa3e853
FB
684static inline void invalidate_page_bitmap(PageDesc *p)
685{
686 if (p->code_bitmap) {
59817ccb 687 qemu_free(p->code_bitmap);
9fa3e853
FB
688 p->code_bitmap = NULL;
689 }
690 p->code_write_count = 0;
691}
692
5cd2c5b6
RH
693/* Set to NULL all the 'first_tb' fields in all PageDescs. */
694
695static void page_flush_tb_1 (int level, void **lp)
fd6ce8f6 696{
5cd2c5b6 697 int i;
fd6ce8f6 698
5cd2c5b6
RH
699 if (*lp == NULL) {
700 return;
701 }
702 if (level == 0) {
703 PageDesc *pd = *lp;
7296abac 704 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
705 pd[i].first_tb = NULL;
706 invalidate_page_bitmap(pd + i);
fd6ce8f6 707 }
5cd2c5b6
RH
708 } else {
709 void **pp = *lp;
7296abac 710 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
711 page_flush_tb_1 (level - 1, pp + i);
712 }
713 }
714}
715
716static void page_flush_tb(void)
717{
718 int i;
719 for (i = 0; i < V_L1_SIZE; i++) {
720 page_flush_tb_1(V_L1_SHIFT / L2_BITS - 1, l1_map + i);
fd6ce8f6
FB
721 }
722}
723
724/* flush all the translation blocks */
d4e8164f 725/* XXX: tb_flush is currently not thread safe */
6a00d601 726void tb_flush(CPUState *env1)
fd6ce8f6 727{
6a00d601 728 CPUState *env;
0124311e 729#if defined(DEBUG_FLUSH)
ab3d1727
BS
730 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
731 (unsigned long)(code_gen_ptr - code_gen_buffer),
732 nb_tbs, nb_tbs > 0 ?
733 ((unsigned long)(code_gen_ptr - code_gen_buffer)) / nb_tbs : 0);
fd6ce8f6 734#endif
26a5f13b 735 if ((unsigned long)(code_gen_ptr - code_gen_buffer) > code_gen_buffer_size)
a208e54a
PB
736 cpu_abort(env1, "Internal error: code buffer overflow\n");
737
fd6ce8f6 738 nb_tbs = 0;
3b46e624 739
6a00d601
FB
740 for(env = first_cpu; env != NULL; env = env->next_cpu) {
741 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
742 }
9fa3e853 743
8a8a608f 744 memset (tb_phys_hash, 0, CODE_GEN_PHYS_HASH_SIZE * sizeof (void *));
fd6ce8f6 745 page_flush_tb();
9fa3e853 746
fd6ce8f6 747 code_gen_ptr = code_gen_buffer;
d4e8164f
FB
748 /* XXX: flush processor icache at this point if cache flush is
749 expensive */
e3db7226 750 tb_flush_count++;
fd6ce8f6
FB
751}
752
753#ifdef DEBUG_TB_CHECK
754
bc98a7ef 755static void tb_invalidate_check(target_ulong address)
fd6ce8f6
FB
756{
757 TranslationBlock *tb;
758 int i;
759 address &= TARGET_PAGE_MASK;
99773bd4
PB
760 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
761 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
fd6ce8f6
FB
762 if (!(address + TARGET_PAGE_SIZE <= tb->pc ||
763 address >= tb->pc + tb->size)) {
0bf9e31a
BS
764 printf("ERROR invalidate: address=" TARGET_FMT_lx
765 " PC=%08lx size=%04x\n",
99773bd4 766 address, (long)tb->pc, tb->size);
fd6ce8f6
FB
767 }
768 }
769 }
770}
771
772/* verify that all the pages have correct rights for code */
773static void tb_page_check(void)
774{
775 TranslationBlock *tb;
776 int i, flags1, flags2;
3b46e624 777
99773bd4
PB
778 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
779 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
fd6ce8f6
FB
780 flags1 = page_get_flags(tb->pc);
781 flags2 = page_get_flags(tb->pc + tb->size - 1);
782 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
783 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
99773bd4 784 (long)tb->pc, tb->size, flags1, flags2);
fd6ce8f6
FB
785 }
786 }
787 }
788}
789
790#endif
791
792/* invalidate one TB */
793static inline void tb_remove(TranslationBlock **ptb, TranslationBlock *tb,
794 int next_offset)
795{
796 TranslationBlock *tb1;
797 for(;;) {
798 tb1 = *ptb;
799 if (tb1 == tb) {
800 *ptb = *(TranslationBlock **)((char *)tb1 + next_offset);
801 break;
802 }
803 ptb = (TranslationBlock **)((char *)tb1 + next_offset);
804 }
805}
806
9fa3e853
FB
807static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
808{
809 TranslationBlock *tb1;
810 unsigned int n1;
811
812 for(;;) {
813 tb1 = *ptb;
814 n1 = (long)tb1 & 3;
815 tb1 = (TranslationBlock *)((long)tb1 & ~3);
816 if (tb1 == tb) {
817 *ptb = tb1->page_next[n1];
818 break;
819 }
820 ptb = &tb1->page_next[n1];
821 }
822}
823
d4e8164f
FB
824static inline void tb_jmp_remove(TranslationBlock *tb, int n)
825{
826 TranslationBlock *tb1, **ptb;
827 unsigned int n1;
828
829 ptb = &tb->jmp_next[n];
830 tb1 = *ptb;
831 if (tb1) {
832 /* find tb(n) in circular list */
833 for(;;) {
834 tb1 = *ptb;
835 n1 = (long)tb1 & 3;
836 tb1 = (TranslationBlock *)((long)tb1 & ~3);
837 if (n1 == n && tb1 == tb)
838 break;
839 if (n1 == 2) {
840 ptb = &tb1->jmp_first;
841 } else {
842 ptb = &tb1->jmp_next[n1];
843 }
844 }
845 /* now we can suppress tb(n) from the list */
846 *ptb = tb->jmp_next[n];
847
848 tb->jmp_next[n] = NULL;
849 }
850}
851
852/* reset the jump entry 'n' of a TB so that it is not chained to
853 another TB */
854static inline void tb_reset_jump(TranslationBlock *tb, int n)
855{
856 tb_set_jmp_target(tb, n, (unsigned long)(tb->tc_ptr + tb->tb_next_offset[n]));
857}
858
41c1b1c9 859void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
fd6ce8f6 860{
6a00d601 861 CPUState *env;
8a40a180 862 PageDesc *p;
d4e8164f 863 unsigned int h, n1;
41c1b1c9 864 tb_page_addr_t phys_pc;
8a40a180 865 TranslationBlock *tb1, *tb2;
3b46e624 866
8a40a180
FB
867 /* remove the TB from the hash list */
868 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
869 h = tb_phys_hash_func(phys_pc);
5fafdf24 870 tb_remove(&tb_phys_hash[h], tb,
8a40a180
FB
871 offsetof(TranslationBlock, phys_hash_next));
872
873 /* remove the TB from the page list */
874 if (tb->page_addr[0] != page_addr) {
875 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
876 tb_page_remove(&p->first_tb, tb);
877 invalidate_page_bitmap(p);
878 }
879 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
880 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
881 tb_page_remove(&p->first_tb, tb);
882 invalidate_page_bitmap(p);
883 }
884
36bdbe54 885 tb_invalidated_flag = 1;
59817ccb 886
fd6ce8f6 887 /* remove the TB from the hash list */
8a40a180 888 h = tb_jmp_cache_hash_func(tb->pc);
6a00d601
FB
889 for(env = first_cpu; env != NULL; env = env->next_cpu) {
890 if (env->tb_jmp_cache[h] == tb)
891 env->tb_jmp_cache[h] = NULL;
892 }
d4e8164f
FB
893
894 /* suppress this TB from the two jump lists */
895 tb_jmp_remove(tb, 0);
896 tb_jmp_remove(tb, 1);
897
898 /* suppress any remaining jumps to this TB */
899 tb1 = tb->jmp_first;
900 for(;;) {
901 n1 = (long)tb1 & 3;
902 if (n1 == 2)
903 break;
904 tb1 = (TranslationBlock *)((long)tb1 & ~3);
905 tb2 = tb1->jmp_next[n1];
906 tb_reset_jump(tb1, n1);
907 tb1->jmp_next[n1] = NULL;
908 tb1 = tb2;
909 }
910 tb->jmp_first = (TranslationBlock *)((long)tb | 2); /* fail safe */
9fa3e853 911
e3db7226 912 tb_phys_invalidate_count++;
9fa3e853
FB
913}
914
915static inline void set_bits(uint8_t *tab, int start, int len)
916{
917 int end, mask, end1;
918
919 end = start + len;
920 tab += start >> 3;
921 mask = 0xff << (start & 7);
922 if ((start & ~7) == (end & ~7)) {
923 if (start < end) {
924 mask &= ~(0xff << (end & 7));
925 *tab |= mask;
926 }
927 } else {
928 *tab++ |= mask;
929 start = (start + 8) & ~7;
930 end1 = end & ~7;
931 while (start < end1) {
932 *tab++ = 0xff;
933 start += 8;
934 }
935 if (start < end) {
936 mask = ~(0xff << (end & 7));
937 *tab |= mask;
938 }
939 }
940}
941
942static void build_page_bitmap(PageDesc *p)
943{
944 int n, tb_start, tb_end;
945 TranslationBlock *tb;
3b46e624 946
b2a7081a 947 p->code_bitmap = qemu_mallocz(TARGET_PAGE_SIZE / 8);
9fa3e853
FB
948
949 tb = p->first_tb;
950 while (tb != NULL) {
951 n = (long)tb & 3;
952 tb = (TranslationBlock *)((long)tb & ~3);
953 /* NOTE: this is subtle as a TB may span two physical pages */
954 if (n == 0) {
955 /* NOTE: tb_end may be after the end of the page, but
956 it is not a problem */
957 tb_start = tb->pc & ~TARGET_PAGE_MASK;
958 tb_end = tb_start + tb->size;
959 if (tb_end > TARGET_PAGE_SIZE)
960 tb_end = TARGET_PAGE_SIZE;
961 } else {
962 tb_start = 0;
963 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
964 }
965 set_bits(p->code_bitmap, tb_start, tb_end - tb_start);
966 tb = tb->page_next[n];
967 }
968}
969
2e70f6ef
PB
970TranslationBlock *tb_gen_code(CPUState *env,
971 target_ulong pc, target_ulong cs_base,
972 int flags, int cflags)
d720b93d
FB
973{
974 TranslationBlock *tb;
975 uint8_t *tc_ptr;
41c1b1c9
PB
976 tb_page_addr_t phys_pc, phys_page2;
977 target_ulong virt_page2;
d720b93d
FB
978 int code_gen_size;
979
41c1b1c9 980 phys_pc = get_page_addr_code(env, pc);
c27004ec 981 tb = tb_alloc(pc);
d720b93d
FB
982 if (!tb) {
983 /* flush must be done */
984 tb_flush(env);
985 /* cannot fail at this point */
c27004ec 986 tb = tb_alloc(pc);
2e70f6ef
PB
987 /* Don't forget to invalidate previous TB info. */
988 tb_invalidated_flag = 1;
d720b93d
FB
989 }
990 tc_ptr = code_gen_ptr;
991 tb->tc_ptr = tc_ptr;
992 tb->cs_base = cs_base;
993 tb->flags = flags;
994 tb->cflags = cflags;
d07bde88 995 cpu_gen_code(env, tb, &code_gen_size);
d720b93d 996 code_gen_ptr = (void *)(((unsigned long)code_gen_ptr + code_gen_size + CODE_GEN_ALIGN - 1) & ~(CODE_GEN_ALIGN - 1));
3b46e624 997
d720b93d 998 /* check next page if needed */
c27004ec 999 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
d720b93d 1000 phys_page2 = -1;
c27004ec 1001 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
41c1b1c9 1002 phys_page2 = get_page_addr_code(env, virt_page2);
d720b93d 1003 }
41c1b1c9 1004 tb_link_page(tb, phys_pc, phys_page2);
2e70f6ef 1005 return tb;
d720b93d 1006}
3b46e624 1007
9fa3e853
FB
1008/* invalidate all TBs which intersect with the target physical page
1009 starting in range [start;end[. NOTE: start and end must refer to
d720b93d
FB
1010 the same physical page. 'is_cpu_write_access' should be true if called
1011 from a real cpu write access: the virtual CPU will exit the current
1012 TB if code is modified inside this TB. */
41c1b1c9 1013void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
d720b93d
FB
1014 int is_cpu_write_access)
1015{
6b917547 1016 TranslationBlock *tb, *tb_next, *saved_tb;
d720b93d 1017 CPUState *env = cpu_single_env;
41c1b1c9 1018 tb_page_addr_t tb_start, tb_end;
6b917547
AL
1019 PageDesc *p;
1020 int n;
1021#ifdef TARGET_HAS_PRECISE_SMC
1022 int current_tb_not_found = is_cpu_write_access;
1023 TranslationBlock *current_tb = NULL;
1024 int current_tb_modified = 0;
1025 target_ulong current_pc = 0;
1026 target_ulong current_cs_base = 0;
1027 int current_flags = 0;
1028#endif /* TARGET_HAS_PRECISE_SMC */
9fa3e853
FB
1029
1030 p = page_find(start >> TARGET_PAGE_BITS);
5fafdf24 1031 if (!p)
9fa3e853 1032 return;
5fafdf24 1033 if (!p->code_bitmap &&
d720b93d
FB
1034 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD &&
1035 is_cpu_write_access) {
9fa3e853
FB
1036 /* build code bitmap */
1037 build_page_bitmap(p);
1038 }
1039
1040 /* we remove all the TBs in the range [start, end[ */
1041 /* XXX: see if in some cases it could be faster to invalidate all the code */
1042 tb = p->first_tb;
1043 while (tb != NULL) {
1044 n = (long)tb & 3;
1045 tb = (TranslationBlock *)((long)tb & ~3);
1046 tb_next = tb->page_next[n];
1047 /* NOTE: this is subtle as a TB may span two physical pages */
1048 if (n == 0) {
1049 /* NOTE: tb_end may be after the end of the page, but
1050 it is not a problem */
1051 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1052 tb_end = tb_start + tb->size;
1053 } else {
1054 tb_start = tb->page_addr[1];
1055 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1056 }
1057 if (!(tb_end <= start || tb_start >= end)) {
d720b93d
FB
1058#ifdef TARGET_HAS_PRECISE_SMC
1059 if (current_tb_not_found) {
1060 current_tb_not_found = 0;
1061 current_tb = NULL;
2e70f6ef 1062 if (env->mem_io_pc) {
d720b93d 1063 /* now we have a real cpu fault */
2e70f6ef 1064 current_tb = tb_find_pc(env->mem_io_pc);
d720b93d
FB
1065 }
1066 }
1067 if (current_tb == tb &&
2e70f6ef 1068 (current_tb->cflags & CF_COUNT_MASK) != 1) {
d720b93d
FB
1069 /* If we are modifying the current TB, we must stop
1070 its execution. We could be more precise by checking
1071 that the modification is after the current PC, but it
1072 would require a specialized function to partially
1073 restore the CPU state */
3b46e624 1074
d720b93d 1075 current_tb_modified = 1;
618ba8e6 1076 cpu_restore_state(current_tb, env, env->mem_io_pc);
6b917547
AL
1077 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1078 &current_flags);
d720b93d
FB
1079 }
1080#endif /* TARGET_HAS_PRECISE_SMC */
6f5a9f7e
FB
1081 /* we need to do that to handle the case where a signal
1082 occurs while doing tb_phys_invalidate() */
1083 saved_tb = NULL;
1084 if (env) {
1085 saved_tb = env->current_tb;
1086 env->current_tb = NULL;
1087 }
9fa3e853 1088 tb_phys_invalidate(tb, -1);
6f5a9f7e
FB
1089 if (env) {
1090 env->current_tb = saved_tb;
1091 if (env->interrupt_request && env->current_tb)
1092 cpu_interrupt(env, env->interrupt_request);
1093 }
9fa3e853
FB
1094 }
1095 tb = tb_next;
1096 }
1097#if !defined(CONFIG_USER_ONLY)
1098 /* if no code remaining, no need to continue to use slow writes */
1099 if (!p->first_tb) {
1100 invalidate_page_bitmap(p);
d720b93d 1101 if (is_cpu_write_access) {
2e70f6ef 1102 tlb_unprotect_code_phys(env, start, env->mem_io_vaddr);
d720b93d
FB
1103 }
1104 }
1105#endif
1106#ifdef TARGET_HAS_PRECISE_SMC
1107 if (current_tb_modified) {
1108 /* we generate a block containing just the instruction
1109 modifying the memory. It will ensure that it cannot modify
1110 itself */
ea1c1802 1111 env->current_tb = NULL;
2e70f6ef 1112 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
d720b93d 1113 cpu_resume_from_signal(env, NULL);
9fa3e853 1114 }
fd6ce8f6 1115#endif
9fa3e853 1116}
fd6ce8f6 1117
9fa3e853 1118/* len must be <= 8 and start must be a multiple of len */
41c1b1c9 1119static inline void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
9fa3e853
FB
1120{
1121 PageDesc *p;
1122 int offset, b;
59817ccb 1123#if 0
a4193c8a 1124 if (1) {
93fcfe39
AL
1125 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1126 cpu_single_env->mem_io_vaddr, len,
1127 cpu_single_env->eip,
1128 cpu_single_env->eip + (long)cpu_single_env->segs[R_CS].base);
59817ccb
FB
1129 }
1130#endif
9fa3e853 1131 p = page_find(start >> TARGET_PAGE_BITS);
5fafdf24 1132 if (!p)
9fa3e853
FB
1133 return;
1134 if (p->code_bitmap) {
1135 offset = start & ~TARGET_PAGE_MASK;
1136 b = p->code_bitmap[offset >> 3] >> (offset & 7);
1137 if (b & ((1 << len) - 1))
1138 goto do_invalidate;
1139 } else {
1140 do_invalidate:
d720b93d 1141 tb_invalidate_phys_page_range(start, start + len, 1);
9fa3e853
FB
1142 }
1143}
1144
9fa3e853 1145#if !defined(CONFIG_SOFTMMU)
41c1b1c9 1146static void tb_invalidate_phys_page(tb_page_addr_t addr,
d720b93d 1147 unsigned long pc, void *puc)
9fa3e853 1148{
6b917547 1149 TranslationBlock *tb;
9fa3e853 1150 PageDesc *p;
6b917547 1151 int n;
d720b93d 1152#ifdef TARGET_HAS_PRECISE_SMC
6b917547 1153 TranslationBlock *current_tb = NULL;
d720b93d 1154 CPUState *env = cpu_single_env;
6b917547
AL
1155 int current_tb_modified = 0;
1156 target_ulong current_pc = 0;
1157 target_ulong current_cs_base = 0;
1158 int current_flags = 0;
d720b93d 1159#endif
9fa3e853
FB
1160
1161 addr &= TARGET_PAGE_MASK;
1162 p = page_find(addr >> TARGET_PAGE_BITS);
5fafdf24 1163 if (!p)
9fa3e853
FB
1164 return;
1165 tb = p->first_tb;
d720b93d
FB
1166#ifdef TARGET_HAS_PRECISE_SMC
1167 if (tb && pc != 0) {
1168 current_tb = tb_find_pc(pc);
1169 }
1170#endif
9fa3e853
FB
1171 while (tb != NULL) {
1172 n = (long)tb & 3;
1173 tb = (TranslationBlock *)((long)tb & ~3);
d720b93d
FB
1174#ifdef TARGET_HAS_PRECISE_SMC
1175 if (current_tb == tb &&
2e70f6ef 1176 (current_tb->cflags & CF_COUNT_MASK) != 1) {
d720b93d
FB
1177 /* If we are modifying the current TB, we must stop
1178 its execution. We could be more precise by checking
1179 that the modification is after the current PC, but it
1180 would require a specialized function to partially
1181 restore the CPU state */
3b46e624 1182
d720b93d 1183 current_tb_modified = 1;
618ba8e6 1184 cpu_restore_state(current_tb, env, pc);
6b917547
AL
1185 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1186 &current_flags);
d720b93d
FB
1187 }
1188#endif /* TARGET_HAS_PRECISE_SMC */
9fa3e853
FB
1189 tb_phys_invalidate(tb, addr);
1190 tb = tb->page_next[n];
1191 }
fd6ce8f6 1192 p->first_tb = NULL;
d720b93d
FB
1193#ifdef TARGET_HAS_PRECISE_SMC
1194 if (current_tb_modified) {
1195 /* we generate a block containing just the instruction
1196 modifying the memory. It will ensure that it cannot modify
1197 itself */
ea1c1802 1198 env->current_tb = NULL;
2e70f6ef 1199 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
d720b93d
FB
1200 cpu_resume_from_signal(env, puc);
1201 }
1202#endif
fd6ce8f6 1203}
9fa3e853 1204#endif
fd6ce8f6
FB
1205
1206/* add the tb in the target page and protect it if necessary */
5fafdf24 1207static inline void tb_alloc_page(TranslationBlock *tb,
41c1b1c9 1208 unsigned int n, tb_page_addr_t page_addr)
fd6ce8f6
FB
1209{
1210 PageDesc *p;
9fa3e853
FB
1211 TranslationBlock *last_first_tb;
1212
1213 tb->page_addr[n] = page_addr;
5cd2c5b6 1214 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
9fa3e853
FB
1215 tb->page_next[n] = p->first_tb;
1216 last_first_tb = p->first_tb;
1217 p->first_tb = (TranslationBlock *)((long)tb | n);
1218 invalidate_page_bitmap(p);
fd6ce8f6 1219
107db443 1220#if defined(TARGET_HAS_SMC) || 1
d720b93d 1221
9fa3e853 1222#if defined(CONFIG_USER_ONLY)
fd6ce8f6 1223 if (p->flags & PAGE_WRITE) {
53a5960a
PB
1224 target_ulong addr;
1225 PageDesc *p2;
9fa3e853
FB
1226 int prot;
1227
fd6ce8f6
FB
1228 /* force the host page as non writable (writes will have a
1229 page fault + mprotect overhead) */
53a5960a 1230 page_addr &= qemu_host_page_mask;
fd6ce8f6 1231 prot = 0;
53a5960a
PB
1232 for(addr = page_addr; addr < page_addr + qemu_host_page_size;
1233 addr += TARGET_PAGE_SIZE) {
1234
1235 p2 = page_find (addr >> TARGET_PAGE_BITS);
1236 if (!p2)
1237 continue;
1238 prot |= p2->flags;
1239 p2->flags &= ~PAGE_WRITE;
53a5960a 1240 }
5fafdf24 1241 mprotect(g2h(page_addr), qemu_host_page_size,
fd6ce8f6
FB
1242 (prot & PAGE_BITS) & ~PAGE_WRITE);
1243#ifdef DEBUG_TB_INVALIDATE
ab3d1727 1244 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
53a5960a 1245 page_addr);
fd6ce8f6 1246#endif
fd6ce8f6 1247 }
9fa3e853
FB
1248#else
1249 /* if some code is already present, then the pages are already
1250 protected. So we handle the case where only the first TB is
1251 allocated in a physical page */
1252 if (!last_first_tb) {
6a00d601 1253 tlb_protect_code(page_addr);
9fa3e853
FB
1254 }
1255#endif
d720b93d
FB
1256
1257#endif /* TARGET_HAS_SMC */
fd6ce8f6
FB
1258}
1259
9fa3e853
FB
1260/* add a new TB and link it to the physical page tables. phys_page2 is
1261 (-1) to indicate that only one page contains the TB. */
41c1b1c9
PB
1262void tb_link_page(TranslationBlock *tb,
1263 tb_page_addr_t phys_pc, tb_page_addr_t phys_page2)
d4e8164f 1264{
9fa3e853
FB
1265 unsigned int h;
1266 TranslationBlock **ptb;
1267
c8a706fe
PB
1268 /* Grab the mmap lock to stop another thread invalidating this TB
1269 before we are done. */
1270 mmap_lock();
9fa3e853
FB
1271 /* add in the physical hash table */
1272 h = tb_phys_hash_func(phys_pc);
1273 ptb = &tb_phys_hash[h];
1274 tb->phys_hash_next = *ptb;
1275 *ptb = tb;
fd6ce8f6
FB
1276
1277 /* add in the page list */
9fa3e853
FB
1278 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1279 if (phys_page2 != -1)
1280 tb_alloc_page(tb, 1, phys_page2);
1281 else
1282 tb->page_addr[1] = -1;
9fa3e853 1283
d4e8164f
FB
1284 tb->jmp_first = (TranslationBlock *)((long)tb | 2);
1285 tb->jmp_next[0] = NULL;
1286 tb->jmp_next[1] = NULL;
1287
1288 /* init original jump addresses */
1289 if (tb->tb_next_offset[0] != 0xffff)
1290 tb_reset_jump(tb, 0);
1291 if (tb->tb_next_offset[1] != 0xffff)
1292 tb_reset_jump(tb, 1);
8a40a180
FB
1293
1294#ifdef DEBUG_TB_CHECK
1295 tb_page_check();
1296#endif
c8a706fe 1297 mmap_unlock();
fd6ce8f6
FB
1298}
1299
9fa3e853
FB
1300/* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1301 tb[1].tc_ptr. Return NULL if not found */
1302TranslationBlock *tb_find_pc(unsigned long tc_ptr)
fd6ce8f6 1303{
9fa3e853
FB
1304 int m_min, m_max, m;
1305 unsigned long v;
1306 TranslationBlock *tb;
a513fe19
FB
1307
1308 if (nb_tbs <= 0)
1309 return NULL;
1310 if (tc_ptr < (unsigned long)code_gen_buffer ||
1311 tc_ptr >= (unsigned long)code_gen_ptr)
1312 return NULL;
1313 /* binary search (cf Knuth) */
1314 m_min = 0;
1315 m_max = nb_tbs - 1;
1316 while (m_min <= m_max) {
1317 m = (m_min + m_max) >> 1;
1318 tb = &tbs[m];
1319 v = (unsigned long)tb->tc_ptr;
1320 if (v == tc_ptr)
1321 return tb;
1322 else if (tc_ptr < v) {
1323 m_max = m - 1;
1324 } else {
1325 m_min = m + 1;
1326 }
5fafdf24 1327 }
a513fe19
FB
1328 return &tbs[m_max];
1329}
7501267e 1330
ea041c0e
FB
1331static void tb_reset_jump_recursive(TranslationBlock *tb);
1332
1333static inline void tb_reset_jump_recursive2(TranslationBlock *tb, int n)
1334{
1335 TranslationBlock *tb1, *tb_next, **ptb;
1336 unsigned int n1;
1337
1338 tb1 = tb->jmp_next[n];
1339 if (tb1 != NULL) {
1340 /* find head of list */
1341 for(;;) {
1342 n1 = (long)tb1 & 3;
1343 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1344 if (n1 == 2)
1345 break;
1346 tb1 = tb1->jmp_next[n1];
1347 }
1348 /* we are now sure now that tb jumps to tb1 */
1349 tb_next = tb1;
1350
1351 /* remove tb from the jmp_first list */
1352 ptb = &tb_next->jmp_first;
1353 for(;;) {
1354 tb1 = *ptb;
1355 n1 = (long)tb1 & 3;
1356 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1357 if (n1 == n && tb1 == tb)
1358 break;
1359 ptb = &tb1->jmp_next[n1];
1360 }
1361 *ptb = tb->jmp_next[n];
1362 tb->jmp_next[n] = NULL;
3b46e624 1363
ea041c0e
FB
1364 /* suppress the jump to next tb in generated code */
1365 tb_reset_jump(tb, n);
1366
0124311e 1367 /* suppress jumps in the tb on which we could have jumped */
ea041c0e
FB
1368 tb_reset_jump_recursive(tb_next);
1369 }
1370}
1371
1372static void tb_reset_jump_recursive(TranslationBlock *tb)
1373{
1374 tb_reset_jump_recursive2(tb, 0);
1375 tb_reset_jump_recursive2(tb, 1);
1376}
1377
1fddef4b 1378#if defined(TARGET_HAS_ICE)
94df27fd
PB
1379#if defined(CONFIG_USER_ONLY)
1380static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1381{
1382 tb_invalidate_phys_page_range(pc, pc + 1, 0);
1383}
1384#else
d720b93d
FB
1385static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1386{
c227f099 1387 target_phys_addr_t addr;
9b3c35e0 1388 target_ulong pd;
c227f099 1389 ram_addr_t ram_addr;
c2f07f81 1390 PhysPageDesc *p;
d720b93d 1391
c2f07f81
PB
1392 addr = cpu_get_phys_page_debug(env, pc);
1393 p = phys_page_find(addr >> TARGET_PAGE_BITS);
1394 if (!p) {
1395 pd = IO_MEM_UNASSIGNED;
1396 } else {
1397 pd = p->phys_offset;
1398 }
1399 ram_addr = (pd & TARGET_PAGE_MASK) | (pc & ~TARGET_PAGE_MASK);
706cd4b5 1400 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
d720b93d 1401}
c27004ec 1402#endif
94df27fd 1403#endif /* TARGET_HAS_ICE */
d720b93d 1404
c527ee8f
PB
1405#if defined(CONFIG_USER_ONLY)
1406void cpu_watchpoint_remove_all(CPUState *env, int mask)
1407
1408{
1409}
1410
1411int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1412 int flags, CPUWatchpoint **watchpoint)
1413{
1414 return -ENOSYS;
1415}
1416#else
6658ffb8 1417/* Add a watchpoint. */
a1d1bb31
AL
1418int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1419 int flags, CPUWatchpoint **watchpoint)
6658ffb8 1420{
b4051334 1421 target_ulong len_mask = ~(len - 1);
c0ce998e 1422 CPUWatchpoint *wp;
6658ffb8 1423
b4051334
AL
1424 /* sanity checks: allow power-of-2 lengths, deny unaligned watchpoints */
1425 if ((len != 1 && len != 2 && len != 4 && len != 8) || (addr & ~len_mask)) {
1426 fprintf(stderr, "qemu: tried to set invalid watchpoint at "
1427 TARGET_FMT_lx ", len=" TARGET_FMT_lu "\n", addr, len);
1428 return -EINVAL;
1429 }
a1d1bb31 1430 wp = qemu_malloc(sizeof(*wp));
a1d1bb31
AL
1431
1432 wp->vaddr = addr;
b4051334 1433 wp->len_mask = len_mask;
a1d1bb31
AL
1434 wp->flags = flags;
1435
2dc9f411 1436 /* keep all GDB-injected watchpoints in front */
c0ce998e 1437 if (flags & BP_GDB)
72cf2d4f 1438 QTAILQ_INSERT_HEAD(&env->watchpoints, wp, entry);
c0ce998e 1439 else
72cf2d4f 1440 QTAILQ_INSERT_TAIL(&env->watchpoints, wp, entry);
6658ffb8 1441
6658ffb8 1442 tlb_flush_page(env, addr);
a1d1bb31
AL
1443
1444 if (watchpoint)
1445 *watchpoint = wp;
1446 return 0;
6658ffb8
PB
1447}
1448
a1d1bb31
AL
1449/* Remove a specific watchpoint. */
1450int cpu_watchpoint_remove(CPUState *env, target_ulong addr, target_ulong len,
1451 int flags)
6658ffb8 1452{
b4051334 1453 target_ulong len_mask = ~(len - 1);
a1d1bb31 1454 CPUWatchpoint *wp;
6658ffb8 1455
72cf2d4f 1456 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334 1457 if (addr == wp->vaddr && len_mask == wp->len_mask
6e140f28 1458 && flags == (wp->flags & ~BP_WATCHPOINT_HIT)) {
a1d1bb31 1459 cpu_watchpoint_remove_by_ref(env, wp);
6658ffb8
PB
1460 return 0;
1461 }
1462 }
a1d1bb31 1463 return -ENOENT;
6658ffb8
PB
1464}
1465
a1d1bb31
AL
1466/* Remove a specific watchpoint by reference. */
1467void cpu_watchpoint_remove_by_ref(CPUState *env, CPUWatchpoint *watchpoint)
1468{
72cf2d4f 1469 QTAILQ_REMOVE(&env->watchpoints, watchpoint, entry);
7d03f82f 1470
a1d1bb31
AL
1471 tlb_flush_page(env, watchpoint->vaddr);
1472
1473 qemu_free(watchpoint);
1474}
1475
1476/* Remove all matching watchpoints. */
1477void cpu_watchpoint_remove_all(CPUState *env, int mask)
1478{
c0ce998e 1479 CPUWatchpoint *wp, *next;
a1d1bb31 1480
72cf2d4f 1481 QTAILQ_FOREACH_SAFE(wp, &env->watchpoints, entry, next) {
a1d1bb31
AL
1482 if (wp->flags & mask)
1483 cpu_watchpoint_remove_by_ref(env, wp);
c0ce998e 1484 }
7d03f82f 1485}
c527ee8f 1486#endif
7d03f82f 1487
a1d1bb31
AL
1488/* Add a breakpoint. */
1489int cpu_breakpoint_insert(CPUState *env, target_ulong pc, int flags,
1490 CPUBreakpoint **breakpoint)
4c3a88a2 1491{
1fddef4b 1492#if defined(TARGET_HAS_ICE)
c0ce998e 1493 CPUBreakpoint *bp;
3b46e624 1494
a1d1bb31 1495 bp = qemu_malloc(sizeof(*bp));
4c3a88a2 1496
a1d1bb31
AL
1497 bp->pc = pc;
1498 bp->flags = flags;
1499
2dc9f411 1500 /* keep all GDB-injected breakpoints in front */
c0ce998e 1501 if (flags & BP_GDB)
72cf2d4f 1502 QTAILQ_INSERT_HEAD(&env->breakpoints, bp, entry);
c0ce998e 1503 else
72cf2d4f 1504 QTAILQ_INSERT_TAIL(&env->breakpoints, bp, entry);
3b46e624 1505
d720b93d 1506 breakpoint_invalidate(env, pc);
a1d1bb31
AL
1507
1508 if (breakpoint)
1509 *breakpoint = bp;
4c3a88a2
FB
1510 return 0;
1511#else
a1d1bb31 1512 return -ENOSYS;
4c3a88a2
FB
1513#endif
1514}
1515
a1d1bb31
AL
1516/* Remove a specific breakpoint. */
1517int cpu_breakpoint_remove(CPUState *env, target_ulong pc, int flags)
1518{
7d03f82f 1519#if defined(TARGET_HAS_ICE)
a1d1bb31
AL
1520 CPUBreakpoint *bp;
1521
72cf2d4f 1522 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
a1d1bb31
AL
1523 if (bp->pc == pc && bp->flags == flags) {
1524 cpu_breakpoint_remove_by_ref(env, bp);
1525 return 0;
1526 }
7d03f82f 1527 }
a1d1bb31
AL
1528 return -ENOENT;
1529#else
1530 return -ENOSYS;
7d03f82f
EI
1531#endif
1532}
1533
a1d1bb31
AL
1534/* Remove a specific breakpoint by reference. */
1535void cpu_breakpoint_remove_by_ref(CPUState *env, CPUBreakpoint *breakpoint)
4c3a88a2 1536{
1fddef4b 1537#if defined(TARGET_HAS_ICE)
72cf2d4f 1538 QTAILQ_REMOVE(&env->breakpoints, breakpoint, entry);
d720b93d 1539
a1d1bb31
AL
1540 breakpoint_invalidate(env, breakpoint->pc);
1541
1542 qemu_free(breakpoint);
1543#endif
1544}
1545
1546/* Remove all matching breakpoints. */
1547void cpu_breakpoint_remove_all(CPUState *env, int mask)
1548{
1549#if defined(TARGET_HAS_ICE)
c0ce998e 1550 CPUBreakpoint *bp, *next;
a1d1bb31 1551
72cf2d4f 1552 QTAILQ_FOREACH_SAFE(bp, &env->breakpoints, entry, next) {
a1d1bb31
AL
1553 if (bp->flags & mask)
1554 cpu_breakpoint_remove_by_ref(env, bp);
c0ce998e 1555 }
4c3a88a2
FB
1556#endif
1557}
1558
c33a346e
FB
1559/* enable or disable single step mode. EXCP_DEBUG is returned by the
1560 CPU loop after each instruction */
1561void cpu_single_step(CPUState *env, int enabled)
1562{
1fddef4b 1563#if defined(TARGET_HAS_ICE)
c33a346e
FB
1564 if (env->singlestep_enabled != enabled) {
1565 env->singlestep_enabled = enabled;
e22a25c9
AL
1566 if (kvm_enabled())
1567 kvm_update_guest_debug(env, 0);
1568 else {
ccbb4d44 1569 /* must flush all the translated code to avoid inconsistencies */
e22a25c9
AL
1570 /* XXX: only flush what is necessary */
1571 tb_flush(env);
1572 }
c33a346e
FB
1573 }
1574#endif
1575}
1576
34865134
FB
1577/* enable or disable low levels log */
1578void cpu_set_log(int log_flags)
1579{
1580 loglevel = log_flags;
1581 if (loglevel && !logfile) {
11fcfab4 1582 logfile = fopen(logfilename, log_append ? "a" : "w");
34865134
FB
1583 if (!logfile) {
1584 perror(logfilename);
1585 _exit(1);
1586 }
9fa3e853
FB
1587#if !defined(CONFIG_SOFTMMU)
1588 /* must avoid mmap() usage of glibc by setting a buffer "by hand" */
1589 {
b55266b5 1590 static char logfile_buf[4096];
9fa3e853
FB
1591 setvbuf(logfile, logfile_buf, _IOLBF, sizeof(logfile_buf));
1592 }
bf65f53f
FN
1593#elif !defined(_WIN32)
1594 /* Win32 doesn't support line-buffering and requires size >= 2 */
34865134 1595 setvbuf(logfile, NULL, _IOLBF, 0);
9fa3e853 1596#endif
e735b91c
PB
1597 log_append = 1;
1598 }
1599 if (!loglevel && logfile) {
1600 fclose(logfile);
1601 logfile = NULL;
34865134
FB
1602 }
1603}
1604
1605void cpu_set_log_filename(const char *filename)
1606{
1607 logfilename = strdup(filename);
e735b91c
PB
1608 if (logfile) {
1609 fclose(logfile);
1610 logfile = NULL;
1611 }
1612 cpu_set_log(loglevel);
34865134 1613}
c33a346e 1614
3098dba0 1615static void cpu_unlink_tb(CPUState *env)
ea041c0e 1616{
3098dba0
AJ
1617 /* FIXME: TB unchaining isn't SMP safe. For now just ignore the
1618 problem and hope the cpu will stop of its own accord. For userspace
1619 emulation this often isn't actually as bad as it sounds. Often
1620 signals are used primarily to interrupt blocking syscalls. */
ea041c0e 1621 TranslationBlock *tb;
c227f099 1622 static spinlock_t interrupt_lock = SPIN_LOCK_UNLOCKED;
59817ccb 1623
cab1b4bd 1624 spin_lock(&interrupt_lock);
3098dba0
AJ
1625 tb = env->current_tb;
1626 /* if the cpu is currently executing code, we must unlink it and
1627 all the potentially executing TB */
f76cfe56 1628 if (tb) {
3098dba0
AJ
1629 env->current_tb = NULL;
1630 tb_reset_jump_recursive(tb);
be214e6c 1631 }
cab1b4bd 1632 spin_unlock(&interrupt_lock);
3098dba0
AJ
1633}
1634
97ffbd8d 1635#ifndef CONFIG_USER_ONLY
3098dba0 1636/* mask must never be zero, except for A20 change call */
ec6959d0 1637static void tcg_handle_interrupt(CPUState *env, int mask)
3098dba0
AJ
1638{
1639 int old_mask;
be214e6c 1640
2e70f6ef 1641 old_mask = env->interrupt_request;
68a79315 1642 env->interrupt_request |= mask;
3098dba0 1643
8edac960
AL
1644 /*
1645 * If called from iothread context, wake the target cpu in
1646 * case its halted.
1647 */
b7680cb6 1648 if (!qemu_cpu_is_self(env)) {
8edac960
AL
1649 qemu_cpu_kick(env);
1650 return;
1651 }
8edac960 1652
2e70f6ef 1653 if (use_icount) {
266910c4 1654 env->icount_decr.u16.high = 0xffff;
2e70f6ef 1655 if (!can_do_io(env)
be214e6c 1656 && (mask & ~old_mask) != 0) {
2e70f6ef
PB
1657 cpu_abort(env, "Raised interrupt while not in I/O function");
1658 }
2e70f6ef 1659 } else {
3098dba0 1660 cpu_unlink_tb(env);
ea041c0e
FB
1661 }
1662}
1663
ec6959d0
JK
1664CPUInterruptHandler cpu_interrupt_handler = tcg_handle_interrupt;
1665
97ffbd8d
JK
1666#else /* CONFIG_USER_ONLY */
1667
1668void cpu_interrupt(CPUState *env, int mask)
1669{
1670 env->interrupt_request |= mask;
1671 cpu_unlink_tb(env);
1672}
1673#endif /* CONFIG_USER_ONLY */
1674
b54ad049
FB
1675void cpu_reset_interrupt(CPUState *env, int mask)
1676{
1677 env->interrupt_request &= ~mask;
1678}
1679
3098dba0
AJ
1680void cpu_exit(CPUState *env)
1681{
1682 env->exit_request = 1;
1683 cpu_unlink_tb(env);
1684}
1685
c7cd6a37 1686const CPULogItem cpu_log_items[] = {
5fafdf24 1687 { CPU_LOG_TB_OUT_ASM, "out_asm",
f193c797
FB
1688 "show generated host assembly code for each compiled TB" },
1689 { CPU_LOG_TB_IN_ASM, "in_asm",
1690 "show target assembly code for each compiled TB" },
5fafdf24 1691 { CPU_LOG_TB_OP, "op",
57fec1fe 1692 "show micro ops for each compiled TB" },
f193c797 1693 { CPU_LOG_TB_OP_OPT, "op_opt",
e01a1157
BS
1694 "show micro ops "
1695#ifdef TARGET_I386
1696 "before eflags optimization and "
f193c797 1697#endif
e01a1157 1698 "after liveness analysis" },
f193c797
FB
1699 { CPU_LOG_INT, "int",
1700 "show interrupts/exceptions in short format" },
1701 { CPU_LOG_EXEC, "exec",
1702 "show trace before each executed TB (lots of logs)" },
9fddaa0c 1703 { CPU_LOG_TB_CPU, "cpu",
e91c8a77 1704 "show CPU state before block translation" },
f193c797
FB
1705#ifdef TARGET_I386
1706 { CPU_LOG_PCALL, "pcall",
1707 "show protected mode far calls/returns/exceptions" },
eca1bdf4
AL
1708 { CPU_LOG_RESET, "cpu_reset",
1709 "show CPU state before CPU resets" },
f193c797 1710#endif
8e3a9fd2 1711#ifdef DEBUG_IOPORT
fd872598
FB
1712 { CPU_LOG_IOPORT, "ioport",
1713 "show all i/o ports accesses" },
8e3a9fd2 1714#endif
f193c797
FB
1715 { 0, NULL, NULL },
1716};
1717
f6f3fbca
MT
1718#ifndef CONFIG_USER_ONLY
1719static QLIST_HEAD(memory_client_list, CPUPhysMemoryClient) memory_client_list
1720 = QLIST_HEAD_INITIALIZER(memory_client_list);
1721
1722static void cpu_notify_set_memory(target_phys_addr_t start_addr,
9742bf26 1723 ram_addr_t size,
0fd542fb
MT
1724 ram_addr_t phys_offset,
1725 bool log_dirty)
f6f3fbca
MT
1726{
1727 CPUPhysMemoryClient *client;
1728 QLIST_FOREACH(client, &memory_client_list, list) {
0fd542fb 1729 client->set_memory(client, start_addr, size, phys_offset, log_dirty);
f6f3fbca
MT
1730 }
1731}
1732
1733static int cpu_notify_sync_dirty_bitmap(target_phys_addr_t start,
9742bf26 1734 target_phys_addr_t end)
f6f3fbca
MT
1735{
1736 CPUPhysMemoryClient *client;
1737 QLIST_FOREACH(client, &memory_client_list, list) {
1738 int r = client->sync_dirty_bitmap(client, start, end);
1739 if (r < 0)
1740 return r;
1741 }
1742 return 0;
1743}
1744
1745static int cpu_notify_migration_log(int enable)
1746{
1747 CPUPhysMemoryClient *client;
1748 QLIST_FOREACH(client, &memory_client_list, list) {
1749 int r = client->migration_log(client, enable);
1750 if (r < 0)
1751 return r;
1752 }
1753 return 0;
1754}
1755
8d4c78e7
AW
1756/* The l1_phys_map provides the upper P_L1_BITs of the guest physical
1757 * address. Each intermediate table provides the next L2_BITs of guest
1758 * physical address space. The number of levels vary based on host and
1759 * guest configuration, making it efficient to build the final guest
1760 * physical address by seeding the L1 offset and shifting and adding in
1761 * each L2 offset as we recurse through them. */
5cd2c5b6 1762static void phys_page_for_each_1(CPUPhysMemoryClient *client,
8d4c78e7 1763 int level, void **lp, target_phys_addr_t addr)
f6f3fbca 1764{
5cd2c5b6 1765 int i;
f6f3fbca 1766
5cd2c5b6
RH
1767 if (*lp == NULL) {
1768 return;
1769 }
1770 if (level == 0) {
1771 PhysPageDesc *pd = *lp;
8d4c78e7 1772 addr <<= L2_BITS + TARGET_PAGE_BITS;
7296abac 1773 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6 1774 if (pd[i].phys_offset != IO_MEM_UNASSIGNED) {
8d4c78e7 1775 client->set_memory(client, addr | i << TARGET_PAGE_BITS,
0fd542fb 1776 TARGET_PAGE_SIZE, pd[i].phys_offset, false);
f6f3fbca 1777 }
5cd2c5b6
RH
1778 }
1779 } else {
1780 void **pp = *lp;
7296abac 1781 for (i = 0; i < L2_SIZE; ++i) {
8d4c78e7
AW
1782 phys_page_for_each_1(client, level - 1, pp + i,
1783 (addr << L2_BITS) | i);
f6f3fbca
MT
1784 }
1785 }
1786}
1787
1788static void phys_page_for_each(CPUPhysMemoryClient *client)
1789{
5cd2c5b6
RH
1790 int i;
1791 for (i = 0; i < P_L1_SIZE; ++i) {
1792 phys_page_for_each_1(client, P_L1_SHIFT / L2_BITS - 1,
8d4c78e7 1793 l1_phys_map + i, i);
f6f3fbca 1794 }
f6f3fbca
MT
1795}
1796
1797void cpu_register_phys_memory_client(CPUPhysMemoryClient *client)
1798{
1799 QLIST_INSERT_HEAD(&memory_client_list, client, list);
1800 phys_page_for_each(client);
1801}
1802
1803void cpu_unregister_phys_memory_client(CPUPhysMemoryClient *client)
1804{
1805 QLIST_REMOVE(client, list);
1806}
1807#endif
1808
f193c797
FB
1809static int cmp1(const char *s1, int n, const char *s2)
1810{
1811 if (strlen(s2) != n)
1812 return 0;
1813 return memcmp(s1, s2, n) == 0;
1814}
3b46e624 1815
f193c797
FB
1816/* takes a comma separated list of log masks. Return 0 if error. */
1817int cpu_str_to_log_mask(const char *str)
1818{
c7cd6a37 1819 const CPULogItem *item;
f193c797
FB
1820 int mask;
1821 const char *p, *p1;
1822
1823 p = str;
1824 mask = 0;
1825 for(;;) {
1826 p1 = strchr(p, ',');
1827 if (!p1)
1828 p1 = p + strlen(p);
9742bf26
YT
1829 if(cmp1(p,p1-p,"all")) {
1830 for(item = cpu_log_items; item->mask != 0; item++) {
1831 mask |= item->mask;
1832 }
1833 } else {
1834 for(item = cpu_log_items; item->mask != 0; item++) {
1835 if (cmp1(p, p1 - p, item->name))
1836 goto found;
1837 }
1838 return 0;
f193c797 1839 }
f193c797
FB
1840 found:
1841 mask |= item->mask;
1842 if (*p1 != ',')
1843 break;
1844 p = p1 + 1;
1845 }
1846 return mask;
1847}
ea041c0e 1848
7501267e
FB
1849void cpu_abort(CPUState *env, const char *fmt, ...)
1850{
1851 va_list ap;
493ae1f0 1852 va_list ap2;
7501267e
FB
1853
1854 va_start(ap, fmt);
493ae1f0 1855 va_copy(ap2, ap);
7501267e
FB
1856 fprintf(stderr, "qemu: fatal: ");
1857 vfprintf(stderr, fmt, ap);
1858 fprintf(stderr, "\n");
1859#ifdef TARGET_I386
7fe48483
FB
1860 cpu_dump_state(env, stderr, fprintf, X86_DUMP_FPU | X86_DUMP_CCOP);
1861#else
1862 cpu_dump_state(env, stderr, fprintf, 0);
7501267e 1863#endif
93fcfe39
AL
1864 if (qemu_log_enabled()) {
1865 qemu_log("qemu: fatal: ");
1866 qemu_log_vprintf(fmt, ap2);
1867 qemu_log("\n");
f9373291 1868#ifdef TARGET_I386
93fcfe39 1869 log_cpu_state(env, X86_DUMP_FPU | X86_DUMP_CCOP);
f9373291 1870#else
93fcfe39 1871 log_cpu_state(env, 0);
f9373291 1872#endif
31b1a7b4 1873 qemu_log_flush();
93fcfe39 1874 qemu_log_close();
924edcae 1875 }
493ae1f0 1876 va_end(ap2);
f9373291 1877 va_end(ap);
fd052bf6
RV
1878#if defined(CONFIG_USER_ONLY)
1879 {
1880 struct sigaction act;
1881 sigfillset(&act.sa_mask);
1882 act.sa_handler = SIG_DFL;
1883 sigaction(SIGABRT, &act, NULL);
1884 }
1885#endif
7501267e
FB
1886 abort();
1887}
1888
c5be9f08
TS
1889CPUState *cpu_copy(CPUState *env)
1890{
01ba9816 1891 CPUState *new_env = cpu_init(env->cpu_model_str);
c5be9f08
TS
1892 CPUState *next_cpu = new_env->next_cpu;
1893 int cpu_index = new_env->cpu_index;
5a38f081
AL
1894#if defined(TARGET_HAS_ICE)
1895 CPUBreakpoint *bp;
1896 CPUWatchpoint *wp;
1897#endif
1898
c5be9f08 1899 memcpy(new_env, env, sizeof(CPUState));
5a38f081
AL
1900
1901 /* Preserve chaining and index. */
c5be9f08
TS
1902 new_env->next_cpu = next_cpu;
1903 new_env->cpu_index = cpu_index;
5a38f081
AL
1904
1905 /* Clone all break/watchpoints.
1906 Note: Once we support ptrace with hw-debug register access, make sure
1907 BP_CPU break/watchpoints are handled correctly on clone. */
72cf2d4f
BS
1908 QTAILQ_INIT(&env->breakpoints);
1909 QTAILQ_INIT(&env->watchpoints);
5a38f081 1910#if defined(TARGET_HAS_ICE)
72cf2d4f 1911 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
5a38f081
AL
1912 cpu_breakpoint_insert(new_env, bp->pc, bp->flags, NULL);
1913 }
72cf2d4f 1914 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
5a38f081
AL
1915 cpu_watchpoint_insert(new_env, wp->vaddr, (~wp->len_mask) + 1,
1916 wp->flags, NULL);
1917 }
1918#endif
1919
c5be9f08
TS
1920 return new_env;
1921}
1922
0124311e
FB
1923#if !defined(CONFIG_USER_ONLY)
1924
5c751e99
EI
1925static inline void tlb_flush_jmp_cache(CPUState *env, target_ulong addr)
1926{
1927 unsigned int i;
1928
1929 /* Discard jump cache entries for any tb which might potentially
1930 overlap the flushed page. */
1931 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1932 memset (&env->tb_jmp_cache[i], 0,
9742bf26 1933 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
5c751e99
EI
1934
1935 i = tb_jmp_cache_hash_page(addr);
1936 memset (&env->tb_jmp_cache[i], 0,
9742bf26 1937 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
5c751e99
EI
1938}
1939
08738984
IK
1940static CPUTLBEntry s_cputlb_empty_entry = {
1941 .addr_read = -1,
1942 .addr_write = -1,
1943 .addr_code = -1,
1944 .addend = -1,
1945};
1946
ee8b7021
FB
1947/* NOTE: if flush_global is true, also flush global entries (not
1948 implemented yet) */
1949void tlb_flush(CPUState *env, int flush_global)
33417e70 1950{
33417e70 1951 int i;
0124311e 1952
9fa3e853
FB
1953#if defined(DEBUG_TLB)
1954 printf("tlb_flush:\n");
1955#endif
0124311e
FB
1956 /* must reset current TB so that interrupts cannot modify the
1957 links while we are modifying them */
1958 env->current_tb = NULL;
1959
33417e70 1960 for(i = 0; i < CPU_TLB_SIZE; i++) {
cfde4bd9
IY
1961 int mmu_idx;
1962 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
08738984 1963 env->tlb_table[mmu_idx][i] = s_cputlb_empty_entry;
cfde4bd9 1964 }
33417e70 1965 }
9fa3e853 1966
8a40a180 1967 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
9fa3e853 1968
d4c430a8
PB
1969 env->tlb_flush_addr = -1;
1970 env->tlb_flush_mask = 0;
e3db7226 1971 tlb_flush_count++;
33417e70
FB
1972}
1973
274da6b2 1974static inline void tlb_flush_entry(CPUTLBEntry *tlb_entry, target_ulong addr)
61382a50 1975{
5fafdf24 1976 if (addr == (tlb_entry->addr_read &
84b7b8e7 1977 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
5fafdf24 1978 addr == (tlb_entry->addr_write &
84b7b8e7 1979 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
5fafdf24 1980 addr == (tlb_entry->addr_code &
84b7b8e7 1981 (TARGET_PAGE_MASK | TLB_INVALID_MASK))) {
08738984 1982 *tlb_entry = s_cputlb_empty_entry;
84b7b8e7 1983 }
61382a50
FB
1984}
1985
2e12669a 1986void tlb_flush_page(CPUState *env, target_ulong addr)
33417e70 1987{
8a40a180 1988 int i;
cfde4bd9 1989 int mmu_idx;
0124311e 1990
9fa3e853 1991#if defined(DEBUG_TLB)
108c49b8 1992 printf("tlb_flush_page: " TARGET_FMT_lx "\n", addr);
9fa3e853 1993#endif
d4c430a8
PB
1994 /* Check if we need to flush due to large pages. */
1995 if ((addr & env->tlb_flush_mask) == env->tlb_flush_addr) {
1996#if defined(DEBUG_TLB)
1997 printf("tlb_flush_page: forced full flush ("
1998 TARGET_FMT_lx "/" TARGET_FMT_lx ")\n",
1999 env->tlb_flush_addr, env->tlb_flush_mask);
2000#endif
2001 tlb_flush(env, 1);
2002 return;
2003 }
0124311e
FB
2004 /* must reset current TB so that interrupts cannot modify the
2005 links while we are modifying them */
2006 env->current_tb = NULL;
61382a50
FB
2007
2008 addr &= TARGET_PAGE_MASK;
2009 i = (addr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
cfde4bd9
IY
2010 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
2011 tlb_flush_entry(&env->tlb_table[mmu_idx][i], addr);
0124311e 2012
5c751e99 2013 tlb_flush_jmp_cache(env, addr);
9fa3e853
FB
2014}
2015
9fa3e853
FB
2016/* update the TLBs so that writes to code in the virtual page 'addr'
2017 can be detected */
c227f099 2018static void tlb_protect_code(ram_addr_t ram_addr)
9fa3e853 2019{
5fafdf24 2020 cpu_physical_memory_reset_dirty(ram_addr,
6a00d601
FB
2021 ram_addr + TARGET_PAGE_SIZE,
2022 CODE_DIRTY_FLAG);
9fa3e853
FB
2023}
2024
9fa3e853 2025/* update the TLB so that writes in physical page 'phys_addr' are no longer
3a7d929e 2026 tested for self modifying code */
c227f099 2027static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
3a7d929e 2028 target_ulong vaddr)
9fa3e853 2029{
f7c11b53 2030 cpu_physical_memory_set_dirty_flags(ram_addr, CODE_DIRTY_FLAG);
1ccde1cb
FB
2031}
2032
5fafdf24 2033static inline void tlb_reset_dirty_range(CPUTLBEntry *tlb_entry,
1ccde1cb
FB
2034 unsigned long start, unsigned long length)
2035{
2036 unsigned long addr;
84b7b8e7
FB
2037 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
2038 addr = (tlb_entry->addr_write & TARGET_PAGE_MASK) + tlb_entry->addend;
1ccde1cb 2039 if ((addr - start) < length) {
0f459d16 2040 tlb_entry->addr_write = (tlb_entry->addr_write & TARGET_PAGE_MASK) | TLB_NOTDIRTY;
1ccde1cb
FB
2041 }
2042 }
2043}
2044
5579c7f3 2045/* Note: start and end must be within the same ram block. */
c227f099 2046void cpu_physical_memory_reset_dirty(ram_addr_t start, ram_addr_t end,
0a962c02 2047 int dirty_flags)
1ccde1cb
FB
2048{
2049 CPUState *env;
4f2ac237 2050 unsigned long length, start1;
f7c11b53 2051 int i;
1ccde1cb
FB
2052
2053 start &= TARGET_PAGE_MASK;
2054 end = TARGET_PAGE_ALIGN(end);
2055
2056 length = end - start;
2057 if (length == 0)
2058 return;
f7c11b53 2059 cpu_physical_memory_mask_dirty_range(start, length, dirty_flags);
f23db169 2060
1ccde1cb
FB
2061 /* we modify the TLB cache so that the dirty bit will be set again
2062 when accessing the range */
b2e0a138 2063 start1 = (unsigned long)qemu_safe_ram_ptr(start);
5579c7f3
PB
2064 /* Chek that we don't span multiple blocks - this breaks the
2065 address comparisons below. */
b2e0a138 2066 if ((unsigned long)qemu_safe_ram_ptr(end - 1) - start1
5579c7f3
PB
2067 != (end - 1) - start) {
2068 abort();
2069 }
2070
6a00d601 2071 for(env = first_cpu; env != NULL; env = env->next_cpu) {
cfde4bd9
IY
2072 int mmu_idx;
2073 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2074 for(i = 0; i < CPU_TLB_SIZE; i++)
2075 tlb_reset_dirty_range(&env->tlb_table[mmu_idx][i],
2076 start1, length);
2077 }
6a00d601 2078 }
1ccde1cb
FB
2079}
2080
74576198
AL
2081int cpu_physical_memory_set_dirty_tracking(int enable)
2082{
f6f3fbca 2083 int ret = 0;
74576198 2084 in_migration = enable;
f6f3fbca
MT
2085 ret = cpu_notify_migration_log(!!enable);
2086 return ret;
74576198
AL
2087}
2088
2089int cpu_physical_memory_get_dirty_tracking(void)
2090{
2091 return in_migration;
2092}
2093
c227f099
AL
2094int cpu_physical_sync_dirty_bitmap(target_phys_addr_t start_addr,
2095 target_phys_addr_t end_addr)
2bec46dc 2096{
7b8f3b78 2097 int ret;
151f7749 2098
f6f3fbca 2099 ret = cpu_notify_sync_dirty_bitmap(start_addr, end_addr);
151f7749 2100 return ret;
2bec46dc
AL
2101}
2102
e5896b12
AP
2103int cpu_physical_log_start(target_phys_addr_t start_addr,
2104 ram_addr_t size)
2105{
2106 CPUPhysMemoryClient *client;
2107 QLIST_FOREACH(client, &memory_client_list, list) {
2108 if (client->log_start) {
2109 int r = client->log_start(client, start_addr, size);
2110 if (r < 0) {
2111 return r;
2112 }
2113 }
2114 }
2115 return 0;
2116}
2117
2118int cpu_physical_log_stop(target_phys_addr_t start_addr,
2119 ram_addr_t size)
2120{
2121 CPUPhysMemoryClient *client;
2122 QLIST_FOREACH(client, &memory_client_list, list) {
2123 if (client->log_stop) {
2124 int r = client->log_stop(client, start_addr, size);
2125 if (r < 0) {
2126 return r;
2127 }
2128 }
2129 }
2130 return 0;
2131}
2132
3a7d929e
FB
2133static inline void tlb_update_dirty(CPUTLBEntry *tlb_entry)
2134{
c227f099 2135 ram_addr_t ram_addr;
5579c7f3 2136 void *p;
3a7d929e 2137
84b7b8e7 2138 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
5579c7f3
PB
2139 p = (void *)(unsigned long)((tlb_entry->addr_write & TARGET_PAGE_MASK)
2140 + tlb_entry->addend);
e890261f 2141 ram_addr = qemu_ram_addr_from_host_nofail(p);
3a7d929e 2142 if (!cpu_physical_memory_is_dirty(ram_addr)) {
0f459d16 2143 tlb_entry->addr_write |= TLB_NOTDIRTY;
3a7d929e
FB
2144 }
2145 }
2146}
2147
2148/* update the TLB according to the current state of the dirty bits */
2149void cpu_tlb_update_dirty(CPUState *env)
2150{
2151 int i;
cfde4bd9
IY
2152 int mmu_idx;
2153 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2154 for(i = 0; i < CPU_TLB_SIZE; i++)
2155 tlb_update_dirty(&env->tlb_table[mmu_idx][i]);
2156 }
3a7d929e
FB
2157}
2158
0f459d16 2159static inline void tlb_set_dirty1(CPUTLBEntry *tlb_entry, target_ulong vaddr)
1ccde1cb 2160{
0f459d16
PB
2161 if (tlb_entry->addr_write == (vaddr | TLB_NOTDIRTY))
2162 tlb_entry->addr_write = vaddr;
1ccde1cb
FB
2163}
2164
0f459d16
PB
2165/* update the TLB corresponding to virtual page vaddr
2166 so that it is no longer dirty */
2167static inline void tlb_set_dirty(CPUState *env, target_ulong vaddr)
1ccde1cb 2168{
1ccde1cb 2169 int i;
cfde4bd9 2170 int mmu_idx;
1ccde1cb 2171
0f459d16 2172 vaddr &= TARGET_PAGE_MASK;
1ccde1cb 2173 i = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
cfde4bd9
IY
2174 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
2175 tlb_set_dirty1(&env->tlb_table[mmu_idx][i], vaddr);
9fa3e853
FB
2176}
2177
d4c430a8
PB
2178/* Our TLB does not support large pages, so remember the area covered by
2179 large pages and trigger a full TLB flush if these are invalidated. */
2180static void tlb_add_large_page(CPUState *env, target_ulong vaddr,
2181 target_ulong size)
2182{
2183 target_ulong mask = ~(size - 1);
2184
2185 if (env->tlb_flush_addr == (target_ulong)-1) {
2186 env->tlb_flush_addr = vaddr & mask;
2187 env->tlb_flush_mask = mask;
2188 return;
2189 }
2190 /* Extend the existing region to include the new page.
2191 This is a compromise between unnecessary flushes and the cost
2192 of maintaining a full variable size TLB. */
2193 mask &= env->tlb_flush_mask;
2194 while (((env->tlb_flush_addr ^ vaddr) & mask) != 0) {
2195 mask <<= 1;
2196 }
2197 env->tlb_flush_addr &= mask;
2198 env->tlb_flush_mask = mask;
2199}
2200
2201/* Add a new TLB entry. At most one entry for a given virtual address
2202 is permitted. Only a single TARGET_PAGE_SIZE region is mapped, the
2203 supplied size is only used by tlb_flush_page. */
2204void tlb_set_page(CPUState *env, target_ulong vaddr,
2205 target_phys_addr_t paddr, int prot,
2206 int mmu_idx, target_ulong size)
9fa3e853 2207{
92e873b9 2208 PhysPageDesc *p;
4f2ac237 2209 unsigned long pd;
9fa3e853 2210 unsigned int index;
4f2ac237 2211 target_ulong address;
0f459d16 2212 target_ulong code_address;
355b1943 2213 unsigned long addend;
84b7b8e7 2214 CPUTLBEntry *te;
a1d1bb31 2215 CPUWatchpoint *wp;
c227f099 2216 target_phys_addr_t iotlb;
9fa3e853 2217
d4c430a8
PB
2218 assert(size >= TARGET_PAGE_SIZE);
2219 if (size != TARGET_PAGE_SIZE) {
2220 tlb_add_large_page(env, vaddr, size);
2221 }
92e873b9 2222 p = phys_page_find(paddr >> TARGET_PAGE_BITS);
9fa3e853
FB
2223 if (!p) {
2224 pd = IO_MEM_UNASSIGNED;
9fa3e853
FB
2225 } else {
2226 pd = p->phys_offset;
9fa3e853
FB
2227 }
2228#if defined(DEBUG_TLB)
7fd3f494
SW
2229 printf("tlb_set_page: vaddr=" TARGET_FMT_lx " paddr=0x" TARGET_FMT_plx
2230 " prot=%x idx=%d pd=0x%08lx\n",
2231 vaddr, paddr, prot, mmu_idx, pd);
9fa3e853
FB
2232#endif
2233
0f459d16
PB
2234 address = vaddr;
2235 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM && !(pd & IO_MEM_ROMD)) {
2236 /* IO memory case (romd handled later) */
2237 address |= TLB_MMIO;
2238 }
5579c7f3 2239 addend = (unsigned long)qemu_get_ram_ptr(pd & TARGET_PAGE_MASK);
0f459d16
PB
2240 if ((pd & ~TARGET_PAGE_MASK) <= IO_MEM_ROM) {
2241 /* Normal RAM. */
2242 iotlb = pd & TARGET_PAGE_MASK;
2243 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM)
2244 iotlb |= IO_MEM_NOTDIRTY;
2245 else
2246 iotlb |= IO_MEM_ROM;
2247 } else {
ccbb4d44 2248 /* IO handlers are currently passed a physical address.
0f459d16
PB
2249 It would be nice to pass an offset from the base address
2250 of that region. This would avoid having to special case RAM,
2251 and avoid full address decoding in every device.
2252 We can't use the high bits of pd for this because
2253 IO_MEM_ROMD uses these as a ram address. */
8da3ff18
PB
2254 iotlb = (pd & ~TARGET_PAGE_MASK);
2255 if (p) {
8da3ff18
PB
2256 iotlb += p->region_offset;
2257 } else {
2258 iotlb += paddr;
2259 }
0f459d16
PB
2260 }
2261
2262 code_address = address;
2263 /* Make accesses to pages with watchpoints go via the
2264 watchpoint trap routines. */
72cf2d4f 2265 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
a1d1bb31 2266 if (vaddr == (wp->vaddr & TARGET_PAGE_MASK)) {
bf298f83
JK
2267 /* Avoid trapping reads of pages with a write breakpoint. */
2268 if ((prot & PAGE_WRITE) || (wp->flags & BP_MEM_READ)) {
2269 iotlb = io_mem_watch + paddr;
2270 address |= TLB_MMIO;
2271 break;
2272 }
6658ffb8 2273 }
0f459d16 2274 }
d79acba4 2275
0f459d16
PB
2276 index = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
2277 env->iotlb[mmu_idx][index] = iotlb - vaddr;
2278 te = &env->tlb_table[mmu_idx][index];
2279 te->addend = addend - vaddr;
2280 if (prot & PAGE_READ) {
2281 te->addr_read = address;
2282 } else {
2283 te->addr_read = -1;
2284 }
5c751e99 2285
0f459d16
PB
2286 if (prot & PAGE_EXEC) {
2287 te->addr_code = code_address;
2288 } else {
2289 te->addr_code = -1;
2290 }
2291 if (prot & PAGE_WRITE) {
2292 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_ROM ||
2293 (pd & IO_MEM_ROMD)) {
2294 /* Write access calls the I/O callback. */
2295 te->addr_write = address | TLB_MMIO;
2296 } else if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM &&
2297 !cpu_physical_memory_is_dirty(pd)) {
2298 te->addr_write = address | TLB_NOTDIRTY;
9fa3e853 2299 } else {
0f459d16 2300 te->addr_write = address;
9fa3e853 2301 }
0f459d16
PB
2302 } else {
2303 te->addr_write = -1;
9fa3e853 2304 }
9fa3e853
FB
2305}
2306
0124311e
FB
2307#else
2308
ee8b7021 2309void tlb_flush(CPUState *env, int flush_global)
0124311e
FB
2310{
2311}
2312
2e12669a 2313void tlb_flush_page(CPUState *env, target_ulong addr)
0124311e
FB
2314{
2315}
2316
edf8e2af
MW
2317/*
2318 * Walks guest process memory "regions" one by one
2319 * and calls callback function 'fn' for each region.
2320 */
5cd2c5b6
RH
2321
2322struct walk_memory_regions_data
2323{
2324 walk_memory_regions_fn fn;
2325 void *priv;
2326 unsigned long start;
2327 int prot;
2328};
2329
2330static int walk_memory_regions_end(struct walk_memory_regions_data *data,
b480d9b7 2331 abi_ulong end, int new_prot)
5cd2c5b6
RH
2332{
2333 if (data->start != -1ul) {
2334 int rc = data->fn(data->priv, data->start, end, data->prot);
2335 if (rc != 0) {
2336 return rc;
2337 }
2338 }
2339
2340 data->start = (new_prot ? end : -1ul);
2341 data->prot = new_prot;
2342
2343 return 0;
2344}
2345
2346static int walk_memory_regions_1(struct walk_memory_regions_data *data,
b480d9b7 2347 abi_ulong base, int level, void **lp)
5cd2c5b6 2348{
b480d9b7 2349 abi_ulong pa;
5cd2c5b6
RH
2350 int i, rc;
2351
2352 if (*lp == NULL) {
2353 return walk_memory_regions_end(data, base, 0);
2354 }
2355
2356 if (level == 0) {
2357 PageDesc *pd = *lp;
7296abac 2358 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
2359 int prot = pd[i].flags;
2360
2361 pa = base | (i << TARGET_PAGE_BITS);
2362 if (prot != data->prot) {
2363 rc = walk_memory_regions_end(data, pa, prot);
2364 if (rc != 0) {
2365 return rc;
9fa3e853 2366 }
9fa3e853 2367 }
5cd2c5b6
RH
2368 }
2369 } else {
2370 void **pp = *lp;
7296abac 2371 for (i = 0; i < L2_SIZE; ++i) {
b480d9b7
PB
2372 pa = base | ((abi_ulong)i <<
2373 (TARGET_PAGE_BITS + L2_BITS * level));
5cd2c5b6
RH
2374 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
2375 if (rc != 0) {
2376 return rc;
2377 }
2378 }
2379 }
2380
2381 return 0;
2382}
2383
2384int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
2385{
2386 struct walk_memory_regions_data data;
2387 unsigned long i;
2388
2389 data.fn = fn;
2390 data.priv = priv;
2391 data.start = -1ul;
2392 data.prot = 0;
2393
2394 for (i = 0; i < V_L1_SIZE; i++) {
b480d9b7 2395 int rc = walk_memory_regions_1(&data, (abi_ulong)i << V_L1_SHIFT,
5cd2c5b6
RH
2396 V_L1_SHIFT / L2_BITS - 1, l1_map + i);
2397 if (rc != 0) {
2398 return rc;
9fa3e853 2399 }
33417e70 2400 }
5cd2c5b6
RH
2401
2402 return walk_memory_regions_end(&data, 0, 0);
edf8e2af
MW
2403}
2404
b480d9b7
PB
2405static int dump_region(void *priv, abi_ulong start,
2406 abi_ulong end, unsigned long prot)
edf8e2af
MW
2407{
2408 FILE *f = (FILE *)priv;
2409
b480d9b7
PB
2410 (void) fprintf(f, TARGET_ABI_FMT_lx"-"TARGET_ABI_FMT_lx
2411 " "TARGET_ABI_FMT_lx" %c%c%c\n",
edf8e2af
MW
2412 start, end, end - start,
2413 ((prot & PAGE_READ) ? 'r' : '-'),
2414 ((prot & PAGE_WRITE) ? 'w' : '-'),
2415 ((prot & PAGE_EXEC) ? 'x' : '-'));
2416
2417 return (0);
2418}
2419
2420/* dump memory mappings */
2421void page_dump(FILE *f)
2422{
2423 (void) fprintf(f, "%-8s %-8s %-8s %s\n",
2424 "start", "end", "size", "prot");
2425 walk_memory_regions(f, dump_region);
33417e70
FB
2426}
2427
53a5960a 2428int page_get_flags(target_ulong address)
33417e70 2429{
9fa3e853
FB
2430 PageDesc *p;
2431
2432 p = page_find(address >> TARGET_PAGE_BITS);
33417e70 2433 if (!p)
9fa3e853
FB
2434 return 0;
2435 return p->flags;
2436}
2437
376a7909
RH
2438/* Modify the flags of a page and invalidate the code if necessary.
2439 The flag PAGE_WRITE_ORG is positioned automatically depending
2440 on PAGE_WRITE. The mmap_lock should already be held. */
53a5960a 2441void page_set_flags(target_ulong start, target_ulong end, int flags)
9fa3e853 2442{
376a7909
RH
2443 target_ulong addr, len;
2444
2445 /* This function should never be called with addresses outside the
2446 guest address space. If this assert fires, it probably indicates
2447 a missing call to h2g_valid. */
b480d9b7
PB
2448#if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2449 assert(end < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
376a7909
RH
2450#endif
2451 assert(start < end);
9fa3e853
FB
2452
2453 start = start & TARGET_PAGE_MASK;
2454 end = TARGET_PAGE_ALIGN(end);
376a7909
RH
2455
2456 if (flags & PAGE_WRITE) {
9fa3e853 2457 flags |= PAGE_WRITE_ORG;
376a7909
RH
2458 }
2459
2460 for (addr = start, len = end - start;
2461 len != 0;
2462 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2463 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2464
2465 /* If the write protection bit is set, then we invalidate
2466 the code inside. */
5fafdf24 2467 if (!(p->flags & PAGE_WRITE) &&
9fa3e853
FB
2468 (flags & PAGE_WRITE) &&
2469 p->first_tb) {
d720b93d 2470 tb_invalidate_phys_page(addr, 0, NULL);
9fa3e853
FB
2471 }
2472 p->flags = flags;
2473 }
33417e70
FB
2474}
2475
3d97b40b
TS
2476int page_check_range(target_ulong start, target_ulong len, int flags)
2477{
2478 PageDesc *p;
2479 target_ulong end;
2480 target_ulong addr;
2481
376a7909
RH
2482 /* This function should never be called with addresses outside the
2483 guest address space. If this assert fires, it probably indicates
2484 a missing call to h2g_valid. */
338e9e6c
BS
2485#if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2486 assert(start < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
376a7909
RH
2487#endif
2488
3e0650a9
RH
2489 if (len == 0) {
2490 return 0;
2491 }
376a7909
RH
2492 if (start + len - 1 < start) {
2493 /* We've wrapped around. */
55f280c9 2494 return -1;
376a7909 2495 }
55f280c9 2496
3d97b40b
TS
2497 end = TARGET_PAGE_ALIGN(start+len); /* must do before we loose bits in the next step */
2498 start = start & TARGET_PAGE_MASK;
2499
376a7909
RH
2500 for (addr = start, len = end - start;
2501 len != 0;
2502 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
3d97b40b
TS
2503 p = page_find(addr >> TARGET_PAGE_BITS);
2504 if( !p )
2505 return -1;
2506 if( !(p->flags & PAGE_VALID) )
2507 return -1;
2508
dae3270c 2509 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ))
3d97b40b 2510 return -1;
dae3270c
FB
2511 if (flags & PAGE_WRITE) {
2512 if (!(p->flags & PAGE_WRITE_ORG))
2513 return -1;
2514 /* unprotect the page if it was put read-only because it
2515 contains translated code */
2516 if (!(p->flags & PAGE_WRITE)) {
2517 if (!page_unprotect(addr, 0, NULL))
2518 return -1;
2519 }
2520 return 0;
2521 }
3d97b40b
TS
2522 }
2523 return 0;
2524}
2525
9fa3e853 2526/* called from signal handler: invalidate the code and unprotect the
ccbb4d44 2527 page. Return TRUE if the fault was successfully handled. */
53a5960a 2528int page_unprotect(target_ulong address, unsigned long pc, void *puc)
9fa3e853 2529{
45d679d6
AJ
2530 unsigned int prot;
2531 PageDesc *p;
53a5960a 2532 target_ulong host_start, host_end, addr;
9fa3e853 2533
c8a706fe
PB
2534 /* Technically this isn't safe inside a signal handler. However we
2535 know this only ever happens in a synchronous SEGV handler, so in
2536 practice it seems to be ok. */
2537 mmap_lock();
2538
45d679d6
AJ
2539 p = page_find(address >> TARGET_PAGE_BITS);
2540 if (!p) {
c8a706fe 2541 mmap_unlock();
9fa3e853 2542 return 0;
c8a706fe 2543 }
45d679d6 2544
9fa3e853
FB
2545 /* if the page was really writable, then we change its
2546 protection back to writable */
45d679d6
AJ
2547 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
2548 host_start = address & qemu_host_page_mask;
2549 host_end = host_start + qemu_host_page_size;
2550
2551 prot = 0;
2552 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
2553 p = page_find(addr >> TARGET_PAGE_BITS);
2554 p->flags |= PAGE_WRITE;
2555 prot |= p->flags;
2556
9fa3e853
FB
2557 /* and since the content will be modified, we must invalidate
2558 the corresponding translated code. */
45d679d6 2559 tb_invalidate_phys_page(addr, pc, puc);
9fa3e853 2560#ifdef DEBUG_TB_CHECK
45d679d6 2561 tb_invalidate_check(addr);
9fa3e853 2562#endif
9fa3e853 2563 }
45d679d6
AJ
2564 mprotect((void *)g2h(host_start), qemu_host_page_size,
2565 prot & PAGE_BITS);
2566
2567 mmap_unlock();
2568 return 1;
9fa3e853 2569 }
c8a706fe 2570 mmap_unlock();
9fa3e853
FB
2571 return 0;
2572}
2573
6a00d601
FB
2574static inline void tlb_set_dirty(CPUState *env,
2575 unsigned long addr, target_ulong vaddr)
1ccde1cb
FB
2576{
2577}
9fa3e853
FB
2578#endif /* defined(CONFIG_USER_ONLY) */
2579
e2eef170 2580#if !defined(CONFIG_USER_ONLY)
8da3ff18 2581
c04b2b78
PB
2582#define SUBPAGE_IDX(addr) ((addr) & ~TARGET_PAGE_MASK)
2583typedef struct subpage_t {
2584 target_phys_addr_t base;
f6405247
RH
2585 ram_addr_t sub_io_index[TARGET_PAGE_SIZE];
2586 ram_addr_t region_offset[TARGET_PAGE_SIZE];
c04b2b78
PB
2587} subpage_t;
2588
c227f099
AL
2589static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
2590 ram_addr_t memory, ram_addr_t region_offset);
f6405247
RH
2591static subpage_t *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
2592 ram_addr_t orig_memory,
2593 ram_addr_t region_offset);
db7b5426
BS
2594#define CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2, \
2595 need_subpage) \
2596 do { \
2597 if (addr > start_addr) \
2598 start_addr2 = 0; \
2599 else { \
2600 start_addr2 = start_addr & ~TARGET_PAGE_MASK; \
2601 if (start_addr2 > 0) \
2602 need_subpage = 1; \
2603 } \
2604 \
49e9fba2 2605 if ((start_addr + orig_size) - addr >= TARGET_PAGE_SIZE) \
db7b5426
BS
2606 end_addr2 = TARGET_PAGE_SIZE - 1; \
2607 else { \
2608 end_addr2 = (start_addr + orig_size - 1) & ~TARGET_PAGE_MASK; \
2609 if (end_addr2 < TARGET_PAGE_SIZE - 1) \
2610 need_subpage = 1; \
2611 } \
2612 } while (0)
2613
8f2498f9
MT
2614/* register physical memory.
2615 For RAM, 'size' must be a multiple of the target page size.
2616 If (phys_offset & ~TARGET_PAGE_MASK) != 0, then it is an
8da3ff18
PB
2617 io memory page. The address used when calling the IO function is
2618 the offset from the start of the region, plus region_offset. Both
ccbb4d44 2619 start_addr and region_offset are rounded down to a page boundary
8da3ff18
PB
2620 before calculating this offset. This should not be a problem unless
2621 the low bits of start_addr and region_offset differ. */
0fd542fb 2622void cpu_register_physical_memory_log(target_phys_addr_t start_addr,
c227f099
AL
2623 ram_addr_t size,
2624 ram_addr_t phys_offset,
0fd542fb
MT
2625 ram_addr_t region_offset,
2626 bool log_dirty)
33417e70 2627{
c227f099 2628 target_phys_addr_t addr, end_addr;
92e873b9 2629 PhysPageDesc *p;
9d42037b 2630 CPUState *env;
c227f099 2631 ram_addr_t orig_size = size;
f6405247 2632 subpage_t *subpage;
33417e70 2633
3b8e6a2d 2634 assert(size);
0fd542fb 2635 cpu_notify_set_memory(start_addr, size, phys_offset, log_dirty);
f6f3fbca 2636
67c4d23c
PB
2637 if (phys_offset == IO_MEM_UNASSIGNED) {
2638 region_offset = start_addr;
2639 }
8da3ff18 2640 region_offset &= TARGET_PAGE_MASK;
5fd386f6 2641 size = (size + TARGET_PAGE_SIZE - 1) & TARGET_PAGE_MASK;
c227f099 2642 end_addr = start_addr + (target_phys_addr_t)size;
3b8e6a2d
EI
2643
2644 addr = start_addr;
2645 do {
db7b5426
BS
2646 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2647 if (p && p->phys_offset != IO_MEM_UNASSIGNED) {
c227f099
AL
2648 ram_addr_t orig_memory = p->phys_offset;
2649 target_phys_addr_t start_addr2, end_addr2;
db7b5426
BS
2650 int need_subpage = 0;
2651
2652 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2,
2653 need_subpage);
f6405247 2654 if (need_subpage) {
db7b5426
BS
2655 if (!(orig_memory & IO_MEM_SUBPAGE)) {
2656 subpage = subpage_init((addr & TARGET_PAGE_MASK),
8da3ff18
PB
2657 &p->phys_offset, orig_memory,
2658 p->region_offset);
db7b5426
BS
2659 } else {
2660 subpage = io_mem_opaque[(orig_memory & ~TARGET_PAGE_MASK)
2661 >> IO_MEM_SHIFT];
2662 }
8da3ff18
PB
2663 subpage_register(subpage, start_addr2, end_addr2, phys_offset,
2664 region_offset);
2665 p->region_offset = 0;
db7b5426
BS
2666 } else {
2667 p->phys_offset = phys_offset;
2668 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
2669 (phys_offset & IO_MEM_ROMD))
2670 phys_offset += TARGET_PAGE_SIZE;
2671 }
2672 } else {
2673 p = phys_page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2674 p->phys_offset = phys_offset;
8da3ff18 2675 p->region_offset = region_offset;
db7b5426 2676 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
8da3ff18 2677 (phys_offset & IO_MEM_ROMD)) {
db7b5426 2678 phys_offset += TARGET_PAGE_SIZE;
0e8f0967 2679 } else {
c227f099 2680 target_phys_addr_t start_addr2, end_addr2;
db7b5426
BS
2681 int need_subpage = 0;
2682
2683 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr,
2684 end_addr2, need_subpage);
2685
f6405247 2686 if (need_subpage) {
db7b5426 2687 subpage = subpage_init((addr & TARGET_PAGE_MASK),
8da3ff18 2688 &p->phys_offset, IO_MEM_UNASSIGNED,
67c4d23c 2689 addr & TARGET_PAGE_MASK);
db7b5426 2690 subpage_register(subpage, start_addr2, end_addr2,
8da3ff18
PB
2691 phys_offset, region_offset);
2692 p->region_offset = 0;
db7b5426
BS
2693 }
2694 }
2695 }
8da3ff18 2696 region_offset += TARGET_PAGE_SIZE;
3b8e6a2d
EI
2697 addr += TARGET_PAGE_SIZE;
2698 } while (addr != end_addr);
3b46e624 2699
9d42037b
FB
2700 /* since each CPU stores ram addresses in its TLB cache, we must
2701 reset the modified entries */
2702 /* XXX: slow ! */
2703 for(env = first_cpu; env != NULL; env = env->next_cpu) {
2704 tlb_flush(env, 1);
2705 }
33417e70
FB
2706}
2707
ba863458 2708/* XXX: temporary until new memory mapping API */
c227f099 2709ram_addr_t cpu_get_physical_page_desc(target_phys_addr_t addr)
ba863458
FB
2710{
2711 PhysPageDesc *p;
2712
2713 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2714 if (!p)
2715 return IO_MEM_UNASSIGNED;
2716 return p->phys_offset;
2717}
2718
c227f099 2719void qemu_register_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
f65ed4c1
AL
2720{
2721 if (kvm_enabled())
2722 kvm_coalesce_mmio_region(addr, size);
2723}
2724
c227f099 2725void qemu_unregister_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
f65ed4c1
AL
2726{
2727 if (kvm_enabled())
2728 kvm_uncoalesce_mmio_region(addr, size);
2729}
2730
62a2744c
SY
2731void qemu_flush_coalesced_mmio_buffer(void)
2732{
2733 if (kvm_enabled())
2734 kvm_flush_coalesced_mmio_buffer();
2735}
2736
c902760f
MT
2737#if defined(__linux__) && !defined(TARGET_S390X)
2738
2739#include <sys/vfs.h>
2740
2741#define HUGETLBFS_MAGIC 0x958458f6
2742
2743static long gethugepagesize(const char *path)
2744{
2745 struct statfs fs;
2746 int ret;
2747
2748 do {
9742bf26 2749 ret = statfs(path, &fs);
c902760f
MT
2750 } while (ret != 0 && errno == EINTR);
2751
2752 if (ret != 0) {
9742bf26
YT
2753 perror(path);
2754 return 0;
c902760f
MT
2755 }
2756
2757 if (fs.f_type != HUGETLBFS_MAGIC)
9742bf26 2758 fprintf(stderr, "Warning: path not on HugeTLBFS: %s\n", path);
c902760f
MT
2759
2760 return fs.f_bsize;
2761}
2762
04b16653
AW
2763static void *file_ram_alloc(RAMBlock *block,
2764 ram_addr_t memory,
2765 const char *path)
c902760f
MT
2766{
2767 char *filename;
2768 void *area;
2769 int fd;
2770#ifdef MAP_POPULATE
2771 int flags;
2772#endif
2773 unsigned long hpagesize;
2774
2775 hpagesize = gethugepagesize(path);
2776 if (!hpagesize) {
9742bf26 2777 return NULL;
c902760f
MT
2778 }
2779
2780 if (memory < hpagesize) {
2781 return NULL;
2782 }
2783
2784 if (kvm_enabled() && !kvm_has_sync_mmu()) {
2785 fprintf(stderr, "host lacks kvm mmu notifiers, -mem-path unsupported\n");
2786 return NULL;
2787 }
2788
2789 if (asprintf(&filename, "%s/qemu_back_mem.XXXXXX", path) == -1) {
9742bf26 2790 return NULL;
c902760f
MT
2791 }
2792
2793 fd = mkstemp(filename);
2794 if (fd < 0) {
9742bf26
YT
2795 perror("unable to create backing store for hugepages");
2796 free(filename);
2797 return NULL;
c902760f
MT
2798 }
2799 unlink(filename);
2800 free(filename);
2801
2802 memory = (memory+hpagesize-1) & ~(hpagesize-1);
2803
2804 /*
2805 * ftruncate is not supported by hugetlbfs in older
2806 * hosts, so don't bother bailing out on errors.
2807 * If anything goes wrong with it under other filesystems,
2808 * mmap will fail.
2809 */
2810 if (ftruncate(fd, memory))
9742bf26 2811 perror("ftruncate");
c902760f
MT
2812
2813#ifdef MAP_POPULATE
2814 /* NB: MAP_POPULATE won't exhaustively alloc all phys pages in the case
2815 * MAP_PRIVATE is requested. For mem_prealloc we mmap as MAP_SHARED
2816 * to sidestep this quirk.
2817 */
2818 flags = mem_prealloc ? MAP_POPULATE | MAP_SHARED : MAP_PRIVATE;
2819 area = mmap(0, memory, PROT_READ | PROT_WRITE, flags, fd, 0);
2820#else
2821 area = mmap(0, memory, PROT_READ | PROT_WRITE, MAP_PRIVATE, fd, 0);
2822#endif
2823 if (area == MAP_FAILED) {
9742bf26
YT
2824 perror("file_ram_alloc: can't mmap RAM pages");
2825 close(fd);
2826 return (NULL);
c902760f 2827 }
04b16653 2828 block->fd = fd;
c902760f
MT
2829 return area;
2830}
2831#endif
2832
d17b5288 2833static ram_addr_t find_ram_offset(ram_addr_t size)
04b16653
AW
2834{
2835 RAMBlock *block, *next_block;
09d7ae90 2836 ram_addr_t offset = 0, mingap = ULONG_MAX;
04b16653
AW
2837
2838 if (QLIST_EMPTY(&ram_list.blocks))
2839 return 0;
2840
2841 QLIST_FOREACH(block, &ram_list.blocks, next) {
2842 ram_addr_t end, next = ULONG_MAX;
2843
2844 end = block->offset + block->length;
2845
2846 QLIST_FOREACH(next_block, &ram_list.blocks, next) {
2847 if (next_block->offset >= end) {
2848 next = MIN(next, next_block->offset);
2849 }
2850 }
2851 if (next - end >= size && next - end < mingap) {
2852 offset = end;
2853 mingap = next - end;
2854 }
2855 }
2856 return offset;
2857}
2858
2859static ram_addr_t last_ram_offset(void)
d17b5288
AW
2860{
2861 RAMBlock *block;
2862 ram_addr_t last = 0;
2863
2864 QLIST_FOREACH(block, &ram_list.blocks, next)
2865 last = MAX(last, block->offset + block->length);
2866
2867 return last;
2868}
2869
84b89d78 2870ram_addr_t qemu_ram_alloc_from_ptr(DeviceState *dev, const char *name,
6977dfe6 2871 ram_addr_t size, void *host)
84b89d78
CM
2872{
2873 RAMBlock *new_block, *block;
2874
2875 size = TARGET_PAGE_ALIGN(size);
2876 new_block = qemu_mallocz(sizeof(*new_block));
2877
2878 if (dev && dev->parent_bus && dev->parent_bus->info->get_dev_path) {
2879 char *id = dev->parent_bus->info->get_dev_path(dev);
2880 if (id) {
2881 snprintf(new_block->idstr, sizeof(new_block->idstr), "%s/", id);
2882 qemu_free(id);
2883 }
2884 }
2885 pstrcat(new_block->idstr, sizeof(new_block->idstr), name);
2886
2887 QLIST_FOREACH(block, &ram_list.blocks, next) {
2888 if (!strcmp(block->idstr, new_block->idstr)) {
2889 fprintf(stderr, "RAMBlock \"%s\" already registered, abort!\n",
2890 new_block->idstr);
2891 abort();
2892 }
2893 }
2894
432d268c 2895 new_block->offset = find_ram_offset(size);
6977dfe6
YT
2896 if (host) {
2897 new_block->host = host;
cd19cfa2 2898 new_block->flags |= RAM_PREALLOC_MASK;
6977dfe6
YT
2899 } else {
2900 if (mem_path) {
c902760f 2901#if defined (__linux__) && !defined(TARGET_S390X)
6977dfe6
YT
2902 new_block->host = file_ram_alloc(new_block, size, mem_path);
2903 if (!new_block->host) {
2904 new_block->host = qemu_vmalloc(size);
e78815a5 2905 qemu_madvise(new_block->host, size, QEMU_MADV_MERGEABLE);
6977dfe6 2906 }
c902760f 2907#else
6977dfe6
YT
2908 fprintf(stderr, "-mem-path option unsupported\n");
2909 exit(1);
c902760f 2910#endif
6977dfe6 2911 } else {
6b02494d 2912#if defined(TARGET_S390X) && defined(CONFIG_KVM)
ff83678a
CB
2913 /* S390 KVM requires the topmost vma of the RAM to be smaller than
2914 an system defined value, which is at least 256GB. Larger systems
2915 have larger values. We put the guest between the end of data
2916 segment (system break) and this value. We use 32GB as a base to
2917 have enough room for the system break to grow. */
2918 new_block->host = mmap((void*)0x800000000, size,
6977dfe6 2919 PROT_EXEC|PROT_READ|PROT_WRITE,
ff83678a 2920 MAP_SHARED | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
6b02494d 2921#else
432d268c
JN
2922 if (xen_mapcache_enabled()) {
2923 xen_ram_alloc(new_block->offset, size);
2924 } else {
2925 new_block->host = qemu_vmalloc(size);
2926 }
6b02494d 2927#endif
e78815a5 2928 qemu_madvise(new_block->host, size, QEMU_MADV_MERGEABLE);
6977dfe6 2929 }
c902760f 2930 }
94a6b54f
PB
2931 new_block->length = size;
2932
f471a17e 2933 QLIST_INSERT_HEAD(&ram_list.blocks, new_block, next);
94a6b54f 2934
f471a17e 2935 ram_list.phys_dirty = qemu_realloc(ram_list.phys_dirty,
04b16653 2936 last_ram_offset() >> TARGET_PAGE_BITS);
d17b5288 2937 memset(ram_list.phys_dirty + (new_block->offset >> TARGET_PAGE_BITS),
94a6b54f
PB
2938 0xff, size >> TARGET_PAGE_BITS);
2939
6f0437e8
JK
2940 if (kvm_enabled())
2941 kvm_setup_guest_memory(new_block->host, size);
2942
94a6b54f
PB
2943 return new_block->offset;
2944}
e9a1ab19 2945
6977dfe6
YT
2946ram_addr_t qemu_ram_alloc(DeviceState *dev, const char *name, ram_addr_t size)
2947{
2948 return qemu_ram_alloc_from_ptr(dev, name, size, NULL);
2949}
2950
c227f099 2951void qemu_ram_free(ram_addr_t addr)
e9a1ab19 2952{
04b16653
AW
2953 RAMBlock *block;
2954
2955 QLIST_FOREACH(block, &ram_list.blocks, next) {
2956 if (addr == block->offset) {
2957 QLIST_REMOVE(block, next);
cd19cfa2
HY
2958 if (block->flags & RAM_PREALLOC_MASK) {
2959 ;
2960 } else if (mem_path) {
04b16653
AW
2961#if defined (__linux__) && !defined(TARGET_S390X)
2962 if (block->fd) {
2963 munmap(block->host, block->length);
2964 close(block->fd);
2965 } else {
2966 qemu_vfree(block->host);
2967 }
fd28aa13
JK
2968#else
2969 abort();
04b16653
AW
2970#endif
2971 } else {
2972#if defined(TARGET_S390X) && defined(CONFIG_KVM)
2973 munmap(block->host, block->length);
2974#else
432d268c
JN
2975 if (xen_mapcache_enabled()) {
2976 qemu_invalidate_entry(block->host);
2977 } else {
2978 qemu_vfree(block->host);
2979 }
04b16653
AW
2980#endif
2981 }
2982 qemu_free(block);
2983 return;
2984 }
2985 }
2986
e9a1ab19
FB
2987}
2988
cd19cfa2
HY
2989#ifndef _WIN32
2990void qemu_ram_remap(ram_addr_t addr, ram_addr_t length)
2991{
2992 RAMBlock *block;
2993 ram_addr_t offset;
2994 int flags;
2995 void *area, *vaddr;
2996
2997 QLIST_FOREACH(block, &ram_list.blocks, next) {
2998 offset = addr - block->offset;
2999 if (offset < block->length) {
3000 vaddr = block->host + offset;
3001 if (block->flags & RAM_PREALLOC_MASK) {
3002 ;
3003 } else {
3004 flags = MAP_FIXED;
3005 munmap(vaddr, length);
3006 if (mem_path) {
3007#if defined(__linux__) && !defined(TARGET_S390X)
3008 if (block->fd) {
3009#ifdef MAP_POPULATE
3010 flags |= mem_prealloc ? MAP_POPULATE | MAP_SHARED :
3011 MAP_PRIVATE;
3012#else
3013 flags |= MAP_PRIVATE;
3014#endif
3015 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3016 flags, block->fd, offset);
3017 } else {
3018 flags |= MAP_PRIVATE | MAP_ANONYMOUS;
3019 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3020 flags, -1, 0);
3021 }
fd28aa13
JK
3022#else
3023 abort();
cd19cfa2
HY
3024#endif
3025 } else {
3026#if defined(TARGET_S390X) && defined(CONFIG_KVM)
3027 flags |= MAP_SHARED | MAP_ANONYMOUS;
3028 area = mmap(vaddr, length, PROT_EXEC|PROT_READ|PROT_WRITE,
3029 flags, -1, 0);
3030#else
3031 flags |= MAP_PRIVATE | MAP_ANONYMOUS;
3032 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3033 flags, -1, 0);
3034#endif
3035 }
3036 if (area != vaddr) {
3037 fprintf(stderr, "Could not remap addr: %lx@%lx\n",
3038 length, addr);
3039 exit(1);
3040 }
3041 qemu_madvise(vaddr, length, QEMU_MADV_MERGEABLE);
3042 }
3043 return;
3044 }
3045 }
3046}
3047#endif /* !_WIN32 */
3048
dc828ca1 3049/* Return a host pointer to ram allocated with qemu_ram_alloc.
5579c7f3
PB
3050 With the exception of the softmmu code in this file, this should
3051 only be used for local memory (e.g. video ram) that the device owns,
3052 and knows it isn't going to access beyond the end of the block.
3053
3054 It should not be used for general purpose DMA.
3055 Use cpu_physical_memory_map/cpu_physical_memory_rw instead.
3056 */
c227f099 3057void *qemu_get_ram_ptr(ram_addr_t addr)
dc828ca1 3058{
94a6b54f
PB
3059 RAMBlock *block;
3060
f471a17e
AW
3061 QLIST_FOREACH(block, &ram_list.blocks, next) {
3062 if (addr - block->offset < block->length) {
7d82af38
VP
3063 /* Move this entry to to start of the list. */
3064 if (block != QLIST_FIRST(&ram_list.blocks)) {
3065 QLIST_REMOVE(block, next);
3066 QLIST_INSERT_HEAD(&ram_list.blocks, block, next);
3067 }
432d268c
JN
3068 if (xen_mapcache_enabled()) {
3069 /* We need to check if the requested address is in the RAM
3070 * because we don't want to map the entire memory in QEMU.
3071 */
3072 if (block->offset == 0) {
3073 return qemu_map_cache(addr, 0, 1);
3074 } else if (block->host == NULL) {
3075 block->host = xen_map_block(block->offset, block->length);
3076 }
3077 }
f471a17e
AW
3078 return block->host + (addr - block->offset);
3079 }
94a6b54f 3080 }
f471a17e
AW
3081
3082 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3083 abort();
3084
3085 return NULL;
dc828ca1
PB
3086}
3087
b2e0a138
MT
3088/* Return a host pointer to ram allocated with qemu_ram_alloc.
3089 * Same as qemu_get_ram_ptr but avoid reordering ramblocks.
3090 */
3091void *qemu_safe_ram_ptr(ram_addr_t addr)
3092{
3093 RAMBlock *block;
3094
3095 QLIST_FOREACH(block, &ram_list.blocks, next) {
3096 if (addr - block->offset < block->length) {
432d268c
JN
3097 if (xen_mapcache_enabled()) {
3098 /* We need to check if the requested address is in the RAM
3099 * because we don't want to map the entire memory in QEMU.
3100 */
3101 if (block->offset == 0) {
3102 return qemu_map_cache(addr, 0, 1);
3103 } else if (block->host == NULL) {
3104 block->host = xen_map_block(block->offset, block->length);
3105 }
3106 }
b2e0a138
MT
3107 return block->host + (addr - block->offset);
3108 }
3109 }
3110
3111 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3112 abort();
3113
3114 return NULL;
3115}
3116
050a0ddf
AP
3117void qemu_put_ram_ptr(void *addr)
3118{
3119 trace_qemu_put_ram_ptr(addr);
3120
3121 if (xen_mapcache_enabled()) {
3122 RAMBlock *block;
3123
3124 QLIST_FOREACH(block, &ram_list.blocks, next) {
3125 if (addr == block->host) {
3126 break;
3127 }
3128 }
3129 if (block && block->host) {
3130 xen_unmap_block(block->host, block->length);
3131 block->host = NULL;
3132 } else {
3133 qemu_map_cache_unlock(addr);
3134 }
3135 }
3136}
3137
e890261f 3138int qemu_ram_addr_from_host(void *ptr, ram_addr_t *ram_addr)
5579c7f3 3139{
94a6b54f
PB
3140 RAMBlock *block;
3141 uint8_t *host = ptr;
3142
f471a17e 3143 QLIST_FOREACH(block, &ram_list.blocks, next) {
432d268c
JN
3144 /* This case append when the block is not mapped. */
3145 if (block->host == NULL) {
3146 continue;
3147 }
f471a17e 3148 if (host - block->host < block->length) {
e890261f
MT
3149 *ram_addr = block->offset + (host - block->host);
3150 return 0;
f471a17e 3151 }
94a6b54f 3152 }
432d268c
JN
3153
3154 if (xen_mapcache_enabled()) {
3155 *ram_addr = qemu_ram_addr_from_mapcache(ptr);
3156 return 0;
3157 }
3158
e890261f
MT
3159 return -1;
3160}
f471a17e 3161
e890261f
MT
3162/* Some of the softmmu routines need to translate from a host pointer
3163 (typically a TLB entry) back to a ram offset. */
3164ram_addr_t qemu_ram_addr_from_host_nofail(void *ptr)
3165{
3166 ram_addr_t ram_addr;
f471a17e 3167
e890261f
MT
3168 if (qemu_ram_addr_from_host(ptr, &ram_addr)) {
3169 fprintf(stderr, "Bad ram pointer %p\n", ptr);
3170 abort();
3171 }
3172 return ram_addr;
5579c7f3
PB
3173}
3174
c227f099 3175static uint32_t unassigned_mem_readb(void *opaque, target_phys_addr_t addr)
33417e70 3176{
67d3b957 3177#ifdef DEBUG_UNASSIGNED
ab3d1727 3178 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
b4f0a316 3179#endif
faed1c2a 3180#if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
e18231a3
BS
3181 do_unassigned_access(addr, 0, 0, 0, 1);
3182#endif
3183 return 0;
3184}
3185
c227f099 3186static uint32_t unassigned_mem_readw(void *opaque, target_phys_addr_t addr)
e18231a3
BS
3187{
3188#ifdef DEBUG_UNASSIGNED
3189 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
3190#endif
faed1c2a 3191#if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
e18231a3
BS
3192 do_unassigned_access(addr, 0, 0, 0, 2);
3193#endif
3194 return 0;
3195}
3196
c227f099 3197static uint32_t unassigned_mem_readl(void *opaque, target_phys_addr_t addr)
e18231a3
BS
3198{
3199#ifdef DEBUG_UNASSIGNED
3200 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
3201#endif
faed1c2a 3202#if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
e18231a3 3203 do_unassigned_access(addr, 0, 0, 0, 4);
67d3b957 3204#endif
33417e70
FB
3205 return 0;
3206}
3207
c227f099 3208static void unassigned_mem_writeb(void *opaque, target_phys_addr_t addr, uint32_t val)
33417e70 3209{
67d3b957 3210#ifdef DEBUG_UNASSIGNED
ab3d1727 3211 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
67d3b957 3212#endif
faed1c2a 3213#if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
e18231a3
BS
3214 do_unassigned_access(addr, 1, 0, 0, 1);
3215#endif
3216}
3217
c227f099 3218static void unassigned_mem_writew(void *opaque, target_phys_addr_t addr, uint32_t val)
e18231a3
BS
3219{
3220#ifdef DEBUG_UNASSIGNED
3221 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
3222#endif
faed1c2a 3223#if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
e18231a3
BS
3224 do_unassigned_access(addr, 1, 0, 0, 2);
3225#endif
3226}
3227
c227f099 3228static void unassigned_mem_writel(void *opaque, target_phys_addr_t addr, uint32_t val)
e18231a3
BS
3229{
3230#ifdef DEBUG_UNASSIGNED
3231 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
3232#endif
faed1c2a 3233#if defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
e18231a3 3234 do_unassigned_access(addr, 1, 0, 0, 4);
b4f0a316 3235#endif
33417e70
FB
3236}
3237
d60efc6b 3238static CPUReadMemoryFunc * const unassigned_mem_read[3] = {
33417e70 3239 unassigned_mem_readb,
e18231a3
BS
3240 unassigned_mem_readw,
3241 unassigned_mem_readl,
33417e70
FB
3242};
3243
d60efc6b 3244static CPUWriteMemoryFunc * const unassigned_mem_write[3] = {
33417e70 3245 unassigned_mem_writeb,
e18231a3
BS
3246 unassigned_mem_writew,
3247 unassigned_mem_writel,
33417e70
FB
3248};
3249
c227f099 3250static void notdirty_mem_writeb(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3251 uint32_t val)
9fa3e853 3252{
3a7d929e 3253 int dirty_flags;
f7c11b53 3254 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3255 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3256#if !defined(CONFIG_USER_ONLY)
3a7d929e 3257 tb_invalidate_phys_page_fast(ram_addr, 1);
f7c11b53 3258 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3259#endif
3a7d929e 3260 }
5579c7f3 3261 stb_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3262 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3263 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3264 /* we remove the notdirty callback only if the code has been
3265 flushed */
3266 if (dirty_flags == 0xff)
2e70f6ef 3267 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3268}
3269
c227f099 3270static void notdirty_mem_writew(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3271 uint32_t val)
9fa3e853 3272{
3a7d929e 3273 int dirty_flags;
f7c11b53 3274 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3275 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3276#if !defined(CONFIG_USER_ONLY)
3a7d929e 3277 tb_invalidate_phys_page_fast(ram_addr, 2);
f7c11b53 3278 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3279#endif
3a7d929e 3280 }
5579c7f3 3281 stw_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3282 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3283 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3284 /* we remove the notdirty callback only if the code has been
3285 flushed */
3286 if (dirty_flags == 0xff)
2e70f6ef 3287 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3288}
3289
c227f099 3290static void notdirty_mem_writel(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3291 uint32_t val)
9fa3e853 3292{
3a7d929e 3293 int dirty_flags;
f7c11b53 3294 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3295 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3296#if !defined(CONFIG_USER_ONLY)
3a7d929e 3297 tb_invalidate_phys_page_fast(ram_addr, 4);
f7c11b53 3298 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3299#endif
3a7d929e 3300 }
5579c7f3 3301 stl_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3302 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3303 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3304 /* we remove the notdirty callback only if the code has been
3305 flushed */
3306 if (dirty_flags == 0xff)
2e70f6ef 3307 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3308}
3309
d60efc6b 3310static CPUReadMemoryFunc * const error_mem_read[3] = {
9fa3e853
FB
3311 NULL, /* never used */
3312 NULL, /* never used */
3313 NULL, /* never used */
3314};
3315
d60efc6b 3316static CPUWriteMemoryFunc * const notdirty_mem_write[3] = {
1ccde1cb
FB
3317 notdirty_mem_writeb,
3318 notdirty_mem_writew,
3319 notdirty_mem_writel,
3320};
3321
0f459d16 3322/* Generate a debug exception if a watchpoint has been hit. */
b4051334 3323static void check_watchpoint(int offset, int len_mask, int flags)
0f459d16
PB
3324{
3325 CPUState *env = cpu_single_env;
06d55cc1
AL
3326 target_ulong pc, cs_base;
3327 TranslationBlock *tb;
0f459d16 3328 target_ulong vaddr;
a1d1bb31 3329 CPUWatchpoint *wp;
06d55cc1 3330 int cpu_flags;
0f459d16 3331
06d55cc1
AL
3332 if (env->watchpoint_hit) {
3333 /* We re-entered the check after replacing the TB. Now raise
3334 * the debug interrupt so that is will trigger after the
3335 * current instruction. */
3336 cpu_interrupt(env, CPU_INTERRUPT_DEBUG);
3337 return;
3338 }
2e70f6ef 3339 vaddr = (env->mem_io_vaddr & TARGET_PAGE_MASK) + offset;
72cf2d4f 3340 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334
AL
3341 if ((vaddr == (wp->vaddr & len_mask) ||
3342 (vaddr & wp->len_mask) == wp->vaddr) && (wp->flags & flags)) {
6e140f28
AL
3343 wp->flags |= BP_WATCHPOINT_HIT;
3344 if (!env->watchpoint_hit) {
3345 env->watchpoint_hit = wp;
3346 tb = tb_find_pc(env->mem_io_pc);
3347 if (!tb) {
3348 cpu_abort(env, "check_watchpoint: could not find TB for "
3349 "pc=%p", (void *)env->mem_io_pc);
3350 }
618ba8e6 3351 cpu_restore_state(tb, env, env->mem_io_pc);
6e140f28
AL
3352 tb_phys_invalidate(tb, -1);
3353 if (wp->flags & BP_STOP_BEFORE_ACCESS) {
3354 env->exception_index = EXCP_DEBUG;
3355 } else {
3356 cpu_get_tb_cpu_state(env, &pc, &cs_base, &cpu_flags);
3357 tb_gen_code(env, pc, cs_base, cpu_flags, 1);
3358 }
3359 cpu_resume_from_signal(env, NULL);
06d55cc1 3360 }
6e140f28
AL
3361 } else {
3362 wp->flags &= ~BP_WATCHPOINT_HIT;
0f459d16
PB
3363 }
3364 }
3365}
3366
6658ffb8
PB
3367/* Watchpoint access routines. Watchpoints are inserted using TLB tricks,
3368 so these check for a hit then pass through to the normal out-of-line
3369 phys routines. */
c227f099 3370static uint32_t watch_mem_readb(void *opaque, target_phys_addr_t addr)
6658ffb8 3371{
b4051334 3372 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_READ);
6658ffb8
PB
3373 return ldub_phys(addr);
3374}
3375
c227f099 3376static uint32_t watch_mem_readw(void *opaque, target_phys_addr_t addr)
6658ffb8 3377{
b4051334 3378 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_READ);
6658ffb8
PB
3379 return lduw_phys(addr);
3380}
3381
c227f099 3382static uint32_t watch_mem_readl(void *opaque, target_phys_addr_t addr)
6658ffb8 3383{
b4051334 3384 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_READ);
6658ffb8
PB
3385 return ldl_phys(addr);
3386}
3387
c227f099 3388static void watch_mem_writeb(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3389 uint32_t val)
3390{
b4051334 3391 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_WRITE);
6658ffb8
PB
3392 stb_phys(addr, val);
3393}
3394
c227f099 3395static void watch_mem_writew(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3396 uint32_t val)
3397{
b4051334 3398 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_WRITE);
6658ffb8
PB
3399 stw_phys(addr, val);
3400}
3401
c227f099 3402static void watch_mem_writel(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3403 uint32_t val)
3404{
b4051334 3405 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_WRITE);
6658ffb8
PB
3406 stl_phys(addr, val);
3407}
3408
d60efc6b 3409static CPUReadMemoryFunc * const watch_mem_read[3] = {
6658ffb8
PB
3410 watch_mem_readb,
3411 watch_mem_readw,
3412 watch_mem_readl,
3413};
3414
d60efc6b 3415static CPUWriteMemoryFunc * const watch_mem_write[3] = {
6658ffb8
PB
3416 watch_mem_writeb,
3417 watch_mem_writew,
3418 watch_mem_writel,
3419};
6658ffb8 3420
f6405247
RH
3421static inline uint32_t subpage_readlen (subpage_t *mmio,
3422 target_phys_addr_t addr,
3423 unsigned int len)
db7b5426 3424{
f6405247 3425 unsigned int idx = SUBPAGE_IDX(addr);
db7b5426
BS
3426#if defined(DEBUG_SUBPAGE)
3427 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d\n", __func__,
3428 mmio, len, addr, idx);
3429#endif
db7b5426 3430
f6405247
RH
3431 addr += mmio->region_offset[idx];
3432 idx = mmio->sub_io_index[idx];
3433 return io_mem_read[idx][len](io_mem_opaque[idx], addr);
db7b5426
BS
3434}
3435
c227f099 3436static inline void subpage_writelen (subpage_t *mmio, target_phys_addr_t addr,
f6405247 3437 uint32_t value, unsigned int len)
db7b5426 3438{
f6405247 3439 unsigned int idx = SUBPAGE_IDX(addr);
db7b5426 3440#if defined(DEBUG_SUBPAGE)
f6405247
RH
3441 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d value %08x\n",
3442 __func__, mmio, len, addr, idx, value);
db7b5426 3443#endif
f6405247
RH
3444
3445 addr += mmio->region_offset[idx];
3446 idx = mmio->sub_io_index[idx];
3447 io_mem_write[idx][len](io_mem_opaque[idx], addr, value);
db7b5426
BS
3448}
3449
c227f099 3450static uint32_t subpage_readb (void *opaque, target_phys_addr_t addr)
db7b5426 3451{
db7b5426
BS
3452 return subpage_readlen(opaque, addr, 0);
3453}
3454
c227f099 3455static void subpage_writeb (void *opaque, target_phys_addr_t addr,
db7b5426
BS
3456 uint32_t value)
3457{
db7b5426
BS
3458 subpage_writelen(opaque, addr, value, 0);
3459}
3460
c227f099 3461static uint32_t subpage_readw (void *opaque, target_phys_addr_t addr)
db7b5426 3462{
db7b5426
BS
3463 return subpage_readlen(opaque, addr, 1);
3464}
3465
c227f099 3466static void subpage_writew (void *opaque, target_phys_addr_t addr,
db7b5426
BS
3467 uint32_t value)
3468{
db7b5426
BS
3469 subpage_writelen(opaque, addr, value, 1);
3470}
3471
c227f099 3472static uint32_t subpage_readl (void *opaque, target_phys_addr_t addr)
db7b5426 3473{
db7b5426
BS
3474 return subpage_readlen(opaque, addr, 2);
3475}
3476
f6405247
RH
3477static void subpage_writel (void *opaque, target_phys_addr_t addr,
3478 uint32_t value)
db7b5426 3479{
db7b5426
BS
3480 subpage_writelen(opaque, addr, value, 2);
3481}
3482
d60efc6b 3483static CPUReadMemoryFunc * const subpage_read[] = {
db7b5426
BS
3484 &subpage_readb,
3485 &subpage_readw,
3486 &subpage_readl,
3487};
3488
d60efc6b 3489static CPUWriteMemoryFunc * const subpage_write[] = {
db7b5426
BS
3490 &subpage_writeb,
3491 &subpage_writew,
3492 &subpage_writel,
3493};
3494
c227f099
AL
3495static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
3496 ram_addr_t memory, ram_addr_t region_offset)
db7b5426
BS
3497{
3498 int idx, eidx;
3499
3500 if (start >= TARGET_PAGE_SIZE || end >= TARGET_PAGE_SIZE)
3501 return -1;
3502 idx = SUBPAGE_IDX(start);
3503 eidx = SUBPAGE_IDX(end);
3504#if defined(DEBUG_SUBPAGE)
0bf9e31a 3505 printf("%s: %p start %08x end %08x idx %08x eidx %08x mem %ld\n", __func__,
db7b5426
BS
3506 mmio, start, end, idx, eidx, memory);
3507#endif
95c318f5
GN
3508 if ((memory & ~TARGET_PAGE_MASK) == IO_MEM_RAM)
3509 memory = IO_MEM_UNASSIGNED;
f6405247 3510 memory = (memory >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
db7b5426 3511 for (; idx <= eidx; idx++) {
f6405247
RH
3512 mmio->sub_io_index[idx] = memory;
3513 mmio->region_offset[idx] = region_offset;
db7b5426
BS
3514 }
3515
3516 return 0;
3517}
3518
f6405247
RH
3519static subpage_t *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
3520 ram_addr_t orig_memory,
3521 ram_addr_t region_offset)
db7b5426 3522{
c227f099 3523 subpage_t *mmio;
db7b5426
BS
3524 int subpage_memory;
3525
c227f099 3526 mmio = qemu_mallocz(sizeof(subpage_t));
1eec614b
AL
3527
3528 mmio->base = base;
2507c12a
AG
3529 subpage_memory = cpu_register_io_memory(subpage_read, subpage_write, mmio,
3530 DEVICE_NATIVE_ENDIAN);
db7b5426 3531#if defined(DEBUG_SUBPAGE)
1eec614b
AL
3532 printf("%s: %p base " TARGET_FMT_plx " len %08x %d\n", __func__,
3533 mmio, base, TARGET_PAGE_SIZE, subpage_memory);
db7b5426 3534#endif
1eec614b 3535 *phys = subpage_memory | IO_MEM_SUBPAGE;
f6405247 3536 subpage_register(mmio, 0, TARGET_PAGE_SIZE-1, orig_memory, region_offset);
db7b5426
BS
3537
3538 return mmio;
3539}
3540
88715657
AL
3541static int get_free_io_mem_idx(void)
3542{
3543 int i;
3544
3545 for (i = 0; i<IO_MEM_NB_ENTRIES; i++)
3546 if (!io_mem_used[i]) {
3547 io_mem_used[i] = 1;
3548 return i;
3549 }
c6703b47 3550 fprintf(stderr, "RAN out out io_mem_idx, max %d !\n", IO_MEM_NB_ENTRIES);
88715657
AL
3551 return -1;
3552}
3553
dd310534
AG
3554/*
3555 * Usually, devices operate in little endian mode. There are devices out
3556 * there that operate in big endian too. Each device gets byte swapped
3557 * mmio if plugged onto a CPU that does the other endianness.
3558 *
3559 * CPU Device swap?
3560 *
3561 * little little no
3562 * little big yes
3563 * big little yes
3564 * big big no
3565 */
3566
3567typedef struct SwapEndianContainer {
3568 CPUReadMemoryFunc *read[3];
3569 CPUWriteMemoryFunc *write[3];
3570 void *opaque;
3571} SwapEndianContainer;
3572
3573static uint32_t swapendian_mem_readb (void *opaque, target_phys_addr_t addr)
3574{
3575 uint32_t val;
3576 SwapEndianContainer *c = opaque;
3577 val = c->read[0](c->opaque, addr);
3578 return val;
3579}
3580
3581static uint32_t swapendian_mem_readw(void *opaque, target_phys_addr_t addr)
3582{
3583 uint32_t val;
3584 SwapEndianContainer *c = opaque;
3585 val = bswap16(c->read[1](c->opaque, addr));
3586 return val;
3587}
3588
3589static uint32_t swapendian_mem_readl(void *opaque, target_phys_addr_t addr)
3590{
3591 uint32_t val;
3592 SwapEndianContainer *c = opaque;
3593 val = bswap32(c->read[2](c->opaque, addr));
3594 return val;
3595}
3596
3597static CPUReadMemoryFunc * const swapendian_readfn[3]={
3598 swapendian_mem_readb,
3599 swapendian_mem_readw,
3600 swapendian_mem_readl
3601};
3602
3603static void swapendian_mem_writeb(void *opaque, target_phys_addr_t addr,
3604 uint32_t val)
3605{
3606 SwapEndianContainer *c = opaque;
3607 c->write[0](c->opaque, addr, val);
3608}
3609
3610static void swapendian_mem_writew(void *opaque, target_phys_addr_t addr,
3611 uint32_t val)
3612{
3613 SwapEndianContainer *c = opaque;
3614 c->write[1](c->opaque, addr, bswap16(val));
3615}
3616
3617static void swapendian_mem_writel(void *opaque, target_phys_addr_t addr,
3618 uint32_t val)
3619{
3620 SwapEndianContainer *c = opaque;
3621 c->write[2](c->opaque, addr, bswap32(val));
3622}
3623
3624static CPUWriteMemoryFunc * const swapendian_writefn[3]={
3625 swapendian_mem_writeb,
3626 swapendian_mem_writew,
3627 swapendian_mem_writel
3628};
3629
3630static void swapendian_init(int io_index)
3631{
3632 SwapEndianContainer *c = qemu_malloc(sizeof(SwapEndianContainer));
3633 int i;
3634
3635 /* Swap mmio for big endian targets */
3636 c->opaque = io_mem_opaque[io_index];
3637 for (i = 0; i < 3; i++) {
3638 c->read[i] = io_mem_read[io_index][i];
3639 c->write[i] = io_mem_write[io_index][i];
3640
3641 io_mem_read[io_index][i] = swapendian_readfn[i];
3642 io_mem_write[io_index][i] = swapendian_writefn[i];
3643 }
3644 io_mem_opaque[io_index] = c;
3645}
3646
3647static void swapendian_del(int io_index)
3648{
3649 if (io_mem_read[io_index][0] == swapendian_readfn[0]) {
3650 qemu_free(io_mem_opaque[io_index]);
3651 }
3652}
3653
33417e70
FB
3654/* mem_read and mem_write are arrays of functions containing the
3655 function to access byte (index 0), word (index 1) and dword (index
0b4e6e3e 3656 2). Functions can be omitted with a NULL function pointer.
3ee89922 3657 If io_index is non zero, the corresponding io zone is
4254fab8
BS
3658 modified. If it is zero, a new io zone is allocated. The return
3659 value can be used with cpu_register_physical_memory(). (-1) is
3660 returned if error. */
1eed09cb 3661static int cpu_register_io_memory_fixed(int io_index,
d60efc6b
BS
3662 CPUReadMemoryFunc * const *mem_read,
3663 CPUWriteMemoryFunc * const *mem_write,
dd310534 3664 void *opaque, enum device_endian endian)
33417e70 3665{
3cab721d
RH
3666 int i;
3667
33417e70 3668 if (io_index <= 0) {
88715657
AL
3669 io_index = get_free_io_mem_idx();
3670 if (io_index == -1)
3671 return io_index;
33417e70 3672 } else {
1eed09cb 3673 io_index >>= IO_MEM_SHIFT;
33417e70
FB
3674 if (io_index >= IO_MEM_NB_ENTRIES)
3675 return -1;
3676 }
b5ff1b31 3677
3cab721d
RH
3678 for (i = 0; i < 3; ++i) {
3679 io_mem_read[io_index][i]
3680 = (mem_read[i] ? mem_read[i] : unassigned_mem_read[i]);
3681 }
3682 for (i = 0; i < 3; ++i) {
3683 io_mem_write[io_index][i]
3684 = (mem_write[i] ? mem_write[i] : unassigned_mem_write[i]);
3685 }
a4193c8a 3686 io_mem_opaque[io_index] = opaque;
f6405247 3687
dd310534
AG
3688 switch (endian) {
3689 case DEVICE_BIG_ENDIAN:
3690#ifndef TARGET_WORDS_BIGENDIAN
3691 swapendian_init(io_index);
3692#endif
3693 break;
3694 case DEVICE_LITTLE_ENDIAN:
3695#ifdef TARGET_WORDS_BIGENDIAN
3696 swapendian_init(io_index);
3697#endif
3698 break;
3699 case DEVICE_NATIVE_ENDIAN:
3700 default:
3701 break;
3702 }
3703
f6405247 3704 return (io_index << IO_MEM_SHIFT);
33417e70 3705}
61382a50 3706
d60efc6b
BS
3707int cpu_register_io_memory(CPUReadMemoryFunc * const *mem_read,
3708 CPUWriteMemoryFunc * const *mem_write,
dd310534 3709 void *opaque, enum device_endian endian)
1eed09cb 3710{
2507c12a 3711 return cpu_register_io_memory_fixed(0, mem_read, mem_write, opaque, endian);
1eed09cb
AK
3712}
3713
88715657
AL
3714void cpu_unregister_io_memory(int io_table_address)
3715{
3716 int i;
3717 int io_index = io_table_address >> IO_MEM_SHIFT;
3718
dd310534
AG
3719 swapendian_del(io_index);
3720
88715657
AL
3721 for (i=0;i < 3; i++) {
3722 io_mem_read[io_index][i] = unassigned_mem_read[i];
3723 io_mem_write[io_index][i] = unassigned_mem_write[i];
3724 }
3725 io_mem_opaque[io_index] = NULL;
3726 io_mem_used[io_index] = 0;
3727}
3728
e9179ce1
AK
3729static void io_mem_init(void)
3730{
3731 int i;
3732
2507c12a
AG
3733 cpu_register_io_memory_fixed(IO_MEM_ROM, error_mem_read,
3734 unassigned_mem_write, NULL,
3735 DEVICE_NATIVE_ENDIAN);
3736 cpu_register_io_memory_fixed(IO_MEM_UNASSIGNED, unassigned_mem_read,
3737 unassigned_mem_write, NULL,
3738 DEVICE_NATIVE_ENDIAN);
3739 cpu_register_io_memory_fixed(IO_MEM_NOTDIRTY, error_mem_read,
3740 notdirty_mem_write, NULL,
3741 DEVICE_NATIVE_ENDIAN);
e9179ce1
AK
3742 for (i=0; i<5; i++)
3743 io_mem_used[i] = 1;
3744
3745 io_mem_watch = cpu_register_io_memory(watch_mem_read,
2507c12a
AG
3746 watch_mem_write, NULL,
3747 DEVICE_NATIVE_ENDIAN);
e9179ce1
AK
3748}
3749
e2eef170
PB
3750#endif /* !defined(CONFIG_USER_ONLY) */
3751
13eb76e0
FB
3752/* physical memory access (slow version, mainly for debug) */
3753#if defined(CONFIG_USER_ONLY)
a68fe89c
PB
3754int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
3755 uint8_t *buf, int len, int is_write)
13eb76e0
FB
3756{
3757 int l, flags;
3758 target_ulong page;
53a5960a 3759 void * p;
13eb76e0
FB
3760
3761 while (len > 0) {
3762 page = addr & TARGET_PAGE_MASK;
3763 l = (page + TARGET_PAGE_SIZE) - addr;
3764 if (l > len)
3765 l = len;
3766 flags = page_get_flags(page);
3767 if (!(flags & PAGE_VALID))
a68fe89c 3768 return -1;
13eb76e0
FB
3769 if (is_write) {
3770 if (!(flags & PAGE_WRITE))
a68fe89c 3771 return -1;
579a97f7 3772 /* XXX: this code should not depend on lock_user */
72fb7daa 3773 if (!(p = lock_user(VERIFY_WRITE, addr, l, 0)))
a68fe89c 3774 return -1;
72fb7daa
AJ
3775 memcpy(p, buf, l);
3776 unlock_user(p, addr, l);
13eb76e0
FB
3777 } else {
3778 if (!(flags & PAGE_READ))
a68fe89c 3779 return -1;
579a97f7 3780 /* XXX: this code should not depend on lock_user */
72fb7daa 3781 if (!(p = lock_user(VERIFY_READ, addr, l, 1)))
a68fe89c 3782 return -1;
72fb7daa 3783 memcpy(buf, p, l);
5b257578 3784 unlock_user(p, addr, 0);
13eb76e0
FB
3785 }
3786 len -= l;
3787 buf += l;
3788 addr += l;
3789 }
a68fe89c 3790 return 0;
13eb76e0 3791}
8df1cd07 3792
13eb76e0 3793#else
c227f099 3794void cpu_physical_memory_rw(target_phys_addr_t addr, uint8_t *buf,
13eb76e0
FB
3795 int len, int is_write)
3796{
3797 int l, io_index;
3798 uint8_t *ptr;
3799 uint32_t val;
c227f099 3800 target_phys_addr_t page;
2e12669a 3801 unsigned long pd;
92e873b9 3802 PhysPageDesc *p;
3b46e624 3803
13eb76e0
FB
3804 while (len > 0) {
3805 page = addr & TARGET_PAGE_MASK;
3806 l = (page + TARGET_PAGE_SIZE) - addr;
3807 if (l > len)
3808 l = len;
92e873b9 3809 p = phys_page_find(page >> TARGET_PAGE_BITS);
13eb76e0
FB
3810 if (!p) {
3811 pd = IO_MEM_UNASSIGNED;
3812 } else {
3813 pd = p->phys_offset;
3814 }
3b46e624 3815
13eb76e0 3816 if (is_write) {
3a7d929e 3817 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
c227f099 3818 target_phys_addr_t addr1 = addr;
13eb76e0 3819 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18 3820 if (p)
6c2934db 3821 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
6a00d601
FB
3822 /* XXX: could force cpu_single_env to NULL to avoid
3823 potential bugs */
6c2934db 3824 if (l >= 4 && ((addr1 & 3) == 0)) {
1c213d19 3825 /* 32 bit write access */
c27004ec 3826 val = ldl_p(buf);
6c2934db 3827 io_mem_write[io_index][2](io_mem_opaque[io_index], addr1, val);
13eb76e0 3828 l = 4;
6c2934db 3829 } else if (l >= 2 && ((addr1 & 1) == 0)) {
1c213d19 3830 /* 16 bit write access */
c27004ec 3831 val = lduw_p(buf);
6c2934db 3832 io_mem_write[io_index][1](io_mem_opaque[io_index], addr1, val);
13eb76e0
FB
3833 l = 2;
3834 } else {
1c213d19 3835 /* 8 bit write access */
c27004ec 3836 val = ldub_p(buf);
6c2934db 3837 io_mem_write[io_index][0](io_mem_opaque[io_index], addr1, val);
13eb76e0
FB
3838 l = 1;
3839 }
3840 } else {
b448f2f3
FB
3841 unsigned long addr1;
3842 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
13eb76e0 3843 /* RAM case */
5579c7f3 3844 ptr = qemu_get_ram_ptr(addr1);
13eb76e0 3845 memcpy(ptr, buf, l);
3a7d929e
FB
3846 if (!cpu_physical_memory_is_dirty(addr1)) {
3847 /* invalidate code */
3848 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
3849 /* set dirty bit */
f7c11b53
YT
3850 cpu_physical_memory_set_dirty_flags(
3851 addr1, (0xff & ~CODE_DIRTY_FLAG));
3a7d929e 3852 }
050a0ddf 3853 qemu_put_ram_ptr(ptr);
13eb76e0
FB
3854 }
3855 } else {
5fafdf24 3856 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
2a4188a3 3857 !(pd & IO_MEM_ROMD)) {
c227f099 3858 target_phys_addr_t addr1 = addr;
13eb76e0
FB
3859 /* I/O case */
3860 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18 3861 if (p)
6c2934db
AJ
3862 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3863 if (l >= 4 && ((addr1 & 3) == 0)) {
13eb76e0 3864 /* 32 bit read access */
6c2934db 3865 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr1);
c27004ec 3866 stl_p(buf, val);
13eb76e0 3867 l = 4;
6c2934db 3868 } else if (l >= 2 && ((addr1 & 1) == 0)) {
13eb76e0 3869 /* 16 bit read access */
6c2934db 3870 val = io_mem_read[io_index][1](io_mem_opaque[io_index], addr1);
c27004ec 3871 stw_p(buf, val);
13eb76e0
FB
3872 l = 2;
3873 } else {
1c213d19 3874 /* 8 bit read access */
6c2934db 3875 val = io_mem_read[io_index][0](io_mem_opaque[io_index], addr1);
c27004ec 3876 stb_p(buf, val);
13eb76e0
FB
3877 l = 1;
3878 }
3879 } else {
3880 /* RAM case */
050a0ddf
AP
3881 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK);
3882 memcpy(buf, ptr + (addr & ~TARGET_PAGE_MASK), l);
3883 qemu_put_ram_ptr(ptr);
13eb76e0
FB
3884 }
3885 }
3886 len -= l;
3887 buf += l;
3888 addr += l;
3889 }
3890}
8df1cd07 3891
d0ecd2aa 3892/* used for ROM loading : can write in RAM and ROM */
c227f099 3893void cpu_physical_memory_write_rom(target_phys_addr_t addr,
d0ecd2aa
FB
3894 const uint8_t *buf, int len)
3895{
3896 int l;
3897 uint8_t *ptr;
c227f099 3898 target_phys_addr_t page;
d0ecd2aa
FB
3899 unsigned long pd;
3900 PhysPageDesc *p;
3b46e624 3901
d0ecd2aa
FB
3902 while (len > 0) {
3903 page = addr & TARGET_PAGE_MASK;
3904 l = (page + TARGET_PAGE_SIZE) - addr;
3905 if (l > len)
3906 l = len;
3907 p = phys_page_find(page >> TARGET_PAGE_BITS);
3908 if (!p) {
3909 pd = IO_MEM_UNASSIGNED;
3910 } else {
3911 pd = p->phys_offset;
3912 }
3b46e624 3913
d0ecd2aa 3914 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM &&
2a4188a3
FB
3915 (pd & ~TARGET_PAGE_MASK) != IO_MEM_ROM &&
3916 !(pd & IO_MEM_ROMD)) {
d0ecd2aa
FB
3917 /* do nothing */
3918 } else {
3919 unsigned long addr1;
3920 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
3921 /* ROM/RAM case */
5579c7f3 3922 ptr = qemu_get_ram_ptr(addr1);
d0ecd2aa 3923 memcpy(ptr, buf, l);
050a0ddf 3924 qemu_put_ram_ptr(ptr);
d0ecd2aa
FB
3925 }
3926 len -= l;
3927 buf += l;
3928 addr += l;
3929 }
3930}
3931
6d16c2f8
AL
3932typedef struct {
3933 void *buffer;
c227f099
AL
3934 target_phys_addr_t addr;
3935 target_phys_addr_t len;
6d16c2f8
AL
3936} BounceBuffer;
3937
3938static BounceBuffer bounce;
3939
ba223c29
AL
3940typedef struct MapClient {
3941 void *opaque;
3942 void (*callback)(void *opaque);
72cf2d4f 3943 QLIST_ENTRY(MapClient) link;
ba223c29
AL
3944} MapClient;
3945
72cf2d4f
BS
3946static QLIST_HEAD(map_client_list, MapClient) map_client_list
3947 = QLIST_HEAD_INITIALIZER(map_client_list);
ba223c29
AL
3948
3949void *cpu_register_map_client(void *opaque, void (*callback)(void *opaque))
3950{
3951 MapClient *client = qemu_malloc(sizeof(*client));
3952
3953 client->opaque = opaque;
3954 client->callback = callback;
72cf2d4f 3955 QLIST_INSERT_HEAD(&map_client_list, client, link);
ba223c29
AL
3956 return client;
3957}
3958
3959void cpu_unregister_map_client(void *_client)
3960{
3961 MapClient *client = (MapClient *)_client;
3962
72cf2d4f 3963 QLIST_REMOVE(client, link);
34d5e948 3964 qemu_free(client);
ba223c29
AL
3965}
3966
3967static void cpu_notify_map_clients(void)
3968{
3969 MapClient *client;
3970
72cf2d4f
BS
3971 while (!QLIST_EMPTY(&map_client_list)) {
3972 client = QLIST_FIRST(&map_client_list);
ba223c29 3973 client->callback(client->opaque);
34d5e948 3974 cpu_unregister_map_client(client);
ba223c29
AL
3975 }
3976}
3977
6d16c2f8
AL
3978/* Map a physical memory region into a host virtual address.
3979 * May map a subset of the requested range, given by and returned in *plen.
3980 * May return NULL if resources needed to perform the mapping are exhausted.
3981 * Use only for reads OR writes - not for read-modify-write operations.
ba223c29
AL
3982 * Use cpu_register_map_client() to know when retrying the map operation is
3983 * likely to succeed.
6d16c2f8 3984 */
c227f099
AL
3985void *cpu_physical_memory_map(target_phys_addr_t addr,
3986 target_phys_addr_t *plen,
6d16c2f8
AL
3987 int is_write)
3988{
c227f099
AL
3989 target_phys_addr_t len = *plen;
3990 target_phys_addr_t done = 0;
6d16c2f8
AL
3991 int l;
3992 uint8_t *ret = NULL;
3993 uint8_t *ptr;
c227f099 3994 target_phys_addr_t page;
6d16c2f8
AL
3995 unsigned long pd;
3996 PhysPageDesc *p;
3997 unsigned long addr1;
3998
3999 while (len > 0) {
4000 page = addr & TARGET_PAGE_MASK;
4001 l = (page + TARGET_PAGE_SIZE) - addr;
4002 if (l > len)
4003 l = len;
4004 p = phys_page_find(page >> TARGET_PAGE_BITS);
4005 if (!p) {
4006 pd = IO_MEM_UNASSIGNED;
4007 } else {
4008 pd = p->phys_offset;
4009 }
4010
4011 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
4012 if (done || bounce.buffer) {
4013 break;
4014 }
4015 bounce.buffer = qemu_memalign(TARGET_PAGE_SIZE, TARGET_PAGE_SIZE);
4016 bounce.addr = addr;
4017 bounce.len = l;
4018 if (!is_write) {
54f7b4a3 4019 cpu_physical_memory_read(addr, bounce.buffer, l);
6d16c2f8
AL
4020 }
4021 ptr = bounce.buffer;
4022 } else {
4023 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
5579c7f3 4024 ptr = qemu_get_ram_ptr(addr1);
6d16c2f8
AL
4025 }
4026 if (!done) {
4027 ret = ptr;
4028 } else if (ret + done != ptr) {
4029 break;
4030 }
4031
4032 len -= l;
4033 addr += l;
4034 done += l;
4035 }
4036 *plen = done;
4037 return ret;
4038}
4039
4040/* Unmaps a memory region previously mapped by cpu_physical_memory_map().
4041 * Will also mark the memory as dirty if is_write == 1. access_len gives
4042 * the amount of memory that was actually read or written by the caller.
4043 */
c227f099
AL
4044void cpu_physical_memory_unmap(void *buffer, target_phys_addr_t len,
4045 int is_write, target_phys_addr_t access_len)
6d16c2f8
AL
4046{
4047 if (buffer != bounce.buffer) {
4048 if (is_write) {
e890261f 4049 ram_addr_t addr1 = qemu_ram_addr_from_host_nofail(buffer);
6d16c2f8
AL
4050 while (access_len) {
4051 unsigned l;
4052 l = TARGET_PAGE_SIZE;
4053 if (l > access_len)
4054 l = access_len;
4055 if (!cpu_physical_memory_is_dirty(addr1)) {
4056 /* invalidate code */
4057 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
4058 /* set dirty bit */
f7c11b53
YT
4059 cpu_physical_memory_set_dirty_flags(
4060 addr1, (0xff & ~CODE_DIRTY_FLAG));
6d16c2f8
AL
4061 }
4062 addr1 += l;
4063 access_len -= l;
4064 }
4065 }
050a0ddf
AP
4066 if (xen_mapcache_enabled()) {
4067 uint8_t *buffer1 = buffer;
4068 uint8_t *end_buffer = buffer + len;
4069
4070 while (buffer1 < end_buffer) {
4071 qemu_put_ram_ptr(buffer1);
4072 buffer1 += TARGET_PAGE_SIZE;
4073 }
4074 }
6d16c2f8
AL
4075 return;
4076 }
4077 if (is_write) {
4078 cpu_physical_memory_write(bounce.addr, bounce.buffer, access_len);
4079 }
f8a83245 4080 qemu_vfree(bounce.buffer);
6d16c2f8 4081 bounce.buffer = NULL;
ba223c29 4082 cpu_notify_map_clients();
6d16c2f8 4083}
d0ecd2aa 4084
8df1cd07 4085/* warning: addr must be aligned */
c227f099 4086uint32_t ldl_phys(target_phys_addr_t addr)
8df1cd07
FB
4087{
4088 int io_index;
4089 uint8_t *ptr;
4090 uint32_t val;
4091 unsigned long pd;
4092 PhysPageDesc *p;
4093
4094 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4095 if (!p) {
4096 pd = IO_MEM_UNASSIGNED;
4097 } else {
4098 pd = p->phys_offset;
4099 }
3b46e624 4100
5fafdf24 4101 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
2a4188a3 4102 !(pd & IO_MEM_ROMD)) {
8df1cd07
FB
4103 /* I/O case */
4104 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4105 if (p)
4106 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
8df1cd07
FB
4107 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
4108 } else {
4109 /* RAM case */
5579c7f3 4110 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
8df1cd07
FB
4111 (addr & ~TARGET_PAGE_MASK);
4112 val = ldl_p(ptr);
4113 }
4114 return val;
4115}
4116
84b7b8e7 4117/* warning: addr must be aligned */
c227f099 4118uint64_t ldq_phys(target_phys_addr_t addr)
84b7b8e7
FB
4119{
4120 int io_index;
4121 uint8_t *ptr;
4122 uint64_t val;
4123 unsigned long pd;
4124 PhysPageDesc *p;
4125
4126 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4127 if (!p) {
4128 pd = IO_MEM_UNASSIGNED;
4129 } else {
4130 pd = p->phys_offset;
4131 }
3b46e624 4132
2a4188a3
FB
4133 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
4134 !(pd & IO_MEM_ROMD)) {
84b7b8e7
FB
4135 /* I/O case */
4136 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4137 if (p)
4138 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
84b7b8e7
FB
4139#ifdef TARGET_WORDS_BIGENDIAN
4140 val = (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr) << 32;
4141 val |= io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4);
4142#else
4143 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
4144 val |= (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4) << 32;
4145#endif
4146 } else {
4147 /* RAM case */
5579c7f3 4148 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
84b7b8e7
FB
4149 (addr & ~TARGET_PAGE_MASK);
4150 val = ldq_p(ptr);
4151 }
4152 return val;
4153}
4154
aab33094 4155/* XXX: optimize */
c227f099 4156uint32_t ldub_phys(target_phys_addr_t addr)
aab33094
FB
4157{
4158 uint8_t val;
4159 cpu_physical_memory_read(addr, &val, 1);
4160 return val;
4161}
4162
733f0b02 4163/* warning: addr must be aligned */
c227f099 4164uint32_t lduw_phys(target_phys_addr_t addr)
aab33094 4165{
733f0b02
MT
4166 int io_index;
4167 uint8_t *ptr;
4168 uint64_t val;
4169 unsigned long pd;
4170 PhysPageDesc *p;
4171
4172 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4173 if (!p) {
4174 pd = IO_MEM_UNASSIGNED;
4175 } else {
4176 pd = p->phys_offset;
4177 }
4178
4179 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
4180 !(pd & IO_MEM_ROMD)) {
4181 /* I/O case */
4182 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
4183 if (p)
4184 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
4185 val = io_mem_read[io_index][1](io_mem_opaque[io_index], addr);
4186 } else {
4187 /* RAM case */
4188 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
4189 (addr & ~TARGET_PAGE_MASK);
4190 val = lduw_p(ptr);
4191 }
4192 return val;
aab33094
FB
4193}
4194
8df1cd07
FB
4195/* warning: addr must be aligned. The ram page is not masked as dirty
4196 and the code inside is not invalidated. It is useful if the dirty
4197 bits are used to track modified PTEs */
c227f099 4198void stl_phys_notdirty(target_phys_addr_t addr, uint32_t val)
8df1cd07
FB
4199{
4200 int io_index;
4201 uint8_t *ptr;
4202 unsigned long pd;
4203 PhysPageDesc *p;
4204
4205 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4206 if (!p) {
4207 pd = IO_MEM_UNASSIGNED;
4208 } else {
4209 pd = p->phys_offset;
4210 }
3b46e624 4211
3a7d929e 4212 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
8df1cd07 4213 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4214 if (p)
4215 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
8df1cd07
FB
4216 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4217 } else {
74576198 4218 unsigned long addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
5579c7f3 4219 ptr = qemu_get_ram_ptr(addr1);
8df1cd07 4220 stl_p(ptr, val);
74576198
AL
4221
4222 if (unlikely(in_migration)) {
4223 if (!cpu_physical_memory_is_dirty(addr1)) {
4224 /* invalidate code */
4225 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
4226 /* set dirty bit */
f7c11b53
YT
4227 cpu_physical_memory_set_dirty_flags(
4228 addr1, (0xff & ~CODE_DIRTY_FLAG));
74576198
AL
4229 }
4230 }
8df1cd07
FB
4231 }
4232}
4233
c227f099 4234void stq_phys_notdirty(target_phys_addr_t addr, uint64_t val)
bc98a7ef
JM
4235{
4236 int io_index;
4237 uint8_t *ptr;
4238 unsigned long pd;
4239 PhysPageDesc *p;
4240
4241 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4242 if (!p) {
4243 pd = IO_MEM_UNASSIGNED;
4244 } else {
4245 pd = p->phys_offset;
4246 }
3b46e624 4247
bc98a7ef
JM
4248 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
4249 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4250 if (p)
4251 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
bc98a7ef
JM
4252#ifdef TARGET_WORDS_BIGENDIAN
4253 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val >> 32);
4254 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val);
4255#else
4256 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4257 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val >> 32);
4258#endif
4259 } else {
5579c7f3 4260 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
bc98a7ef
JM
4261 (addr & ~TARGET_PAGE_MASK);
4262 stq_p(ptr, val);
4263 }
4264}
4265
8df1cd07 4266/* warning: addr must be aligned */
c227f099 4267void stl_phys(target_phys_addr_t addr, uint32_t val)
8df1cd07
FB
4268{
4269 int io_index;
4270 uint8_t *ptr;
4271 unsigned long pd;
4272 PhysPageDesc *p;
4273
4274 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4275 if (!p) {
4276 pd = IO_MEM_UNASSIGNED;
4277 } else {
4278 pd = p->phys_offset;
4279 }
3b46e624 4280
3a7d929e 4281 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
8df1cd07 4282 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4283 if (p)
4284 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
8df1cd07
FB
4285 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4286 } else {
4287 unsigned long addr1;
4288 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4289 /* RAM case */
5579c7f3 4290 ptr = qemu_get_ram_ptr(addr1);
8df1cd07 4291 stl_p(ptr, val);
3a7d929e
FB
4292 if (!cpu_physical_memory_is_dirty(addr1)) {
4293 /* invalidate code */
4294 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
4295 /* set dirty bit */
f7c11b53
YT
4296 cpu_physical_memory_set_dirty_flags(addr1,
4297 (0xff & ~CODE_DIRTY_FLAG));
3a7d929e 4298 }
8df1cd07
FB
4299 }
4300}
4301
aab33094 4302/* XXX: optimize */
c227f099 4303void stb_phys(target_phys_addr_t addr, uint32_t val)
aab33094
FB
4304{
4305 uint8_t v = val;
4306 cpu_physical_memory_write(addr, &v, 1);
4307}
4308
733f0b02 4309/* warning: addr must be aligned */
c227f099 4310void stw_phys(target_phys_addr_t addr, uint32_t val)
aab33094 4311{
733f0b02
MT
4312 int io_index;
4313 uint8_t *ptr;
4314 unsigned long pd;
4315 PhysPageDesc *p;
4316
4317 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4318 if (!p) {
4319 pd = IO_MEM_UNASSIGNED;
4320 } else {
4321 pd = p->phys_offset;
4322 }
4323
4324 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
4325 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
4326 if (p)
4327 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
4328 io_mem_write[io_index][1](io_mem_opaque[io_index], addr, val);
4329 } else {
4330 unsigned long addr1;
4331 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4332 /* RAM case */
4333 ptr = qemu_get_ram_ptr(addr1);
4334 stw_p(ptr, val);
4335 if (!cpu_physical_memory_is_dirty(addr1)) {
4336 /* invalidate code */
4337 tb_invalidate_phys_page_range(addr1, addr1 + 2, 0);
4338 /* set dirty bit */
4339 cpu_physical_memory_set_dirty_flags(addr1,
4340 (0xff & ~CODE_DIRTY_FLAG));
4341 }
4342 }
aab33094
FB
4343}
4344
4345/* XXX: optimize */
c227f099 4346void stq_phys(target_phys_addr_t addr, uint64_t val)
aab33094
FB
4347{
4348 val = tswap64(val);
71d2b725 4349 cpu_physical_memory_write(addr, &val, 8);
aab33094
FB
4350}
4351
5e2972fd 4352/* virtual memory access for debug (includes writing to ROM) */
5fafdf24 4353int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
b448f2f3 4354 uint8_t *buf, int len, int is_write)
13eb76e0
FB
4355{
4356 int l;
c227f099 4357 target_phys_addr_t phys_addr;
9b3c35e0 4358 target_ulong page;
13eb76e0
FB
4359
4360 while (len > 0) {
4361 page = addr & TARGET_PAGE_MASK;
4362 phys_addr = cpu_get_phys_page_debug(env, page);
4363 /* if no physical page mapped, return an error */
4364 if (phys_addr == -1)
4365 return -1;
4366 l = (page + TARGET_PAGE_SIZE) - addr;
4367 if (l > len)
4368 l = len;
5e2972fd 4369 phys_addr += (addr & ~TARGET_PAGE_MASK);
5e2972fd
AL
4370 if (is_write)
4371 cpu_physical_memory_write_rom(phys_addr, buf, l);
4372 else
5e2972fd 4373 cpu_physical_memory_rw(phys_addr, buf, l, is_write);
13eb76e0
FB
4374 len -= l;
4375 buf += l;
4376 addr += l;
4377 }
4378 return 0;
4379}
a68fe89c 4380#endif
13eb76e0 4381
2e70f6ef
PB
4382/* in deterministic execution mode, instructions doing device I/Os
4383 must be at the end of the TB */
4384void cpu_io_recompile(CPUState *env, void *retaddr)
4385{
4386 TranslationBlock *tb;
4387 uint32_t n, cflags;
4388 target_ulong pc, cs_base;
4389 uint64_t flags;
4390
4391 tb = tb_find_pc((unsigned long)retaddr);
4392 if (!tb) {
4393 cpu_abort(env, "cpu_io_recompile: could not find TB for pc=%p",
4394 retaddr);
4395 }
4396 n = env->icount_decr.u16.low + tb->icount;
618ba8e6 4397 cpu_restore_state(tb, env, (unsigned long)retaddr);
2e70f6ef 4398 /* Calculate how many instructions had been executed before the fault
bf20dc07 4399 occurred. */
2e70f6ef
PB
4400 n = n - env->icount_decr.u16.low;
4401 /* Generate a new TB ending on the I/O insn. */
4402 n++;
4403 /* On MIPS and SH, delay slot instructions can only be restarted if
4404 they were already the first instruction in the TB. If this is not
bf20dc07 4405 the first instruction in a TB then re-execute the preceding
2e70f6ef
PB
4406 branch. */
4407#if defined(TARGET_MIPS)
4408 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
4409 env->active_tc.PC -= 4;
4410 env->icount_decr.u16.low++;
4411 env->hflags &= ~MIPS_HFLAG_BMASK;
4412 }
4413#elif defined(TARGET_SH4)
4414 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
4415 && n > 1) {
4416 env->pc -= 2;
4417 env->icount_decr.u16.low++;
4418 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
4419 }
4420#endif
4421 /* This should never happen. */
4422 if (n > CF_COUNT_MASK)
4423 cpu_abort(env, "TB too big during recompile");
4424
4425 cflags = n | CF_LAST_IO;
4426 pc = tb->pc;
4427 cs_base = tb->cs_base;
4428 flags = tb->flags;
4429 tb_phys_invalidate(tb, -1);
4430 /* FIXME: In theory this could raise an exception. In practice
4431 we have already translated the block once so it's probably ok. */
4432 tb_gen_code(env, pc, cs_base, flags, cflags);
bf20dc07 4433 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
2e70f6ef
PB
4434 the first in the TB) then we end up generating a whole new TB and
4435 repeating the fault, which is horribly inefficient.
4436 Better would be to execute just this insn uncached, or generate a
4437 second new TB. */
4438 cpu_resume_from_signal(env, NULL);
4439}
4440
b3755a91
PB
4441#if !defined(CONFIG_USER_ONLY)
4442
055403b2 4443void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
e3db7226
FB
4444{
4445 int i, target_code_size, max_target_code_size;
4446 int direct_jmp_count, direct_jmp2_count, cross_page;
4447 TranslationBlock *tb;
3b46e624 4448
e3db7226
FB
4449 target_code_size = 0;
4450 max_target_code_size = 0;
4451 cross_page = 0;
4452 direct_jmp_count = 0;
4453 direct_jmp2_count = 0;
4454 for(i = 0; i < nb_tbs; i++) {
4455 tb = &tbs[i];
4456 target_code_size += tb->size;
4457 if (tb->size > max_target_code_size)
4458 max_target_code_size = tb->size;
4459 if (tb->page_addr[1] != -1)
4460 cross_page++;
4461 if (tb->tb_next_offset[0] != 0xffff) {
4462 direct_jmp_count++;
4463 if (tb->tb_next_offset[1] != 0xffff) {
4464 direct_jmp2_count++;
4465 }
4466 }
4467 }
4468 /* XXX: avoid using doubles ? */
57fec1fe 4469 cpu_fprintf(f, "Translation buffer state:\n");
055403b2 4470 cpu_fprintf(f, "gen code size %td/%ld\n",
26a5f13b
FB
4471 code_gen_ptr - code_gen_buffer, code_gen_buffer_max_size);
4472 cpu_fprintf(f, "TB count %d/%d\n",
4473 nb_tbs, code_gen_max_blocks);
5fafdf24 4474 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
e3db7226
FB
4475 nb_tbs ? target_code_size / nb_tbs : 0,
4476 max_target_code_size);
055403b2 4477 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
e3db7226
FB
4478 nb_tbs ? (code_gen_ptr - code_gen_buffer) / nb_tbs : 0,
4479 target_code_size ? (double) (code_gen_ptr - code_gen_buffer) / target_code_size : 0);
5fafdf24
TS
4480 cpu_fprintf(f, "cross page TB count %d (%d%%)\n",
4481 cross_page,
e3db7226
FB
4482 nb_tbs ? (cross_page * 100) / nb_tbs : 0);
4483 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
5fafdf24 4484 direct_jmp_count,
e3db7226
FB
4485 nb_tbs ? (direct_jmp_count * 100) / nb_tbs : 0,
4486 direct_jmp2_count,
4487 nb_tbs ? (direct_jmp2_count * 100) / nb_tbs : 0);
57fec1fe 4488 cpu_fprintf(f, "\nStatistics:\n");
e3db7226
FB
4489 cpu_fprintf(f, "TB flush count %d\n", tb_flush_count);
4490 cpu_fprintf(f, "TB invalidate count %d\n", tb_phys_invalidate_count);
4491 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
b67d9a52 4492 tcg_dump_info(f, cpu_fprintf);
e3db7226
FB
4493}
4494
61382a50
FB
4495#define MMUSUFFIX _cmmu
4496#define GETPC() NULL
4497#define env cpu_single_env
b769d8fe 4498#define SOFTMMU_CODE_ACCESS
61382a50
FB
4499
4500#define SHIFT 0
4501#include "softmmu_template.h"
4502
4503#define SHIFT 1
4504#include "softmmu_template.h"
4505
4506#define SHIFT 2
4507#include "softmmu_template.h"
4508
4509#define SHIFT 3
4510#include "softmmu_template.h"
4511
4512#undef env
4513
4514#endif