]> git.proxmox.com Git - mirror_qemu.git/blame - exec.c
Fix network interface tap backend
[mirror_qemu.git] / exec.c
CommitLineData
54936004 1/*
fd6ce8f6 2 * virtual page mapping and translated block handling
5fafdf24 3 *
54936004
FB
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
8167ee88 17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
54936004 18 */
67b915a5 19#include "config.h"
d5a8f07c
FB
20#ifdef _WIN32
21#include <windows.h>
22#else
a98d49b1 23#include <sys/types.h>
d5a8f07c
FB
24#include <sys/mman.h>
25#endif
54936004 26
055403b2 27#include "qemu-common.h"
6180a181 28#include "cpu.h"
b67d9a52 29#include "tcg.h"
b3c7724c 30#include "hw/hw.h"
cc9e98cb 31#include "hw/qdev.h"
74576198 32#include "osdep.h"
7ba1e619 33#include "kvm.h"
432d268c 34#include "hw/xen.h"
29e922b6 35#include "qemu-timer.h"
62152b8a
AK
36#include "memory.h"
37#include "exec-memory.h"
53a5960a
PB
38#if defined(CONFIG_USER_ONLY)
39#include <qemu.h>
f01576f1
JL
40#if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
41#include <sys/param.h>
42#if __FreeBSD_version >= 700104
43#define HAVE_KINFO_GETVMMAP
44#define sigqueue sigqueue_freebsd /* avoid redefinition */
45#include <sys/time.h>
46#include <sys/proc.h>
47#include <machine/profile.h>
48#define _KERNEL
49#include <sys/user.h>
50#undef _KERNEL
51#undef sigqueue
52#include <libutil.h>
53#endif
54#endif
432d268c
JN
55#else /* !CONFIG_USER_ONLY */
56#include "xen-mapcache.h"
6506e4f9 57#include "trace.h"
53a5960a 58#endif
54936004 59
fd6ce8f6 60//#define DEBUG_TB_INVALIDATE
66e85a21 61//#define DEBUG_FLUSH
9fa3e853 62//#define DEBUG_TLB
67d3b957 63//#define DEBUG_UNASSIGNED
fd6ce8f6
FB
64
65/* make various TB consistency checks */
5fafdf24
TS
66//#define DEBUG_TB_CHECK
67//#define DEBUG_TLB_CHECK
fd6ce8f6 68
1196be37 69//#define DEBUG_IOPORT
db7b5426 70//#define DEBUG_SUBPAGE
1196be37 71
99773bd4
PB
72#if !defined(CONFIG_USER_ONLY)
73/* TB consistency checks only implemented for usermode emulation. */
74#undef DEBUG_TB_CHECK
75#endif
76
9fa3e853
FB
77#define SMC_BITMAP_USE_THRESHOLD 10
78
bdaf78e0 79static TranslationBlock *tbs;
24ab68ac 80static int code_gen_max_blocks;
9fa3e853 81TranslationBlock *tb_phys_hash[CODE_GEN_PHYS_HASH_SIZE];
bdaf78e0 82static int nb_tbs;
eb51d102 83/* any access to the tbs or the page table must use this lock */
c227f099 84spinlock_t tb_lock = SPIN_LOCK_UNLOCKED;
fd6ce8f6 85
141ac468
BS
86#if defined(__arm__) || defined(__sparc_v9__)
87/* The prologue must be reachable with a direct jump. ARM and Sparc64
88 have limited branch ranges (possibly also PPC) so place it in a
d03d860b
BS
89 section close to code segment. */
90#define code_gen_section \
91 __attribute__((__section__(".gen_code"))) \
92 __attribute__((aligned (32)))
f8e2af11
SW
93#elif defined(_WIN32)
94/* Maximum alignment for Win32 is 16. */
95#define code_gen_section \
96 __attribute__((aligned (16)))
d03d860b
BS
97#else
98#define code_gen_section \
99 __attribute__((aligned (32)))
100#endif
101
102uint8_t code_gen_prologue[1024] code_gen_section;
bdaf78e0
BS
103static uint8_t *code_gen_buffer;
104static unsigned long code_gen_buffer_size;
26a5f13b 105/* threshold to flush the translated code buffer */
bdaf78e0 106static unsigned long code_gen_buffer_max_size;
24ab68ac 107static uint8_t *code_gen_ptr;
fd6ce8f6 108
e2eef170 109#if !defined(CONFIG_USER_ONLY)
9fa3e853 110int phys_ram_fd;
74576198 111static int in_migration;
94a6b54f 112
f471a17e 113RAMList ram_list = { .blocks = QLIST_HEAD_INITIALIZER(ram_list) };
62152b8a
AK
114
115static MemoryRegion *system_memory;
116
e2eef170 117#endif
9fa3e853 118
6a00d601
FB
119CPUState *first_cpu;
120/* current CPU in the current thread. It is only valid inside
121 cpu_exec() */
5fafdf24 122CPUState *cpu_single_env;
2e70f6ef 123/* 0 = Do not count executed instructions.
bf20dc07 124 1 = Precise instruction counting.
2e70f6ef
PB
125 2 = Adaptive rate instruction counting. */
126int use_icount = 0;
127/* Current instruction counter. While executing translated code this may
128 include some instructions that have not yet been executed. */
129int64_t qemu_icount;
6a00d601 130
54936004 131typedef struct PageDesc {
92e873b9 132 /* list of TBs intersecting this ram page */
fd6ce8f6 133 TranslationBlock *first_tb;
9fa3e853
FB
134 /* in order to optimize self modifying code, we count the number
135 of lookups we do to a given page to use a bitmap */
136 unsigned int code_write_count;
137 uint8_t *code_bitmap;
138#if defined(CONFIG_USER_ONLY)
139 unsigned long flags;
140#endif
54936004
FB
141} PageDesc;
142
41c1b1c9 143/* In system mode we want L1_MAP to be based on ram offsets,
5cd2c5b6
RH
144 while in user mode we want it to be based on virtual addresses. */
145#if !defined(CONFIG_USER_ONLY)
41c1b1c9
PB
146#if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
147# define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
148#else
5cd2c5b6 149# define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
41c1b1c9 150#endif
bedb69ea 151#else
5cd2c5b6 152# define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
bedb69ea 153#endif
54936004 154
5cd2c5b6
RH
155/* Size of the L2 (and L3, etc) page tables. */
156#define L2_BITS 10
54936004
FB
157#define L2_SIZE (1 << L2_BITS)
158
5cd2c5b6
RH
159/* The bits remaining after N lower levels of page tables. */
160#define P_L1_BITS_REM \
161 ((TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
162#define V_L1_BITS_REM \
163 ((L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % L2_BITS)
164
165/* Size of the L1 page table. Avoid silly small sizes. */
166#if P_L1_BITS_REM < 4
167#define P_L1_BITS (P_L1_BITS_REM + L2_BITS)
168#else
169#define P_L1_BITS P_L1_BITS_REM
170#endif
171
172#if V_L1_BITS_REM < 4
173#define V_L1_BITS (V_L1_BITS_REM + L2_BITS)
174#else
175#define V_L1_BITS V_L1_BITS_REM
176#endif
177
178#define P_L1_SIZE ((target_phys_addr_t)1 << P_L1_BITS)
179#define V_L1_SIZE ((target_ulong)1 << V_L1_BITS)
180
181#define P_L1_SHIFT (TARGET_PHYS_ADDR_SPACE_BITS - TARGET_PAGE_BITS - P_L1_BITS)
182#define V_L1_SHIFT (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - V_L1_BITS)
183
83fb7adf
FB
184unsigned long qemu_real_host_page_size;
185unsigned long qemu_host_page_bits;
186unsigned long qemu_host_page_size;
187unsigned long qemu_host_page_mask;
54936004 188
5cd2c5b6
RH
189/* This is a multi-level map on the virtual address space.
190 The bottom level has pointers to PageDesc. */
191static void *l1_map[V_L1_SIZE];
54936004 192
e2eef170 193#if !defined(CONFIG_USER_ONLY)
41c1b1c9
PB
194typedef struct PhysPageDesc {
195 /* offset in host memory of the page + io_index in the low bits */
196 ram_addr_t phys_offset;
197 ram_addr_t region_offset;
198} PhysPageDesc;
199
5cd2c5b6
RH
200/* This is a multi-level map on the physical address space.
201 The bottom level has pointers to PhysPageDesc. */
202static void *l1_phys_map[P_L1_SIZE];
6d9a1304 203
e2eef170 204static void io_mem_init(void);
62152b8a 205static void memory_map_init(void);
e2eef170 206
33417e70 207/* io memory support */
33417e70
FB
208CPUWriteMemoryFunc *io_mem_write[IO_MEM_NB_ENTRIES][4];
209CPUReadMemoryFunc *io_mem_read[IO_MEM_NB_ENTRIES][4];
a4193c8a 210void *io_mem_opaque[IO_MEM_NB_ENTRIES];
511d2b14 211static char io_mem_used[IO_MEM_NB_ENTRIES];
6658ffb8
PB
212static int io_mem_watch;
213#endif
33417e70 214
34865134 215/* log support */
1e8b27ca
JR
216#ifdef WIN32
217static const char *logfilename = "qemu.log";
218#else
d9b630fd 219static const char *logfilename = "/tmp/qemu.log";
1e8b27ca 220#endif
34865134
FB
221FILE *logfile;
222int loglevel;
e735b91c 223static int log_append = 0;
34865134 224
e3db7226 225/* statistics */
b3755a91 226#if !defined(CONFIG_USER_ONLY)
e3db7226 227static int tlb_flush_count;
b3755a91 228#endif
e3db7226
FB
229static int tb_flush_count;
230static int tb_phys_invalidate_count;
231
7cb69cae
FB
232#ifdef _WIN32
233static void map_exec(void *addr, long size)
234{
235 DWORD old_protect;
236 VirtualProtect(addr, size,
237 PAGE_EXECUTE_READWRITE, &old_protect);
238
239}
240#else
241static void map_exec(void *addr, long size)
242{
4369415f 243 unsigned long start, end, page_size;
7cb69cae 244
4369415f 245 page_size = getpagesize();
7cb69cae 246 start = (unsigned long)addr;
4369415f 247 start &= ~(page_size - 1);
7cb69cae
FB
248
249 end = (unsigned long)addr + size;
4369415f
FB
250 end += page_size - 1;
251 end &= ~(page_size - 1);
7cb69cae
FB
252
253 mprotect((void *)start, end - start,
254 PROT_READ | PROT_WRITE | PROT_EXEC);
255}
256#endif
257
b346ff46 258static void page_init(void)
54936004 259{
83fb7adf 260 /* NOTE: we can always suppose that qemu_host_page_size >=
54936004 261 TARGET_PAGE_SIZE */
c2b48b69
AL
262#ifdef _WIN32
263 {
264 SYSTEM_INFO system_info;
265
266 GetSystemInfo(&system_info);
267 qemu_real_host_page_size = system_info.dwPageSize;
268 }
269#else
270 qemu_real_host_page_size = getpagesize();
271#endif
83fb7adf
FB
272 if (qemu_host_page_size == 0)
273 qemu_host_page_size = qemu_real_host_page_size;
274 if (qemu_host_page_size < TARGET_PAGE_SIZE)
275 qemu_host_page_size = TARGET_PAGE_SIZE;
276 qemu_host_page_bits = 0;
277 while ((1 << qemu_host_page_bits) < qemu_host_page_size)
278 qemu_host_page_bits++;
279 qemu_host_page_mask = ~(qemu_host_page_size - 1);
50a9569b 280
2e9a5713 281#if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
50a9569b 282 {
f01576f1
JL
283#ifdef HAVE_KINFO_GETVMMAP
284 struct kinfo_vmentry *freep;
285 int i, cnt;
286
287 freep = kinfo_getvmmap(getpid(), &cnt);
288 if (freep) {
289 mmap_lock();
290 for (i = 0; i < cnt; i++) {
291 unsigned long startaddr, endaddr;
292
293 startaddr = freep[i].kve_start;
294 endaddr = freep[i].kve_end;
295 if (h2g_valid(startaddr)) {
296 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
297
298 if (h2g_valid(endaddr)) {
299 endaddr = h2g(endaddr);
fd436907 300 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
f01576f1
JL
301 } else {
302#if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
303 endaddr = ~0ul;
fd436907 304 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
f01576f1
JL
305#endif
306 }
307 }
308 }
309 free(freep);
310 mmap_unlock();
311 }
312#else
50a9569b 313 FILE *f;
50a9569b 314
0776590d 315 last_brk = (unsigned long)sbrk(0);
5cd2c5b6 316
fd436907 317 f = fopen("/compat/linux/proc/self/maps", "r");
50a9569b 318 if (f) {
5cd2c5b6
RH
319 mmap_lock();
320
50a9569b 321 do {
5cd2c5b6
RH
322 unsigned long startaddr, endaddr;
323 int n;
324
325 n = fscanf (f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
326
327 if (n == 2 && h2g_valid(startaddr)) {
328 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
329
330 if (h2g_valid(endaddr)) {
331 endaddr = h2g(endaddr);
332 } else {
333 endaddr = ~0ul;
334 }
335 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
50a9569b
AZ
336 }
337 } while (!feof(f));
5cd2c5b6 338
50a9569b 339 fclose(f);
5cd2c5b6 340 mmap_unlock();
50a9569b 341 }
f01576f1 342#endif
50a9569b
AZ
343 }
344#endif
54936004
FB
345}
346
41c1b1c9 347static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
54936004 348{
41c1b1c9
PB
349 PageDesc *pd;
350 void **lp;
351 int i;
352
5cd2c5b6 353#if defined(CONFIG_USER_ONLY)
2e9a5713 354 /* We can't use qemu_malloc because it may recurse into a locked mutex. */
5cd2c5b6
RH
355# define ALLOC(P, SIZE) \
356 do { \
357 P = mmap(NULL, SIZE, PROT_READ | PROT_WRITE, \
358 MAP_PRIVATE | MAP_ANONYMOUS, -1, 0); \
5cd2c5b6
RH
359 } while (0)
360#else
361# define ALLOC(P, SIZE) \
362 do { P = qemu_mallocz(SIZE); } while (0)
17e2377a 363#endif
434929bf 364
5cd2c5b6
RH
365 /* Level 1. Always allocated. */
366 lp = l1_map + ((index >> V_L1_SHIFT) & (V_L1_SIZE - 1));
367
368 /* Level 2..N-1. */
369 for (i = V_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
370 void **p = *lp;
371
372 if (p == NULL) {
373 if (!alloc) {
374 return NULL;
375 }
376 ALLOC(p, sizeof(void *) * L2_SIZE);
377 *lp = p;
17e2377a 378 }
5cd2c5b6
RH
379
380 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
381 }
382
383 pd = *lp;
384 if (pd == NULL) {
385 if (!alloc) {
386 return NULL;
387 }
388 ALLOC(pd, sizeof(PageDesc) * L2_SIZE);
389 *lp = pd;
54936004 390 }
5cd2c5b6
RH
391
392#undef ALLOC
5cd2c5b6
RH
393
394 return pd + (index & (L2_SIZE - 1));
54936004
FB
395}
396
41c1b1c9 397static inline PageDesc *page_find(tb_page_addr_t index)
54936004 398{
5cd2c5b6 399 return page_find_alloc(index, 0);
fd6ce8f6
FB
400}
401
6d9a1304 402#if !defined(CONFIG_USER_ONLY)
c227f099 403static PhysPageDesc *phys_page_find_alloc(target_phys_addr_t index, int alloc)
92e873b9 404{
e3f4e2a4 405 PhysPageDesc *pd;
5cd2c5b6
RH
406 void **lp;
407 int i;
92e873b9 408
5cd2c5b6
RH
409 /* Level 1. Always allocated. */
410 lp = l1_phys_map + ((index >> P_L1_SHIFT) & (P_L1_SIZE - 1));
108c49b8 411
5cd2c5b6
RH
412 /* Level 2..N-1. */
413 for (i = P_L1_SHIFT / L2_BITS - 1; i > 0; i--) {
414 void **p = *lp;
415 if (p == NULL) {
416 if (!alloc) {
417 return NULL;
418 }
419 *lp = p = qemu_mallocz(sizeof(void *) * L2_SIZE);
420 }
421 lp = p + ((index >> (i * L2_BITS)) & (L2_SIZE - 1));
108c49b8 422 }
5cd2c5b6 423
e3f4e2a4 424 pd = *lp;
5cd2c5b6 425 if (pd == NULL) {
e3f4e2a4 426 int i;
5cd2c5b6
RH
427
428 if (!alloc) {
108c49b8 429 return NULL;
5cd2c5b6
RH
430 }
431
432 *lp = pd = qemu_malloc(sizeof(PhysPageDesc) * L2_SIZE);
433
67c4d23c 434 for (i = 0; i < L2_SIZE; i++) {
5cd2c5b6
RH
435 pd[i].phys_offset = IO_MEM_UNASSIGNED;
436 pd[i].region_offset = (index + i) << TARGET_PAGE_BITS;
67c4d23c 437 }
92e873b9 438 }
5cd2c5b6
RH
439
440 return pd + (index & (L2_SIZE - 1));
92e873b9
FB
441}
442
c227f099 443static inline PhysPageDesc *phys_page_find(target_phys_addr_t index)
92e873b9 444{
108c49b8 445 return phys_page_find_alloc(index, 0);
92e873b9
FB
446}
447
c227f099
AL
448static void tlb_protect_code(ram_addr_t ram_addr);
449static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
3a7d929e 450 target_ulong vaddr);
c8a706fe
PB
451#define mmap_lock() do { } while(0)
452#define mmap_unlock() do { } while(0)
9fa3e853 453#endif
fd6ce8f6 454
4369415f
FB
455#define DEFAULT_CODE_GEN_BUFFER_SIZE (32 * 1024 * 1024)
456
457#if defined(CONFIG_USER_ONLY)
ccbb4d44 458/* Currently it is not recommended to allocate big chunks of data in
4369415f
FB
459 user mode. It will change when a dedicated libc will be used */
460#define USE_STATIC_CODE_GEN_BUFFER
461#endif
462
463#ifdef USE_STATIC_CODE_GEN_BUFFER
ebf50fb3
AJ
464static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
465 __attribute__((aligned (CODE_GEN_ALIGN)));
4369415f
FB
466#endif
467
8fcd3692 468static void code_gen_alloc(unsigned long tb_size)
26a5f13b 469{
4369415f
FB
470#ifdef USE_STATIC_CODE_GEN_BUFFER
471 code_gen_buffer = static_code_gen_buffer;
472 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
473 map_exec(code_gen_buffer, code_gen_buffer_size);
474#else
26a5f13b
FB
475 code_gen_buffer_size = tb_size;
476 if (code_gen_buffer_size == 0) {
4369415f
FB
477#if defined(CONFIG_USER_ONLY)
478 /* in user mode, phys_ram_size is not meaningful */
479 code_gen_buffer_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
480#else
ccbb4d44 481 /* XXX: needs adjustments */
94a6b54f 482 code_gen_buffer_size = (unsigned long)(ram_size / 4);
4369415f 483#endif
26a5f13b
FB
484 }
485 if (code_gen_buffer_size < MIN_CODE_GEN_BUFFER_SIZE)
486 code_gen_buffer_size = MIN_CODE_GEN_BUFFER_SIZE;
487 /* The code gen buffer location may have constraints depending on
488 the host cpu and OS */
489#if defined(__linux__)
490 {
491 int flags;
141ac468
BS
492 void *start = NULL;
493
26a5f13b
FB
494 flags = MAP_PRIVATE | MAP_ANONYMOUS;
495#if defined(__x86_64__)
496 flags |= MAP_32BIT;
497 /* Cannot map more than that */
498 if (code_gen_buffer_size > (800 * 1024 * 1024))
499 code_gen_buffer_size = (800 * 1024 * 1024);
141ac468
BS
500#elif defined(__sparc_v9__)
501 // Map the buffer below 2G, so we can use direct calls and branches
502 flags |= MAP_FIXED;
503 start = (void *) 0x60000000UL;
504 if (code_gen_buffer_size > (512 * 1024 * 1024))
505 code_gen_buffer_size = (512 * 1024 * 1024);
1cb0661e 506#elif defined(__arm__)
63d41246 507 /* Map the buffer below 32M, so we can use direct calls and branches */
1cb0661e
AZ
508 flags |= MAP_FIXED;
509 start = (void *) 0x01000000UL;
510 if (code_gen_buffer_size > 16 * 1024 * 1024)
511 code_gen_buffer_size = 16 * 1024 * 1024;
eba0b893
RH
512#elif defined(__s390x__)
513 /* Map the buffer so that we can use direct calls and branches. */
514 /* We have a +- 4GB range on the branches; leave some slop. */
515 if (code_gen_buffer_size > (3ul * 1024 * 1024 * 1024)) {
516 code_gen_buffer_size = 3ul * 1024 * 1024 * 1024;
517 }
518 start = (void *)0x90000000UL;
26a5f13b 519#endif
141ac468
BS
520 code_gen_buffer = mmap(start, code_gen_buffer_size,
521 PROT_WRITE | PROT_READ | PROT_EXEC,
26a5f13b
FB
522 flags, -1, 0);
523 if (code_gen_buffer == MAP_FAILED) {
524 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
525 exit(1);
526 }
527 }
cbb608a5
BS
528#elif defined(__FreeBSD__) || defined(__FreeBSD_kernel__) \
529 || defined(__DragonFly__) || defined(__OpenBSD__)
06e67a82
AL
530 {
531 int flags;
532 void *addr = NULL;
533 flags = MAP_PRIVATE | MAP_ANONYMOUS;
534#if defined(__x86_64__)
535 /* FreeBSD doesn't have MAP_32BIT, use MAP_FIXED and assume
536 * 0x40000000 is free */
537 flags |= MAP_FIXED;
538 addr = (void *)0x40000000;
539 /* Cannot map more than that */
540 if (code_gen_buffer_size > (800 * 1024 * 1024))
541 code_gen_buffer_size = (800 * 1024 * 1024);
4cd31ad2
BS
542#elif defined(__sparc_v9__)
543 // Map the buffer below 2G, so we can use direct calls and branches
544 flags |= MAP_FIXED;
545 addr = (void *) 0x60000000UL;
546 if (code_gen_buffer_size > (512 * 1024 * 1024)) {
547 code_gen_buffer_size = (512 * 1024 * 1024);
548 }
06e67a82
AL
549#endif
550 code_gen_buffer = mmap(addr, code_gen_buffer_size,
551 PROT_WRITE | PROT_READ | PROT_EXEC,
552 flags, -1, 0);
553 if (code_gen_buffer == MAP_FAILED) {
554 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
555 exit(1);
556 }
557 }
26a5f13b
FB
558#else
559 code_gen_buffer = qemu_malloc(code_gen_buffer_size);
26a5f13b
FB
560 map_exec(code_gen_buffer, code_gen_buffer_size);
561#endif
4369415f 562#endif /* !USE_STATIC_CODE_GEN_BUFFER */
26a5f13b 563 map_exec(code_gen_prologue, sizeof(code_gen_prologue));
a884da8a
PM
564 code_gen_buffer_max_size = code_gen_buffer_size -
565 (TCG_MAX_OP_SIZE * OPC_BUF_SIZE);
26a5f13b
FB
566 code_gen_max_blocks = code_gen_buffer_size / CODE_GEN_AVG_BLOCK_SIZE;
567 tbs = qemu_malloc(code_gen_max_blocks * sizeof(TranslationBlock));
568}
569
570/* Must be called before using the QEMU cpus. 'tb_size' is the size
571 (in bytes) allocated to the translation buffer. Zero means default
572 size. */
d5ab9713 573void tcg_exec_init(unsigned long tb_size)
26a5f13b 574{
26a5f13b
FB
575 cpu_gen_init();
576 code_gen_alloc(tb_size);
577 code_gen_ptr = code_gen_buffer;
4369415f 578 page_init();
9002ec79
RH
579#if !defined(CONFIG_USER_ONLY) || !defined(CONFIG_USE_GUEST_BASE)
580 /* There's no guest base to take into account, so go ahead and
581 initialize the prologue now. */
582 tcg_prologue_init(&tcg_ctx);
583#endif
26a5f13b
FB
584}
585
d5ab9713
JK
586bool tcg_enabled(void)
587{
588 return code_gen_buffer != NULL;
589}
590
591void cpu_exec_init_all(void)
592{
593#if !defined(CONFIG_USER_ONLY)
594 memory_map_init();
595 io_mem_init();
596#endif
597}
598
9656f324
PB
599#if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
600
e59fb374 601static int cpu_common_post_load(void *opaque, int version_id)
e7f4eff7
JQ
602{
603 CPUState *env = opaque;
9656f324 604
3098dba0
AJ
605 /* 0x01 was CPU_INTERRUPT_EXIT. This line can be removed when the
606 version_id is increased. */
607 env->interrupt_request &= ~0x01;
9656f324
PB
608 tlb_flush(env, 1);
609
610 return 0;
611}
e7f4eff7
JQ
612
613static const VMStateDescription vmstate_cpu_common = {
614 .name = "cpu_common",
615 .version_id = 1,
616 .minimum_version_id = 1,
617 .minimum_version_id_old = 1,
e7f4eff7
JQ
618 .post_load = cpu_common_post_load,
619 .fields = (VMStateField []) {
620 VMSTATE_UINT32(halted, CPUState),
621 VMSTATE_UINT32(interrupt_request, CPUState),
622 VMSTATE_END_OF_LIST()
623 }
624};
9656f324
PB
625#endif
626
950f1472
GC
627CPUState *qemu_get_cpu(int cpu)
628{
629 CPUState *env = first_cpu;
630
631 while (env) {
632 if (env->cpu_index == cpu)
633 break;
634 env = env->next_cpu;
635 }
636
637 return env;
638}
639
6a00d601 640void cpu_exec_init(CPUState *env)
fd6ce8f6 641{
6a00d601
FB
642 CPUState **penv;
643 int cpu_index;
644
c2764719
PB
645#if defined(CONFIG_USER_ONLY)
646 cpu_list_lock();
647#endif
6a00d601
FB
648 env->next_cpu = NULL;
649 penv = &first_cpu;
650 cpu_index = 0;
651 while (*penv != NULL) {
1e9fa730 652 penv = &(*penv)->next_cpu;
6a00d601
FB
653 cpu_index++;
654 }
655 env->cpu_index = cpu_index;
268a362c 656 env->numa_node = 0;
72cf2d4f
BS
657 QTAILQ_INIT(&env->breakpoints);
658 QTAILQ_INIT(&env->watchpoints);
dc7a09cf
JK
659#ifndef CONFIG_USER_ONLY
660 env->thread_id = qemu_get_thread_id();
661#endif
6a00d601 662 *penv = env;
c2764719
PB
663#if defined(CONFIG_USER_ONLY)
664 cpu_list_unlock();
665#endif
b3c7724c 666#if defined(CPU_SAVE_VERSION) && !defined(CONFIG_USER_ONLY)
0be71e32
AW
667 vmstate_register(NULL, cpu_index, &vmstate_cpu_common, env);
668 register_savevm(NULL, "cpu", cpu_index, CPU_SAVE_VERSION,
b3c7724c
PB
669 cpu_save, cpu_load, env);
670#endif
fd6ce8f6
FB
671}
672
d1a1eb74
TG
673/* Allocate a new translation block. Flush the translation buffer if
674 too many translation blocks or too much generated code. */
675static TranslationBlock *tb_alloc(target_ulong pc)
676{
677 TranslationBlock *tb;
678
679 if (nb_tbs >= code_gen_max_blocks ||
680 (code_gen_ptr - code_gen_buffer) >= code_gen_buffer_max_size)
681 return NULL;
682 tb = &tbs[nb_tbs++];
683 tb->pc = pc;
684 tb->cflags = 0;
685 return tb;
686}
687
688void tb_free(TranslationBlock *tb)
689{
690 /* In practice this is mostly used for single use temporary TB
691 Ignore the hard cases and just back up if this TB happens to
692 be the last one generated. */
693 if (nb_tbs > 0 && tb == &tbs[nb_tbs - 1]) {
694 code_gen_ptr = tb->tc_ptr;
695 nb_tbs--;
696 }
697}
698
9fa3e853
FB
699static inline void invalidate_page_bitmap(PageDesc *p)
700{
701 if (p->code_bitmap) {
59817ccb 702 qemu_free(p->code_bitmap);
9fa3e853
FB
703 p->code_bitmap = NULL;
704 }
705 p->code_write_count = 0;
706}
707
5cd2c5b6
RH
708/* Set to NULL all the 'first_tb' fields in all PageDescs. */
709
710static void page_flush_tb_1 (int level, void **lp)
fd6ce8f6 711{
5cd2c5b6 712 int i;
fd6ce8f6 713
5cd2c5b6
RH
714 if (*lp == NULL) {
715 return;
716 }
717 if (level == 0) {
718 PageDesc *pd = *lp;
7296abac 719 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
720 pd[i].first_tb = NULL;
721 invalidate_page_bitmap(pd + i);
fd6ce8f6 722 }
5cd2c5b6
RH
723 } else {
724 void **pp = *lp;
7296abac 725 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
726 page_flush_tb_1 (level - 1, pp + i);
727 }
728 }
729}
730
731static void page_flush_tb(void)
732{
733 int i;
734 for (i = 0; i < V_L1_SIZE; i++) {
735 page_flush_tb_1(V_L1_SHIFT / L2_BITS - 1, l1_map + i);
fd6ce8f6
FB
736 }
737}
738
739/* flush all the translation blocks */
d4e8164f 740/* XXX: tb_flush is currently not thread safe */
6a00d601 741void tb_flush(CPUState *env1)
fd6ce8f6 742{
6a00d601 743 CPUState *env;
0124311e 744#if defined(DEBUG_FLUSH)
ab3d1727
BS
745 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
746 (unsigned long)(code_gen_ptr - code_gen_buffer),
747 nb_tbs, nb_tbs > 0 ?
748 ((unsigned long)(code_gen_ptr - code_gen_buffer)) / nb_tbs : 0);
fd6ce8f6 749#endif
26a5f13b 750 if ((unsigned long)(code_gen_ptr - code_gen_buffer) > code_gen_buffer_size)
a208e54a
PB
751 cpu_abort(env1, "Internal error: code buffer overflow\n");
752
fd6ce8f6 753 nb_tbs = 0;
3b46e624 754
6a00d601
FB
755 for(env = first_cpu; env != NULL; env = env->next_cpu) {
756 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
757 }
9fa3e853 758
8a8a608f 759 memset (tb_phys_hash, 0, CODE_GEN_PHYS_HASH_SIZE * sizeof (void *));
fd6ce8f6 760 page_flush_tb();
9fa3e853 761
fd6ce8f6 762 code_gen_ptr = code_gen_buffer;
d4e8164f
FB
763 /* XXX: flush processor icache at this point if cache flush is
764 expensive */
e3db7226 765 tb_flush_count++;
fd6ce8f6
FB
766}
767
768#ifdef DEBUG_TB_CHECK
769
bc98a7ef 770static void tb_invalidate_check(target_ulong address)
fd6ce8f6
FB
771{
772 TranslationBlock *tb;
773 int i;
774 address &= TARGET_PAGE_MASK;
99773bd4
PB
775 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
776 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
fd6ce8f6
FB
777 if (!(address + TARGET_PAGE_SIZE <= tb->pc ||
778 address >= tb->pc + tb->size)) {
0bf9e31a
BS
779 printf("ERROR invalidate: address=" TARGET_FMT_lx
780 " PC=%08lx size=%04x\n",
99773bd4 781 address, (long)tb->pc, tb->size);
fd6ce8f6
FB
782 }
783 }
784 }
785}
786
787/* verify that all the pages have correct rights for code */
788static void tb_page_check(void)
789{
790 TranslationBlock *tb;
791 int i, flags1, flags2;
3b46e624 792
99773bd4
PB
793 for(i = 0;i < CODE_GEN_PHYS_HASH_SIZE; i++) {
794 for(tb = tb_phys_hash[i]; tb != NULL; tb = tb->phys_hash_next) {
fd6ce8f6
FB
795 flags1 = page_get_flags(tb->pc);
796 flags2 = page_get_flags(tb->pc + tb->size - 1);
797 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
798 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
99773bd4 799 (long)tb->pc, tb->size, flags1, flags2);
fd6ce8f6
FB
800 }
801 }
802 }
803}
804
805#endif
806
807/* invalidate one TB */
808static inline void tb_remove(TranslationBlock **ptb, TranslationBlock *tb,
809 int next_offset)
810{
811 TranslationBlock *tb1;
812 for(;;) {
813 tb1 = *ptb;
814 if (tb1 == tb) {
815 *ptb = *(TranslationBlock **)((char *)tb1 + next_offset);
816 break;
817 }
818 ptb = (TranslationBlock **)((char *)tb1 + next_offset);
819 }
820}
821
9fa3e853
FB
822static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
823{
824 TranslationBlock *tb1;
825 unsigned int n1;
826
827 for(;;) {
828 tb1 = *ptb;
829 n1 = (long)tb1 & 3;
830 tb1 = (TranslationBlock *)((long)tb1 & ~3);
831 if (tb1 == tb) {
832 *ptb = tb1->page_next[n1];
833 break;
834 }
835 ptb = &tb1->page_next[n1];
836 }
837}
838
d4e8164f
FB
839static inline void tb_jmp_remove(TranslationBlock *tb, int n)
840{
841 TranslationBlock *tb1, **ptb;
842 unsigned int n1;
843
844 ptb = &tb->jmp_next[n];
845 tb1 = *ptb;
846 if (tb1) {
847 /* find tb(n) in circular list */
848 for(;;) {
849 tb1 = *ptb;
850 n1 = (long)tb1 & 3;
851 tb1 = (TranslationBlock *)((long)tb1 & ~3);
852 if (n1 == n && tb1 == tb)
853 break;
854 if (n1 == 2) {
855 ptb = &tb1->jmp_first;
856 } else {
857 ptb = &tb1->jmp_next[n1];
858 }
859 }
860 /* now we can suppress tb(n) from the list */
861 *ptb = tb->jmp_next[n];
862
863 tb->jmp_next[n] = NULL;
864 }
865}
866
867/* reset the jump entry 'n' of a TB so that it is not chained to
868 another TB */
869static inline void tb_reset_jump(TranslationBlock *tb, int n)
870{
871 tb_set_jmp_target(tb, n, (unsigned long)(tb->tc_ptr + tb->tb_next_offset[n]));
872}
873
41c1b1c9 874void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
fd6ce8f6 875{
6a00d601 876 CPUState *env;
8a40a180 877 PageDesc *p;
d4e8164f 878 unsigned int h, n1;
41c1b1c9 879 tb_page_addr_t phys_pc;
8a40a180 880 TranslationBlock *tb1, *tb2;
3b46e624 881
8a40a180
FB
882 /* remove the TB from the hash list */
883 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
884 h = tb_phys_hash_func(phys_pc);
5fafdf24 885 tb_remove(&tb_phys_hash[h], tb,
8a40a180
FB
886 offsetof(TranslationBlock, phys_hash_next));
887
888 /* remove the TB from the page list */
889 if (tb->page_addr[0] != page_addr) {
890 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
891 tb_page_remove(&p->first_tb, tb);
892 invalidate_page_bitmap(p);
893 }
894 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
895 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
896 tb_page_remove(&p->first_tb, tb);
897 invalidate_page_bitmap(p);
898 }
899
36bdbe54 900 tb_invalidated_flag = 1;
59817ccb 901
fd6ce8f6 902 /* remove the TB from the hash list */
8a40a180 903 h = tb_jmp_cache_hash_func(tb->pc);
6a00d601
FB
904 for(env = first_cpu; env != NULL; env = env->next_cpu) {
905 if (env->tb_jmp_cache[h] == tb)
906 env->tb_jmp_cache[h] = NULL;
907 }
d4e8164f
FB
908
909 /* suppress this TB from the two jump lists */
910 tb_jmp_remove(tb, 0);
911 tb_jmp_remove(tb, 1);
912
913 /* suppress any remaining jumps to this TB */
914 tb1 = tb->jmp_first;
915 for(;;) {
916 n1 = (long)tb1 & 3;
917 if (n1 == 2)
918 break;
919 tb1 = (TranslationBlock *)((long)tb1 & ~3);
920 tb2 = tb1->jmp_next[n1];
921 tb_reset_jump(tb1, n1);
922 tb1->jmp_next[n1] = NULL;
923 tb1 = tb2;
924 }
925 tb->jmp_first = (TranslationBlock *)((long)tb | 2); /* fail safe */
9fa3e853 926
e3db7226 927 tb_phys_invalidate_count++;
9fa3e853
FB
928}
929
930static inline void set_bits(uint8_t *tab, int start, int len)
931{
932 int end, mask, end1;
933
934 end = start + len;
935 tab += start >> 3;
936 mask = 0xff << (start & 7);
937 if ((start & ~7) == (end & ~7)) {
938 if (start < end) {
939 mask &= ~(0xff << (end & 7));
940 *tab |= mask;
941 }
942 } else {
943 *tab++ |= mask;
944 start = (start + 8) & ~7;
945 end1 = end & ~7;
946 while (start < end1) {
947 *tab++ = 0xff;
948 start += 8;
949 }
950 if (start < end) {
951 mask = ~(0xff << (end & 7));
952 *tab |= mask;
953 }
954 }
955}
956
957static void build_page_bitmap(PageDesc *p)
958{
959 int n, tb_start, tb_end;
960 TranslationBlock *tb;
3b46e624 961
b2a7081a 962 p->code_bitmap = qemu_mallocz(TARGET_PAGE_SIZE / 8);
9fa3e853
FB
963
964 tb = p->first_tb;
965 while (tb != NULL) {
966 n = (long)tb & 3;
967 tb = (TranslationBlock *)((long)tb & ~3);
968 /* NOTE: this is subtle as a TB may span two physical pages */
969 if (n == 0) {
970 /* NOTE: tb_end may be after the end of the page, but
971 it is not a problem */
972 tb_start = tb->pc & ~TARGET_PAGE_MASK;
973 tb_end = tb_start + tb->size;
974 if (tb_end > TARGET_PAGE_SIZE)
975 tb_end = TARGET_PAGE_SIZE;
976 } else {
977 tb_start = 0;
978 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
979 }
980 set_bits(p->code_bitmap, tb_start, tb_end - tb_start);
981 tb = tb->page_next[n];
982 }
983}
984
2e70f6ef
PB
985TranslationBlock *tb_gen_code(CPUState *env,
986 target_ulong pc, target_ulong cs_base,
987 int flags, int cflags)
d720b93d
FB
988{
989 TranslationBlock *tb;
990 uint8_t *tc_ptr;
41c1b1c9
PB
991 tb_page_addr_t phys_pc, phys_page2;
992 target_ulong virt_page2;
d720b93d
FB
993 int code_gen_size;
994
41c1b1c9 995 phys_pc = get_page_addr_code(env, pc);
c27004ec 996 tb = tb_alloc(pc);
d720b93d
FB
997 if (!tb) {
998 /* flush must be done */
999 tb_flush(env);
1000 /* cannot fail at this point */
c27004ec 1001 tb = tb_alloc(pc);
2e70f6ef
PB
1002 /* Don't forget to invalidate previous TB info. */
1003 tb_invalidated_flag = 1;
d720b93d
FB
1004 }
1005 tc_ptr = code_gen_ptr;
1006 tb->tc_ptr = tc_ptr;
1007 tb->cs_base = cs_base;
1008 tb->flags = flags;
1009 tb->cflags = cflags;
d07bde88 1010 cpu_gen_code(env, tb, &code_gen_size);
d720b93d 1011 code_gen_ptr = (void *)(((unsigned long)code_gen_ptr + code_gen_size + CODE_GEN_ALIGN - 1) & ~(CODE_GEN_ALIGN - 1));
3b46e624 1012
d720b93d 1013 /* check next page if needed */
c27004ec 1014 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
d720b93d 1015 phys_page2 = -1;
c27004ec 1016 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
41c1b1c9 1017 phys_page2 = get_page_addr_code(env, virt_page2);
d720b93d 1018 }
41c1b1c9 1019 tb_link_page(tb, phys_pc, phys_page2);
2e70f6ef 1020 return tb;
d720b93d 1021}
3b46e624 1022
9fa3e853
FB
1023/* invalidate all TBs which intersect with the target physical page
1024 starting in range [start;end[. NOTE: start and end must refer to
d720b93d
FB
1025 the same physical page. 'is_cpu_write_access' should be true if called
1026 from a real cpu write access: the virtual CPU will exit the current
1027 TB if code is modified inside this TB. */
41c1b1c9 1028void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
d720b93d
FB
1029 int is_cpu_write_access)
1030{
6b917547 1031 TranslationBlock *tb, *tb_next, *saved_tb;
d720b93d 1032 CPUState *env = cpu_single_env;
41c1b1c9 1033 tb_page_addr_t tb_start, tb_end;
6b917547
AL
1034 PageDesc *p;
1035 int n;
1036#ifdef TARGET_HAS_PRECISE_SMC
1037 int current_tb_not_found = is_cpu_write_access;
1038 TranslationBlock *current_tb = NULL;
1039 int current_tb_modified = 0;
1040 target_ulong current_pc = 0;
1041 target_ulong current_cs_base = 0;
1042 int current_flags = 0;
1043#endif /* TARGET_HAS_PRECISE_SMC */
9fa3e853
FB
1044
1045 p = page_find(start >> TARGET_PAGE_BITS);
5fafdf24 1046 if (!p)
9fa3e853 1047 return;
5fafdf24 1048 if (!p->code_bitmap &&
d720b93d
FB
1049 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD &&
1050 is_cpu_write_access) {
9fa3e853
FB
1051 /* build code bitmap */
1052 build_page_bitmap(p);
1053 }
1054
1055 /* we remove all the TBs in the range [start, end[ */
1056 /* XXX: see if in some cases it could be faster to invalidate all the code */
1057 tb = p->first_tb;
1058 while (tb != NULL) {
1059 n = (long)tb & 3;
1060 tb = (TranslationBlock *)((long)tb & ~3);
1061 tb_next = tb->page_next[n];
1062 /* NOTE: this is subtle as a TB may span two physical pages */
1063 if (n == 0) {
1064 /* NOTE: tb_end may be after the end of the page, but
1065 it is not a problem */
1066 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1067 tb_end = tb_start + tb->size;
1068 } else {
1069 tb_start = tb->page_addr[1];
1070 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1071 }
1072 if (!(tb_end <= start || tb_start >= end)) {
d720b93d
FB
1073#ifdef TARGET_HAS_PRECISE_SMC
1074 if (current_tb_not_found) {
1075 current_tb_not_found = 0;
1076 current_tb = NULL;
2e70f6ef 1077 if (env->mem_io_pc) {
d720b93d 1078 /* now we have a real cpu fault */
2e70f6ef 1079 current_tb = tb_find_pc(env->mem_io_pc);
d720b93d
FB
1080 }
1081 }
1082 if (current_tb == tb &&
2e70f6ef 1083 (current_tb->cflags & CF_COUNT_MASK) != 1) {
d720b93d
FB
1084 /* If we are modifying the current TB, we must stop
1085 its execution. We could be more precise by checking
1086 that the modification is after the current PC, but it
1087 would require a specialized function to partially
1088 restore the CPU state */
3b46e624 1089
d720b93d 1090 current_tb_modified = 1;
618ba8e6 1091 cpu_restore_state(current_tb, env, env->mem_io_pc);
6b917547
AL
1092 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1093 &current_flags);
d720b93d
FB
1094 }
1095#endif /* TARGET_HAS_PRECISE_SMC */
6f5a9f7e
FB
1096 /* we need to do that to handle the case where a signal
1097 occurs while doing tb_phys_invalidate() */
1098 saved_tb = NULL;
1099 if (env) {
1100 saved_tb = env->current_tb;
1101 env->current_tb = NULL;
1102 }
9fa3e853 1103 tb_phys_invalidate(tb, -1);
6f5a9f7e
FB
1104 if (env) {
1105 env->current_tb = saved_tb;
1106 if (env->interrupt_request && env->current_tb)
1107 cpu_interrupt(env, env->interrupt_request);
1108 }
9fa3e853
FB
1109 }
1110 tb = tb_next;
1111 }
1112#if !defined(CONFIG_USER_ONLY)
1113 /* if no code remaining, no need to continue to use slow writes */
1114 if (!p->first_tb) {
1115 invalidate_page_bitmap(p);
d720b93d 1116 if (is_cpu_write_access) {
2e70f6ef 1117 tlb_unprotect_code_phys(env, start, env->mem_io_vaddr);
d720b93d
FB
1118 }
1119 }
1120#endif
1121#ifdef TARGET_HAS_PRECISE_SMC
1122 if (current_tb_modified) {
1123 /* we generate a block containing just the instruction
1124 modifying the memory. It will ensure that it cannot modify
1125 itself */
ea1c1802 1126 env->current_tb = NULL;
2e70f6ef 1127 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
d720b93d 1128 cpu_resume_from_signal(env, NULL);
9fa3e853 1129 }
fd6ce8f6 1130#endif
9fa3e853 1131}
fd6ce8f6 1132
9fa3e853 1133/* len must be <= 8 and start must be a multiple of len */
41c1b1c9 1134static inline void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
9fa3e853
FB
1135{
1136 PageDesc *p;
1137 int offset, b;
59817ccb 1138#if 0
a4193c8a 1139 if (1) {
93fcfe39
AL
1140 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1141 cpu_single_env->mem_io_vaddr, len,
1142 cpu_single_env->eip,
1143 cpu_single_env->eip + (long)cpu_single_env->segs[R_CS].base);
59817ccb
FB
1144 }
1145#endif
9fa3e853 1146 p = page_find(start >> TARGET_PAGE_BITS);
5fafdf24 1147 if (!p)
9fa3e853
FB
1148 return;
1149 if (p->code_bitmap) {
1150 offset = start & ~TARGET_PAGE_MASK;
1151 b = p->code_bitmap[offset >> 3] >> (offset & 7);
1152 if (b & ((1 << len) - 1))
1153 goto do_invalidate;
1154 } else {
1155 do_invalidate:
d720b93d 1156 tb_invalidate_phys_page_range(start, start + len, 1);
9fa3e853
FB
1157 }
1158}
1159
9fa3e853 1160#if !defined(CONFIG_SOFTMMU)
41c1b1c9 1161static void tb_invalidate_phys_page(tb_page_addr_t addr,
d720b93d 1162 unsigned long pc, void *puc)
9fa3e853 1163{
6b917547 1164 TranslationBlock *tb;
9fa3e853 1165 PageDesc *p;
6b917547 1166 int n;
d720b93d 1167#ifdef TARGET_HAS_PRECISE_SMC
6b917547 1168 TranslationBlock *current_tb = NULL;
d720b93d 1169 CPUState *env = cpu_single_env;
6b917547
AL
1170 int current_tb_modified = 0;
1171 target_ulong current_pc = 0;
1172 target_ulong current_cs_base = 0;
1173 int current_flags = 0;
d720b93d 1174#endif
9fa3e853
FB
1175
1176 addr &= TARGET_PAGE_MASK;
1177 p = page_find(addr >> TARGET_PAGE_BITS);
5fafdf24 1178 if (!p)
9fa3e853
FB
1179 return;
1180 tb = p->first_tb;
d720b93d
FB
1181#ifdef TARGET_HAS_PRECISE_SMC
1182 if (tb && pc != 0) {
1183 current_tb = tb_find_pc(pc);
1184 }
1185#endif
9fa3e853
FB
1186 while (tb != NULL) {
1187 n = (long)tb & 3;
1188 tb = (TranslationBlock *)((long)tb & ~3);
d720b93d
FB
1189#ifdef TARGET_HAS_PRECISE_SMC
1190 if (current_tb == tb &&
2e70f6ef 1191 (current_tb->cflags & CF_COUNT_MASK) != 1) {
d720b93d
FB
1192 /* If we are modifying the current TB, we must stop
1193 its execution. We could be more precise by checking
1194 that the modification is after the current PC, but it
1195 would require a specialized function to partially
1196 restore the CPU state */
3b46e624 1197
d720b93d 1198 current_tb_modified = 1;
618ba8e6 1199 cpu_restore_state(current_tb, env, pc);
6b917547
AL
1200 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1201 &current_flags);
d720b93d
FB
1202 }
1203#endif /* TARGET_HAS_PRECISE_SMC */
9fa3e853
FB
1204 tb_phys_invalidate(tb, addr);
1205 tb = tb->page_next[n];
1206 }
fd6ce8f6 1207 p->first_tb = NULL;
d720b93d
FB
1208#ifdef TARGET_HAS_PRECISE_SMC
1209 if (current_tb_modified) {
1210 /* we generate a block containing just the instruction
1211 modifying the memory. It will ensure that it cannot modify
1212 itself */
ea1c1802 1213 env->current_tb = NULL;
2e70f6ef 1214 tb_gen_code(env, current_pc, current_cs_base, current_flags, 1);
d720b93d
FB
1215 cpu_resume_from_signal(env, puc);
1216 }
1217#endif
fd6ce8f6 1218}
9fa3e853 1219#endif
fd6ce8f6
FB
1220
1221/* add the tb in the target page and protect it if necessary */
5fafdf24 1222static inline void tb_alloc_page(TranslationBlock *tb,
41c1b1c9 1223 unsigned int n, tb_page_addr_t page_addr)
fd6ce8f6
FB
1224{
1225 PageDesc *p;
4429ab44
JQ
1226#ifndef CONFIG_USER_ONLY
1227 bool page_already_protected;
1228#endif
9fa3e853
FB
1229
1230 tb->page_addr[n] = page_addr;
5cd2c5b6 1231 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
9fa3e853 1232 tb->page_next[n] = p->first_tb;
4429ab44
JQ
1233#ifndef CONFIG_USER_ONLY
1234 page_already_protected = p->first_tb != NULL;
1235#endif
9fa3e853
FB
1236 p->first_tb = (TranslationBlock *)((long)tb | n);
1237 invalidate_page_bitmap(p);
fd6ce8f6 1238
107db443 1239#if defined(TARGET_HAS_SMC) || 1
d720b93d 1240
9fa3e853 1241#if defined(CONFIG_USER_ONLY)
fd6ce8f6 1242 if (p->flags & PAGE_WRITE) {
53a5960a
PB
1243 target_ulong addr;
1244 PageDesc *p2;
9fa3e853
FB
1245 int prot;
1246
fd6ce8f6
FB
1247 /* force the host page as non writable (writes will have a
1248 page fault + mprotect overhead) */
53a5960a 1249 page_addr &= qemu_host_page_mask;
fd6ce8f6 1250 prot = 0;
53a5960a
PB
1251 for(addr = page_addr; addr < page_addr + qemu_host_page_size;
1252 addr += TARGET_PAGE_SIZE) {
1253
1254 p2 = page_find (addr >> TARGET_PAGE_BITS);
1255 if (!p2)
1256 continue;
1257 prot |= p2->flags;
1258 p2->flags &= ~PAGE_WRITE;
53a5960a 1259 }
5fafdf24 1260 mprotect(g2h(page_addr), qemu_host_page_size,
fd6ce8f6
FB
1261 (prot & PAGE_BITS) & ~PAGE_WRITE);
1262#ifdef DEBUG_TB_INVALIDATE
ab3d1727 1263 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
53a5960a 1264 page_addr);
fd6ce8f6 1265#endif
fd6ce8f6 1266 }
9fa3e853
FB
1267#else
1268 /* if some code is already present, then the pages are already
1269 protected. So we handle the case where only the first TB is
1270 allocated in a physical page */
4429ab44 1271 if (!page_already_protected) {
6a00d601 1272 tlb_protect_code(page_addr);
9fa3e853
FB
1273 }
1274#endif
d720b93d
FB
1275
1276#endif /* TARGET_HAS_SMC */
fd6ce8f6
FB
1277}
1278
9fa3e853
FB
1279/* add a new TB and link it to the physical page tables. phys_page2 is
1280 (-1) to indicate that only one page contains the TB. */
41c1b1c9
PB
1281void tb_link_page(TranslationBlock *tb,
1282 tb_page_addr_t phys_pc, tb_page_addr_t phys_page2)
d4e8164f 1283{
9fa3e853
FB
1284 unsigned int h;
1285 TranslationBlock **ptb;
1286
c8a706fe
PB
1287 /* Grab the mmap lock to stop another thread invalidating this TB
1288 before we are done. */
1289 mmap_lock();
9fa3e853
FB
1290 /* add in the physical hash table */
1291 h = tb_phys_hash_func(phys_pc);
1292 ptb = &tb_phys_hash[h];
1293 tb->phys_hash_next = *ptb;
1294 *ptb = tb;
fd6ce8f6
FB
1295
1296 /* add in the page list */
9fa3e853
FB
1297 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1298 if (phys_page2 != -1)
1299 tb_alloc_page(tb, 1, phys_page2);
1300 else
1301 tb->page_addr[1] = -1;
9fa3e853 1302
d4e8164f
FB
1303 tb->jmp_first = (TranslationBlock *)((long)tb | 2);
1304 tb->jmp_next[0] = NULL;
1305 tb->jmp_next[1] = NULL;
1306
1307 /* init original jump addresses */
1308 if (tb->tb_next_offset[0] != 0xffff)
1309 tb_reset_jump(tb, 0);
1310 if (tb->tb_next_offset[1] != 0xffff)
1311 tb_reset_jump(tb, 1);
8a40a180
FB
1312
1313#ifdef DEBUG_TB_CHECK
1314 tb_page_check();
1315#endif
c8a706fe 1316 mmap_unlock();
fd6ce8f6
FB
1317}
1318
9fa3e853
FB
1319/* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1320 tb[1].tc_ptr. Return NULL if not found */
1321TranslationBlock *tb_find_pc(unsigned long tc_ptr)
fd6ce8f6 1322{
9fa3e853
FB
1323 int m_min, m_max, m;
1324 unsigned long v;
1325 TranslationBlock *tb;
a513fe19
FB
1326
1327 if (nb_tbs <= 0)
1328 return NULL;
1329 if (tc_ptr < (unsigned long)code_gen_buffer ||
1330 tc_ptr >= (unsigned long)code_gen_ptr)
1331 return NULL;
1332 /* binary search (cf Knuth) */
1333 m_min = 0;
1334 m_max = nb_tbs - 1;
1335 while (m_min <= m_max) {
1336 m = (m_min + m_max) >> 1;
1337 tb = &tbs[m];
1338 v = (unsigned long)tb->tc_ptr;
1339 if (v == tc_ptr)
1340 return tb;
1341 else if (tc_ptr < v) {
1342 m_max = m - 1;
1343 } else {
1344 m_min = m + 1;
1345 }
5fafdf24 1346 }
a513fe19
FB
1347 return &tbs[m_max];
1348}
7501267e 1349
ea041c0e
FB
1350static void tb_reset_jump_recursive(TranslationBlock *tb);
1351
1352static inline void tb_reset_jump_recursive2(TranslationBlock *tb, int n)
1353{
1354 TranslationBlock *tb1, *tb_next, **ptb;
1355 unsigned int n1;
1356
1357 tb1 = tb->jmp_next[n];
1358 if (tb1 != NULL) {
1359 /* find head of list */
1360 for(;;) {
1361 n1 = (long)tb1 & 3;
1362 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1363 if (n1 == 2)
1364 break;
1365 tb1 = tb1->jmp_next[n1];
1366 }
1367 /* we are now sure now that tb jumps to tb1 */
1368 tb_next = tb1;
1369
1370 /* remove tb from the jmp_first list */
1371 ptb = &tb_next->jmp_first;
1372 for(;;) {
1373 tb1 = *ptb;
1374 n1 = (long)tb1 & 3;
1375 tb1 = (TranslationBlock *)((long)tb1 & ~3);
1376 if (n1 == n && tb1 == tb)
1377 break;
1378 ptb = &tb1->jmp_next[n1];
1379 }
1380 *ptb = tb->jmp_next[n];
1381 tb->jmp_next[n] = NULL;
3b46e624 1382
ea041c0e
FB
1383 /* suppress the jump to next tb in generated code */
1384 tb_reset_jump(tb, n);
1385
0124311e 1386 /* suppress jumps in the tb on which we could have jumped */
ea041c0e
FB
1387 tb_reset_jump_recursive(tb_next);
1388 }
1389}
1390
1391static void tb_reset_jump_recursive(TranslationBlock *tb)
1392{
1393 tb_reset_jump_recursive2(tb, 0);
1394 tb_reset_jump_recursive2(tb, 1);
1395}
1396
1fddef4b 1397#if defined(TARGET_HAS_ICE)
94df27fd
PB
1398#if defined(CONFIG_USER_ONLY)
1399static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1400{
1401 tb_invalidate_phys_page_range(pc, pc + 1, 0);
1402}
1403#else
d720b93d
FB
1404static void breakpoint_invalidate(CPUState *env, target_ulong pc)
1405{
c227f099 1406 target_phys_addr_t addr;
9b3c35e0 1407 target_ulong pd;
c227f099 1408 ram_addr_t ram_addr;
c2f07f81 1409 PhysPageDesc *p;
d720b93d 1410
c2f07f81
PB
1411 addr = cpu_get_phys_page_debug(env, pc);
1412 p = phys_page_find(addr >> TARGET_PAGE_BITS);
1413 if (!p) {
1414 pd = IO_MEM_UNASSIGNED;
1415 } else {
1416 pd = p->phys_offset;
1417 }
1418 ram_addr = (pd & TARGET_PAGE_MASK) | (pc & ~TARGET_PAGE_MASK);
706cd4b5 1419 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
d720b93d 1420}
c27004ec 1421#endif
94df27fd 1422#endif /* TARGET_HAS_ICE */
d720b93d 1423
c527ee8f
PB
1424#if defined(CONFIG_USER_ONLY)
1425void cpu_watchpoint_remove_all(CPUState *env, int mask)
1426
1427{
1428}
1429
1430int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1431 int flags, CPUWatchpoint **watchpoint)
1432{
1433 return -ENOSYS;
1434}
1435#else
6658ffb8 1436/* Add a watchpoint. */
a1d1bb31
AL
1437int cpu_watchpoint_insert(CPUState *env, target_ulong addr, target_ulong len,
1438 int flags, CPUWatchpoint **watchpoint)
6658ffb8 1439{
b4051334 1440 target_ulong len_mask = ~(len - 1);
c0ce998e 1441 CPUWatchpoint *wp;
6658ffb8 1442
b4051334
AL
1443 /* sanity checks: allow power-of-2 lengths, deny unaligned watchpoints */
1444 if ((len != 1 && len != 2 && len != 4 && len != 8) || (addr & ~len_mask)) {
1445 fprintf(stderr, "qemu: tried to set invalid watchpoint at "
1446 TARGET_FMT_lx ", len=" TARGET_FMT_lu "\n", addr, len);
1447 return -EINVAL;
1448 }
a1d1bb31 1449 wp = qemu_malloc(sizeof(*wp));
a1d1bb31
AL
1450
1451 wp->vaddr = addr;
b4051334 1452 wp->len_mask = len_mask;
a1d1bb31
AL
1453 wp->flags = flags;
1454
2dc9f411 1455 /* keep all GDB-injected watchpoints in front */
c0ce998e 1456 if (flags & BP_GDB)
72cf2d4f 1457 QTAILQ_INSERT_HEAD(&env->watchpoints, wp, entry);
c0ce998e 1458 else
72cf2d4f 1459 QTAILQ_INSERT_TAIL(&env->watchpoints, wp, entry);
6658ffb8 1460
6658ffb8 1461 tlb_flush_page(env, addr);
a1d1bb31
AL
1462
1463 if (watchpoint)
1464 *watchpoint = wp;
1465 return 0;
6658ffb8
PB
1466}
1467
a1d1bb31
AL
1468/* Remove a specific watchpoint. */
1469int cpu_watchpoint_remove(CPUState *env, target_ulong addr, target_ulong len,
1470 int flags)
6658ffb8 1471{
b4051334 1472 target_ulong len_mask = ~(len - 1);
a1d1bb31 1473 CPUWatchpoint *wp;
6658ffb8 1474
72cf2d4f 1475 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334 1476 if (addr == wp->vaddr && len_mask == wp->len_mask
6e140f28 1477 && flags == (wp->flags & ~BP_WATCHPOINT_HIT)) {
a1d1bb31 1478 cpu_watchpoint_remove_by_ref(env, wp);
6658ffb8
PB
1479 return 0;
1480 }
1481 }
a1d1bb31 1482 return -ENOENT;
6658ffb8
PB
1483}
1484
a1d1bb31
AL
1485/* Remove a specific watchpoint by reference. */
1486void cpu_watchpoint_remove_by_ref(CPUState *env, CPUWatchpoint *watchpoint)
1487{
72cf2d4f 1488 QTAILQ_REMOVE(&env->watchpoints, watchpoint, entry);
7d03f82f 1489
a1d1bb31
AL
1490 tlb_flush_page(env, watchpoint->vaddr);
1491
1492 qemu_free(watchpoint);
1493}
1494
1495/* Remove all matching watchpoints. */
1496void cpu_watchpoint_remove_all(CPUState *env, int mask)
1497{
c0ce998e 1498 CPUWatchpoint *wp, *next;
a1d1bb31 1499
72cf2d4f 1500 QTAILQ_FOREACH_SAFE(wp, &env->watchpoints, entry, next) {
a1d1bb31
AL
1501 if (wp->flags & mask)
1502 cpu_watchpoint_remove_by_ref(env, wp);
c0ce998e 1503 }
7d03f82f 1504}
c527ee8f 1505#endif
7d03f82f 1506
a1d1bb31
AL
1507/* Add a breakpoint. */
1508int cpu_breakpoint_insert(CPUState *env, target_ulong pc, int flags,
1509 CPUBreakpoint **breakpoint)
4c3a88a2 1510{
1fddef4b 1511#if defined(TARGET_HAS_ICE)
c0ce998e 1512 CPUBreakpoint *bp;
3b46e624 1513
a1d1bb31 1514 bp = qemu_malloc(sizeof(*bp));
4c3a88a2 1515
a1d1bb31
AL
1516 bp->pc = pc;
1517 bp->flags = flags;
1518
2dc9f411 1519 /* keep all GDB-injected breakpoints in front */
c0ce998e 1520 if (flags & BP_GDB)
72cf2d4f 1521 QTAILQ_INSERT_HEAD(&env->breakpoints, bp, entry);
c0ce998e 1522 else
72cf2d4f 1523 QTAILQ_INSERT_TAIL(&env->breakpoints, bp, entry);
3b46e624 1524
d720b93d 1525 breakpoint_invalidate(env, pc);
a1d1bb31
AL
1526
1527 if (breakpoint)
1528 *breakpoint = bp;
4c3a88a2
FB
1529 return 0;
1530#else
a1d1bb31 1531 return -ENOSYS;
4c3a88a2
FB
1532#endif
1533}
1534
a1d1bb31
AL
1535/* Remove a specific breakpoint. */
1536int cpu_breakpoint_remove(CPUState *env, target_ulong pc, int flags)
1537{
7d03f82f 1538#if defined(TARGET_HAS_ICE)
a1d1bb31
AL
1539 CPUBreakpoint *bp;
1540
72cf2d4f 1541 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
a1d1bb31
AL
1542 if (bp->pc == pc && bp->flags == flags) {
1543 cpu_breakpoint_remove_by_ref(env, bp);
1544 return 0;
1545 }
7d03f82f 1546 }
a1d1bb31
AL
1547 return -ENOENT;
1548#else
1549 return -ENOSYS;
7d03f82f
EI
1550#endif
1551}
1552
a1d1bb31
AL
1553/* Remove a specific breakpoint by reference. */
1554void cpu_breakpoint_remove_by_ref(CPUState *env, CPUBreakpoint *breakpoint)
4c3a88a2 1555{
1fddef4b 1556#if defined(TARGET_HAS_ICE)
72cf2d4f 1557 QTAILQ_REMOVE(&env->breakpoints, breakpoint, entry);
d720b93d 1558
a1d1bb31
AL
1559 breakpoint_invalidate(env, breakpoint->pc);
1560
1561 qemu_free(breakpoint);
1562#endif
1563}
1564
1565/* Remove all matching breakpoints. */
1566void cpu_breakpoint_remove_all(CPUState *env, int mask)
1567{
1568#if defined(TARGET_HAS_ICE)
c0ce998e 1569 CPUBreakpoint *bp, *next;
a1d1bb31 1570
72cf2d4f 1571 QTAILQ_FOREACH_SAFE(bp, &env->breakpoints, entry, next) {
a1d1bb31
AL
1572 if (bp->flags & mask)
1573 cpu_breakpoint_remove_by_ref(env, bp);
c0ce998e 1574 }
4c3a88a2
FB
1575#endif
1576}
1577
c33a346e
FB
1578/* enable or disable single step mode. EXCP_DEBUG is returned by the
1579 CPU loop after each instruction */
1580void cpu_single_step(CPUState *env, int enabled)
1581{
1fddef4b 1582#if defined(TARGET_HAS_ICE)
c33a346e
FB
1583 if (env->singlestep_enabled != enabled) {
1584 env->singlestep_enabled = enabled;
e22a25c9
AL
1585 if (kvm_enabled())
1586 kvm_update_guest_debug(env, 0);
1587 else {
ccbb4d44 1588 /* must flush all the translated code to avoid inconsistencies */
e22a25c9
AL
1589 /* XXX: only flush what is necessary */
1590 tb_flush(env);
1591 }
c33a346e
FB
1592 }
1593#endif
1594}
1595
34865134
FB
1596/* enable or disable low levels log */
1597void cpu_set_log(int log_flags)
1598{
1599 loglevel = log_flags;
1600 if (loglevel && !logfile) {
11fcfab4 1601 logfile = fopen(logfilename, log_append ? "a" : "w");
34865134
FB
1602 if (!logfile) {
1603 perror(logfilename);
1604 _exit(1);
1605 }
9fa3e853
FB
1606#if !defined(CONFIG_SOFTMMU)
1607 /* must avoid mmap() usage of glibc by setting a buffer "by hand" */
1608 {
b55266b5 1609 static char logfile_buf[4096];
9fa3e853
FB
1610 setvbuf(logfile, logfile_buf, _IOLBF, sizeof(logfile_buf));
1611 }
bf65f53f
FN
1612#elif !defined(_WIN32)
1613 /* Win32 doesn't support line-buffering and requires size >= 2 */
34865134 1614 setvbuf(logfile, NULL, _IOLBF, 0);
9fa3e853 1615#endif
e735b91c
PB
1616 log_append = 1;
1617 }
1618 if (!loglevel && logfile) {
1619 fclose(logfile);
1620 logfile = NULL;
34865134
FB
1621 }
1622}
1623
1624void cpu_set_log_filename(const char *filename)
1625{
1626 logfilename = strdup(filename);
e735b91c
PB
1627 if (logfile) {
1628 fclose(logfile);
1629 logfile = NULL;
1630 }
1631 cpu_set_log(loglevel);
34865134 1632}
c33a346e 1633
3098dba0 1634static void cpu_unlink_tb(CPUState *env)
ea041c0e 1635{
3098dba0
AJ
1636 /* FIXME: TB unchaining isn't SMP safe. For now just ignore the
1637 problem and hope the cpu will stop of its own accord. For userspace
1638 emulation this often isn't actually as bad as it sounds. Often
1639 signals are used primarily to interrupt blocking syscalls. */
ea041c0e 1640 TranslationBlock *tb;
c227f099 1641 static spinlock_t interrupt_lock = SPIN_LOCK_UNLOCKED;
59817ccb 1642
cab1b4bd 1643 spin_lock(&interrupt_lock);
3098dba0
AJ
1644 tb = env->current_tb;
1645 /* if the cpu is currently executing code, we must unlink it and
1646 all the potentially executing TB */
f76cfe56 1647 if (tb) {
3098dba0
AJ
1648 env->current_tb = NULL;
1649 tb_reset_jump_recursive(tb);
be214e6c 1650 }
cab1b4bd 1651 spin_unlock(&interrupt_lock);
3098dba0
AJ
1652}
1653
97ffbd8d 1654#ifndef CONFIG_USER_ONLY
3098dba0 1655/* mask must never be zero, except for A20 change call */
ec6959d0 1656static void tcg_handle_interrupt(CPUState *env, int mask)
3098dba0
AJ
1657{
1658 int old_mask;
be214e6c 1659
2e70f6ef 1660 old_mask = env->interrupt_request;
68a79315 1661 env->interrupt_request |= mask;
3098dba0 1662
8edac960
AL
1663 /*
1664 * If called from iothread context, wake the target cpu in
1665 * case its halted.
1666 */
b7680cb6 1667 if (!qemu_cpu_is_self(env)) {
8edac960
AL
1668 qemu_cpu_kick(env);
1669 return;
1670 }
8edac960 1671
2e70f6ef 1672 if (use_icount) {
266910c4 1673 env->icount_decr.u16.high = 0xffff;
2e70f6ef 1674 if (!can_do_io(env)
be214e6c 1675 && (mask & ~old_mask) != 0) {
2e70f6ef
PB
1676 cpu_abort(env, "Raised interrupt while not in I/O function");
1677 }
2e70f6ef 1678 } else {
3098dba0 1679 cpu_unlink_tb(env);
ea041c0e
FB
1680 }
1681}
1682
ec6959d0
JK
1683CPUInterruptHandler cpu_interrupt_handler = tcg_handle_interrupt;
1684
97ffbd8d
JK
1685#else /* CONFIG_USER_ONLY */
1686
1687void cpu_interrupt(CPUState *env, int mask)
1688{
1689 env->interrupt_request |= mask;
1690 cpu_unlink_tb(env);
1691}
1692#endif /* CONFIG_USER_ONLY */
1693
b54ad049
FB
1694void cpu_reset_interrupt(CPUState *env, int mask)
1695{
1696 env->interrupt_request &= ~mask;
1697}
1698
3098dba0
AJ
1699void cpu_exit(CPUState *env)
1700{
1701 env->exit_request = 1;
1702 cpu_unlink_tb(env);
1703}
1704
c7cd6a37 1705const CPULogItem cpu_log_items[] = {
5fafdf24 1706 { CPU_LOG_TB_OUT_ASM, "out_asm",
f193c797
FB
1707 "show generated host assembly code for each compiled TB" },
1708 { CPU_LOG_TB_IN_ASM, "in_asm",
1709 "show target assembly code for each compiled TB" },
5fafdf24 1710 { CPU_LOG_TB_OP, "op",
57fec1fe 1711 "show micro ops for each compiled TB" },
f193c797 1712 { CPU_LOG_TB_OP_OPT, "op_opt",
e01a1157
BS
1713 "show micro ops "
1714#ifdef TARGET_I386
1715 "before eflags optimization and "
f193c797 1716#endif
e01a1157 1717 "after liveness analysis" },
f193c797
FB
1718 { CPU_LOG_INT, "int",
1719 "show interrupts/exceptions in short format" },
1720 { CPU_LOG_EXEC, "exec",
1721 "show trace before each executed TB (lots of logs)" },
9fddaa0c 1722 { CPU_LOG_TB_CPU, "cpu",
e91c8a77 1723 "show CPU state before block translation" },
f193c797
FB
1724#ifdef TARGET_I386
1725 { CPU_LOG_PCALL, "pcall",
1726 "show protected mode far calls/returns/exceptions" },
eca1bdf4
AL
1727 { CPU_LOG_RESET, "cpu_reset",
1728 "show CPU state before CPU resets" },
f193c797 1729#endif
8e3a9fd2 1730#ifdef DEBUG_IOPORT
fd872598
FB
1731 { CPU_LOG_IOPORT, "ioport",
1732 "show all i/o ports accesses" },
8e3a9fd2 1733#endif
f193c797
FB
1734 { 0, NULL, NULL },
1735};
1736
f6f3fbca
MT
1737#ifndef CONFIG_USER_ONLY
1738static QLIST_HEAD(memory_client_list, CPUPhysMemoryClient) memory_client_list
1739 = QLIST_HEAD_INITIALIZER(memory_client_list);
1740
1741static void cpu_notify_set_memory(target_phys_addr_t start_addr,
9742bf26 1742 ram_addr_t size,
0fd542fb
MT
1743 ram_addr_t phys_offset,
1744 bool log_dirty)
f6f3fbca
MT
1745{
1746 CPUPhysMemoryClient *client;
1747 QLIST_FOREACH(client, &memory_client_list, list) {
0fd542fb 1748 client->set_memory(client, start_addr, size, phys_offset, log_dirty);
f6f3fbca
MT
1749 }
1750}
1751
1752static int cpu_notify_sync_dirty_bitmap(target_phys_addr_t start,
9742bf26 1753 target_phys_addr_t end)
f6f3fbca
MT
1754{
1755 CPUPhysMemoryClient *client;
1756 QLIST_FOREACH(client, &memory_client_list, list) {
1757 int r = client->sync_dirty_bitmap(client, start, end);
1758 if (r < 0)
1759 return r;
1760 }
1761 return 0;
1762}
1763
1764static int cpu_notify_migration_log(int enable)
1765{
1766 CPUPhysMemoryClient *client;
1767 QLIST_FOREACH(client, &memory_client_list, list) {
1768 int r = client->migration_log(client, enable);
1769 if (r < 0)
1770 return r;
1771 }
1772 return 0;
1773}
1774
2173a75f
AW
1775struct last_map {
1776 target_phys_addr_t start_addr;
1777 ram_addr_t size;
1778 ram_addr_t phys_offset;
1779};
1780
8d4c78e7
AW
1781/* The l1_phys_map provides the upper P_L1_BITs of the guest physical
1782 * address. Each intermediate table provides the next L2_BITs of guest
1783 * physical address space. The number of levels vary based on host and
1784 * guest configuration, making it efficient to build the final guest
1785 * physical address by seeding the L1 offset and shifting and adding in
1786 * each L2 offset as we recurse through them. */
2173a75f
AW
1787static void phys_page_for_each_1(CPUPhysMemoryClient *client, int level,
1788 void **lp, target_phys_addr_t addr,
1789 struct last_map *map)
f6f3fbca 1790{
5cd2c5b6 1791 int i;
f6f3fbca 1792
5cd2c5b6
RH
1793 if (*lp == NULL) {
1794 return;
1795 }
1796 if (level == 0) {
1797 PhysPageDesc *pd = *lp;
8d4c78e7 1798 addr <<= L2_BITS + TARGET_PAGE_BITS;
7296abac 1799 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6 1800 if (pd[i].phys_offset != IO_MEM_UNASSIGNED) {
2173a75f
AW
1801 target_phys_addr_t start_addr = addr | i << TARGET_PAGE_BITS;
1802
1803 if (map->size &&
1804 start_addr == map->start_addr + map->size &&
1805 pd[i].phys_offset == map->phys_offset + map->size) {
1806
1807 map->size += TARGET_PAGE_SIZE;
1808 continue;
1809 } else if (map->size) {
1810 client->set_memory(client, map->start_addr,
1811 map->size, map->phys_offset, false);
1812 }
1813
1814 map->start_addr = start_addr;
1815 map->size = TARGET_PAGE_SIZE;
1816 map->phys_offset = pd[i].phys_offset;
f6f3fbca 1817 }
5cd2c5b6
RH
1818 }
1819 } else {
1820 void **pp = *lp;
7296abac 1821 for (i = 0; i < L2_SIZE; ++i) {
8d4c78e7 1822 phys_page_for_each_1(client, level - 1, pp + i,
2173a75f 1823 (addr << L2_BITS) | i, map);
f6f3fbca
MT
1824 }
1825 }
1826}
1827
1828static void phys_page_for_each(CPUPhysMemoryClient *client)
1829{
5cd2c5b6 1830 int i;
2173a75f
AW
1831 struct last_map map = { };
1832
5cd2c5b6
RH
1833 for (i = 0; i < P_L1_SIZE; ++i) {
1834 phys_page_for_each_1(client, P_L1_SHIFT / L2_BITS - 1,
2173a75f
AW
1835 l1_phys_map + i, i, &map);
1836 }
1837 if (map.size) {
1838 client->set_memory(client, map.start_addr, map.size, map.phys_offset,
1839 false);
f6f3fbca 1840 }
f6f3fbca
MT
1841}
1842
1843void cpu_register_phys_memory_client(CPUPhysMemoryClient *client)
1844{
1845 QLIST_INSERT_HEAD(&memory_client_list, client, list);
1846 phys_page_for_each(client);
1847}
1848
1849void cpu_unregister_phys_memory_client(CPUPhysMemoryClient *client)
1850{
1851 QLIST_REMOVE(client, list);
1852}
1853#endif
1854
f193c797
FB
1855static int cmp1(const char *s1, int n, const char *s2)
1856{
1857 if (strlen(s2) != n)
1858 return 0;
1859 return memcmp(s1, s2, n) == 0;
1860}
3b46e624 1861
f193c797
FB
1862/* takes a comma separated list of log masks. Return 0 if error. */
1863int cpu_str_to_log_mask(const char *str)
1864{
c7cd6a37 1865 const CPULogItem *item;
f193c797
FB
1866 int mask;
1867 const char *p, *p1;
1868
1869 p = str;
1870 mask = 0;
1871 for(;;) {
1872 p1 = strchr(p, ',');
1873 if (!p1)
1874 p1 = p + strlen(p);
9742bf26
YT
1875 if(cmp1(p,p1-p,"all")) {
1876 for(item = cpu_log_items; item->mask != 0; item++) {
1877 mask |= item->mask;
1878 }
1879 } else {
1880 for(item = cpu_log_items; item->mask != 0; item++) {
1881 if (cmp1(p, p1 - p, item->name))
1882 goto found;
1883 }
1884 return 0;
f193c797 1885 }
f193c797
FB
1886 found:
1887 mask |= item->mask;
1888 if (*p1 != ',')
1889 break;
1890 p = p1 + 1;
1891 }
1892 return mask;
1893}
ea041c0e 1894
7501267e
FB
1895void cpu_abort(CPUState *env, const char *fmt, ...)
1896{
1897 va_list ap;
493ae1f0 1898 va_list ap2;
7501267e
FB
1899
1900 va_start(ap, fmt);
493ae1f0 1901 va_copy(ap2, ap);
7501267e
FB
1902 fprintf(stderr, "qemu: fatal: ");
1903 vfprintf(stderr, fmt, ap);
1904 fprintf(stderr, "\n");
1905#ifdef TARGET_I386
7fe48483
FB
1906 cpu_dump_state(env, stderr, fprintf, X86_DUMP_FPU | X86_DUMP_CCOP);
1907#else
1908 cpu_dump_state(env, stderr, fprintf, 0);
7501267e 1909#endif
93fcfe39
AL
1910 if (qemu_log_enabled()) {
1911 qemu_log("qemu: fatal: ");
1912 qemu_log_vprintf(fmt, ap2);
1913 qemu_log("\n");
f9373291 1914#ifdef TARGET_I386
93fcfe39 1915 log_cpu_state(env, X86_DUMP_FPU | X86_DUMP_CCOP);
f9373291 1916#else
93fcfe39 1917 log_cpu_state(env, 0);
f9373291 1918#endif
31b1a7b4 1919 qemu_log_flush();
93fcfe39 1920 qemu_log_close();
924edcae 1921 }
493ae1f0 1922 va_end(ap2);
f9373291 1923 va_end(ap);
fd052bf6
RV
1924#if defined(CONFIG_USER_ONLY)
1925 {
1926 struct sigaction act;
1927 sigfillset(&act.sa_mask);
1928 act.sa_handler = SIG_DFL;
1929 sigaction(SIGABRT, &act, NULL);
1930 }
1931#endif
7501267e
FB
1932 abort();
1933}
1934
c5be9f08
TS
1935CPUState *cpu_copy(CPUState *env)
1936{
01ba9816 1937 CPUState *new_env = cpu_init(env->cpu_model_str);
c5be9f08
TS
1938 CPUState *next_cpu = new_env->next_cpu;
1939 int cpu_index = new_env->cpu_index;
5a38f081
AL
1940#if defined(TARGET_HAS_ICE)
1941 CPUBreakpoint *bp;
1942 CPUWatchpoint *wp;
1943#endif
1944
c5be9f08 1945 memcpy(new_env, env, sizeof(CPUState));
5a38f081
AL
1946
1947 /* Preserve chaining and index. */
c5be9f08
TS
1948 new_env->next_cpu = next_cpu;
1949 new_env->cpu_index = cpu_index;
5a38f081
AL
1950
1951 /* Clone all break/watchpoints.
1952 Note: Once we support ptrace with hw-debug register access, make sure
1953 BP_CPU break/watchpoints are handled correctly on clone. */
72cf2d4f
BS
1954 QTAILQ_INIT(&env->breakpoints);
1955 QTAILQ_INIT(&env->watchpoints);
5a38f081 1956#if defined(TARGET_HAS_ICE)
72cf2d4f 1957 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
5a38f081
AL
1958 cpu_breakpoint_insert(new_env, bp->pc, bp->flags, NULL);
1959 }
72cf2d4f 1960 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
5a38f081
AL
1961 cpu_watchpoint_insert(new_env, wp->vaddr, (~wp->len_mask) + 1,
1962 wp->flags, NULL);
1963 }
1964#endif
1965
c5be9f08
TS
1966 return new_env;
1967}
1968
0124311e
FB
1969#if !defined(CONFIG_USER_ONLY)
1970
5c751e99
EI
1971static inline void tlb_flush_jmp_cache(CPUState *env, target_ulong addr)
1972{
1973 unsigned int i;
1974
1975 /* Discard jump cache entries for any tb which might potentially
1976 overlap the flushed page. */
1977 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1978 memset (&env->tb_jmp_cache[i], 0,
9742bf26 1979 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
5c751e99
EI
1980
1981 i = tb_jmp_cache_hash_page(addr);
1982 memset (&env->tb_jmp_cache[i], 0,
9742bf26 1983 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
5c751e99
EI
1984}
1985
08738984
IK
1986static CPUTLBEntry s_cputlb_empty_entry = {
1987 .addr_read = -1,
1988 .addr_write = -1,
1989 .addr_code = -1,
1990 .addend = -1,
1991};
1992
ee8b7021
FB
1993/* NOTE: if flush_global is true, also flush global entries (not
1994 implemented yet) */
1995void tlb_flush(CPUState *env, int flush_global)
33417e70 1996{
33417e70 1997 int i;
0124311e 1998
9fa3e853
FB
1999#if defined(DEBUG_TLB)
2000 printf("tlb_flush:\n");
2001#endif
0124311e
FB
2002 /* must reset current TB so that interrupts cannot modify the
2003 links while we are modifying them */
2004 env->current_tb = NULL;
2005
33417e70 2006 for(i = 0; i < CPU_TLB_SIZE; i++) {
cfde4bd9
IY
2007 int mmu_idx;
2008 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
08738984 2009 env->tlb_table[mmu_idx][i] = s_cputlb_empty_entry;
cfde4bd9 2010 }
33417e70 2011 }
9fa3e853 2012
8a40a180 2013 memset (env->tb_jmp_cache, 0, TB_JMP_CACHE_SIZE * sizeof (void *));
9fa3e853 2014
d4c430a8
PB
2015 env->tlb_flush_addr = -1;
2016 env->tlb_flush_mask = 0;
e3db7226 2017 tlb_flush_count++;
33417e70
FB
2018}
2019
274da6b2 2020static inline void tlb_flush_entry(CPUTLBEntry *tlb_entry, target_ulong addr)
61382a50 2021{
5fafdf24 2022 if (addr == (tlb_entry->addr_read &
84b7b8e7 2023 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
5fafdf24 2024 addr == (tlb_entry->addr_write &
84b7b8e7 2025 (TARGET_PAGE_MASK | TLB_INVALID_MASK)) ||
5fafdf24 2026 addr == (tlb_entry->addr_code &
84b7b8e7 2027 (TARGET_PAGE_MASK | TLB_INVALID_MASK))) {
08738984 2028 *tlb_entry = s_cputlb_empty_entry;
84b7b8e7 2029 }
61382a50
FB
2030}
2031
2e12669a 2032void tlb_flush_page(CPUState *env, target_ulong addr)
33417e70 2033{
8a40a180 2034 int i;
cfde4bd9 2035 int mmu_idx;
0124311e 2036
9fa3e853 2037#if defined(DEBUG_TLB)
108c49b8 2038 printf("tlb_flush_page: " TARGET_FMT_lx "\n", addr);
9fa3e853 2039#endif
d4c430a8
PB
2040 /* Check if we need to flush due to large pages. */
2041 if ((addr & env->tlb_flush_mask) == env->tlb_flush_addr) {
2042#if defined(DEBUG_TLB)
2043 printf("tlb_flush_page: forced full flush ("
2044 TARGET_FMT_lx "/" TARGET_FMT_lx ")\n",
2045 env->tlb_flush_addr, env->tlb_flush_mask);
2046#endif
2047 tlb_flush(env, 1);
2048 return;
2049 }
0124311e
FB
2050 /* must reset current TB so that interrupts cannot modify the
2051 links while we are modifying them */
2052 env->current_tb = NULL;
61382a50
FB
2053
2054 addr &= TARGET_PAGE_MASK;
2055 i = (addr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
cfde4bd9
IY
2056 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
2057 tlb_flush_entry(&env->tlb_table[mmu_idx][i], addr);
0124311e 2058
5c751e99 2059 tlb_flush_jmp_cache(env, addr);
9fa3e853
FB
2060}
2061
9fa3e853
FB
2062/* update the TLBs so that writes to code in the virtual page 'addr'
2063 can be detected */
c227f099 2064static void tlb_protect_code(ram_addr_t ram_addr)
9fa3e853 2065{
5fafdf24 2066 cpu_physical_memory_reset_dirty(ram_addr,
6a00d601
FB
2067 ram_addr + TARGET_PAGE_SIZE,
2068 CODE_DIRTY_FLAG);
9fa3e853
FB
2069}
2070
9fa3e853 2071/* update the TLB so that writes in physical page 'phys_addr' are no longer
3a7d929e 2072 tested for self modifying code */
c227f099 2073static void tlb_unprotect_code_phys(CPUState *env, ram_addr_t ram_addr,
3a7d929e 2074 target_ulong vaddr)
9fa3e853 2075{
f7c11b53 2076 cpu_physical_memory_set_dirty_flags(ram_addr, CODE_DIRTY_FLAG);
1ccde1cb
FB
2077}
2078
5fafdf24 2079static inline void tlb_reset_dirty_range(CPUTLBEntry *tlb_entry,
1ccde1cb
FB
2080 unsigned long start, unsigned long length)
2081{
2082 unsigned long addr;
84b7b8e7
FB
2083 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
2084 addr = (tlb_entry->addr_write & TARGET_PAGE_MASK) + tlb_entry->addend;
1ccde1cb 2085 if ((addr - start) < length) {
0f459d16 2086 tlb_entry->addr_write = (tlb_entry->addr_write & TARGET_PAGE_MASK) | TLB_NOTDIRTY;
1ccde1cb
FB
2087 }
2088 }
2089}
2090
5579c7f3 2091/* Note: start and end must be within the same ram block. */
c227f099 2092void cpu_physical_memory_reset_dirty(ram_addr_t start, ram_addr_t end,
0a962c02 2093 int dirty_flags)
1ccde1cb
FB
2094{
2095 CPUState *env;
4f2ac237 2096 unsigned long length, start1;
f7c11b53 2097 int i;
1ccde1cb
FB
2098
2099 start &= TARGET_PAGE_MASK;
2100 end = TARGET_PAGE_ALIGN(end);
2101
2102 length = end - start;
2103 if (length == 0)
2104 return;
f7c11b53 2105 cpu_physical_memory_mask_dirty_range(start, length, dirty_flags);
f23db169 2106
1ccde1cb
FB
2107 /* we modify the TLB cache so that the dirty bit will be set again
2108 when accessing the range */
b2e0a138 2109 start1 = (unsigned long)qemu_safe_ram_ptr(start);
a57d23e4 2110 /* Check that we don't span multiple blocks - this breaks the
5579c7f3 2111 address comparisons below. */
b2e0a138 2112 if ((unsigned long)qemu_safe_ram_ptr(end - 1) - start1
5579c7f3
PB
2113 != (end - 1) - start) {
2114 abort();
2115 }
2116
6a00d601 2117 for(env = first_cpu; env != NULL; env = env->next_cpu) {
cfde4bd9
IY
2118 int mmu_idx;
2119 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2120 for(i = 0; i < CPU_TLB_SIZE; i++)
2121 tlb_reset_dirty_range(&env->tlb_table[mmu_idx][i],
2122 start1, length);
2123 }
6a00d601 2124 }
1ccde1cb
FB
2125}
2126
74576198
AL
2127int cpu_physical_memory_set_dirty_tracking(int enable)
2128{
f6f3fbca 2129 int ret = 0;
74576198 2130 in_migration = enable;
f6f3fbca
MT
2131 ret = cpu_notify_migration_log(!!enable);
2132 return ret;
74576198
AL
2133}
2134
2135int cpu_physical_memory_get_dirty_tracking(void)
2136{
2137 return in_migration;
2138}
2139
c227f099
AL
2140int cpu_physical_sync_dirty_bitmap(target_phys_addr_t start_addr,
2141 target_phys_addr_t end_addr)
2bec46dc 2142{
7b8f3b78 2143 int ret;
151f7749 2144
f6f3fbca 2145 ret = cpu_notify_sync_dirty_bitmap(start_addr, end_addr);
151f7749 2146 return ret;
2bec46dc
AL
2147}
2148
e5896b12
AP
2149int cpu_physical_log_start(target_phys_addr_t start_addr,
2150 ram_addr_t size)
2151{
2152 CPUPhysMemoryClient *client;
2153 QLIST_FOREACH(client, &memory_client_list, list) {
2154 if (client->log_start) {
2155 int r = client->log_start(client, start_addr, size);
2156 if (r < 0) {
2157 return r;
2158 }
2159 }
2160 }
2161 return 0;
2162}
2163
2164int cpu_physical_log_stop(target_phys_addr_t start_addr,
2165 ram_addr_t size)
2166{
2167 CPUPhysMemoryClient *client;
2168 QLIST_FOREACH(client, &memory_client_list, list) {
2169 if (client->log_stop) {
2170 int r = client->log_stop(client, start_addr, size);
2171 if (r < 0) {
2172 return r;
2173 }
2174 }
2175 }
2176 return 0;
2177}
2178
3a7d929e
FB
2179static inline void tlb_update_dirty(CPUTLBEntry *tlb_entry)
2180{
c227f099 2181 ram_addr_t ram_addr;
5579c7f3 2182 void *p;
3a7d929e 2183
84b7b8e7 2184 if ((tlb_entry->addr_write & ~TARGET_PAGE_MASK) == IO_MEM_RAM) {
5579c7f3
PB
2185 p = (void *)(unsigned long)((tlb_entry->addr_write & TARGET_PAGE_MASK)
2186 + tlb_entry->addend);
e890261f 2187 ram_addr = qemu_ram_addr_from_host_nofail(p);
3a7d929e 2188 if (!cpu_physical_memory_is_dirty(ram_addr)) {
0f459d16 2189 tlb_entry->addr_write |= TLB_NOTDIRTY;
3a7d929e
FB
2190 }
2191 }
2192}
2193
2194/* update the TLB according to the current state of the dirty bits */
2195void cpu_tlb_update_dirty(CPUState *env)
2196{
2197 int i;
cfde4bd9
IY
2198 int mmu_idx;
2199 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++) {
2200 for(i = 0; i < CPU_TLB_SIZE; i++)
2201 tlb_update_dirty(&env->tlb_table[mmu_idx][i]);
2202 }
3a7d929e
FB
2203}
2204
0f459d16 2205static inline void tlb_set_dirty1(CPUTLBEntry *tlb_entry, target_ulong vaddr)
1ccde1cb 2206{
0f459d16
PB
2207 if (tlb_entry->addr_write == (vaddr | TLB_NOTDIRTY))
2208 tlb_entry->addr_write = vaddr;
1ccde1cb
FB
2209}
2210
0f459d16
PB
2211/* update the TLB corresponding to virtual page vaddr
2212 so that it is no longer dirty */
2213static inline void tlb_set_dirty(CPUState *env, target_ulong vaddr)
1ccde1cb 2214{
1ccde1cb 2215 int i;
cfde4bd9 2216 int mmu_idx;
1ccde1cb 2217
0f459d16 2218 vaddr &= TARGET_PAGE_MASK;
1ccde1cb 2219 i = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
cfde4bd9
IY
2220 for (mmu_idx = 0; mmu_idx < NB_MMU_MODES; mmu_idx++)
2221 tlb_set_dirty1(&env->tlb_table[mmu_idx][i], vaddr);
9fa3e853
FB
2222}
2223
d4c430a8
PB
2224/* Our TLB does not support large pages, so remember the area covered by
2225 large pages and trigger a full TLB flush if these are invalidated. */
2226static void tlb_add_large_page(CPUState *env, target_ulong vaddr,
2227 target_ulong size)
2228{
2229 target_ulong mask = ~(size - 1);
2230
2231 if (env->tlb_flush_addr == (target_ulong)-1) {
2232 env->tlb_flush_addr = vaddr & mask;
2233 env->tlb_flush_mask = mask;
2234 return;
2235 }
2236 /* Extend the existing region to include the new page.
2237 This is a compromise between unnecessary flushes and the cost
2238 of maintaining a full variable size TLB. */
2239 mask &= env->tlb_flush_mask;
2240 while (((env->tlb_flush_addr ^ vaddr) & mask) != 0) {
2241 mask <<= 1;
2242 }
2243 env->tlb_flush_addr &= mask;
2244 env->tlb_flush_mask = mask;
2245}
2246
2247/* Add a new TLB entry. At most one entry for a given virtual address
2248 is permitted. Only a single TARGET_PAGE_SIZE region is mapped, the
2249 supplied size is only used by tlb_flush_page. */
2250void tlb_set_page(CPUState *env, target_ulong vaddr,
2251 target_phys_addr_t paddr, int prot,
2252 int mmu_idx, target_ulong size)
9fa3e853 2253{
92e873b9 2254 PhysPageDesc *p;
4f2ac237 2255 unsigned long pd;
9fa3e853 2256 unsigned int index;
4f2ac237 2257 target_ulong address;
0f459d16 2258 target_ulong code_address;
355b1943 2259 unsigned long addend;
84b7b8e7 2260 CPUTLBEntry *te;
a1d1bb31 2261 CPUWatchpoint *wp;
c227f099 2262 target_phys_addr_t iotlb;
9fa3e853 2263
d4c430a8
PB
2264 assert(size >= TARGET_PAGE_SIZE);
2265 if (size != TARGET_PAGE_SIZE) {
2266 tlb_add_large_page(env, vaddr, size);
2267 }
92e873b9 2268 p = phys_page_find(paddr >> TARGET_PAGE_BITS);
9fa3e853
FB
2269 if (!p) {
2270 pd = IO_MEM_UNASSIGNED;
9fa3e853
FB
2271 } else {
2272 pd = p->phys_offset;
9fa3e853
FB
2273 }
2274#if defined(DEBUG_TLB)
7fd3f494
SW
2275 printf("tlb_set_page: vaddr=" TARGET_FMT_lx " paddr=0x" TARGET_FMT_plx
2276 " prot=%x idx=%d pd=0x%08lx\n",
2277 vaddr, paddr, prot, mmu_idx, pd);
9fa3e853
FB
2278#endif
2279
0f459d16
PB
2280 address = vaddr;
2281 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM && !(pd & IO_MEM_ROMD)) {
2282 /* IO memory case (romd handled later) */
2283 address |= TLB_MMIO;
2284 }
5579c7f3 2285 addend = (unsigned long)qemu_get_ram_ptr(pd & TARGET_PAGE_MASK);
0f459d16
PB
2286 if ((pd & ~TARGET_PAGE_MASK) <= IO_MEM_ROM) {
2287 /* Normal RAM. */
2288 iotlb = pd & TARGET_PAGE_MASK;
2289 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM)
2290 iotlb |= IO_MEM_NOTDIRTY;
2291 else
2292 iotlb |= IO_MEM_ROM;
2293 } else {
ccbb4d44 2294 /* IO handlers are currently passed a physical address.
0f459d16
PB
2295 It would be nice to pass an offset from the base address
2296 of that region. This would avoid having to special case RAM,
2297 and avoid full address decoding in every device.
2298 We can't use the high bits of pd for this because
2299 IO_MEM_ROMD uses these as a ram address. */
8da3ff18
PB
2300 iotlb = (pd & ~TARGET_PAGE_MASK);
2301 if (p) {
8da3ff18
PB
2302 iotlb += p->region_offset;
2303 } else {
2304 iotlb += paddr;
2305 }
0f459d16
PB
2306 }
2307
2308 code_address = address;
2309 /* Make accesses to pages with watchpoints go via the
2310 watchpoint trap routines. */
72cf2d4f 2311 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
a1d1bb31 2312 if (vaddr == (wp->vaddr & TARGET_PAGE_MASK)) {
bf298f83
JK
2313 /* Avoid trapping reads of pages with a write breakpoint. */
2314 if ((prot & PAGE_WRITE) || (wp->flags & BP_MEM_READ)) {
2315 iotlb = io_mem_watch + paddr;
2316 address |= TLB_MMIO;
2317 break;
2318 }
6658ffb8 2319 }
0f459d16 2320 }
d79acba4 2321
0f459d16
PB
2322 index = (vaddr >> TARGET_PAGE_BITS) & (CPU_TLB_SIZE - 1);
2323 env->iotlb[mmu_idx][index] = iotlb - vaddr;
2324 te = &env->tlb_table[mmu_idx][index];
2325 te->addend = addend - vaddr;
2326 if (prot & PAGE_READ) {
2327 te->addr_read = address;
2328 } else {
2329 te->addr_read = -1;
2330 }
5c751e99 2331
0f459d16
PB
2332 if (prot & PAGE_EXEC) {
2333 te->addr_code = code_address;
2334 } else {
2335 te->addr_code = -1;
2336 }
2337 if (prot & PAGE_WRITE) {
2338 if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_ROM ||
2339 (pd & IO_MEM_ROMD)) {
2340 /* Write access calls the I/O callback. */
2341 te->addr_write = address | TLB_MMIO;
2342 } else if ((pd & ~TARGET_PAGE_MASK) == IO_MEM_RAM &&
2343 !cpu_physical_memory_is_dirty(pd)) {
2344 te->addr_write = address | TLB_NOTDIRTY;
9fa3e853 2345 } else {
0f459d16 2346 te->addr_write = address;
9fa3e853 2347 }
0f459d16
PB
2348 } else {
2349 te->addr_write = -1;
9fa3e853 2350 }
9fa3e853
FB
2351}
2352
0124311e
FB
2353#else
2354
ee8b7021 2355void tlb_flush(CPUState *env, int flush_global)
0124311e
FB
2356{
2357}
2358
2e12669a 2359void tlb_flush_page(CPUState *env, target_ulong addr)
0124311e
FB
2360{
2361}
2362
edf8e2af
MW
2363/*
2364 * Walks guest process memory "regions" one by one
2365 * and calls callback function 'fn' for each region.
2366 */
5cd2c5b6
RH
2367
2368struct walk_memory_regions_data
2369{
2370 walk_memory_regions_fn fn;
2371 void *priv;
2372 unsigned long start;
2373 int prot;
2374};
2375
2376static int walk_memory_regions_end(struct walk_memory_regions_data *data,
b480d9b7 2377 abi_ulong end, int new_prot)
5cd2c5b6
RH
2378{
2379 if (data->start != -1ul) {
2380 int rc = data->fn(data->priv, data->start, end, data->prot);
2381 if (rc != 0) {
2382 return rc;
2383 }
2384 }
2385
2386 data->start = (new_prot ? end : -1ul);
2387 data->prot = new_prot;
2388
2389 return 0;
2390}
2391
2392static int walk_memory_regions_1(struct walk_memory_regions_data *data,
b480d9b7 2393 abi_ulong base, int level, void **lp)
5cd2c5b6 2394{
b480d9b7 2395 abi_ulong pa;
5cd2c5b6
RH
2396 int i, rc;
2397
2398 if (*lp == NULL) {
2399 return walk_memory_regions_end(data, base, 0);
2400 }
2401
2402 if (level == 0) {
2403 PageDesc *pd = *lp;
7296abac 2404 for (i = 0; i < L2_SIZE; ++i) {
5cd2c5b6
RH
2405 int prot = pd[i].flags;
2406
2407 pa = base | (i << TARGET_PAGE_BITS);
2408 if (prot != data->prot) {
2409 rc = walk_memory_regions_end(data, pa, prot);
2410 if (rc != 0) {
2411 return rc;
9fa3e853 2412 }
9fa3e853 2413 }
5cd2c5b6
RH
2414 }
2415 } else {
2416 void **pp = *lp;
7296abac 2417 for (i = 0; i < L2_SIZE; ++i) {
b480d9b7
PB
2418 pa = base | ((abi_ulong)i <<
2419 (TARGET_PAGE_BITS + L2_BITS * level));
5cd2c5b6
RH
2420 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
2421 if (rc != 0) {
2422 return rc;
2423 }
2424 }
2425 }
2426
2427 return 0;
2428}
2429
2430int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
2431{
2432 struct walk_memory_regions_data data;
2433 unsigned long i;
2434
2435 data.fn = fn;
2436 data.priv = priv;
2437 data.start = -1ul;
2438 data.prot = 0;
2439
2440 for (i = 0; i < V_L1_SIZE; i++) {
b480d9b7 2441 int rc = walk_memory_regions_1(&data, (abi_ulong)i << V_L1_SHIFT,
5cd2c5b6
RH
2442 V_L1_SHIFT / L2_BITS - 1, l1_map + i);
2443 if (rc != 0) {
2444 return rc;
9fa3e853 2445 }
33417e70 2446 }
5cd2c5b6
RH
2447
2448 return walk_memory_regions_end(&data, 0, 0);
edf8e2af
MW
2449}
2450
b480d9b7
PB
2451static int dump_region(void *priv, abi_ulong start,
2452 abi_ulong end, unsigned long prot)
edf8e2af
MW
2453{
2454 FILE *f = (FILE *)priv;
2455
b480d9b7
PB
2456 (void) fprintf(f, TARGET_ABI_FMT_lx"-"TARGET_ABI_FMT_lx
2457 " "TARGET_ABI_FMT_lx" %c%c%c\n",
edf8e2af
MW
2458 start, end, end - start,
2459 ((prot & PAGE_READ) ? 'r' : '-'),
2460 ((prot & PAGE_WRITE) ? 'w' : '-'),
2461 ((prot & PAGE_EXEC) ? 'x' : '-'));
2462
2463 return (0);
2464}
2465
2466/* dump memory mappings */
2467void page_dump(FILE *f)
2468{
2469 (void) fprintf(f, "%-8s %-8s %-8s %s\n",
2470 "start", "end", "size", "prot");
2471 walk_memory_regions(f, dump_region);
33417e70
FB
2472}
2473
53a5960a 2474int page_get_flags(target_ulong address)
33417e70 2475{
9fa3e853
FB
2476 PageDesc *p;
2477
2478 p = page_find(address >> TARGET_PAGE_BITS);
33417e70 2479 if (!p)
9fa3e853
FB
2480 return 0;
2481 return p->flags;
2482}
2483
376a7909
RH
2484/* Modify the flags of a page and invalidate the code if necessary.
2485 The flag PAGE_WRITE_ORG is positioned automatically depending
2486 on PAGE_WRITE. The mmap_lock should already be held. */
53a5960a 2487void page_set_flags(target_ulong start, target_ulong end, int flags)
9fa3e853 2488{
376a7909
RH
2489 target_ulong addr, len;
2490
2491 /* This function should never be called with addresses outside the
2492 guest address space. If this assert fires, it probably indicates
2493 a missing call to h2g_valid. */
b480d9b7
PB
2494#if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2495 assert(end < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
376a7909
RH
2496#endif
2497 assert(start < end);
9fa3e853
FB
2498
2499 start = start & TARGET_PAGE_MASK;
2500 end = TARGET_PAGE_ALIGN(end);
376a7909
RH
2501
2502 if (flags & PAGE_WRITE) {
9fa3e853 2503 flags |= PAGE_WRITE_ORG;
376a7909
RH
2504 }
2505
2506 for (addr = start, len = end - start;
2507 len != 0;
2508 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2509 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2510
2511 /* If the write protection bit is set, then we invalidate
2512 the code inside. */
5fafdf24 2513 if (!(p->flags & PAGE_WRITE) &&
9fa3e853
FB
2514 (flags & PAGE_WRITE) &&
2515 p->first_tb) {
d720b93d 2516 tb_invalidate_phys_page(addr, 0, NULL);
9fa3e853
FB
2517 }
2518 p->flags = flags;
2519 }
33417e70
FB
2520}
2521
3d97b40b
TS
2522int page_check_range(target_ulong start, target_ulong len, int flags)
2523{
2524 PageDesc *p;
2525 target_ulong end;
2526 target_ulong addr;
2527
376a7909
RH
2528 /* This function should never be called with addresses outside the
2529 guest address space. If this assert fires, it probably indicates
2530 a missing call to h2g_valid. */
338e9e6c
BS
2531#if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2532 assert(start < ((abi_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
376a7909
RH
2533#endif
2534
3e0650a9
RH
2535 if (len == 0) {
2536 return 0;
2537 }
376a7909
RH
2538 if (start + len - 1 < start) {
2539 /* We've wrapped around. */
55f280c9 2540 return -1;
376a7909 2541 }
55f280c9 2542
3d97b40b
TS
2543 end = TARGET_PAGE_ALIGN(start+len); /* must do before we loose bits in the next step */
2544 start = start & TARGET_PAGE_MASK;
2545
376a7909
RH
2546 for (addr = start, len = end - start;
2547 len != 0;
2548 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
3d97b40b
TS
2549 p = page_find(addr >> TARGET_PAGE_BITS);
2550 if( !p )
2551 return -1;
2552 if( !(p->flags & PAGE_VALID) )
2553 return -1;
2554
dae3270c 2555 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ))
3d97b40b 2556 return -1;
dae3270c
FB
2557 if (flags & PAGE_WRITE) {
2558 if (!(p->flags & PAGE_WRITE_ORG))
2559 return -1;
2560 /* unprotect the page if it was put read-only because it
2561 contains translated code */
2562 if (!(p->flags & PAGE_WRITE)) {
2563 if (!page_unprotect(addr, 0, NULL))
2564 return -1;
2565 }
2566 return 0;
2567 }
3d97b40b
TS
2568 }
2569 return 0;
2570}
2571
9fa3e853 2572/* called from signal handler: invalidate the code and unprotect the
ccbb4d44 2573 page. Return TRUE if the fault was successfully handled. */
53a5960a 2574int page_unprotect(target_ulong address, unsigned long pc, void *puc)
9fa3e853 2575{
45d679d6
AJ
2576 unsigned int prot;
2577 PageDesc *p;
53a5960a 2578 target_ulong host_start, host_end, addr;
9fa3e853 2579
c8a706fe
PB
2580 /* Technically this isn't safe inside a signal handler. However we
2581 know this only ever happens in a synchronous SEGV handler, so in
2582 practice it seems to be ok. */
2583 mmap_lock();
2584
45d679d6
AJ
2585 p = page_find(address >> TARGET_PAGE_BITS);
2586 if (!p) {
c8a706fe 2587 mmap_unlock();
9fa3e853 2588 return 0;
c8a706fe 2589 }
45d679d6 2590
9fa3e853
FB
2591 /* if the page was really writable, then we change its
2592 protection back to writable */
45d679d6
AJ
2593 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
2594 host_start = address & qemu_host_page_mask;
2595 host_end = host_start + qemu_host_page_size;
2596
2597 prot = 0;
2598 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
2599 p = page_find(addr >> TARGET_PAGE_BITS);
2600 p->flags |= PAGE_WRITE;
2601 prot |= p->flags;
2602
9fa3e853
FB
2603 /* and since the content will be modified, we must invalidate
2604 the corresponding translated code. */
45d679d6 2605 tb_invalidate_phys_page(addr, pc, puc);
9fa3e853 2606#ifdef DEBUG_TB_CHECK
45d679d6 2607 tb_invalidate_check(addr);
9fa3e853 2608#endif
9fa3e853 2609 }
45d679d6
AJ
2610 mprotect((void *)g2h(host_start), qemu_host_page_size,
2611 prot & PAGE_BITS);
2612
2613 mmap_unlock();
2614 return 1;
9fa3e853 2615 }
c8a706fe 2616 mmap_unlock();
9fa3e853
FB
2617 return 0;
2618}
2619
6a00d601
FB
2620static inline void tlb_set_dirty(CPUState *env,
2621 unsigned long addr, target_ulong vaddr)
1ccde1cb
FB
2622{
2623}
9fa3e853
FB
2624#endif /* defined(CONFIG_USER_ONLY) */
2625
e2eef170 2626#if !defined(CONFIG_USER_ONLY)
8da3ff18 2627
c04b2b78
PB
2628#define SUBPAGE_IDX(addr) ((addr) & ~TARGET_PAGE_MASK)
2629typedef struct subpage_t {
2630 target_phys_addr_t base;
f6405247
RH
2631 ram_addr_t sub_io_index[TARGET_PAGE_SIZE];
2632 ram_addr_t region_offset[TARGET_PAGE_SIZE];
c04b2b78
PB
2633} subpage_t;
2634
c227f099
AL
2635static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
2636 ram_addr_t memory, ram_addr_t region_offset);
f6405247
RH
2637static subpage_t *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
2638 ram_addr_t orig_memory,
2639 ram_addr_t region_offset);
db7b5426
BS
2640#define CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2, \
2641 need_subpage) \
2642 do { \
2643 if (addr > start_addr) \
2644 start_addr2 = 0; \
2645 else { \
2646 start_addr2 = start_addr & ~TARGET_PAGE_MASK; \
2647 if (start_addr2 > 0) \
2648 need_subpage = 1; \
2649 } \
2650 \
49e9fba2 2651 if ((start_addr + orig_size) - addr >= TARGET_PAGE_SIZE) \
db7b5426
BS
2652 end_addr2 = TARGET_PAGE_SIZE - 1; \
2653 else { \
2654 end_addr2 = (start_addr + orig_size - 1) & ~TARGET_PAGE_MASK; \
2655 if (end_addr2 < TARGET_PAGE_SIZE - 1) \
2656 need_subpage = 1; \
2657 } \
2658 } while (0)
2659
8f2498f9
MT
2660/* register physical memory.
2661 For RAM, 'size' must be a multiple of the target page size.
2662 If (phys_offset & ~TARGET_PAGE_MASK) != 0, then it is an
8da3ff18
PB
2663 io memory page. The address used when calling the IO function is
2664 the offset from the start of the region, plus region_offset. Both
ccbb4d44 2665 start_addr and region_offset are rounded down to a page boundary
8da3ff18
PB
2666 before calculating this offset. This should not be a problem unless
2667 the low bits of start_addr and region_offset differ. */
0fd542fb 2668void cpu_register_physical_memory_log(target_phys_addr_t start_addr,
c227f099
AL
2669 ram_addr_t size,
2670 ram_addr_t phys_offset,
0fd542fb
MT
2671 ram_addr_t region_offset,
2672 bool log_dirty)
33417e70 2673{
c227f099 2674 target_phys_addr_t addr, end_addr;
92e873b9 2675 PhysPageDesc *p;
9d42037b 2676 CPUState *env;
c227f099 2677 ram_addr_t orig_size = size;
f6405247 2678 subpage_t *subpage;
33417e70 2679
3b8e6a2d 2680 assert(size);
0fd542fb 2681 cpu_notify_set_memory(start_addr, size, phys_offset, log_dirty);
f6f3fbca 2682
67c4d23c
PB
2683 if (phys_offset == IO_MEM_UNASSIGNED) {
2684 region_offset = start_addr;
2685 }
8da3ff18 2686 region_offset &= TARGET_PAGE_MASK;
5fd386f6 2687 size = (size + TARGET_PAGE_SIZE - 1) & TARGET_PAGE_MASK;
c227f099 2688 end_addr = start_addr + (target_phys_addr_t)size;
3b8e6a2d
EI
2689
2690 addr = start_addr;
2691 do {
db7b5426
BS
2692 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2693 if (p && p->phys_offset != IO_MEM_UNASSIGNED) {
c227f099
AL
2694 ram_addr_t orig_memory = p->phys_offset;
2695 target_phys_addr_t start_addr2, end_addr2;
db7b5426
BS
2696 int need_subpage = 0;
2697
2698 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr, end_addr2,
2699 need_subpage);
f6405247 2700 if (need_subpage) {
db7b5426
BS
2701 if (!(orig_memory & IO_MEM_SUBPAGE)) {
2702 subpage = subpage_init((addr & TARGET_PAGE_MASK),
8da3ff18
PB
2703 &p->phys_offset, orig_memory,
2704 p->region_offset);
db7b5426
BS
2705 } else {
2706 subpage = io_mem_opaque[(orig_memory & ~TARGET_PAGE_MASK)
2707 >> IO_MEM_SHIFT];
2708 }
8da3ff18
PB
2709 subpage_register(subpage, start_addr2, end_addr2, phys_offset,
2710 region_offset);
2711 p->region_offset = 0;
db7b5426
BS
2712 } else {
2713 p->phys_offset = phys_offset;
2714 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
2715 (phys_offset & IO_MEM_ROMD))
2716 phys_offset += TARGET_PAGE_SIZE;
2717 }
2718 } else {
2719 p = phys_page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2720 p->phys_offset = phys_offset;
8da3ff18 2721 p->region_offset = region_offset;
db7b5426 2722 if ((phys_offset & ~TARGET_PAGE_MASK) <= IO_MEM_ROM ||
8da3ff18 2723 (phys_offset & IO_MEM_ROMD)) {
db7b5426 2724 phys_offset += TARGET_PAGE_SIZE;
0e8f0967 2725 } else {
c227f099 2726 target_phys_addr_t start_addr2, end_addr2;
db7b5426
BS
2727 int need_subpage = 0;
2728
2729 CHECK_SUBPAGE(addr, start_addr, start_addr2, end_addr,
2730 end_addr2, need_subpage);
2731
f6405247 2732 if (need_subpage) {
db7b5426 2733 subpage = subpage_init((addr & TARGET_PAGE_MASK),
8da3ff18 2734 &p->phys_offset, IO_MEM_UNASSIGNED,
67c4d23c 2735 addr & TARGET_PAGE_MASK);
db7b5426 2736 subpage_register(subpage, start_addr2, end_addr2,
8da3ff18
PB
2737 phys_offset, region_offset);
2738 p->region_offset = 0;
db7b5426
BS
2739 }
2740 }
2741 }
8da3ff18 2742 region_offset += TARGET_PAGE_SIZE;
3b8e6a2d
EI
2743 addr += TARGET_PAGE_SIZE;
2744 } while (addr != end_addr);
3b46e624 2745
9d42037b
FB
2746 /* since each CPU stores ram addresses in its TLB cache, we must
2747 reset the modified entries */
2748 /* XXX: slow ! */
2749 for(env = first_cpu; env != NULL; env = env->next_cpu) {
2750 tlb_flush(env, 1);
2751 }
33417e70
FB
2752}
2753
ba863458 2754/* XXX: temporary until new memory mapping API */
c227f099 2755ram_addr_t cpu_get_physical_page_desc(target_phys_addr_t addr)
ba863458
FB
2756{
2757 PhysPageDesc *p;
2758
2759 p = phys_page_find(addr >> TARGET_PAGE_BITS);
2760 if (!p)
2761 return IO_MEM_UNASSIGNED;
2762 return p->phys_offset;
2763}
2764
c227f099 2765void qemu_register_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
f65ed4c1
AL
2766{
2767 if (kvm_enabled())
2768 kvm_coalesce_mmio_region(addr, size);
2769}
2770
c227f099 2771void qemu_unregister_coalesced_mmio(target_phys_addr_t addr, ram_addr_t size)
f65ed4c1
AL
2772{
2773 if (kvm_enabled())
2774 kvm_uncoalesce_mmio_region(addr, size);
2775}
2776
62a2744c
SY
2777void qemu_flush_coalesced_mmio_buffer(void)
2778{
2779 if (kvm_enabled())
2780 kvm_flush_coalesced_mmio_buffer();
2781}
2782
c902760f
MT
2783#if defined(__linux__) && !defined(TARGET_S390X)
2784
2785#include <sys/vfs.h>
2786
2787#define HUGETLBFS_MAGIC 0x958458f6
2788
2789static long gethugepagesize(const char *path)
2790{
2791 struct statfs fs;
2792 int ret;
2793
2794 do {
9742bf26 2795 ret = statfs(path, &fs);
c902760f
MT
2796 } while (ret != 0 && errno == EINTR);
2797
2798 if (ret != 0) {
9742bf26
YT
2799 perror(path);
2800 return 0;
c902760f
MT
2801 }
2802
2803 if (fs.f_type != HUGETLBFS_MAGIC)
9742bf26 2804 fprintf(stderr, "Warning: path not on HugeTLBFS: %s\n", path);
c902760f
MT
2805
2806 return fs.f_bsize;
2807}
2808
04b16653
AW
2809static void *file_ram_alloc(RAMBlock *block,
2810 ram_addr_t memory,
2811 const char *path)
c902760f
MT
2812{
2813 char *filename;
2814 void *area;
2815 int fd;
2816#ifdef MAP_POPULATE
2817 int flags;
2818#endif
2819 unsigned long hpagesize;
2820
2821 hpagesize = gethugepagesize(path);
2822 if (!hpagesize) {
9742bf26 2823 return NULL;
c902760f
MT
2824 }
2825
2826 if (memory < hpagesize) {
2827 return NULL;
2828 }
2829
2830 if (kvm_enabled() && !kvm_has_sync_mmu()) {
2831 fprintf(stderr, "host lacks kvm mmu notifiers, -mem-path unsupported\n");
2832 return NULL;
2833 }
2834
2835 if (asprintf(&filename, "%s/qemu_back_mem.XXXXXX", path) == -1) {
9742bf26 2836 return NULL;
c902760f
MT
2837 }
2838
2839 fd = mkstemp(filename);
2840 if (fd < 0) {
9742bf26
YT
2841 perror("unable to create backing store for hugepages");
2842 free(filename);
2843 return NULL;
c902760f
MT
2844 }
2845 unlink(filename);
2846 free(filename);
2847
2848 memory = (memory+hpagesize-1) & ~(hpagesize-1);
2849
2850 /*
2851 * ftruncate is not supported by hugetlbfs in older
2852 * hosts, so don't bother bailing out on errors.
2853 * If anything goes wrong with it under other filesystems,
2854 * mmap will fail.
2855 */
2856 if (ftruncate(fd, memory))
9742bf26 2857 perror("ftruncate");
c902760f
MT
2858
2859#ifdef MAP_POPULATE
2860 /* NB: MAP_POPULATE won't exhaustively alloc all phys pages in the case
2861 * MAP_PRIVATE is requested. For mem_prealloc we mmap as MAP_SHARED
2862 * to sidestep this quirk.
2863 */
2864 flags = mem_prealloc ? MAP_POPULATE | MAP_SHARED : MAP_PRIVATE;
2865 area = mmap(0, memory, PROT_READ | PROT_WRITE, flags, fd, 0);
2866#else
2867 area = mmap(0, memory, PROT_READ | PROT_WRITE, MAP_PRIVATE, fd, 0);
2868#endif
2869 if (area == MAP_FAILED) {
9742bf26
YT
2870 perror("file_ram_alloc: can't mmap RAM pages");
2871 close(fd);
2872 return (NULL);
c902760f 2873 }
04b16653 2874 block->fd = fd;
c902760f
MT
2875 return area;
2876}
2877#endif
2878
d17b5288 2879static ram_addr_t find_ram_offset(ram_addr_t size)
04b16653
AW
2880{
2881 RAMBlock *block, *next_block;
f15fbc4b 2882 ram_addr_t offset = 0, mingap = RAM_ADDR_MAX;
04b16653
AW
2883
2884 if (QLIST_EMPTY(&ram_list.blocks))
2885 return 0;
2886
2887 QLIST_FOREACH(block, &ram_list.blocks, next) {
f15fbc4b 2888 ram_addr_t end, next = RAM_ADDR_MAX;
04b16653
AW
2889
2890 end = block->offset + block->length;
2891
2892 QLIST_FOREACH(next_block, &ram_list.blocks, next) {
2893 if (next_block->offset >= end) {
2894 next = MIN(next, next_block->offset);
2895 }
2896 }
2897 if (next - end >= size && next - end < mingap) {
2898 offset = end;
2899 mingap = next - end;
2900 }
2901 }
2902 return offset;
2903}
2904
2905static ram_addr_t last_ram_offset(void)
d17b5288
AW
2906{
2907 RAMBlock *block;
2908 ram_addr_t last = 0;
2909
2910 QLIST_FOREACH(block, &ram_list.blocks, next)
2911 last = MAX(last, block->offset + block->length);
2912
2913 return last;
2914}
2915
84b89d78 2916ram_addr_t qemu_ram_alloc_from_ptr(DeviceState *dev, const char *name,
6977dfe6 2917 ram_addr_t size, void *host)
84b89d78
CM
2918{
2919 RAMBlock *new_block, *block;
2920
2921 size = TARGET_PAGE_ALIGN(size);
2922 new_block = qemu_mallocz(sizeof(*new_block));
2923
2924 if (dev && dev->parent_bus && dev->parent_bus->info->get_dev_path) {
2925 char *id = dev->parent_bus->info->get_dev_path(dev);
2926 if (id) {
2927 snprintf(new_block->idstr, sizeof(new_block->idstr), "%s/", id);
2928 qemu_free(id);
2929 }
2930 }
2931 pstrcat(new_block->idstr, sizeof(new_block->idstr), name);
2932
2933 QLIST_FOREACH(block, &ram_list.blocks, next) {
2934 if (!strcmp(block->idstr, new_block->idstr)) {
2935 fprintf(stderr, "RAMBlock \"%s\" already registered, abort!\n",
2936 new_block->idstr);
2937 abort();
2938 }
2939 }
2940
432d268c 2941 new_block->offset = find_ram_offset(size);
6977dfe6
YT
2942 if (host) {
2943 new_block->host = host;
cd19cfa2 2944 new_block->flags |= RAM_PREALLOC_MASK;
6977dfe6
YT
2945 } else {
2946 if (mem_path) {
c902760f 2947#if defined (__linux__) && !defined(TARGET_S390X)
6977dfe6
YT
2948 new_block->host = file_ram_alloc(new_block, size, mem_path);
2949 if (!new_block->host) {
2950 new_block->host = qemu_vmalloc(size);
e78815a5 2951 qemu_madvise(new_block->host, size, QEMU_MADV_MERGEABLE);
6977dfe6 2952 }
c902760f 2953#else
6977dfe6
YT
2954 fprintf(stderr, "-mem-path option unsupported\n");
2955 exit(1);
c902760f 2956#endif
6977dfe6 2957 } else {
6b02494d 2958#if defined(TARGET_S390X) && defined(CONFIG_KVM)
ff83678a
CB
2959 /* S390 KVM requires the topmost vma of the RAM to be smaller than
2960 an system defined value, which is at least 256GB. Larger systems
2961 have larger values. We put the guest between the end of data
2962 segment (system break) and this value. We use 32GB as a base to
2963 have enough room for the system break to grow. */
2964 new_block->host = mmap((void*)0x800000000, size,
6977dfe6 2965 PROT_EXEC|PROT_READ|PROT_WRITE,
ff83678a 2966 MAP_SHARED | MAP_ANONYMOUS | MAP_FIXED, -1, 0);
fb8b2735
AG
2967 if (new_block->host == MAP_FAILED) {
2968 fprintf(stderr, "Allocating RAM failed\n");
2969 abort();
2970 }
6b02494d 2971#else
868bb33f 2972 if (xen_enabled()) {
432d268c
JN
2973 xen_ram_alloc(new_block->offset, size);
2974 } else {
2975 new_block->host = qemu_vmalloc(size);
2976 }
6b02494d 2977#endif
e78815a5 2978 qemu_madvise(new_block->host, size, QEMU_MADV_MERGEABLE);
6977dfe6 2979 }
c902760f 2980 }
94a6b54f
PB
2981 new_block->length = size;
2982
f471a17e 2983 QLIST_INSERT_HEAD(&ram_list.blocks, new_block, next);
94a6b54f 2984
f471a17e 2985 ram_list.phys_dirty = qemu_realloc(ram_list.phys_dirty,
04b16653 2986 last_ram_offset() >> TARGET_PAGE_BITS);
d17b5288 2987 memset(ram_list.phys_dirty + (new_block->offset >> TARGET_PAGE_BITS),
94a6b54f
PB
2988 0xff, size >> TARGET_PAGE_BITS);
2989
6f0437e8
JK
2990 if (kvm_enabled())
2991 kvm_setup_guest_memory(new_block->host, size);
2992
94a6b54f
PB
2993 return new_block->offset;
2994}
e9a1ab19 2995
6977dfe6
YT
2996ram_addr_t qemu_ram_alloc(DeviceState *dev, const char *name, ram_addr_t size)
2997{
2998 return qemu_ram_alloc_from_ptr(dev, name, size, NULL);
2999}
3000
1f2e98b6
AW
3001void qemu_ram_free_from_ptr(ram_addr_t addr)
3002{
3003 RAMBlock *block;
3004
3005 QLIST_FOREACH(block, &ram_list.blocks, next) {
3006 if (addr == block->offset) {
3007 QLIST_REMOVE(block, next);
3008 qemu_free(block);
3009 return;
3010 }
3011 }
3012}
3013
c227f099 3014void qemu_ram_free(ram_addr_t addr)
e9a1ab19 3015{
04b16653
AW
3016 RAMBlock *block;
3017
3018 QLIST_FOREACH(block, &ram_list.blocks, next) {
3019 if (addr == block->offset) {
3020 QLIST_REMOVE(block, next);
cd19cfa2
HY
3021 if (block->flags & RAM_PREALLOC_MASK) {
3022 ;
3023 } else if (mem_path) {
04b16653
AW
3024#if defined (__linux__) && !defined(TARGET_S390X)
3025 if (block->fd) {
3026 munmap(block->host, block->length);
3027 close(block->fd);
3028 } else {
3029 qemu_vfree(block->host);
3030 }
fd28aa13
JK
3031#else
3032 abort();
04b16653
AW
3033#endif
3034 } else {
3035#if defined(TARGET_S390X) && defined(CONFIG_KVM)
3036 munmap(block->host, block->length);
3037#else
868bb33f 3038 if (xen_enabled()) {
e41d7c69 3039 xen_invalidate_map_cache_entry(block->host);
432d268c
JN
3040 } else {
3041 qemu_vfree(block->host);
3042 }
04b16653
AW
3043#endif
3044 }
3045 qemu_free(block);
3046 return;
3047 }
3048 }
3049
e9a1ab19
FB
3050}
3051
cd19cfa2
HY
3052#ifndef _WIN32
3053void qemu_ram_remap(ram_addr_t addr, ram_addr_t length)
3054{
3055 RAMBlock *block;
3056 ram_addr_t offset;
3057 int flags;
3058 void *area, *vaddr;
3059
3060 QLIST_FOREACH(block, &ram_list.blocks, next) {
3061 offset = addr - block->offset;
3062 if (offset < block->length) {
3063 vaddr = block->host + offset;
3064 if (block->flags & RAM_PREALLOC_MASK) {
3065 ;
3066 } else {
3067 flags = MAP_FIXED;
3068 munmap(vaddr, length);
3069 if (mem_path) {
3070#if defined(__linux__) && !defined(TARGET_S390X)
3071 if (block->fd) {
3072#ifdef MAP_POPULATE
3073 flags |= mem_prealloc ? MAP_POPULATE | MAP_SHARED :
3074 MAP_PRIVATE;
3075#else
3076 flags |= MAP_PRIVATE;
3077#endif
3078 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3079 flags, block->fd, offset);
3080 } else {
3081 flags |= MAP_PRIVATE | MAP_ANONYMOUS;
3082 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3083 flags, -1, 0);
3084 }
fd28aa13
JK
3085#else
3086 abort();
cd19cfa2
HY
3087#endif
3088 } else {
3089#if defined(TARGET_S390X) && defined(CONFIG_KVM)
3090 flags |= MAP_SHARED | MAP_ANONYMOUS;
3091 area = mmap(vaddr, length, PROT_EXEC|PROT_READ|PROT_WRITE,
3092 flags, -1, 0);
3093#else
3094 flags |= MAP_PRIVATE | MAP_ANONYMOUS;
3095 area = mmap(vaddr, length, PROT_READ | PROT_WRITE,
3096 flags, -1, 0);
3097#endif
3098 }
3099 if (area != vaddr) {
f15fbc4b
AP
3100 fprintf(stderr, "Could not remap addr: "
3101 RAM_ADDR_FMT "@" RAM_ADDR_FMT "\n",
cd19cfa2
HY
3102 length, addr);
3103 exit(1);
3104 }
3105 qemu_madvise(vaddr, length, QEMU_MADV_MERGEABLE);
3106 }
3107 return;
3108 }
3109 }
3110}
3111#endif /* !_WIN32 */
3112
dc828ca1 3113/* Return a host pointer to ram allocated with qemu_ram_alloc.
5579c7f3
PB
3114 With the exception of the softmmu code in this file, this should
3115 only be used for local memory (e.g. video ram) that the device owns,
3116 and knows it isn't going to access beyond the end of the block.
3117
3118 It should not be used for general purpose DMA.
3119 Use cpu_physical_memory_map/cpu_physical_memory_rw instead.
3120 */
c227f099 3121void *qemu_get_ram_ptr(ram_addr_t addr)
dc828ca1 3122{
94a6b54f
PB
3123 RAMBlock *block;
3124
f471a17e
AW
3125 QLIST_FOREACH(block, &ram_list.blocks, next) {
3126 if (addr - block->offset < block->length) {
7d82af38
VP
3127 /* Move this entry to to start of the list. */
3128 if (block != QLIST_FIRST(&ram_list.blocks)) {
3129 QLIST_REMOVE(block, next);
3130 QLIST_INSERT_HEAD(&ram_list.blocks, block, next);
3131 }
868bb33f 3132 if (xen_enabled()) {
432d268c
JN
3133 /* We need to check if the requested address is in the RAM
3134 * because we don't want to map the entire memory in QEMU.
712c2b41 3135 * In that case just map until the end of the page.
432d268c
JN
3136 */
3137 if (block->offset == 0) {
e41d7c69 3138 return xen_map_cache(addr, 0, 0);
432d268c 3139 } else if (block->host == NULL) {
e41d7c69
JK
3140 block->host =
3141 xen_map_cache(block->offset, block->length, 1);
432d268c
JN
3142 }
3143 }
f471a17e
AW
3144 return block->host + (addr - block->offset);
3145 }
94a6b54f 3146 }
f471a17e
AW
3147
3148 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3149 abort();
3150
3151 return NULL;
dc828ca1
PB
3152}
3153
b2e0a138
MT
3154/* Return a host pointer to ram allocated with qemu_ram_alloc.
3155 * Same as qemu_get_ram_ptr but avoid reordering ramblocks.
3156 */
3157void *qemu_safe_ram_ptr(ram_addr_t addr)
3158{
3159 RAMBlock *block;
3160
3161 QLIST_FOREACH(block, &ram_list.blocks, next) {
3162 if (addr - block->offset < block->length) {
868bb33f 3163 if (xen_enabled()) {
432d268c
JN
3164 /* We need to check if the requested address is in the RAM
3165 * because we don't want to map the entire memory in QEMU.
712c2b41 3166 * In that case just map until the end of the page.
432d268c
JN
3167 */
3168 if (block->offset == 0) {
e41d7c69 3169 return xen_map_cache(addr, 0, 0);
432d268c 3170 } else if (block->host == NULL) {
e41d7c69
JK
3171 block->host =
3172 xen_map_cache(block->offset, block->length, 1);
432d268c
JN
3173 }
3174 }
b2e0a138
MT
3175 return block->host + (addr - block->offset);
3176 }
3177 }
3178
3179 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3180 abort();
3181
3182 return NULL;
3183}
3184
38bee5dc
SS
3185/* Return a host pointer to guest's ram. Similar to qemu_get_ram_ptr
3186 * but takes a size argument */
8ab934f9 3187void *qemu_ram_ptr_length(ram_addr_t addr, ram_addr_t *size)
38bee5dc 3188{
8ab934f9
SS
3189 if (*size == 0) {
3190 return NULL;
3191 }
868bb33f 3192 if (xen_enabled()) {
e41d7c69 3193 return xen_map_cache(addr, *size, 1);
868bb33f 3194 } else {
38bee5dc
SS
3195 RAMBlock *block;
3196
3197 QLIST_FOREACH(block, &ram_list.blocks, next) {
3198 if (addr - block->offset < block->length) {
3199 if (addr - block->offset + *size > block->length)
3200 *size = block->length - addr + block->offset;
3201 return block->host + (addr - block->offset);
3202 }
3203 }
3204
3205 fprintf(stderr, "Bad ram offset %" PRIx64 "\n", (uint64_t)addr);
3206 abort();
38bee5dc
SS
3207 }
3208}
3209
050a0ddf
AP
3210void qemu_put_ram_ptr(void *addr)
3211{
3212 trace_qemu_put_ram_ptr(addr);
050a0ddf
AP
3213}
3214
e890261f 3215int qemu_ram_addr_from_host(void *ptr, ram_addr_t *ram_addr)
5579c7f3 3216{
94a6b54f
PB
3217 RAMBlock *block;
3218 uint8_t *host = ptr;
3219
868bb33f 3220 if (xen_enabled()) {
e41d7c69 3221 *ram_addr = xen_ram_addr_from_mapcache(ptr);
712c2b41
SS
3222 return 0;
3223 }
3224
f471a17e 3225 QLIST_FOREACH(block, &ram_list.blocks, next) {
432d268c
JN
3226 /* This case append when the block is not mapped. */
3227 if (block->host == NULL) {
3228 continue;
3229 }
f471a17e 3230 if (host - block->host < block->length) {
e890261f
MT
3231 *ram_addr = block->offset + (host - block->host);
3232 return 0;
f471a17e 3233 }
94a6b54f 3234 }
432d268c 3235
e890261f
MT
3236 return -1;
3237}
f471a17e 3238
e890261f
MT
3239/* Some of the softmmu routines need to translate from a host pointer
3240 (typically a TLB entry) back to a ram offset. */
3241ram_addr_t qemu_ram_addr_from_host_nofail(void *ptr)
3242{
3243 ram_addr_t ram_addr;
f471a17e 3244
e890261f
MT
3245 if (qemu_ram_addr_from_host(ptr, &ram_addr)) {
3246 fprintf(stderr, "Bad ram pointer %p\n", ptr);
3247 abort();
3248 }
3249 return ram_addr;
5579c7f3
PB
3250}
3251
c227f099 3252static uint32_t unassigned_mem_readb(void *opaque, target_phys_addr_t addr)
33417e70 3253{
67d3b957 3254#ifdef DEBUG_UNASSIGNED
ab3d1727 3255 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
b4f0a316 3256#endif
5b450407 3257#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3258 cpu_unassigned_access(cpu_single_env, addr, 0, 0, 0, 1);
e18231a3
BS
3259#endif
3260 return 0;
3261}
3262
c227f099 3263static uint32_t unassigned_mem_readw(void *opaque, target_phys_addr_t addr)
e18231a3
BS
3264{
3265#ifdef DEBUG_UNASSIGNED
3266 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
3267#endif
5b450407 3268#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3269 cpu_unassigned_access(cpu_single_env, addr, 0, 0, 0, 2);
e18231a3
BS
3270#endif
3271 return 0;
3272}
3273
c227f099 3274static uint32_t unassigned_mem_readl(void *opaque, target_phys_addr_t addr)
e18231a3
BS
3275{
3276#ifdef DEBUG_UNASSIGNED
3277 printf("Unassigned mem read " TARGET_FMT_plx "\n", addr);
3278#endif
5b450407 3279#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3280 cpu_unassigned_access(cpu_single_env, addr, 0, 0, 0, 4);
67d3b957 3281#endif
33417e70
FB
3282 return 0;
3283}
3284
c227f099 3285static void unassigned_mem_writeb(void *opaque, target_phys_addr_t addr, uint32_t val)
33417e70 3286{
67d3b957 3287#ifdef DEBUG_UNASSIGNED
ab3d1727 3288 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
67d3b957 3289#endif
5b450407 3290#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3291 cpu_unassigned_access(cpu_single_env, addr, 1, 0, 0, 1);
e18231a3
BS
3292#endif
3293}
3294
c227f099 3295static void unassigned_mem_writew(void *opaque, target_phys_addr_t addr, uint32_t val)
e18231a3
BS
3296{
3297#ifdef DEBUG_UNASSIGNED
3298 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
3299#endif
5b450407 3300#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3301 cpu_unassigned_access(cpu_single_env, addr, 1, 0, 0, 2);
e18231a3
BS
3302#endif
3303}
3304
c227f099 3305static void unassigned_mem_writel(void *opaque, target_phys_addr_t addr, uint32_t val)
e18231a3
BS
3306{
3307#ifdef DEBUG_UNASSIGNED
3308 printf("Unassigned mem write " TARGET_FMT_plx " = 0x%x\n", addr, val);
3309#endif
5b450407 3310#if defined(TARGET_ALPHA) || defined(TARGET_SPARC) || defined(TARGET_MICROBLAZE)
b14ef7c9 3311 cpu_unassigned_access(cpu_single_env, addr, 1, 0, 0, 4);
b4f0a316 3312#endif
33417e70
FB
3313}
3314
d60efc6b 3315static CPUReadMemoryFunc * const unassigned_mem_read[3] = {
33417e70 3316 unassigned_mem_readb,
e18231a3
BS
3317 unassigned_mem_readw,
3318 unassigned_mem_readl,
33417e70
FB
3319};
3320
d60efc6b 3321static CPUWriteMemoryFunc * const unassigned_mem_write[3] = {
33417e70 3322 unassigned_mem_writeb,
e18231a3
BS
3323 unassigned_mem_writew,
3324 unassigned_mem_writel,
33417e70
FB
3325};
3326
c227f099 3327static void notdirty_mem_writeb(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3328 uint32_t val)
9fa3e853 3329{
3a7d929e 3330 int dirty_flags;
f7c11b53 3331 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3332 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3333#if !defined(CONFIG_USER_ONLY)
3a7d929e 3334 tb_invalidate_phys_page_fast(ram_addr, 1);
f7c11b53 3335 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3336#endif
3a7d929e 3337 }
5579c7f3 3338 stb_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3339 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3340 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3341 /* we remove the notdirty callback only if the code has been
3342 flushed */
3343 if (dirty_flags == 0xff)
2e70f6ef 3344 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3345}
3346
c227f099 3347static void notdirty_mem_writew(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3348 uint32_t val)
9fa3e853 3349{
3a7d929e 3350 int dirty_flags;
f7c11b53 3351 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3352 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3353#if !defined(CONFIG_USER_ONLY)
3a7d929e 3354 tb_invalidate_phys_page_fast(ram_addr, 2);
f7c11b53 3355 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3356#endif
3a7d929e 3357 }
5579c7f3 3358 stw_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3359 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3360 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3361 /* we remove the notdirty callback only if the code has been
3362 flushed */
3363 if (dirty_flags == 0xff)
2e70f6ef 3364 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3365}
3366
c227f099 3367static void notdirty_mem_writel(void *opaque, target_phys_addr_t ram_addr,
0f459d16 3368 uint32_t val)
9fa3e853 3369{
3a7d929e 3370 int dirty_flags;
f7c11b53 3371 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
3a7d929e 3372 if (!(dirty_flags & CODE_DIRTY_FLAG)) {
9fa3e853 3373#if !defined(CONFIG_USER_ONLY)
3a7d929e 3374 tb_invalidate_phys_page_fast(ram_addr, 4);
f7c11b53 3375 dirty_flags = cpu_physical_memory_get_dirty_flags(ram_addr);
9fa3e853 3376#endif
3a7d929e 3377 }
5579c7f3 3378 stl_p(qemu_get_ram_ptr(ram_addr), val);
f23db169 3379 dirty_flags |= (0xff & ~CODE_DIRTY_FLAG);
f7c11b53 3380 cpu_physical_memory_set_dirty_flags(ram_addr, dirty_flags);
f23db169
FB
3381 /* we remove the notdirty callback only if the code has been
3382 flushed */
3383 if (dirty_flags == 0xff)
2e70f6ef 3384 tlb_set_dirty(cpu_single_env, cpu_single_env->mem_io_vaddr);
9fa3e853
FB
3385}
3386
d60efc6b 3387static CPUReadMemoryFunc * const error_mem_read[3] = {
9fa3e853
FB
3388 NULL, /* never used */
3389 NULL, /* never used */
3390 NULL, /* never used */
3391};
3392
d60efc6b 3393static CPUWriteMemoryFunc * const notdirty_mem_write[3] = {
1ccde1cb
FB
3394 notdirty_mem_writeb,
3395 notdirty_mem_writew,
3396 notdirty_mem_writel,
3397};
3398
0f459d16 3399/* Generate a debug exception if a watchpoint has been hit. */
b4051334 3400static void check_watchpoint(int offset, int len_mask, int flags)
0f459d16
PB
3401{
3402 CPUState *env = cpu_single_env;
06d55cc1
AL
3403 target_ulong pc, cs_base;
3404 TranslationBlock *tb;
0f459d16 3405 target_ulong vaddr;
a1d1bb31 3406 CPUWatchpoint *wp;
06d55cc1 3407 int cpu_flags;
0f459d16 3408
06d55cc1
AL
3409 if (env->watchpoint_hit) {
3410 /* We re-entered the check after replacing the TB. Now raise
3411 * the debug interrupt so that is will trigger after the
3412 * current instruction. */
3413 cpu_interrupt(env, CPU_INTERRUPT_DEBUG);
3414 return;
3415 }
2e70f6ef 3416 vaddr = (env->mem_io_vaddr & TARGET_PAGE_MASK) + offset;
72cf2d4f 3417 QTAILQ_FOREACH(wp, &env->watchpoints, entry) {
b4051334
AL
3418 if ((vaddr == (wp->vaddr & len_mask) ||
3419 (vaddr & wp->len_mask) == wp->vaddr) && (wp->flags & flags)) {
6e140f28
AL
3420 wp->flags |= BP_WATCHPOINT_HIT;
3421 if (!env->watchpoint_hit) {
3422 env->watchpoint_hit = wp;
3423 tb = tb_find_pc(env->mem_io_pc);
3424 if (!tb) {
3425 cpu_abort(env, "check_watchpoint: could not find TB for "
3426 "pc=%p", (void *)env->mem_io_pc);
3427 }
618ba8e6 3428 cpu_restore_state(tb, env, env->mem_io_pc);
6e140f28
AL
3429 tb_phys_invalidate(tb, -1);
3430 if (wp->flags & BP_STOP_BEFORE_ACCESS) {
3431 env->exception_index = EXCP_DEBUG;
3432 } else {
3433 cpu_get_tb_cpu_state(env, &pc, &cs_base, &cpu_flags);
3434 tb_gen_code(env, pc, cs_base, cpu_flags, 1);
3435 }
3436 cpu_resume_from_signal(env, NULL);
06d55cc1 3437 }
6e140f28
AL
3438 } else {
3439 wp->flags &= ~BP_WATCHPOINT_HIT;
0f459d16
PB
3440 }
3441 }
3442}
3443
6658ffb8
PB
3444/* Watchpoint access routines. Watchpoints are inserted using TLB tricks,
3445 so these check for a hit then pass through to the normal out-of-line
3446 phys routines. */
c227f099 3447static uint32_t watch_mem_readb(void *opaque, target_phys_addr_t addr)
6658ffb8 3448{
b4051334 3449 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_READ);
6658ffb8
PB
3450 return ldub_phys(addr);
3451}
3452
c227f099 3453static uint32_t watch_mem_readw(void *opaque, target_phys_addr_t addr)
6658ffb8 3454{
b4051334 3455 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_READ);
6658ffb8
PB
3456 return lduw_phys(addr);
3457}
3458
c227f099 3459static uint32_t watch_mem_readl(void *opaque, target_phys_addr_t addr)
6658ffb8 3460{
b4051334 3461 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_READ);
6658ffb8
PB
3462 return ldl_phys(addr);
3463}
3464
c227f099 3465static void watch_mem_writeb(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3466 uint32_t val)
3467{
b4051334 3468 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x0, BP_MEM_WRITE);
6658ffb8
PB
3469 stb_phys(addr, val);
3470}
3471
c227f099 3472static void watch_mem_writew(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3473 uint32_t val)
3474{
b4051334 3475 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x1, BP_MEM_WRITE);
6658ffb8
PB
3476 stw_phys(addr, val);
3477}
3478
c227f099 3479static void watch_mem_writel(void *opaque, target_phys_addr_t addr,
6658ffb8
PB
3480 uint32_t val)
3481{
b4051334 3482 check_watchpoint(addr & ~TARGET_PAGE_MASK, ~0x3, BP_MEM_WRITE);
6658ffb8
PB
3483 stl_phys(addr, val);
3484}
3485
d60efc6b 3486static CPUReadMemoryFunc * const watch_mem_read[3] = {
6658ffb8
PB
3487 watch_mem_readb,
3488 watch_mem_readw,
3489 watch_mem_readl,
3490};
3491
d60efc6b 3492static CPUWriteMemoryFunc * const watch_mem_write[3] = {
6658ffb8
PB
3493 watch_mem_writeb,
3494 watch_mem_writew,
3495 watch_mem_writel,
3496};
6658ffb8 3497
f6405247
RH
3498static inline uint32_t subpage_readlen (subpage_t *mmio,
3499 target_phys_addr_t addr,
3500 unsigned int len)
db7b5426 3501{
f6405247 3502 unsigned int idx = SUBPAGE_IDX(addr);
db7b5426
BS
3503#if defined(DEBUG_SUBPAGE)
3504 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d\n", __func__,
3505 mmio, len, addr, idx);
3506#endif
db7b5426 3507
f6405247
RH
3508 addr += mmio->region_offset[idx];
3509 idx = mmio->sub_io_index[idx];
3510 return io_mem_read[idx][len](io_mem_opaque[idx], addr);
db7b5426
BS
3511}
3512
c227f099 3513static inline void subpage_writelen (subpage_t *mmio, target_phys_addr_t addr,
f6405247 3514 uint32_t value, unsigned int len)
db7b5426 3515{
f6405247 3516 unsigned int idx = SUBPAGE_IDX(addr);
db7b5426 3517#if defined(DEBUG_SUBPAGE)
f6405247
RH
3518 printf("%s: subpage %p len %d addr " TARGET_FMT_plx " idx %d value %08x\n",
3519 __func__, mmio, len, addr, idx, value);
db7b5426 3520#endif
f6405247
RH
3521
3522 addr += mmio->region_offset[idx];
3523 idx = mmio->sub_io_index[idx];
3524 io_mem_write[idx][len](io_mem_opaque[idx], addr, value);
db7b5426
BS
3525}
3526
c227f099 3527static uint32_t subpage_readb (void *opaque, target_phys_addr_t addr)
db7b5426 3528{
db7b5426
BS
3529 return subpage_readlen(opaque, addr, 0);
3530}
3531
c227f099 3532static void subpage_writeb (void *opaque, target_phys_addr_t addr,
db7b5426
BS
3533 uint32_t value)
3534{
db7b5426
BS
3535 subpage_writelen(opaque, addr, value, 0);
3536}
3537
c227f099 3538static uint32_t subpage_readw (void *opaque, target_phys_addr_t addr)
db7b5426 3539{
db7b5426
BS
3540 return subpage_readlen(opaque, addr, 1);
3541}
3542
c227f099 3543static void subpage_writew (void *opaque, target_phys_addr_t addr,
db7b5426
BS
3544 uint32_t value)
3545{
db7b5426
BS
3546 subpage_writelen(opaque, addr, value, 1);
3547}
3548
c227f099 3549static uint32_t subpage_readl (void *opaque, target_phys_addr_t addr)
db7b5426 3550{
db7b5426
BS
3551 return subpage_readlen(opaque, addr, 2);
3552}
3553
f6405247
RH
3554static void subpage_writel (void *opaque, target_phys_addr_t addr,
3555 uint32_t value)
db7b5426 3556{
db7b5426
BS
3557 subpage_writelen(opaque, addr, value, 2);
3558}
3559
d60efc6b 3560static CPUReadMemoryFunc * const subpage_read[] = {
db7b5426
BS
3561 &subpage_readb,
3562 &subpage_readw,
3563 &subpage_readl,
3564};
3565
d60efc6b 3566static CPUWriteMemoryFunc * const subpage_write[] = {
db7b5426
BS
3567 &subpage_writeb,
3568 &subpage_writew,
3569 &subpage_writel,
3570};
3571
c227f099
AL
3572static int subpage_register (subpage_t *mmio, uint32_t start, uint32_t end,
3573 ram_addr_t memory, ram_addr_t region_offset)
db7b5426
BS
3574{
3575 int idx, eidx;
3576
3577 if (start >= TARGET_PAGE_SIZE || end >= TARGET_PAGE_SIZE)
3578 return -1;
3579 idx = SUBPAGE_IDX(start);
3580 eidx = SUBPAGE_IDX(end);
3581#if defined(DEBUG_SUBPAGE)
0bf9e31a 3582 printf("%s: %p start %08x end %08x idx %08x eidx %08x mem %ld\n", __func__,
db7b5426
BS
3583 mmio, start, end, idx, eidx, memory);
3584#endif
95c318f5
GN
3585 if ((memory & ~TARGET_PAGE_MASK) == IO_MEM_RAM)
3586 memory = IO_MEM_UNASSIGNED;
f6405247 3587 memory = (memory >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
db7b5426 3588 for (; idx <= eidx; idx++) {
f6405247
RH
3589 mmio->sub_io_index[idx] = memory;
3590 mmio->region_offset[idx] = region_offset;
db7b5426
BS
3591 }
3592
3593 return 0;
3594}
3595
f6405247
RH
3596static subpage_t *subpage_init (target_phys_addr_t base, ram_addr_t *phys,
3597 ram_addr_t orig_memory,
3598 ram_addr_t region_offset)
db7b5426 3599{
c227f099 3600 subpage_t *mmio;
db7b5426
BS
3601 int subpage_memory;
3602
c227f099 3603 mmio = qemu_mallocz(sizeof(subpage_t));
1eec614b
AL
3604
3605 mmio->base = base;
2507c12a
AG
3606 subpage_memory = cpu_register_io_memory(subpage_read, subpage_write, mmio,
3607 DEVICE_NATIVE_ENDIAN);
db7b5426 3608#if defined(DEBUG_SUBPAGE)
1eec614b
AL
3609 printf("%s: %p base " TARGET_FMT_plx " len %08x %d\n", __func__,
3610 mmio, base, TARGET_PAGE_SIZE, subpage_memory);
db7b5426 3611#endif
1eec614b 3612 *phys = subpage_memory | IO_MEM_SUBPAGE;
f6405247 3613 subpage_register(mmio, 0, TARGET_PAGE_SIZE-1, orig_memory, region_offset);
db7b5426
BS
3614
3615 return mmio;
3616}
3617
88715657
AL
3618static int get_free_io_mem_idx(void)
3619{
3620 int i;
3621
3622 for (i = 0; i<IO_MEM_NB_ENTRIES; i++)
3623 if (!io_mem_used[i]) {
3624 io_mem_used[i] = 1;
3625 return i;
3626 }
c6703b47 3627 fprintf(stderr, "RAN out out io_mem_idx, max %d !\n", IO_MEM_NB_ENTRIES);
88715657
AL
3628 return -1;
3629}
3630
dd310534
AG
3631/*
3632 * Usually, devices operate in little endian mode. There are devices out
3633 * there that operate in big endian too. Each device gets byte swapped
3634 * mmio if plugged onto a CPU that does the other endianness.
3635 *
3636 * CPU Device swap?
3637 *
3638 * little little no
3639 * little big yes
3640 * big little yes
3641 * big big no
3642 */
3643
3644typedef struct SwapEndianContainer {
3645 CPUReadMemoryFunc *read[3];
3646 CPUWriteMemoryFunc *write[3];
3647 void *opaque;
3648} SwapEndianContainer;
3649
3650static uint32_t swapendian_mem_readb (void *opaque, target_phys_addr_t addr)
3651{
3652 uint32_t val;
3653 SwapEndianContainer *c = opaque;
3654 val = c->read[0](c->opaque, addr);
3655 return val;
3656}
3657
3658static uint32_t swapendian_mem_readw(void *opaque, target_phys_addr_t addr)
3659{
3660 uint32_t val;
3661 SwapEndianContainer *c = opaque;
3662 val = bswap16(c->read[1](c->opaque, addr));
3663 return val;
3664}
3665
3666static uint32_t swapendian_mem_readl(void *opaque, target_phys_addr_t addr)
3667{
3668 uint32_t val;
3669 SwapEndianContainer *c = opaque;
3670 val = bswap32(c->read[2](c->opaque, addr));
3671 return val;
3672}
3673
3674static CPUReadMemoryFunc * const swapendian_readfn[3]={
3675 swapendian_mem_readb,
3676 swapendian_mem_readw,
3677 swapendian_mem_readl
3678};
3679
3680static void swapendian_mem_writeb(void *opaque, target_phys_addr_t addr,
3681 uint32_t val)
3682{
3683 SwapEndianContainer *c = opaque;
3684 c->write[0](c->opaque, addr, val);
3685}
3686
3687static void swapendian_mem_writew(void *opaque, target_phys_addr_t addr,
3688 uint32_t val)
3689{
3690 SwapEndianContainer *c = opaque;
3691 c->write[1](c->opaque, addr, bswap16(val));
3692}
3693
3694static void swapendian_mem_writel(void *opaque, target_phys_addr_t addr,
3695 uint32_t val)
3696{
3697 SwapEndianContainer *c = opaque;
3698 c->write[2](c->opaque, addr, bswap32(val));
3699}
3700
3701static CPUWriteMemoryFunc * const swapendian_writefn[3]={
3702 swapendian_mem_writeb,
3703 swapendian_mem_writew,
3704 swapendian_mem_writel
3705};
3706
3707static void swapendian_init(int io_index)
3708{
3709 SwapEndianContainer *c = qemu_malloc(sizeof(SwapEndianContainer));
3710 int i;
3711
3712 /* Swap mmio for big endian targets */
3713 c->opaque = io_mem_opaque[io_index];
3714 for (i = 0; i < 3; i++) {
3715 c->read[i] = io_mem_read[io_index][i];
3716 c->write[i] = io_mem_write[io_index][i];
3717
3718 io_mem_read[io_index][i] = swapendian_readfn[i];
3719 io_mem_write[io_index][i] = swapendian_writefn[i];
3720 }
3721 io_mem_opaque[io_index] = c;
3722}
3723
3724static void swapendian_del(int io_index)
3725{
3726 if (io_mem_read[io_index][0] == swapendian_readfn[0]) {
3727 qemu_free(io_mem_opaque[io_index]);
3728 }
3729}
3730
33417e70
FB
3731/* mem_read and mem_write are arrays of functions containing the
3732 function to access byte (index 0), word (index 1) and dword (index
0b4e6e3e 3733 2). Functions can be omitted with a NULL function pointer.
3ee89922 3734 If io_index is non zero, the corresponding io zone is
4254fab8
BS
3735 modified. If it is zero, a new io zone is allocated. The return
3736 value can be used with cpu_register_physical_memory(). (-1) is
3737 returned if error. */
1eed09cb 3738static int cpu_register_io_memory_fixed(int io_index,
d60efc6b
BS
3739 CPUReadMemoryFunc * const *mem_read,
3740 CPUWriteMemoryFunc * const *mem_write,
dd310534 3741 void *opaque, enum device_endian endian)
33417e70 3742{
3cab721d
RH
3743 int i;
3744
33417e70 3745 if (io_index <= 0) {
88715657
AL
3746 io_index = get_free_io_mem_idx();
3747 if (io_index == -1)
3748 return io_index;
33417e70 3749 } else {
1eed09cb 3750 io_index >>= IO_MEM_SHIFT;
33417e70
FB
3751 if (io_index >= IO_MEM_NB_ENTRIES)
3752 return -1;
3753 }
b5ff1b31 3754
3cab721d
RH
3755 for (i = 0; i < 3; ++i) {
3756 io_mem_read[io_index][i]
3757 = (mem_read[i] ? mem_read[i] : unassigned_mem_read[i]);
3758 }
3759 for (i = 0; i < 3; ++i) {
3760 io_mem_write[io_index][i]
3761 = (mem_write[i] ? mem_write[i] : unassigned_mem_write[i]);
3762 }
a4193c8a 3763 io_mem_opaque[io_index] = opaque;
f6405247 3764
dd310534
AG
3765 switch (endian) {
3766 case DEVICE_BIG_ENDIAN:
3767#ifndef TARGET_WORDS_BIGENDIAN
3768 swapendian_init(io_index);
3769#endif
3770 break;
3771 case DEVICE_LITTLE_ENDIAN:
3772#ifdef TARGET_WORDS_BIGENDIAN
3773 swapendian_init(io_index);
3774#endif
3775 break;
3776 case DEVICE_NATIVE_ENDIAN:
3777 default:
3778 break;
3779 }
3780
f6405247 3781 return (io_index << IO_MEM_SHIFT);
33417e70 3782}
61382a50 3783
d60efc6b
BS
3784int cpu_register_io_memory(CPUReadMemoryFunc * const *mem_read,
3785 CPUWriteMemoryFunc * const *mem_write,
dd310534 3786 void *opaque, enum device_endian endian)
1eed09cb 3787{
2507c12a 3788 return cpu_register_io_memory_fixed(0, mem_read, mem_write, opaque, endian);
1eed09cb
AK
3789}
3790
88715657
AL
3791void cpu_unregister_io_memory(int io_table_address)
3792{
3793 int i;
3794 int io_index = io_table_address >> IO_MEM_SHIFT;
3795
dd310534
AG
3796 swapendian_del(io_index);
3797
88715657
AL
3798 for (i=0;i < 3; i++) {
3799 io_mem_read[io_index][i] = unassigned_mem_read[i];
3800 io_mem_write[io_index][i] = unassigned_mem_write[i];
3801 }
3802 io_mem_opaque[io_index] = NULL;
3803 io_mem_used[io_index] = 0;
3804}
3805
e9179ce1
AK
3806static void io_mem_init(void)
3807{
3808 int i;
3809
2507c12a
AG
3810 cpu_register_io_memory_fixed(IO_MEM_ROM, error_mem_read,
3811 unassigned_mem_write, NULL,
3812 DEVICE_NATIVE_ENDIAN);
3813 cpu_register_io_memory_fixed(IO_MEM_UNASSIGNED, unassigned_mem_read,
3814 unassigned_mem_write, NULL,
3815 DEVICE_NATIVE_ENDIAN);
3816 cpu_register_io_memory_fixed(IO_MEM_NOTDIRTY, error_mem_read,
3817 notdirty_mem_write, NULL,
3818 DEVICE_NATIVE_ENDIAN);
e9179ce1
AK
3819 for (i=0; i<5; i++)
3820 io_mem_used[i] = 1;
3821
3822 io_mem_watch = cpu_register_io_memory(watch_mem_read,
2507c12a
AG
3823 watch_mem_write, NULL,
3824 DEVICE_NATIVE_ENDIAN);
e9179ce1
AK
3825}
3826
62152b8a
AK
3827static void memory_map_init(void)
3828{
3829 system_memory = qemu_malloc(sizeof(*system_memory));
8417cebf 3830 memory_region_init(system_memory, "system", INT64_MAX);
62152b8a
AK
3831 set_system_memory_map(system_memory);
3832}
3833
3834MemoryRegion *get_system_memory(void)
3835{
3836 return system_memory;
3837}
3838
e2eef170
PB
3839#endif /* !defined(CONFIG_USER_ONLY) */
3840
13eb76e0
FB
3841/* physical memory access (slow version, mainly for debug) */
3842#if defined(CONFIG_USER_ONLY)
a68fe89c
PB
3843int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
3844 uint8_t *buf, int len, int is_write)
13eb76e0
FB
3845{
3846 int l, flags;
3847 target_ulong page;
53a5960a 3848 void * p;
13eb76e0
FB
3849
3850 while (len > 0) {
3851 page = addr & TARGET_PAGE_MASK;
3852 l = (page + TARGET_PAGE_SIZE) - addr;
3853 if (l > len)
3854 l = len;
3855 flags = page_get_flags(page);
3856 if (!(flags & PAGE_VALID))
a68fe89c 3857 return -1;
13eb76e0
FB
3858 if (is_write) {
3859 if (!(flags & PAGE_WRITE))
a68fe89c 3860 return -1;
579a97f7 3861 /* XXX: this code should not depend on lock_user */
72fb7daa 3862 if (!(p = lock_user(VERIFY_WRITE, addr, l, 0)))
a68fe89c 3863 return -1;
72fb7daa
AJ
3864 memcpy(p, buf, l);
3865 unlock_user(p, addr, l);
13eb76e0
FB
3866 } else {
3867 if (!(flags & PAGE_READ))
a68fe89c 3868 return -1;
579a97f7 3869 /* XXX: this code should not depend on lock_user */
72fb7daa 3870 if (!(p = lock_user(VERIFY_READ, addr, l, 1)))
a68fe89c 3871 return -1;
72fb7daa 3872 memcpy(buf, p, l);
5b257578 3873 unlock_user(p, addr, 0);
13eb76e0
FB
3874 }
3875 len -= l;
3876 buf += l;
3877 addr += l;
3878 }
a68fe89c 3879 return 0;
13eb76e0 3880}
8df1cd07 3881
13eb76e0 3882#else
c227f099 3883void cpu_physical_memory_rw(target_phys_addr_t addr, uint8_t *buf,
13eb76e0
FB
3884 int len, int is_write)
3885{
3886 int l, io_index;
3887 uint8_t *ptr;
3888 uint32_t val;
c227f099 3889 target_phys_addr_t page;
8ca5692d 3890 ram_addr_t pd;
92e873b9 3891 PhysPageDesc *p;
3b46e624 3892
13eb76e0
FB
3893 while (len > 0) {
3894 page = addr & TARGET_PAGE_MASK;
3895 l = (page + TARGET_PAGE_SIZE) - addr;
3896 if (l > len)
3897 l = len;
92e873b9 3898 p = phys_page_find(page >> TARGET_PAGE_BITS);
13eb76e0
FB
3899 if (!p) {
3900 pd = IO_MEM_UNASSIGNED;
3901 } else {
3902 pd = p->phys_offset;
3903 }
3b46e624 3904
13eb76e0 3905 if (is_write) {
3a7d929e 3906 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
c227f099 3907 target_phys_addr_t addr1 = addr;
13eb76e0 3908 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18 3909 if (p)
6c2934db 3910 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
6a00d601
FB
3911 /* XXX: could force cpu_single_env to NULL to avoid
3912 potential bugs */
6c2934db 3913 if (l >= 4 && ((addr1 & 3) == 0)) {
1c213d19 3914 /* 32 bit write access */
c27004ec 3915 val = ldl_p(buf);
6c2934db 3916 io_mem_write[io_index][2](io_mem_opaque[io_index], addr1, val);
13eb76e0 3917 l = 4;
6c2934db 3918 } else if (l >= 2 && ((addr1 & 1) == 0)) {
1c213d19 3919 /* 16 bit write access */
c27004ec 3920 val = lduw_p(buf);
6c2934db 3921 io_mem_write[io_index][1](io_mem_opaque[io_index], addr1, val);
13eb76e0
FB
3922 l = 2;
3923 } else {
1c213d19 3924 /* 8 bit write access */
c27004ec 3925 val = ldub_p(buf);
6c2934db 3926 io_mem_write[io_index][0](io_mem_opaque[io_index], addr1, val);
13eb76e0
FB
3927 l = 1;
3928 }
3929 } else {
8ca5692d 3930 ram_addr_t addr1;
b448f2f3 3931 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
13eb76e0 3932 /* RAM case */
5579c7f3 3933 ptr = qemu_get_ram_ptr(addr1);
13eb76e0 3934 memcpy(ptr, buf, l);
3a7d929e
FB
3935 if (!cpu_physical_memory_is_dirty(addr1)) {
3936 /* invalidate code */
3937 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
3938 /* set dirty bit */
f7c11b53
YT
3939 cpu_physical_memory_set_dirty_flags(
3940 addr1, (0xff & ~CODE_DIRTY_FLAG));
3a7d929e 3941 }
050a0ddf 3942 qemu_put_ram_ptr(ptr);
13eb76e0
FB
3943 }
3944 } else {
5fafdf24 3945 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
2a4188a3 3946 !(pd & IO_MEM_ROMD)) {
c227f099 3947 target_phys_addr_t addr1 = addr;
13eb76e0
FB
3948 /* I/O case */
3949 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18 3950 if (p)
6c2934db
AJ
3951 addr1 = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
3952 if (l >= 4 && ((addr1 & 3) == 0)) {
13eb76e0 3953 /* 32 bit read access */
6c2934db 3954 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr1);
c27004ec 3955 stl_p(buf, val);
13eb76e0 3956 l = 4;
6c2934db 3957 } else if (l >= 2 && ((addr1 & 1) == 0)) {
13eb76e0 3958 /* 16 bit read access */
6c2934db 3959 val = io_mem_read[io_index][1](io_mem_opaque[io_index], addr1);
c27004ec 3960 stw_p(buf, val);
13eb76e0
FB
3961 l = 2;
3962 } else {
1c213d19 3963 /* 8 bit read access */
6c2934db 3964 val = io_mem_read[io_index][0](io_mem_opaque[io_index], addr1);
c27004ec 3965 stb_p(buf, val);
13eb76e0
FB
3966 l = 1;
3967 }
3968 } else {
3969 /* RAM case */
050a0ddf
AP
3970 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK);
3971 memcpy(buf, ptr + (addr & ~TARGET_PAGE_MASK), l);
3972 qemu_put_ram_ptr(ptr);
13eb76e0
FB
3973 }
3974 }
3975 len -= l;
3976 buf += l;
3977 addr += l;
3978 }
3979}
8df1cd07 3980
d0ecd2aa 3981/* used for ROM loading : can write in RAM and ROM */
c227f099 3982void cpu_physical_memory_write_rom(target_phys_addr_t addr,
d0ecd2aa
FB
3983 const uint8_t *buf, int len)
3984{
3985 int l;
3986 uint8_t *ptr;
c227f099 3987 target_phys_addr_t page;
d0ecd2aa
FB
3988 unsigned long pd;
3989 PhysPageDesc *p;
3b46e624 3990
d0ecd2aa
FB
3991 while (len > 0) {
3992 page = addr & TARGET_PAGE_MASK;
3993 l = (page + TARGET_PAGE_SIZE) - addr;
3994 if (l > len)
3995 l = len;
3996 p = phys_page_find(page >> TARGET_PAGE_BITS);
3997 if (!p) {
3998 pd = IO_MEM_UNASSIGNED;
3999 } else {
4000 pd = p->phys_offset;
4001 }
3b46e624 4002
d0ecd2aa 4003 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM &&
2a4188a3
FB
4004 (pd & ~TARGET_PAGE_MASK) != IO_MEM_ROM &&
4005 !(pd & IO_MEM_ROMD)) {
d0ecd2aa
FB
4006 /* do nothing */
4007 } else {
4008 unsigned long addr1;
4009 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4010 /* ROM/RAM case */
5579c7f3 4011 ptr = qemu_get_ram_ptr(addr1);
d0ecd2aa 4012 memcpy(ptr, buf, l);
050a0ddf 4013 qemu_put_ram_ptr(ptr);
d0ecd2aa
FB
4014 }
4015 len -= l;
4016 buf += l;
4017 addr += l;
4018 }
4019}
4020
6d16c2f8
AL
4021typedef struct {
4022 void *buffer;
c227f099
AL
4023 target_phys_addr_t addr;
4024 target_phys_addr_t len;
6d16c2f8
AL
4025} BounceBuffer;
4026
4027static BounceBuffer bounce;
4028
ba223c29
AL
4029typedef struct MapClient {
4030 void *opaque;
4031 void (*callback)(void *opaque);
72cf2d4f 4032 QLIST_ENTRY(MapClient) link;
ba223c29
AL
4033} MapClient;
4034
72cf2d4f
BS
4035static QLIST_HEAD(map_client_list, MapClient) map_client_list
4036 = QLIST_HEAD_INITIALIZER(map_client_list);
ba223c29
AL
4037
4038void *cpu_register_map_client(void *opaque, void (*callback)(void *opaque))
4039{
4040 MapClient *client = qemu_malloc(sizeof(*client));
4041
4042 client->opaque = opaque;
4043 client->callback = callback;
72cf2d4f 4044 QLIST_INSERT_HEAD(&map_client_list, client, link);
ba223c29
AL
4045 return client;
4046}
4047
4048void cpu_unregister_map_client(void *_client)
4049{
4050 MapClient *client = (MapClient *)_client;
4051
72cf2d4f 4052 QLIST_REMOVE(client, link);
34d5e948 4053 qemu_free(client);
ba223c29
AL
4054}
4055
4056static void cpu_notify_map_clients(void)
4057{
4058 MapClient *client;
4059
72cf2d4f
BS
4060 while (!QLIST_EMPTY(&map_client_list)) {
4061 client = QLIST_FIRST(&map_client_list);
ba223c29 4062 client->callback(client->opaque);
34d5e948 4063 cpu_unregister_map_client(client);
ba223c29
AL
4064 }
4065}
4066
6d16c2f8
AL
4067/* Map a physical memory region into a host virtual address.
4068 * May map a subset of the requested range, given by and returned in *plen.
4069 * May return NULL if resources needed to perform the mapping are exhausted.
4070 * Use only for reads OR writes - not for read-modify-write operations.
ba223c29
AL
4071 * Use cpu_register_map_client() to know when retrying the map operation is
4072 * likely to succeed.
6d16c2f8 4073 */
c227f099
AL
4074void *cpu_physical_memory_map(target_phys_addr_t addr,
4075 target_phys_addr_t *plen,
6d16c2f8
AL
4076 int is_write)
4077{
c227f099 4078 target_phys_addr_t len = *plen;
38bee5dc 4079 target_phys_addr_t todo = 0;
6d16c2f8 4080 int l;
c227f099 4081 target_phys_addr_t page;
6d16c2f8
AL
4082 unsigned long pd;
4083 PhysPageDesc *p;
f15fbc4b 4084 ram_addr_t raddr = RAM_ADDR_MAX;
8ab934f9
SS
4085 ram_addr_t rlen;
4086 void *ret;
6d16c2f8
AL
4087
4088 while (len > 0) {
4089 page = addr & TARGET_PAGE_MASK;
4090 l = (page + TARGET_PAGE_SIZE) - addr;
4091 if (l > len)
4092 l = len;
4093 p = phys_page_find(page >> TARGET_PAGE_BITS);
4094 if (!p) {
4095 pd = IO_MEM_UNASSIGNED;
4096 } else {
4097 pd = p->phys_offset;
4098 }
4099
4100 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
38bee5dc 4101 if (todo || bounce.buffer) {
6d16c2f8
AL
4102 break;
4103 }
4104 bounce.buffer = qemu_memalign(TARGET_PAGE_SIZE, TARGET_PAGE_SIZE);
4105 bounce.addr = addr;
4106 bounce.len = l;
4107 if (!is_write) {
54f7b4a3 4108 cpu_physical_memory_read(addr, bounce.buffer, l);
6d16c2f8 4109 }
38bee5dc
SS
4110
4111 *plen = l;
4112 return bounce.buffer;
6d16c2f8 4113 }
8ab934f9
SS
4114 if (!todo) {
4115 raddr = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4116 }
6d16c2f8
AL
4117
4118 len -= l;
4119 addr += l;
38bee5dc 4120 todo += l;
6d16c2f8 4121 }
8ab934f9
SS
4122 rlen = todo;
4123 ret = qemu_ram_ptr_length(raddr, &rlen);
4124 *plen = rlen;
4125 return ret;
6d16c2f8
AL
4126}
4127
4128/* Unmaps a memory region previously mapped by cpu_physical_memory_map().
4129 * Will also mark the memory as dirty if is_write == 1. access_len gives
4130 * the amount of memory that was actually read or written by the caller.
4131 */
c227f099
AL
4132void cpu_physical_memory_unmap(void *buffer, target_phys_addr_t len,
4133 int is_write, target_phys_addr_t access_len)
6d16c2f8
AL
4134{
4135 if (buffer != bounce.buffer) {
4136 if (is_write) {
e890261f 4137 ram_addr_t addr1 = qemu_ram_addr_from_host_nofail(buffer);
6d16c2f8
AL
4138 while (access_len) {
4139 unsigned l;
4140 l = TARGET_PAGE_SIZE;
4141 if (l > access_len)
4142 l = access_len;
4143 if (!cpu_physical_memory_is_dirty(addr1)) {
4144 /* invalidate code */
4145 tb_invalidate_phys_page_range(addr1, addr1 + l, 0);
4146 /* set dirty bit */
f7c11b53
YT
4147 cpu_physical_memory_set_dirty_flags(
4148 addr1, (0xff & ~CODE_DIRTY_FLAG));
6d16c2f8
AL
4149 }
4150 addr1 += l;
4151 access_len -= l;
4152 }
4153 }
868bb33f 4154 if (xen_enabled()) {
e41d7c69 4155 xen_invalidate_map_cache_entry(buffer);
050a0ddf 4156 }
6d16c2f8
AL
4157 return;
4158 }
4159 if (is_write) {
4160 cpu_physical_memory_write(bounce.addr, bounce.buffer, access_len);
4161 }
f8a83245 4162 qemu_vfree(bounce.buffer);
6d16c2f8 4163 bounce.buffer = NULL;
ba223c29 4164 cpu_notify_map_clients();
6d16c2f8 4165}
d0ecd2aa 4166
8df1cd07 4167/* warning: addr must be aligned */
1e78bcc1
AG
4168static inline uint32_t ldl_phys_internal(target_phys_addr_t addr,
4169 enum device_endian endian)
8df1cd07
FB
4170{
4171 int io_index;
4172 uint8_t *ptr;
4173 uint32_t val;
4174 unsigned long pd;
4175 PhysPageDesc *p;
4176
4177 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4178 if (!p) {
4179 pd = IO_MEM_UNASSIGNED;
4180 } else {
4181 pd = p->phys_offset;
4182 }
3b46e624 4183
5fafdf24 4184 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
2a4188a3 4185 !(pd & IO_MEM_ROMD)) {
8df1cd07
FB
4186 /* I/O case */
4187 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4188 if (p)
4189 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
8df1cd07 4190 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
1e78bcc1
AG
4191#if defined(TARGET_WORDS_BIGENDIAN)
4192 if (endian == DEVICE_LITTLE_ENDIAN) {
4193 val = bswap32(val);
4194 }
4195#else
4196 if (endian == DEVICE_BIG_ENDIAN) {
4197 val = bswap32(val);
4198 }
4199#endif
8df1cd07
FB
4200 } else {
4201 /* RAM case */
5579c7f3 4202 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
8df1cd07 4203 (addr & ~TARGET_PAGE_MASK);
1e78bcc1
AG
4204 switch (endian) {
4205 case DEVICE_LITTLE_ENDIAN:
4206 val = ldl_le_p(ptr);
4207 break;
4208 case DEVICE_BIG_ENDIAN:
4209 val = ldl_be_p(ptr);
4210 break;
4211 default:
4212 val = ldl_p(ptr);
4213 break;
4214 }
8df1cd07
FB
4215 }
4216 return val;
4217}
4218
1e78bcc1
AG
4219uint32_t ldl_phys(target_phys_addr_t addr)
4220{
4221 return ldl_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
4222}
4223
4224uint32_t ldl_le_phys(target_phys_addr_t addr)
4225{
4226 return ldl_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
4227}
4228
4229uint32_t ldl_be_phys(target_phys_addr_t addr)
4230{
4231 return ldl_phys_internal(addr, DEVICE_BIG_ENDIAN);
4232}
4233
84b7b8e7 4234/* warning: addr must be aligned */
1e78bcc1
AG
4235static inline uint64_t ldq_phys_internal(target_phys_addr_t addr,
4236 enum device_endian endian)
84b7b8e7
FB
4237{
4238 int io_index;
4239 uint8_t *ptr;
4240 uint64_t val;
4241 unsigned long pd;
4242 PhysPageDesc *p;
4243
4244 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4245 if (!p) {
4246 pd = IO_MEM_UNASSIGNED;
4247 } else {
4248 pd = p->phys_offset;
4249 }
3b46e624 4250
2a4188a3
FB
4251 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
4252 !(pd & IO_MEM_ROMD)) {
84b7b8e7
FB
4253 /* I/O case */
4254 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4255 if (p)
4256 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
1e78bcc1
AG
4257
4258 /* XXX This is broken when device endian != cpu endian.
4259 Fix and add "endian" variable check */
84b7b8e7
FB
4260#ifdef TARGET_WORDS_BIGENDIAN
4261 val = (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr) << 32;
4262 val |= io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4);
4263#else
4264 val = io_mem_read[io_index][2](io_mem_opaque[io_index], addr);
4265 val |= (uint64_t)io_mem_read[io_index][2](io_mem_opaque[io_index], addr + 4) << 32;
4266#endif
4267 } else {
4268 /* RAM case */
5579c7f3 4269 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
84b7b8e7 4270 (addr & ~TARGET_PAGE_MASK);
1e78bcc1
AG
4271 switch (endian) {
4272 case DEVICE_LITTLE_ENDIAN:
4273 val = ldq_le_p(ptr);
4274 break;
4275 case DEVICE_BIG_ENDIAN:
4276 val = ldq_be_p(ptr);
4277 break;
4278 default:
4279 val = ldq_p(ptr);
4280 break;
4281 }
84b7b8e7
FB
4282 }
4283 return val;
4284}
4285
1e78bcc1
AG
4286uint64_t ldq_phys(target_phys_addr_t addr)
4287{
4288 return ldq_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
4289}
4290
4291uint64_t ldq_le_phys(target_phys_addr_t addr)
4292{
4293 return ldq_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
4294}
4295
4296uint64_t ldq_be_phys(target_phys_addr_t addr)
4297{
4298 return ldq_phys_internal(addr, DEVICE_BIG_ENDIAN);
4299}
4300
aab33094 4301/* XXX: optimize */
c227f099 4302uint32_t ldub_phys(target_phys_addr_t addr)
aab33094
FB
4303{
4304 uint8_t val;
4305 cpu_physical_memory_read(addr, &val, 1);
4306 return val;
4307}
4308
733f0b02 4309/* warning: addr must be aligned */
1e78bcc1
AG
4310static inline uint32_t lduw_phys_internal(target_phys_addr_t addr,
4311 enum device_endian endian)
aab33094 4312{
733f0b02
MT
4313 int io_index;
4314 uint8_t *ptr;
4315 uint64_t val;
4316 unsigned long pd;
4317 PhysPageDesc *p;
4318
4319 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4320 if (!p) {
4321 pd = IO_MEM_UNASSIGNED;
4322 } else {
4323 pd = p->phys_offset;
4324 }
4325
4326 if ((pd & ~TARGET_PAGE_MASK) > IO_MEM_ROM &&
4327 !(pd & IO_MEM_ROMD)) {
4328 /* I/O case */
4329 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
4330 if (p)
4331 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
4332 val = io_mem_read[io_index][1](io_mem_opaque[io_index], addr);
1e78bcc1
AG
4333#if defined(TARGET_WORDS_BIGENDIAN)
4334 if (endian == DEVICE_LITTLE_ENDIAN) {
4335 val = bswap16(val);
4336 }
4337#else
4338 if (endian == DEVICE_BIG_ENDIAN) {
4339 val = bswap16(val);
4340 }
4341#endif
733f0b02
MT
4342 } else {
4343 /* RAM case */
4344 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
4345 (addr & ~TARGET_PAGE_MASK);
1e78bcc1
AG
4346 switch (endian) {
4347 case DEVICE_LITTLE_ENDIAN:
4348 val = lduw_le_p(ptr);
4349 break;
4350 case DEVICE_BIG_ENDIAN:
4351 val = lduw_be_p(ptr);
4352 break;
4353 default:
4354 val = lduw_p(ptr);
4355 break;
4356 }
733f0b02
MT
4357 }
4358 return val;
aab33094
FB
4359}
4360
1e78bcc1
AG
4361uint32_t lduw_phys(target_phys_addr_t addr)
4362{
4363 return lduw_phys_internal(addr, DEVICE_NATIVE_ENDIAN);
4364}
4365
4366uint32_t lduw_le_phys(target_phys_addr_t addr)
4367{
4368 return lduw_phys_internal(addr, DEVICE_LITTLE_ENDIAN);
4369}
4370
4371uint32_t lduw_be_phys(target_phys_addr_t addr)
4372{
4373 return lduw_phys_internal(addr, DEVICE_BIG_ENDIAN);
4374}
4375
8df1cd07
FB
4376/* warning: addr must be aligned. The ram page is not masked as dirty
4377 and the code inside is not invalidated. It is useful if the dirty
4378 bits are used to track modified PTEs */
c227f099 4379void stl_phys_notdirty(target_phys_addr_t addr, uint32_t val)
8df1cd07
FB
4380{
4381 int io_index;
4382 uint8_t *ptr;
4383 unsigned long pd;
4384 PhysPageDesc *p;
4385
4386 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4387 if (!p) {
4388 pd = IO_MEM_UNASSIGNED;
4389 } else {
4390 pd = p->phys_offset;
4391 }
3b46e624 4392
3a7d929e 4393 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
8df1cd07 4394 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4395 if (p)
4396 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
8df1cd07
FB
4397 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4398 } else {
74576198 4399 unsigned long addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
5579c7f3 4400 ptr = qemu_get_ram_ptr(addr1);
8df1cd07 4401 stl_p(ptr, val);
74576198
AL
4402
4403 if (unlikely(in_migration)) {
4404 if (!cpu_physical_memory_is_dirty(addr1)) {
4405 /* invalidate code */
4406 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
4407 /* set dirty bit */
f7c11b53
YT
4408 cpu_physical_memory_set_dirty_flags(
4409 addr1, (0xff & ~CODE_DIRTY_FLAG));
74576198
AL
4410 }
4411 }
8df1cd07
FB
4412 }
4413}
4414
c227f099 4415void stq_phys_notdirty(target_phys_addr_t addr, uint64_t val)
bc98a7ef
JM
4416{
4417 int io_index;
4418 uint8_t *ptr;
4419 unsigned long pd;
4420 PhysPageDesc *p;
4421
4422 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4423 if (!p) {
4424 pd = IO_MEM_UNASSIGNED;
4425 } else {
4426 pd = p->phys_offset;
4427 }
3b46e624 4428
bc98a7ef
JM
4429 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
4430 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4431 if (p)
4432 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
bc98a7ef
JM
4433#ifdef TARGET_WORDS_BIGENDIAN
4434 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val >> 32);
4435 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val);
4436#else
4437 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4438 io_mem_write[io_index][2](io_mem_opaque[io_index], addr + 4, val >> 32);
4439#endif
4440 } else {
5579c7f3 4441 ptr = qemu_get_ram_ptr(pd & TARGET_PAGE_MASK) +
bc98a7ef
JM
4442 (addr & ~TARGET_PAGE_MASK);
4443 stq_p(ptr, val);
4444 }
4445}
4446
8df1cd07 4447/* warning: addr must be aligned */
1e78bcc1
AG
4448static inline void stl_phys_internal(target_phys_addr_t addr, uint32_t val,
4449 enum device_endian endian)
8df1cd07
FB
4450{
4451 int io_index;
4452 uint8_t *ptr;
4453 unsigned long pd;
4454 PhysPageDesc *p;
4455
4456 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4457 if (!p) {
4458 pd = IO_MEM_UNASSIGNED;
4459 } else {
4460 pd = p->phys_offset;
4461 }
3b46e624 4462
3a7d929e 4463 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
8df1cd07 4464 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
8da3ff18
PB
4465 if (p)
4466 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
1e78bcc1
AG
4467#if defined(TARGET_WORDS_BIGENDIAN)
4468 if (endian == DEVICE_LITTLE_ENDIAN) {
4469 val = bswap32(val);
4470 }
4471#else
4472 if (endian == DEVICE_BIG_ENDIAN) {
4473 val = bswap32(val);
4474 }
4475#endif
8df1cd07
FB
4476 io_mem_write[io_index][2](io_mem_opaque[io_index], addr, val);
4477 } else {
4478 unsigned long addr1;
4479 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4480 /* RAM case */
5579c7f3 4481 ptr = qemu_get_ram_ptr(addr1);
1e78bcc1
AG
4482 switch (endian) {
4483 case DEVICE_LITTLE_ENDIAN:
4484 stl_le_p(ptr, val);
4485 break;
4486 case DEVICE_BIG_ENDIAN:
4487 stl_be_p(ptr, val);
4488 break;
4489 default:
4490 stl_p(ptr, val);
4491 break;
4492 }
3a7d929e
FB
4493 if (!cpu_physical_memory_is_dirty(addr1)) {
4494 /* invalidate code */
4495 tb_invalidate_phys_page_range(addr1, addr1 + 4, 0);
4496 /* set dirty bit */
f7c11b53
YT
4497 cpu_physical_memory_set_dirty_flags(addr1,
4498 (0xff & ~CODE_DIRTY_FLAG));
3a7d929e 4499 }
8df1cd07
FB
4500 }
4501}
4502
1e78bcc1
AG
4503void stl_phys(target_phys_addr_t addr, uint32_t val)
4504{
4505 stl_phys_internal(addr, val, DEVICE_NATIVE_ENDIAN);
4506}
4507
4508void stl_le_phys(target_phys_addr_t addr, uint32_t val)
4509{
4510 stl_phys_internal(addr, val, DEVICE_LITTLE_ENDIAN);
4511}
4512
4513void stl_be_phys(target_phys_addr_t addr, uint32_t val)
4514{
4515 stl_phys_internal(addr, val, DEVICE_BIG_ENDIAN);
4516}
4517
aab33094 4518/* XXX: optimize */
c227f099 4519void stb_phys(target_phys_addr_t addr, uint32_t val)
aab33094
FB
4520{
4521 uint8_t v = val;
4522 cpu_physical_memory_write(addr, &v, 1);
4523}
4524
733f0b02 4525/* warning: addr must be aligned */
1e78bcc1
AG
4526static inline void stw_phys_internal(target_phys_addr_t addr, uint32_t val,
4527 enum device_endian endian)
aab33094 4528{
733f0b02
MT
4529 int io_index;
4530 uint8_t *ptr;
4531 unsigned long pd;
4532 PhysPageDesc *p;
4533
4534 p = phys_page_find(addr >> TARGET_PAGE_BITS);
4535 if (!p) {
4536 pd = IO_MEM_UNASSIGNED;
4537 } else {
4538 pd = p->phys_offset;
4539 }
4540
4541 if ((pd & ~TARGET_PAGE_MASK) != IO_MEM_RAM) {
4542 io_index = (pd >> IO_MEM_SHIFT) & (IO_MEM_NB_ENTRIES - 1);
4543 if (p)
4544 addr = (addr & ~TARGET_PAGE_MASK) + p->region_offset;
1e78bcc1
AG
4545#if defined(TARGET_WORDS_BIGENDIAN)
4546 if (endian == DEVICE_LITTLE_ENDIAN) {
4547 val = bswap16(val);
4548 }
4549#else
4550 if (endian == DEVICE_BIG_ENDIAN) {
4551 val = bswap16(val);
4552 }
4553#endif
733f0b02
MT
4554 io_mem_write[io_index][1](io_mem_opaque[io_index], addr, val);
4555 } else {
4556 unsigned long addr1;
4557 addr1 = (pd & TARGET_PAGE_MASK) + (addr & ~TARGET_PAGE_MASK);
4558 /* RAM case */
4559 ptr = qemu_get_ram_ptr(addr1);
1e78bcc1
AG
4560 switch (endian) {
4561 case DEVICE_LITTLE_ENDIAN:
4562 stw_le_p(ptr, val);
4563 break;
4564 case DEVICE_BIG_ENDIAN:
4565 stw_be_p(ptr, val);
4566 break;
4567 default:
4568 stw_p(ptr, val);
4569 break;
4570 }
733f0b02
MT
4571 if (!cpu_physical_memory_is_dirty(addr1)) {
4572 /* invalidate code */
4573 tb_invalidate_phys_page_range(addr1, addr1 + 2, 0);
4574 /* set dirty bit */
4575 cpu_physical_memory_set_dirty_flags(addr1,
4576 (0xff & ~CODE_DIRTY_FLAG));
4577 }
4578 }
aab33094
FB
4579}
4580
1e78bcc1
AG
4581void stw_phys(target_phys_addr_t addr, uint32_t val)
4582{
4583 stw_phys_internal(addr, val, DEVICE_NATIVE_ENDIAN);
4584}
4585
4586void stw_le_phys(target_phys_addr_t addr, uint32_t val)
4587{
4588 stw_phys_internal(addr, val, DEVICE_LITTLE_ENDIAN);
4589}
4590
4591void stw_be_phys(target_phys_addr_t addr, uint32_t val)
4592{
4593 stw_phys_internal(addr, val, DEVICE_BIG_ENDIAN);
4594}
4595
aab33094 4596/* XXX: optimize */
c227f099 4597void stq_phys(target_phys_addr_t addr, uint64_t val)
aab33094
FB
4598{
4599 val = tswap64(val);
71d2b725 4600 cpu_physical_memory_write(addr, &val, 8);
aab33094
FB
4601}
4602
1e78bcc1
AG
4603void stq_le_phys(target_phys_addr_t addr, uint64_t val)
4604{
4605 val = cpu_to_le64(val);
4606 cpu_physical_memory_write(addr, &val, 8);
4607}
4608
4609void stq_be_phys(target_phys_addr_t addr, uint64_t val)
4610{
4611 val = cpu_to_be64(val);
4612 cpu_physical_memory_write(addr, &val, 8);
4613}
4614
5e2972fd 4615/* virtual memory access for debug (includes writing to ROM) */
5fafdf24 4616int cpu_memory_rw_debug(CPUState *env, target_ulong addr,
b448f2f3 4617 uint8_t *buf, int len, int is_write)
13eb76e0
FB
4618{
4619 int l;
c227f099 4620 target_phys_addr_t phys_addr;
9b3c35e0 4621 target_ulong page;
13eb76e0
FB
4622
4623 while (len > 0) {
4624 page = addr & TARGET_PAGE_MASK;
4625 phys_addr = cpu_get_phys_page_debug(env, page);
4626 /* if no physical page mapped, return an error */
4627 if (phys_addr == -1)
4628 return -1;
4629 l = (page + TARGET_PAGE_SIZE) - addr;
4630 if (l > len)
4631 l = len;
5e2972fd 4632 phys_addr += (addr & ~TARGET_PAGE_MASK);
5e2972fd
AL
4633 if (is_write)
4634 cpu_physical_memory_write_rom(phys_addr, buf, l);
4635 else
5e2972fd 4636 cpu_physical_memory_rw(phys_addr, buf, l, is_write);
13eb76e0
FB
4637 len -= l;
4638 buf += l;
4639 addr += l;
4640 }
4641 return 0;
4642}
a68fe89c 4643#endif
13eb76e0 4644
2e70f6ef
PB
4645/* in deterministic execution mode, instructions doing device I/Os
4646 must be at the end of the TB */
4647void cpu_io_recompile(CPUState *env, void *retaddr)
4648{
4649 TranslationBlock *tb;
4650 uint32_t n, cflags;
4651 target_ulong pc, cs_base;
4652 uint64_t flags;
4653
4654 tb = tb_find_pc((unsigned long)retaddr);
4655 if (!tb) {
4656 cpu_abort(env, "cpu_io_recompile: could not find TB for pc=%p",
4657 retaddr);
4658 }
4659 n = env->icount_decr.u16.low + tb->icount;
618ba8e6 4660 cpu_restore_state(tb, env, (unsigned long)retaddr);
2e70f6ef 4661 /* Calculate how many instructions had been executed before the fault
bf20dc07 4662 occurred. */
2e70f6ef
PB
4663 n = n - env->icount_decr.u16.low;
4664 /* Generate a new TB ending on the I/O insn. */
4665 n++;
4666 /* On MIPS and SH, delay slot instructions can only be restarted if
4667 they were already the first instruction in the TB. If this is not
bf20dc07 4668 the first instruction in a TB then re-execute the preceding
2e70f6ef
PB
4669 branch. */
4670#if defined(TARGET_MIPS)
4671 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
4672 env->active_tc.PC -= 4;
4673 env->icount_decr.u16.low++;
4674 env->hflags &= ~MIPS_HFLAG_BMASK;
4675 }
4676#elif defined(TARGET_SH4)
4677 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
4678 && n > 1) {
4679 env->pc -= 2;
4680 env->icount_decr.u16.low++;
4681 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
4682 }
4683#endif
4684 /* This should never happen. */
4685 if (n > CF_COUNT_MASK)
4686 cpu_abort(env, "TB too big during recompile");
4687
4688 cflags = n | CF_LAST_IO;
4689 pc = tb->pc;
4690 cs_base = tb->cs_base;
4691 flags = tb->flags;
4692 tb_phys_invalidate(tb, -1);
4693 /* FIXME: In theory this could raise an exception. In practice
4694 we have already translated the block once so it's probably ok. */
4695 tb_gen_code(env, pc, cs_base, flags, cflags);
bf20dc07 4696 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
2e70f6ef
PB
4697 the first in the TB) then we end up generating a whole new TB and
4698 repeating the fault, which is horribly inefficient.
4699 Better would be to execute just this insn uncached, or generate a
4700 second new TB. */
4701 cpu_resume_from_signal(env, NULL);
4702}
4703
b3755a91
PB
4704#if !defined(CONFIG_USER_ONLY)
4705
055403b2 4706void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
e3db7226
FB
4707{
4708 int i, target_code_size, max_target_code_size;
4709 int direct_jmp_count, direct_jmp2_count, cross_page;
4710 TranslationBlock *tb;
3b46e624 4711
e3db7226
FB
4712 target_code_size = 0;
4713 max_target_code_size = 0;
4714 cross_page = 0;
4715 direct_jmp_count = 0;
4716 direct_jmp2_count = 0;
4717 for(i = 0; i < nb_tbs; i++) {
4718 tb = &tbs[i];
4719 target_code_size += tb->size;
4720 if (tb->size > max_target_code_size)
4721 max_target_code_size = tb->size;
4722 if (tb->page_addr[1] != -1)
4723 cross_page++;
4724 if (tb->tb_next_offset[0] != 0xffff) {
4725 direct_jmp_count++;
4726 if (tb->tb_next_offset[1] != 0xffff) {
4727 direct_jmp2_count++;
4728 }
4729 }
4730 }
4731 /* XXX: avoid using doubles ? */
57fec1fe 4732 cpu_fprintf(f, "Translation buffer state:\n");
055403b2 4733 cpu_fprintf(f, "gen code size %td/%ld\n",
26a5f13b
FB
4734 code_gen_ptr - code_gen_buffer, code_gen_buffer_max_size);
4735 cpu_fprintf(f, "TB count %d/%d\n",
4736 nb_tbs, code_gen_max_blocks);
5fafdf24 4737 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
e3db7226
FB
4738 nb_tbs ? target_code_size / nb_tbs : 0,
4739 max_target_code_size);
055403b2 4740 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
e3db7226
FB
4741 nb_tbs ? (code_gen_ptr - code_gen_buffer) / nb_tbs : 0,
4742 target_code_size ? (double) (code_gen_ptr - code_gen_buffer) / target_code_size : 0);
5fafdf24
TS
4743 cpu_fprintf(f, "cross page TB count %d (%d%%)\n",
4744 cross_page,
e3db7226
FB
4745 nb_tbs ? (cross_page * 100) / nb_tbs : 0);
4746 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
5fafdf24 4747 direct_jmp_count,
e3db7226
FB
4748 nb_tbs ? (direct_jmp_count * 100) / nb_tbs : 0,
4749 direct_jmp2_count,
4750 nb_tbs ? (direct_jmp2_count * 100) / nb_tbs : 0);
57fec1fe 4751 cpu_fprintf(f, "\nStatistics:\n");
e3db7226
FB
4752 cpu_fprintf(f, "TB flush count %d\n", tb_flush_count);
4753 cpu_fprintf(f, "TB invalidate count %d\n", tb_phys_invalidate_count);
4754 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
b67d9a52 4755 tcg_dump_info(f, cpu_fprintf);
e3db7226
FB
4756}
4757
61382a50
FB
4758#define MMUSUFFIX _cmmu
4759#define GETPC() NULL
4760#define env cpu_single_env
b769d8fe 4761#define SOFTMMU_CODE_ACCESS
61382a50
FB
4762
4763#define SHIFT 0
4764#include "softmmu_template.h"
4765
4766#define SHIFT 1
4767#include "softmmu_template.h"
4768
4769#define SHIFT 2
4770#include "softmmu_template.h"
4771
4772#define SHIFT 3
4773#include "softmmu_template.h"
4774
4775#undef env
4776
4777#endif