]> git.proxmox.com Git - mirror_qemu.git/blob - translate-all.c
char: remove chr_free
[mirror_qemu.git] / translate-all.c
1 /*
2 * Host code generation
3 *
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18 */
19 #ifdef _WIN32
20 #include <windows.h>
21 #endif
22 #include "qemu/osdep.h"
23
24
25 #include "qemu-common.h"
26 #define NO_CPU_IO_DEFS
27 #include "cpu.h"
28 #include "trace.h"
29 #include "disas/disas.h"
30 #include "exec/exec-all.h"
31 #include "tcg.h"
32 #if defined(CONFIG_USER_ONLY)
33 #include "qemu.h"
34 #include "exec/exec-all.h"
35 #if defined(__FreeBSD__) || defined(__FreeBSD_kernel__)
36 #include <sys/param.h>
37 #if __FreeBSD_version >= 700104
38 #define HAVE_KINFO_GETVMMAP
39 #define sigqueue sigqueue_freebsd /* avoid redefinition */
40 #include <sys/proc.h>
41 #include <machine/profile.h>
42 #define _KERNEL
43 #include <sys/user.h>
44 #undef _KERNEL
45 #undef sigqueue
46 #include <libutil.h>
47 #endif
48 #endif
49 #else
50 #include "exec/address-spaces.h"
51 #endif
52
53 #include "exec/cputlb.h"
54 #include "exec/tb-hash.h"
55 #include "translate-all.h"
56 #include "qemu/bitmap.h"
57 #include "qemu/timer.h"
58 #include "exec/log.h"
59
60 /* #define DEBUG_TB_INVALIDATE */
61 /* #define DEBUG_TB_FLUSH */
62 /* #define DEBUG_LOCKING */
63 /* make various TB consistency checks */
64 /* #define DEBUG_TB_CHECK */
65
66 #if !defined(CONFIG_USER_ONLY)
67 /* TB consistency checks only implemented for usermode emulation. */
68 #undef DEBUG_TB_CHECK
69 #endif
70
71 /* Access to the various translations structures need to be serialised via locks
72 * for consistency. This is automatic for SoftMMU based system
73 * emulation due to its single threaded nature. In user-mode emulation
74 * access to the memory related structures are protected with the
75 * mmap_lock.
76 */
77 #ifdef DEBUG_LOCKING
78 #define DEBUG_MEM_LOCKS 1
79 #else
80 #define DEBUG_MEM_LOCKS 0
81 #endif
82
83 #ifdef CONFIG_SOFTMMU
84 #define assert_memory_lock() do { /* nothing */ } while (0)
85 #else
86 #define assert_memory_lock() do { \
87 if (DEBUG_MEM_LOCKS) { \
88 g_assert(have_mmap_lock()); \
89 } \
90 } while (0)
91 #endif
92
93 #define SMC_BITMAP_USE_THRESHOLD 10
94
95 typedef struct PageDesc {
96 /* list of TBs intersecting this ram page */
97 TranslationBlock *first_tb;
98 #ifdef CONFIG_SOFTMMU
99 /* in order to optimize self modifying code, we count the number
100 of lookups we do to a given page to use a bitmap */
101 unsigned int code_write_count;
102 unsigned long *code_bitmap;
103 #else
104 unsigned long flags;
105 #endif
106 } PageDesc;
107
108 /* In system mode we want L1_MAP to be based on ram offsets,
109 while in user mode we want it to be based on virtual addresses. */
110 #if !defined(CONFIG_USER_ONLY)
111 #if HOST_LONG_BITS < TARGET_PHYS_ADDR_SPACE_BITS
112 # define L1_MAP_ADDR_SPACE_BITS HOST_LONG_BITS
113 #else
114 # define L1_MAP_ADDR_SPACE_BITS TARGET_PHYS_ADDR_SPACE_BITS
115 #endif
116 #else
117 # define L1_MAP_ADDR_SPACE_BITS TARGET_VIRT_ADDR_SPACE_BITS
118 #endif
119
120 /* Size of the L2 (and L3, etc) page tables. */
121 #define V_L2_BITS 10
122 #define V_L2_SIZE (1 << V_L2_BITS)
123
124 uintptr_t qemu_host_page_size;
125 intptr_t qemu_host_page_mask;
126
127 /*
128 * L1 Mapping properties
129 */
130 static int v_l1_size;
131 static int v_l1_shift;
132 static int v_l2_levels;
133
134 /* The bottom level has pointers to PageDesc, and is indexed by
135 * anything from 4 to (V_L2_BITS + 3) bits, depending on target page size.
136 */
137 #define V_L1_MIN_BITS 4
138 #define V_L1_MAX_BITS (V_L2_BITS + 3)
139 #define V_L1_MAX_SIZE (1 << V_L1_MAX_BITS)
140
141 static void *l1_map[V_L1_MAX_SIZE];
142
143 /* code generation context */
144 TCGContext tcg_ctx;
145 bool parallel_cpus;
146
147 /* translation block context */
148 #ifdef CONFIG_USER_ONLY
149 __thread int have_tb_lock;
150 #endif
151
152 static void page_table_config_init(void)
153 {
154 uint32_t v_l1_bits;
155
156 assert(TARGET_PAGE_BITS);
157 /* The bits remaining after N lower levels of page tables. */
158 v_l1_bits = (L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS) % V_L2_BITS;
159 if (v_l1_bits < V_L1_MIN_BITS) {
160 v_l1_bits += V_L2_BITS;
161 }
162
163 v_l1_size = 1 << v_l1_bits;
164 v_l1_shift = L1_MAP_ADDR_SPACE_BITS - TARGET_PAGE_BITS - v_l1_bits;
165 v_l2_levels = v_l1_shift / V_L2_BITS - 1;
166
167 assert(v_l1_bits <= V_L1_MAX_BITS);
168 assert(v_l1_shift % V_L2_BITS == 0);
169 assert(v_l2_levels >= 0);
170 }
171
172 void tb_lock(void)
173 {
174 #ifdef CONFIG_USER_ONLY
175 assert(!have_tb_lock);
176 qemu_mutex_lock(&tcg_ctx.tb_ctx.tb_lock);
177 have_tb_lock++;
178 #endif
179 }
180
181 void tb_unlock(void)
182 {
183 #ifdef CONFIG_USER_ONLY
184 assert(have_tb_lock);
185 have_tb_lock--;
186 qemu_mutex_unlock(&tcg_ctx.tb_ctx.tb_lock);
187 #endif
188 }
189
190 void tb_lock_reset(void)
191 {
192 #ifdef CONFIG_USER_ONLY
193 if (have_tb_lock) {
194 qemu_mutex_unlock(&tcg_ctx.tb_ctx.tb_lock);
195 have_tb_lock = 0;
196 }
197 #endif
198 }
199
200 #ifdef DEBUG_LOCKING
201 #define DEBUG_TB_LOCKS 1
202 #else
203 #define DEBUG_TB_LOCKS 0
204 #endif
205
206 #ifdef CONFIG_SOFTMMU
207 #define assert_tb_lock() do { /* nothing */ } while (0)
208 #else
209 #define assert_tb_lock() do { \
210 if (DEBUG_TB_LOCKS) { \
211 g_assert(have_tb_lock); \
212 } \
213 } while (0)
214 #endif
215
216
217 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr);
218
219 void cpu_gen_init(void)
220 {
221 tcg_context_init(&tcg_ctx);
222 }
223
224 /* Encode VAL as a signed leb128 sequence at P.
225 Return P incremented past the encoded value. */
226 static uint8_t *encode_sleb128(uint8_t *p, target_long val)
227 {
228 int more, byte;
229
230 do {
231 byte = val & 0x7f;
232 val >>= 7;
233 more = !((val == 0 && (byte & 0x40) == 0)
234 || (val == -1 && (byte & 0x40) != 0));
235 if (more) {
236 byte |= 0x80;
237 }
238 *p++ = byte;
239 } while (more);
240
241 return p;
242 }
243
244 /* Decode a signed leb128 sequence at *PP; increment *PP past the
245 decoded value. Return the decoded value. */
246 static target_long decode_sleb128(uint8_t **pp)
247 {
248 uint8_t *p = *pp;
249 target_long val = 0;
250 int byte, shift = 0;
251
252 do {
253 byte = *p++;
254 val |= (target_ulong)(byte & 0x7f) << shift;
255 shift += 7;
256 } while (byte & 0x80);
257 if (shift < TARGET_LONG_BITS && (byte & 0x40)) {
258 val |= -(target_ulong)1 << shift;
259 }
260
261 *pp = p;
262 return val;
263 }
264
265 /* Encode the data collected about the instructions while compiling TB.
266 Place the data at BLOCK, and return the number of bytes consumed.
267
268 The logical table consisits of TARGET_INSN_START_WORDS target_ulong's,
269 which come from the target's insn_start data, followed by a uintptr_t
270 which comes from the host pc of the end of the code implementing the insn.
271
272 Each line of the table is encoded as sleb128 deltas from the previous
273 line. The seed for the first line is { tb->pc, 0..., tb->tc_ptr }.
274 That is, the first column is seeded with the guest pc, the last column
275 with the host pc, and the middle columns with zeros. */
276
277 static int encode_search(TranslationBlock *tb, uint8_t *block)
278 {
279 uint8_t *highwater = tcg_ctx.code_gen_highwater;
280 uint8_t *p = block;
281 int i, j, n;
282
283 tb->tc_search = block;
284
285 for (i = 0, n = tb->icount; i < n; ++i) {
286 target_ulong prev;
287
288 for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
289 if (i == 0) {
290 prev = (j == 0 ? tb->pc : 0);
291 } else {
292 prev = tcg_ctx.gen_insn_data[i - 1][j];
293 }
294 p = encode_sleb128(p, tcg_ctx.gen_insn_data[i][j] - prev);
295 }
296 prev = (i == 0 ? 0 : tcg_ctx.gen_insn_end_off[i - 1]);
297 p = encode_sleb128(p, tcg_ctx.gen_insn_end_off[i] - prev);
298
299 /* Test for (pending) buffer overflow. The assumption is that any
300 one row beginning below the high water mark cannot overrun
301 the buffer completely. Thus we can test for overflow after
302 encoding a row without having to check during encoding. */
303 if (unlikely(p > highwater)) {
304 return -1;
305 }
306 }
307
308 return p - block;
309 }
310
311 /* The cpu state corresponding to 'searched_pc' is restored.
312 * Called with tb_lock held.
313 */
314 static int cpu_restore_state_from_tb(CPUState *cpu, TranslationBlock *tb,
315 uintptr_t searched_pc)
316 {
317 target_ulong data[TARGET_INSN_START_WORDS] = { tb->pc };
318 uintptr_t host_pc = (uintptr_t)tb->tc_ptr;
319 CPUArchState *env = cpu->env_ptr;
320 uint8_t *p = tb->tc_search;
321 int i, j, num_insns = tb->icount;
322 #ifdef CONFIG_PROFILER
323 int64_t ti = profile_getclock();
324 #endif
325
326 searched_pc -= GETPC_ADJ;
327
328 if (searched_pc < host_pc) {
329 return -1;
330 }
331
332 /* Reconstruct the stored insn data while looking for the point at
333 which the end of the insn exceeds the searched_pc. */
334 for (i = 0; i < num_insns; ++i) {
335 for (j = 0; j < TARGET_INSN_START_WORDS; ++j) {
336 data[j] += decode_sleb128(&p);
337 }
338 host_pc += decode_sleb128(&p);
339 if (host_pc > searched_pc) {
340 goto found;
341 }
342 }
343 return -1;
344
345 found:
346 if (tb->cflags & CF_USE_ICOUNT) {
347 assert(use_icount);
348 /* Reset the cycle counter to the start of the block. */
349 cpu->icount_decr.u16.low += num_insns;
350 /* Clear the IO flag. */
351 cpu->can_do_io = 0;
352 }
353 cpu->icount_decr.u16.low -= i;
354 restore_state_to_opc(env, tb, data);
355
356 #ifdef CONFIG_PROFILER
357 tcg_ctx.restore_time += profile_getclock() - ti;
358 tcg_ctx.restore_count++;
359 #endif
360 return 0;
361 }
362
363 bool cpu_restore_state(CPUState *cpu, uintptr_t retaddr)
364 {
365 TranslationBlock *tb;
366 bool r = false;
367
368 tb_lock();
369 tb = tb_find_pc(retaddr);
370 if (tb) {
371 cpu_restore_state_from_tb(cpu, tb, retaddr);
372 if (tb->cflags & CF_NOCACHE) {
373 /* one-shot translation, invalidate it immediately */
374 tb_phys_invalidate(tb, -1);
375 tb_free(tb);
376 }
377 r = true;
378 }
379 tb_unlock();
380
381 return r;
382 }
383
384 void page_size_init(void)
385 {
386 /* NOTE: we can always suppose that qemu_host_page_size >=
387 TARGET_PAGE_SIZE */
388 qemu_real_host_page_size = getpagesize();
389 qemu_real_host_page_mask = -(intptr_t)qemu_real_host_page_size;
390 if (qemu_host_page_size == 0) {
391 qemu_host_page_size = qemu_real_host_page_size;
392 }
393 if (qemu_host_page_size < TARGET_PAGE_SIZE) {
394 qemu_host_page_size = TARGET_PAGE_SIZE;
395 }
396 qemu_host_page_mask = -(intptr_t)qemu_host_page_size;
397 }
398
399 static void page_init(void)
400 {
401 page_size_init();
402 page_table_config_init();
403
404 #if defined(CONFIG_BSD) && defined(CONFIG_USER_ONLY)
405 {
406 #ifdef HAVE_KINFO_GETVMMAP
407 struct kinfo_vmentry *freep;
408 int i, cnt;
409
410 freep = kinfo_getvmmap(getpid(), &cnt);
411 if (freep) {
412 mmap_lock();
413 for (i = 0; i < cnt; i++) {
414 unsigned long startaddr, endaddr;
415
416 startaddr = freep[i].kve_start;
417 endaddr = freep[i].kve_end;
418 if (h2g_valid(startaddr)) {
419 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
420
421 if (h2g_valid(endaddr)) {
422 endaddr = h2g(endaddr);
423 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
424 } else {
425 #if TARGET_ABI_BITS <= L1_MAP_ADDR_SPACE_BITS
426 endaddr = ~0ul;
427 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
428 #endif
429 }
430 }
431 }
432 free(freep);
433 mmap_unlock();
434 }
435 #else
436 FILE *f;
437
438 last_brk = (unsigned long)sbrk(0);
439
440 f = fopen("/compat/linux/proc/self/maps", "r");
441 if (f) {
442 mmap_lock();
443
444 do {
445 unsigned long startaddr, endaddr;
446 int n;
447
448 n = fscanf(f, "%lx-%lx %*[^\n]\n", &startaddr, &endaddr);
449
450 if (n == 2 && h2g_valid(startaddr)) {
451 startaddr = h2g(startaddr) & TARGET_PAGE_MASK;
452
453 if (h2g_valid(endaddr)) {
454 endaddr = h2g(endaddr);
455 } else {
456 endaddr = ~0ul;
457 }
458 page_set_flags(startaddr, endaddr, PAGE_RESERVED);
459 }
460 } while (!feof(f));
461
462 fclose(f);
463 mmap_unlock();
464 }
465 #endif
466 }
467 #endif
468 }
469
470 /* If alloc=1:
471 * Called with tb_lock held for system emulation.
472 * Called with mmap_lock held for user-mode emulation.
473 */
474 static PageDesc *page_find_alloc(tb_page_addr_t index, int alloc)
475 {
476 PageDesc *pd;
477 void **lp;
478 int i;
479
480 if (alloc) {
481 assert_memory_lock();
482 }
483
484 /* Level 1. Always allocated. */
485 lp = l1_map + ((index >> v_l1_shift) & (v_l1_size - 1));
486
487 /* Level 2..N-1. */
488 for (i = v_l2_levels; i > 0; i--) {
489 void **p = atomic_rcu_read(lp);
490
491 if (p == NULL) {
492 if (!alloc) {
493 return NULL;
494 }
495 p = g_new0(void *, V_L2_SIZE);
496 atomic_rcu_set(lp, p);
497 }
498
499 lp = p + ((index >> (i * V_L2_BITS)) & (V_L2_SIZE - 1));
500 }
501
502 pd = atomic_rcu_read(lp);
503 if (pd == NULL) {
504 if (!alloc) {
505 return NULL;
506 }
507 pd = g_new0(PageDesc, V_L2_SIZE);
508 atomic_rcu_set(lp, pd);
509 }
510
511 return pd + (index & (V_L2_SIZE - 1));
512 }
513
514 static inline PageDesc *page_find(tb_page_addr_t index)
515 {
516 return page_find_alloc(index, 0);
517 }
518
519 #if defined(CONFIG_USER_ONLY)
520 /* Currently it is not recommended to allocate big chunks of data in
521 user mode. It will change when a dedicated libc will be used. */
522 /* ??? 64-bit hosts ought to have no problem mmaping data outside the
523 region in which the guest needs to run. Revisit this. */
524 #define USE_STATIC_CODE_GEN_BUFFER
525 #endif
526
527 /* Minimum size of the code gen buffer. This number is randomly chosen,
528 but not so small that we can't have a fair number of TB's live. */
529 #define MIN_CODE_GEN_BUFFER_SIZE (1024u * 1024)
530
531 /* Maximum size of the code gen buffer we'd like to use. Unless otherwise
532 indicated, this is constrained by the range of direct branches on the
533 host cpu, as used by the TCG implementation of goto_tb. */
534 #if defined(__x86_64__)
535 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
536 #elif defined(__sparc__)
537 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
538 #elif defined(__powerpc64__)
539 # define MAX_CODE_GEN_BUFFER_SIZE (2ul * 1024 * 1024 * 1024)
540 #elif defined(__powerpc__)
541 # define MAX_CODE_GEN_BUFFER_SIZE (32u * 1024 * 1024)
542 #elif defined(__aarch64__)
543 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
544 #elif defined(__arm__)
545 # define MAX_CODE_GEN_BUFFER_SIZE (16u * 1024 * 1024)
546 #elif defined(__s390x__)
547 /* We have a +- 4GB range on the branches; leave some slop. */
548 # define MAX_CODE_GEN_BUFFER_SIZE (3ul * 1024 * 1024 * 1024)
549 #elif defined(__mips__)
550 /* We have a 256MB branch region, but leave room to make sure the
551 main executable is also within that region. */
552 # define MAX_CODE_GEN_BUFFER_SIZE (128ul * 1024 * 1024)
553 #else
554 # define MAX_CODE_GEN_BUFFER_SIZE ((size_t)-1)
555 #endif
556
557 #define DEFAULT_CODE_GEN_BUFFER_SIZE_1 (32u * 1024 * 1024)
558
559 #define DEFAULT_CODE_GEN_BUFFER_SIZE \
560 (DEFAULT_CODE_GEN_BUFFER_SIZE_1 < MAX_CODE_GEN_BUFFER_SIZE \
561 ? DEFAULT_CODE_GEN_BUFFER_SIZE_1 : MAX_CODE_GEN_BUFFER_SIZE)
562
563 static inline size_t size_code_gen_buffer(size_t tb_size)
564 {
565 /* Size the buffer. */
566 if (tb_size == 0) {
567 #ifdef USE_STATIC_CODE_GEN_BUFFER
568 tb_size = DEFAULT_CODE_GEN_BUFFER_SIZE;
569 #else
570 /* ??? Needs adjustments. */
571 /* ??? If we relax the requirement that CONFIG_USER_ONLY use the
572 static buffer, we could size this on RESERVED_VA, on the text
573 segment size of the executable, or continue to use the default. */
574 tb_size = (unsigned long)(ram_size / 4);
575 #endif
576 }
577 if (tb_size < MIN_CODE_GEN_BUFFER_SIZE) {
578 tb_size = MIN_CODE_GEN_BUFFER_SIZE;
579 }
580 if (tb_size > MAX_CODE_GEN_BUFFER_SIZE) {
581 tb_size = MAX_CODE_GEN_BUFFER_SIZE;
582 }
583 return tb_size;
584 }
585
586 #ifdef __mips__
587 /* In order to use J and JAL within the code_gen_buffer, we require
588 that the buffer not cross a 256MB boundary. */
589 static inline bool cross_256mb(void *addr, size_t size)
590 {
591 return ((uintptr_t)addr ^ ((uintptr_t)addr + size)) & ~0x0ffffffful;
592 }
593
594 /* We weren't able to allocate a buffer without crossing that boundary,
595 so make do with the larger portion of the buffer that doesn't cross.
596 Returns the new base of the buffer, and adjusts code_gen_buffer_size. */
597 static inline void *split_cross_256mb(void *buf1, size_t size1)
598 {
599 void *buf2 = (void *)(((uintptr_t)buf1 + size1) & ~0x0ffffffful);
600 size_t size2 = buf1 + size1 - buf2;
601
602 size1 = buf2 - buf1;
603 if (size1 < size2) {
604 size1 = size2;
605 buf1 = buf2;
606 }
607
608 tcg_ctx.code_gen_buffer_size = size1;
609 return buf1;
610 }
611 #endif
612
613 #ifdef USE_STATIC_CODE_GEN_BUFFER
614 static uint8_t static_code_gen_buffer[DEFAULT_CODE_GEN_BUFFER_SIZE]
615 __attribute__((aligned(CODE_GEN_ALIGN)));
616
617 # ifdef _WIN32
618 static inline void do_protect(void *addr, long size, int prot)
619 {
620 DWORD old_protect;
621 VirtualProtect(addr, size, prot, &old_protect);
622 }
623
624 static inline void map_exec(void *addr, long size)
625 {
626 do_protect(addr, size, PAGE_EXECUTE_READWRITE);
627 }
628
629 static inline void map_none(void *addr, long size)
630 {
631 do_protect(addr, size, PAGE_NOACCESS);
632 }
633 # else
634 static inline void do_protect(void *addr, long size, int prot)
635 {
636 uintptr_t start, end;
637
638 start = (uintptr_t)addr;
639 start &= qemu_real_host_page_mask;
640
641 end = (uintptr_t)addr + size;
642 end = ROUND_UP(end, qemu_real_host_page_size);
643
644 mprotect((void *)start, end - start, prot);
645 }
646
647 static inline void map_exec(void *addr, long size)
648 {
649 do_protect(addr, size, PROT_READ | PROT_WRITE | PROT_EXEC);
650 }
651
652 static inline void map_none(void *addr, long size)
653 {
654 do_protect(addr, size, PROT_NONE);
655 }
656 # endif /* WIN32 */
657
658 static inline void *alloc_code_gen_buffer(void)
659 {
660 void *buf = static_code_gen_buffer;
661 size_t full_size, size;
662
663 /* The size of the buffer, rounded down to end on a page boundary. */
664 full_size = (((uintptr_t)buf + sizeof(static_code_gen_buffer))
665 & qemu_real_host_page_mask) - (uintptr_t)buf;
666
667 /* Reserve a guard page. */
668 size = full_size - qemu_real_host_page_size;
669
670 /* Honor a command-line option limiting the size of the buffer. */
671 if (size > tcg_ctx.code_gen_buffer_size) {
672 size = (((uintptr_t)buf + tcg_ctx.code_gen_buffer_size)
673 & qemu_real_host_page_mask) - (uintptr_t)buf;
674 }
675 tcg_ctx.code_gen_buffer_size = size;
676
677 #ifdef __mips__
678 if (cross_256mb(buf, size)) {
679 buf = split_cross_256mb(buf, size);
680 size = tcg_ctx.code_gen_buffer_size;
681 }
682 #endif
683
684 map_exec(buf, size);
685 map_none(buf + size, qemu_real_host_page_size);
686 qemu_madvise(buf, size, QEMU_MADV_HUGEPAGE);
687
688 return buf;
689 }
690 #elif defined(_WIN32)
691 static inline void *alloc_code_gen_buffer(void)
692 {
693 size_t size = tcg_ctx.code_gen_buffer_size;
694 void *buf1, *buf2;
695
696 /* Perform the allocation in two steps, so that the guard page
697 is reserved but uncommitted. */
698 buf1 = VirtualAlloc(NULL, size + qemu_real_host_page_size,
699 MEM_RESERVE, PAGE_NOACCESS);
700 if (buf1 != NULL) {
701 buf2 = VirtualAlloc(buf1, size, MEM_COMMIT, PAGE_EXECUTE_READWRITE);
702 assert(buf1 == buf2);
703 }
704
705 return buf1;
706 }
707 #else
708 static inline void *alloc_code_gen_buffer(void)
709 {
710 int flags = MAP_PRIVATE | MAP_ANONYMOUS;
711 uintptr_t start = 0;
712 size_t size = tcg_ctx.code_gen_buffer_size;
713 void *buf;
714
715 /* Constrain the position of the buffer based on the host cpu.
716 Note that these addresses are chosen in concert with the
717 addresses assigned in the relevant linker script file. */
718 # if defined(__PIE__) || defined(__PIC__)
719 /* Don't bother setting a preferred location if we're building
720 a position-independent executable. We're more likely to get
721 an address near the main executable if we let the kernel
722 choose the address. */
723 # elif defined(__x86_64__) && defined(MAP_32BIT)
724 /* Force the memory down into low memory with the executable.
725 Leave the choice of exact location with the kernel. */
726 flags |= MAP_32BIT;
727 /* Cannot expect to map more than 800MB in low memory. */
728 if (size > 800u * 1024 * 1024) {
729 tcg_ctx.code_gen_buffer_size = size = 800u * 1024 * 1024;
730 }
731 # elif defined(__sparc__)
732 start = 0x40000000ul;
733 # elif defined(__s390x__)
734 start = 0x90000000ul;
735 # elif defined(__mips__)
736 # if _MIPS_SIM == _ABI64
737 start = 0x128000000ul;
738 # else
739 start = 0x08000000ul;
740 # endif
741 # endif
742
743 buf = mmap((void *)start, size + qemu_real_host_page_size,
744 PROT_NONE, flags, -1, 0);
745 if (buf == MAP_FAILED) {
746 return NULL;
747 }
748
749 #ifdef __mips__
750 if (cross_256mb(buf, size)) {
751 /* Try again, with the original still mapped, to avoid re-acquiring
752 that 256mb crossing. This time don't specify an address. */
753 size_t size2;
754 void *buf2 = mmap(NULL, size + qemu_real_host_page_size,
755 PROT_NONE, flags, -1, 0);
756 switch ((int)(buf2 != MAP_FAILED)) {
757 case 1:
758 if (!cross_256mb(buf2, size)) {
759 /* Success! Use the new buffer. */
760 munmap(buf, size + qemu_real_host_page_size);
761 break;
762 }
763 /* Failure. Work with what we had. */
764 munmap(buf2, size + qemu_real_host_page_size);
765 /* fallthru */
766 default:
767 /* Split the original buffer. Free the smaller half. */
768 buf2 = split_cross_256mb(buf, size);
769 size2 = tcg_ctx.code_gen_buffer_size;
770 if (buf == buf2) {
771 munmap(buf + size2 + qemu_real_host_page_size, size - size2);
772 } else {
773 munmap(buf, size - size2);
774 }
775 size = size2;
776 break;
777 }
778 buf = buf2;
779 }
780 #endif
781
782 /* Make the final buffer accessible. The guard page at the end
783 will remain inaccessible with PROT_NONE. */
784 mprotect(buf, size, PROT_WRITE | PROT_READ | PROT_EXEC);
785
786 /* Request large pages for the buffer. */
787 qemu_madvise(buf, size, QEMU_MADV_HUGEPAGE);
788
789 return buf;
790 }
791 #endif /* USE_STATIC_CODE_GEN_BUFFER, WIN32, POSIX */
792
793 static inline void code_gen_alloc(size_t tb_size)
794 {
795 tcg_ctx.code_gen_buffer_size = size_code_gen_buffer(tb_size);
796 tcg_ctx.code_gen_buffer = alloc_code_gen_buffer();
797 if (tcg_ctx.code_gen_buffer == NULL) {
798 fprintf(stderr, "Could not allocate dynamic translator buffer\n");
799 exit(1);
800 }
801
802 /* Estimate a good size for the number of TBs we can support. We
803 still haven't deducted the prologue from the buffer size here,
804 but that's minimal and won't affect the estimate much. */
805 tcg_ctx.code_gen_max_blocks
806 = tcg_ctx.code_gen_buffer_size / CODE_GEN_AVG_BLOCK_SIZE;
807 tcg_ctx.tb_ctx.tbs = g_new(TranslationBlock, tcg_ctx.code_gen_max_blocks);
808
809 qemu_mutex_init(&tcg_ctx.tb_ctx.tb_lock);
810 }
811
812 static void tb_htable_init(void)
813 {
814 unsigned int mode = QHT_MODE_AUTO_RESIZE;
815
816 qht_init(&tcg_ctx.tb_ctx.htable, CODE_GEN_HTABLE_SIZE, mode);
817 }
818
819 /* Must be called before using the QEMU cpus. 'tb_size' is the size
820 (in bytes) allocated to the translation buffer. Zero means default
821 size. */
822 void tcg_exec_init(unsigned long tb_size)
823 {
824 cpu_gen_init();
825 page_init();
826 tb_htable_init();
827 code_gen_alloc(tb_size);
828 #if defined(CONFIG_SOFTMMU)
829 /* There's no guest base to take into account, so go ahead and
830 initialize the prologue now. */
831 tcg_prologue_init(&tcg_ctx);
832 #endif
833 }
834
835 bool tcg_enabled(void)
836 {
837 return tcg_ctx.code_gen_buffer != NULL;
838 }
839
840 /*
841 * Allocate a new translation block. Flush the translation buffer if
842 * too many translation blocks or too much generated code.
843 *
844 * Called with tb_lock held.
845 */
846 static TranslationBlock *tb_alloc(target_ulong pc)
847 {
848 TranslationBlock *tb;
849
850 assert_tb_lock();
851
852 if (tcg_ctx.tb_ctx.nb_tbs >= tcg_ctx.code_gen_max_blocks) {
853 return NULL;
854 }
855 tb = &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs++];
856 tb->pc = pc;
857 tb->cflags = 0;
858 tb->invalid = false;
859 return tb;
860 }
861
862 /* Called with tb_lock held. */
863 void tb_free(TranslationBlock *tb)
864 {
865 assert_tb_lock();
866
867 /* In practice this is mostly used for single use temporary TB
868 Ignore the hard cases and just back up if this TB happens to
869 be the last one generated. */
870 if (tcg_ctx.tb_ctx.nb_tbs > 0 &&
871 tb == &tcg_ctx.tb_ctx.tbs[tcg_ctx.tb_ctx.nb_tbs - 1]) {
872 tcg_ctx.code_gen_ptr = tb->tc_ptr;
873 tcg_ctx.tb_ctx.nb_tbs--;
874 }
875 }
876
877 static inline void invalidate_page_bitmap(PageDesc *p)
878 {
879 #ifdef CONFIG_SOFTMMU
880 g_free(p->code_bitmap);
881 p->code_bitmap = NULL;
882 p->code_write_count = 0;
883 #endif
884 }
885
886 /* Set to NULL all the 'first_tb' fields in all PageDescs. */
887 static void page_flush_tb_1(int level, void **lp)
888 {
889 int i;
890
891 if (*lp == NULL) {
892 return;
893 }
894 if (level == 0) {
895 PageDesc *pd = *lp;
896
897 for (i = 0; i < V_L2_SIZE; ++i) {
898 pd[i].first_tb = NULL;
899 invalidate_page_bitmap(pd + i);
900 }
901 } else {
902 void **pp = *lp;
903
904 for (i = 0; i < V_L2_SIZE; ++i) {
905 page_flush_tb_1(level - 1, pp + i);
906 }
907 }
908 }
909
910 static void page_flush_tb(void)
911 {
912 int i, l1_sz = v_l1_size;
913
914 for (i = 0; i < l1_sz; i++) {
915 page_flush_tb_1(v_l2_levels, l1_map + i);
916 }
917 }
918
919 /* flush all the translation blocks */
920 static void do_tb_flush(CPUState *cpu, run_on_cpu_data tb_flush_count)
921 {
922 tb_lock();
923
924 /* If it is already been done on request of another CPU,
925 * just retry.
926 */
927 if (tcg_ctx.tb_ctx.tb_flush_count != tb_flush_count.host_int) {
928 goto done;
929 }
930
931 #if defined(DEBUG_TB_FLUSH)
932 printf("qemu: flush code_size=%ld nb_tbs=%d avg_tb_size=%ld\n",
933 (unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer),
934 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.tb_ctx.nb_tbs > 0 ?
935 ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)) /
936 tcg_ctx.tb_ctx.nb_tbs : 0);
937 #endif
938 if ((unsigned long)(tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer)
939 > tcg_ctx.code_gen_buffer_size) {
940 cpu_abort(cpu, "Internal error: code buffer overflow\n");
941 }
942
943 CPU_FOREACH(cpu) {
944 int i;
945
946 for (i = 0; i < TB_JMP_CACHE_SIZE; ++i) {
947 atomic_set(&cpu->tb_jmp_cache[i], NULL);
948 }
949 }
950
951 tcg_ctx.tb_ctx.nb_tbs = 0;
952 qht_reset_size(&tcg_ctx.tb_ctx.htable, CODE_GEN_HTABLE_SIZE);
953 page_flush_tb();
954
955 tcg_ctx.code_gen_ptr = tcg_ctx.code_gen_buffer;
956 /* XXX: flush processor icache at this point if cache flush is
957 expensive */
958 atomic_mb_set(&tcg_ctx.tb_ctx.tb_flush_count,
959 tcg_ctx.tb_ctx.tb_flush_count + 1);
960
961 done:
962 tb_unlock();
963 }
964
965 void tb_flush(CPUState *cpu)
966 {
967 if (tcg_enabled()) {
968 unsigned tb_flush_count = atomic_mb_read(&tcg_ctx.tb_ctx.tb_flush_count);
969 async_safe_run_on_cpu(cpu, do_tb_flush,
970 RUN_ON_CPU_HOST_INT(tb_flush_count));
971 }
972 }
973
974 #ifdef DEBUG_TB_CHECK
975
976 static void
977 do_tb_invalidate_check(struct qht *ht, void *p, uint32_t hash, void *userp)
978 {
979 TranslationBlock *tb = p;
980 target_ulong addr = *(target_ulong *)userp;
981
982 if (!(addr + TARGET_PAGE_SIZE <= tb->pc || addr >= tb->pc + tb->size)) {
983 printf("ERROR invalidate: address=" TARGET_FMT_lx
984 " PC=%08lx size=%04x\n", addr, (long)tb->pc, tb->size);
985 }
986 }
987
988 /* verify that all the pages have correct rights for code
989 *
990 * Called with tb_lock held.
991 */
992 static void tb_invalidate_check(target_ulong address)
993 {
994 address &= TARGET_PAGE_MASK;
995 qht_iter(&tcg_ctx.tb_ctx.htable, do_tb_invalidate_check, &address);
996 }
997
998 static void
999 do_tb_page_check(struct qht *ht, void *p, uint32_t hash, void *userp)
1000 {
1001 TranslationBlock *tb = p;
1002 int flags1, flags2;
1003
1004 flags1 = page_get_flags(tb->pc);
1005 flags2 = page_get_flags(tb->pc + tb->size - 1);
1006 if ((flags1 & PAGE_WRITE) || (flags2 & PAGE_WRITE)) {
1007 printf("ERROR page flags: PC=%08lx size=%04x f1=%x f2=%x\n",
1008 (long)tb->pc, tb->size, flags1, flags2);
1009 }
1010 }
1011
1012 /* verify that all the pages have correct rights for code */
1013 static void tb_page_check(void)
1014 {
1015 qht_iter(&tcg_ctx.tb_ctx.htable, do_tb_page_check, NULL);
1016 }
1017
1018 #endif
1019
1020 static inline void tb_page_remove(TranslationBlock **ptb, TranslationBlock *tb)
1021 {
1022 TranslationBlock *tb1;
1023 unsigned int n1;
1024
1025 for (;;) {
1026 tb1 = *ptb;
1027 n1 = (uintptr_t)tb1 & 3;
1028 tb1 = (TranslationBlock *)((uintptr_t)tb1 & ~3);
1029 if (tb1 == tb) {
1030 *ptb = tb1->page_next[n1];
1031 break;
1032 }
1033 ptb = &tb1->page_next[n1];
1034 }
1035 }
1036
1037 /* remove the TB from a list of TBs jumping to the n-th jump target of the TB */
1038 static inline void tb_remove_from_jmp_list(TranslationBlock *tb, int n)
1039 {
1040 TranslationBlock *tb1;
1041 uintptr_t *ptb, ntb;
1042 unsigned int n1;
1043
1044 ptb = &tb->jmp_list_next[n];
1045 if (*ptb) {
1046 /* find tb(n) in circular list */
1047 for (;;) {
1048 ntb = *ptb;
1049 n1 = ntb & 3;
1050 tb1 = (TranslationBlock *)(ntb & ~3);
1051 if (n1 == n && tb1 == tb) {
1052 break;
1053 }
1054 if (n1 == 2) {
1055 ptb = &tb1->jmp_list_first;
1056 } else {
1057 ptb = &tb1->jmp_list_next[n1];
1058 }
1059 }
1060 /* now we can suppress tb(n) from the list */
1061 *ptb = tb->jmp_list_next[n];
1062
1063 tb->jmp_list_next[n] = (uintptr_t)NULL;
1064 }
1065 }
1066
1067 /* reset the jump entry 'n' of a TB so that it is not chained to
1068 another TB */
1069 static inline void tb_reset_jump(TranslationBlock *tb, int n)
1070 {
1071 uintptr_t addr = (uintptr_t)(tb->tc_ptr + tb->jmp_reset_offset[n]);
1072 tb_set_jmp_target(tb, n, addr);
1073 }
1074
1075 /* remove any jumps to the TB */
1076 static inline void tb_jmp_unlink(TranslationBlock *tb)
1077 {
1078 TranslationBlock *tb1;
1079 uintptr_t *ptb, ntb;
1080 unsigned int n1;
1081
1082 ptb = &tb->jmp_list_first;
1083 for (;;) {
1084 ntb = *ptb;
1085 n1 = ntb & 3;
1086 tb1 = (TranslationBlock *)(ntb & ~3);
1087 if (n1 == 2) {
1088 break;
1089 }
1090 tb_reset_jump(tb1, n1);
1091 *ptb = tb1->jmp_list_next[n1];
1092 tb1->jmp_list_next[n1] = (uintptr_t)NULL;
1093 }
1094 }
1095
1096 /* invalidate one TB
1097 *
1098 * Called with tb_lock held.
1099 */
1100 void tb_phys_invalidate(TranslationBlock *tb, tb_page_addr_t page_addr)
1101 {
1102 CPUState *cpu;
1103 PageDesc *p;
1104 uint32_t h;
1105 tb_page_addr_t phys_pc;
1106
1107 assert_tb_lock();
1108
1109 atomic_set(&tb->invalid, true);
1110
1111 /* remove the TB from the hash list */
1112 phys_pc = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1113 h = tb_hash_func(phys_pc, tb->pc, tb->flags);
1114 qht_remove(&tcg_ctx.tb_ctx.htable, tb, h);
1115
1116 /* remove the TB from the page list */
1117 if (tb->page_addr[0] != page_addr) {
1118 p = page_find(tb->page_addr[0] >> TARGET_PAGE_BITS);
1119 tb_page_remove(&p->first_tb, tb);
1120 invalidate_page_bitmap(p);
1121 }
1122 if (tb->page_addr[1] != -1 && tb->page_addr[1] != page_addr) {
1123 p = page_find(tb->page_addr[1] >> TARGET_PAGE_BITS);
1124 tb_page_remove(&p->first_tb, tb);
1125 invalidate_page_bitmap(p);
1126 }
1127
1128 /* remove the TB from the hash list */
1129 h = tb_jmp_cache_hash_func(tb->pc);
1130 CPU_FOREACH(cpu) {
1131 if (atomic_read(&cpu->tb_jmp_cache[h]) == tb) {
1132 atomic_set(&cpu->tb_jmp_cache[h], NULL);
1133 }
1134 }
1135
1136 /* suppress this TB from the two jump lists */
1137 tb_remove_from_jmp_list(tb, 0);
1138 tb_remove_from_jmp_list(tb, 1);
1139
1140 /* suppress any remaining jumps to this TB */
1141 tb_jmp_unlink(tb);
1142
1143 tcg_ctx.tb_ctx.tb_phys_invalidate_count++;
1144 }
1145
1146 #ifdef CONFIG_SOFTMMU
1147 static void build_page_bitmap(PageDesc *p)
1148 {
1149 int n, tb_start, tb_end;
1150 TranslationBlock *tb;
1151
1152 p->code_bitmap = bitmap_new(TARGET_PAGE_SIZE);
1153
1154 tb = p->first_tb;
1155 while (tb != NULL) {
1156 n = (uintptr_t)tb & 3;
1157 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1158 /* NOTE: this is subtle as a TB may span two physical pages */
1159 if (n == 0) {
1160 /* NOTE: tb_end may be after the end of the page, but
1161 it is not a problem */
1162 tb_start = tb->pc & ~TARGET_PAGE_MASK;
1163 tb_end = tb_start + tb->size;
1164 if (tb_end > TARGET_PAGE_SIZE) {
1165 tb_end = TARGET_PAGE_SIZE;
1166 }
1167 } else {
1168 tb_start = 0;
1169 tb_end = ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1170 }
1171 bitmap_set(p->code_bitmap, tb_start, tb_end - tb_start);
1172 tb = tb->page_next[n];
1173 }
1174 }
1175 #endif
1176
1177 /* add the tb in the target page and protect it if necessary
1178 *
1179 * Called with mmap_lock held for user-mode emulation.
1180 */
1181 static inline void tb_alloc_page(TranslationBlock *tb,
1182 unsigned int n, tb_page_addr_t page_addr)
1183 {
1184 PageDesc *p;
1185 #ifndef CONFIG_USER_ONLY
1186 bool page_already_protected;
1187 #endif
1188
1189 assert_memory_lock();
1190
1191 tb->page_addr[n] = page_addr;
1192 p = page_find_alloc(page_addr >> TARGET_PAGE_BITS, 1);
1193 tb->page_next[n] = p->first_tb;
1194 #ifndef CONFIG_USER_ONLY
1195 page_already_protected = p->first_tb != NULL;
1196 #endif
1197 p->first_tb = (TranslationBlock *)((uintptr_t)tb | n);
1198 invalidate_page_bitmap(p);
1199
1200 #if defined(CONFIG_USER_ONLY)
1201 if (p->flags & PAGE_WRITE) {
1202 target_ulong addr;
1203 PageDesc *p2;
1204 int prot;
1205
1206 /* force the host page as non writable (writes will have a
1207 page fault + mprotect overhead) */
1208 page_addr &= qemu_host_page_mask;
1209 prot = 0;
1210 for (addr = page_addr; addr < page_addr + qemu_host_page_size;
1211 addr += TARGET_PAGE_SIZE) {
1212
1213 p2 = page_find(addr >> TARGET_PAGE_BITS);
1214 if (!p2) {
1215 continue;
1216 }
1217 prot |= p2->flags;
1218 p2->flags &= ~PAGE_WRITE;
1219 }
1220 mprotect(g2h(page_addr), qemu_host_page_size,
1221 (prot & PAGE_BITS) & ~PAGE_WRITE);
1222 #ifdef DEBUG_TB_INVALIDATE
1223 printf("protecting code page: 0x" TARGET_FMT_lx "\n",
1224 page_addr);
1225 #endif
1226 }
1227 #else
1228 /* if some code is already present, then the pages are already
1229 protected. So we handle the case where only the first TB is
1230 allocated in a physical page */
1231 if (!page_already_protected) {
1232 tlb_protect_code(page_addr);
1233 }
1234 #endif
1235 }
1236
1237 /* add a new TB and link it to the physical page tables. phys_page2 is
1238 * (-1) to indicate that only one page contains the TB.
1239 *
1240 * Called with mmap_lock held for user-mode emulation.
1241 */
1242 static void tb_link_page(TranslationBlock *tb, tb_page_addr_t phys_pc,
1243 tb_page_addr_t phys_page2)
1244 {
1245 uint32_t h;
1246
1247 assert_memory_lock();
1248
1249 /* add in the page list */
1250 tb_alloc_page(tb, 0, phys_pc & TARGET_PAGE_MASK);
1251 if (phys_page2 != -1) {
1252 tb_alloc_page(tb, 1, phys_page2);
1253 } else {
1254 tb->page_addr[1] = -1;
1255 }
1256
1257 /* add in the hash table */
1258 h = tb_hash_func(phys_pc, tb->pc, tb->flags);
1259 qht_insert(&tcg_ctx.tb_ctx.htable, tb, h);
1260
1261 #ifdef DEBUG_TB_CHECK
1262 tb_page_check();
1263 #endif
1264 }
1265
1266 /* Called with mmap_lock held for user mode emulation. */
1267 TranslationBlock *tb_gen_code(CPUState *cpu,
1268 target_ulong pc, target_ulong cs_base,
1269 uint32_t flags, int cflags)
1270 {
1271 CPUArchState *env = cpu->env_ptr;
1272 TranslationBlock *tb;
1273 tb_page_addr_t phys_pc, phys_page2;
1274 target_ulong virt_page2;
1275 tcg_insn_unit *gen_code_buf;
1276 int gen_code_size, search_size;
1277 #ifdef CONFIG_PROFILER
1278 int64_t ti;
1279 #endif
1280 assert_memory_lock();
1281
1282 phys_pc = get_page_addr_code(env, pc);
1283 if (use_icount && !(cflags & CF_IGNORE_ICOUNT)) {
1284 cflags |= CF_USE_ICOUNT;
1285 }
1286
1287 tb = tb_alloc(pc);
1288 if (unlikely(!tb)) {
1289 buffer_overflow:
1290 /* flush must be done */
1291 tb_flush(cpu);
1292 mmap_unlock();
1293 /* Make the execution loop process the flush as soon as possible. */
1294 cpu->exception_index = EXCP_INTERRUPT;
1295 cpu_loop_exit(cpu);
1296 }
1297
1298 gen_code_buf = tcg_ctx.code_gen_ptr;
1299 tb->tc_ptr = gen_code_buf;
1300 tb->cs_base = cs_base;
1301 tb->flags = flags;
1302 tb->cflags = cflags;
1303
1304 #ifdef CONFIG_PROFILER
1305 tcg_ctx.tb_count1++; /* includes aborted translations because of
1306 exceptions */
1307 ti = profile_getclock();
1308 #endif
1309
1310 tcg_func_start(&tcg_ctx);
1311
1312 tcg_ctx.cpu = ENV_GET_CPU(env);
1313 gen_intermediate_code(env, tb);
1314 tcg_ctx.cpu = NULL;
1315
1316 trace_translate_block(tb, tb->pc, tb->tc_ptr);
1317
1318 /* generate machine code */
1319 tb->jmp_reset_offset[0] = TB_JMP_RESET_OFFSET_INVALID;
1320 tb->jmp_reset_offset[1] = TB_JMP_RESET_OFFSET_INVALID;
1321 tcg_ctx.tb_jmp_reset_offset = tb->jmp_reset_offset;
1322 #ifdef USE_DIRECT_JUMP
1323 tcg_ctx.tb_jmp_insn_offset = tb->jmp_insn_offset;
1324 tcg_ctx.tb_jmp_target_addr = NULL;
1325 #else
1326 tcg_ctx.tb_jmp_insn_offset = NULL;
1327 tcg_ctx.tb_jmp_target_addr = tb->jmp_target_addr;
1328 #endif
1329
1330 #ifdef CONFIG_PROFILER
1331 tcg_ctx.tb_count++;
1332 tcg_ctx.interm_time += profile_getclock() - ti;
1333 tcg_ctx.code_time -= profile_getclock();
1334 #endif
1335
1336 /* ??? Overflow could be handled better here. In particular, we
1337 don't need to re-do gen_intermediate_code, nor should we re-do
1338 the tcg optimization currently hidden inside tcg_gen_code. All
1339 that should be required is to flush the TBs, allocate a new TB,
1340 re-initialize it per above, and re-do the actual code generation. */
1341 gen_code_size = tcg_gen_code(&tcg_ctx, tb);
1342 if (unlikely(gen_code_size < 0)) {
1343 goto buffer_overflow;
1344 }
1345 search_size = encode_search(tb, (void *)gen_code_buf + gen_code_size);
1346 if (unlikely(search_size < 0)) {
1347 goto buffer_overflow;
1348 }
1349
1350 #ifdef CONFIG_PROFILER
1351 tcg_ctx.code_time += profile_getclock();
1352 tcg_ctx.code_in_len += tb->size;
1353 tcg_ctx.code_out_len += gen_code_size;
1354 tcg_ctx.search_out_len += search_size;
1355 #endif
1356
1357 #ifdef DEBUG_DISAS
1358 if (qemu_loglevel_mask(CPU_LOG_TB_OUT_ASM) &&
1359 qemu_log_in_addr_range(tb->pc)) {
1360 qemu_log_lock();
1361 qemu_log("OUT: [size=%d]\n", gen_code_size);
1362 log_disas(tb->tc_ptr, gen_code_size);
1363 qemu_log("\n");
1364 qemu_log_flush();
1365 qemu_log_unlock();
1366 }
1367 #endif
1368
1369 tcg_ctx.code_gen_ptr = (void *)
1370 ROUND_UP((uintptr_t)gen_code_buf + gen_code_size + search_size,
1371 CODE_GEN_ALIGN);
1372
1373 /* init jump list */
1374 assert(((uintptr_t)tb & 3) == 0);
1375 tb->jmp_list_first = (uintptr_t)tb | 2;
1376 tb->jmp_list_next[0] = (uintptr_t)NULL;
1377 tb->jmp_list_next[1] = (uintptr_t)NULL;
1378
1379 /* init original jump addresses wich has been set during tcg_gen_code() */
1380 if (tb->jmp_reset_offset[0] != TB_JMP_RESET_OFFSET_INVALID) {
1381 tb_reset_jump(tb, 0);
1382 }
1383 if (tb->jmp_reset_offset[1] != TB_JMP_RESET_OFFSET_INVALID) {
1384 tb_reset_jump(tb, 1);
1385 }
1386
1387 /* check next page if needed */
1388 virt_page2 = (pc + tb->size - 1) & TARGET_PAGE_MASK;
1389 phys_page2 = -1;
1390 if ((pc & TARGET_PAGE_MASK) != virt_page2) {
1391 phys_page2 = get_page_addr_code(env, virt_page2);
1392 }
1393 /* As long as consistency of the TB stuff is provided by tb_lock in user
1394 * mode and is implicit in single-threaded softmmu emulation, no explicit
1395 * memory barrier is required before tb_link_page() makes the TB visible
1396 * through the physical hash table and physical page list.
1397 */
1398 tb_link_page(tb, phys_pc, phys_page2);
1399 return tb;
1400 }
1401
1402 /*
1403 * Invalidate all TBs which intersect with the target physical address range
1404 * [start;end[. NOTE: start and end may refer to *different* physical pages.
1405 * 'is_cpu_write_access' should be true if called from a real cpu write
1406 * access: the virtual CPU will exit the current TB if code is modified inside
1407 * this TB.
1408 *
1409 * Called with mmap_lock held for user-mode emulation, grabs tb_lock
1410 * Called with tb_lock held for system-mode emulation
1411 */
1412 static void tb_invalidate_phys_range_1(tb_page_addr_t start, tb_page_addr_t end)
1413 {
1414 while (start < end) {
1415 tb_invalidate_phys_page_range(start, end, 0);
1416 start &= TARGET_PAGE_MASK;
1417 start += TARGET_PAGE_SIZE;
1418 }
1419 }
1420
1421 #ifdef CONFIG_SOFTMMU
1422 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end)
1423 {
1424 assert_tb_lock();
1425 tb_invalidate_phys_range_1(start, end);
1426 }
1427 #else
1428 void tb_invalidate_phys_range(tb_page_addr_t start, tb_page_addr_t end)
1429 {
1430 assert_memory_lock();
1431 tb_lock();
1432 tb_invalidate_phys_range_1(start, end);
1433 tb_unlock();
1434 }
1435 #endif
1436 /*
1437 * Invalidate all TBs which intersect with the target physical address range
1438 * [start;end[. NOTE: start and end must refer to the *same* physical page.
1439 * 'is_cpu_write_access' should be true if called from a real cpu write
1440 * access: the virtual CPU will exit the current TB if code is modified inside
1441 * this TB.
1442 *
1443 * Called with tb_lock/mmap_lock held for user-mode emulation
1444 * Called with tb_lock held for system-mode emulation
1445 */
1446 void tb_invalidate_phys_page_range(tb_page_addr_t start, tb_page_addr_t end,
1447 int is_cpu_write_access)
1448 {
1449 TranslationBlock *tb, *tb_next;
1450 #if defined(TARGET_HAS_PRECISE_SMC)
1451 CPUState *cpu = current_cpu;
1452 CPUArchState *env = NULL;
1453 #endif
1454 tb_page_addr_t tb_start, tb_end;
1455 PageDesc *p;
1456 int n;
1457 #ifdef TARGET_HAS_PRECISE_SMC
1458 int current_tb_not_found = is_cpu_write_access;
1459 TranslationBlock *current_tb = NULL;
1460 int current_tb_modified = 0;
1461 target_ulong current_pc = 0;
1462 target_ulong current_cs_base = 0;
1463 uint32_t current_flags = 0;
1464 #endif /* TARGET_HAS_PRECISE_SMC */
1465
1466 assert_memory_lock();
1467 assert_tb_lock();
1468
1469 p = page_find(start >> TARGET_PAGE_BITS);
1470 if (!p) {
1471 return;
1472 }
1473 #if defined(TARGET_HAS_PRECISE_SMC)
1474 if (cpu != NULL) {
1475 env = cpu->env_ptr;
1476 }
1477 #endif
1478
1479 /* we remove all the TBs in the range [start, end[ */
1480 /* XXX: see if in some cases it could be faster to invalidate all
1481 the code */
1482 tb = p->first_tb;
1483 while (tb != NULL) {
1484 n = (uintptr_t)tb & 3;
1485 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1486 tb_next = tb->page_next[n];
1487 /* NOTE: this is subtle as a TB may span two physical pages */
1488 if (n == 0) {
1489 /* NOTE: tb_end may be after the end of the page, but
1490 it is not a problem */
1491 tb_start = tb->page_addr[0] + (tb->pc & ~TARGET_PAGE_MASK);
1492 tb_end = tb_start + tb->size;
1493 } else {
1494 tb_start = tb->page_addr[1];
1495 tb_end = tb_start + ((tb->pc + tb->size) & ~TARGET_PAGE_MASK);
1496 }
1497 if (!(tb_end <= start || tb_start >= end)) {
1498 #ifdef TARGET_HAS_PRECISE_SMC
1499 if (current_tb_not_found) {
1500 current_tb_not_found = 0;
1501 current_tb = NULL;
1502 if (cpu->mem_io_pc) {
1503 /* now we have a real cpu fault */
1504 current_tb = tb_find_pc(cpu->mem_io_pc);
1505 }
1506 }
1507 if (current_tb == tb &&
1508 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1509 /* If we are modifying the current TB, we must stop
1510 its execution. We could be more precise by checking
1511 that the modification is after the current PC, but it
1512 would require a specialized function to partially
1513 restore the CPU state */
1514
1515 current_tb_modified = 1;
1516 cpu_restore_state_from_tb(cpu, current_tb, cpu->mem_io_pc);
1517 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1518 &current_flags);
1519 }
1520 #endif /* TARGET_HAS_PRECISE_SMC */
1521 tb_phys_invalidate(tb, -1);
1522 }
1523 tb = tb_next;
1524 }
1525 #if !defined(CONFIG_USER_ONLY)
1526 /* if no code remaining, no need to continue to use slow writes */
1527 if (!p->first_tb) {
1528 invalidate_page_bitmap(p);
1529 tlb_unprotect_code(start);
1530 }
1531 #endif
1532 #ifdef TARGET_HAS_PRECISE_SMC
1533 if (current_tb_modified) {
1534 /* we generate a block containing just the instruction
1535 modifying the memory. It will ensure that it cannot modify
1536 itself */
1537 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1538 cpu_loop_exit_noexc(cpu);
1539 }
1540 #endif
1541 }
1542
1543 #ifdef CONFIG_SOFTMMU
1544 /* len must be <= 8 and start must be a multiple of len.
1545 * Called via softmmu_template.h when code areas are written to with
1546 * tb_lock held.
1547 */
1548 void tb_invalidate_phys_page_fast(tb_page_addr_t start, int len)
1549 {
1550 PageDesc *p;
1551
1552 #if 0
1553 if (1) {
1554 qemu_log("modifying code at 0x%x size=%d EIP=%x PC=%08x\n",
1555 cpu_single_env->mem_io_vaddr, len,
1556 cpu_single_env->eip,
1557 cpu_single_env->eip +
1558 (intptr_t)cpu_single_env->segs[R_CS].base);
1559 }
1560 #endif
1561 assert_memory_lock();
1562
1563 p = page_find(start >> TARGET_PAGE_BITS);
1564 if (!p) {
1565 return;
1566 }
1567 if (!p->code_bitmap &&
1568 ++p->code_write_count >= SMC_BITMAP_USE_THRESHOLD) {
1569 /* build code bitmap. FIXME: writes should be protected by
1570 * tb_lock, reads by tb_lock or RCU.
1571 */
1572 build_page_bitmap(p);
1573 }
1574 if (p->code_bitmap) {
1575 unsigned int nr;
1576 unsigned long b;
1577
1578 nr = start & ~TARGET_PAGE_MASK;
1579 b = p->code_bitmap[BIT_WORD(nr)] >> (nr & (BITS_PER_LONG - 1));
1580 if (b & ((1 << len) - 1)) {
1581 goto do_invalidate;
1582 }
1583 } else {
1584 do_invalidate:
1585 tb_invalidate_phys_page_range(start, start + len, 1);
1586 }
1587 }
1588 #else
1589 /* Called with mmap_lock held. If pc is not 0 then it indicates the
1590 * host PC of the faulting store instruction that caused this invalidate.
1591 * Returns true if the caller needs to abort execution of the current
1592 * TB (because it was modified by this store and the guest CPU has
1593 * precise-SMC semantics).
1594 */
1595 static bool tb_invalidate_phys_page(tb_page_addr_t addr, uintptr_t pc)
1596 {
1597 TranslationBlock *tb;
1598 PageDesc *p;
1599 int n;
1600 #ifdef TARGET_HAS_PRECISE_SMC
1601 TranslationBlock *current_tb = NULL;
1602 CPUState *cpu = current_cpu;
1603 CPUArchState *env = NULL;
1604 int current_tb_modified = 0;
1605 target_ulong current_pc = 0;
1606 target_ulong current_cs_base = 0;
1607 uint32_t current_flags = 0;
1608 #endif
1609
1610 assert_memory_lock();
1611
1612 addr &= TARGET_PAGE_MASK;
1613 p = page_find(addr >> TARGET_PAGE_BITS);
1614 if (!p) {
1615 return false;
1616 }
1617
1618 tb_lock();
1619 tb = p->first_tb;
1620 #ifdef TARGET_HAS_PRECISE_SMC
1621 if (tb && pc != 0) {
1622 current_tb = tb_find_pc(pc);
1623 }
1624 if (cpu != NULL) {
1625 env = cpu->env_ptr;
1626 }
1627 #endif
1628 while (tb != NULL) {
1629 n = (uintptr_t)tb & 3;
1630 tb = (TranslationBlock *)((uintptr_t)tb & ~3);
1631 #ifdef TARGET_HAS_PRECISE_SMC
1632 if (current_tb == tb &&
1633 (current_tb->cflags & CF_COUNT_MASK) != 1) {
1634 /* If we are modifying the current TB, we must stop
1635 its execution. We could be more precise by checking
1636 that the modification is after the current PC, but it
1637 would require a specialized function to partially
1638 restore the CPU state */
1639
1640 current_tb_modified = 1;
1641 cpu_restore_state_from_tb(cpu, current_tb, pc);
1642 cpu_get_tb_cpu_state(env, &current_pc, &current_cs_base,
1643 &current_flags);
1644 }
1645 #endif /* TARGET_HAS_PRECISE_SMC */
1646 tb_phys_invalidate(tb, addr);
1647 tb = tb->page_next[n];
1648 }
1649 p->first_tb = NULL;
1650 #ifdef TARGET_HAS_PRECISE_SMC
1651 if (current_tb_modified) {
1652 /* we generate a block containing just the instruction
1653 modifying the memory. It will ensure that it cannot modify
1654 itself */
1655 tb_gen_code(cpu, current_pc, current_cs_base, current_flags, 1);
1656 /* tb_lock will be reset after cpu_loop_exit_noexc longjmps
1657 * back into the cpu_exec loop. */
1658 return true;
1659 }
1660 #endif
1661 tb_unlock();
1662
1663 return false;
1664 }
1665 #endif
1666
1667 /* find the TB 'tb' such that tb[0].tc_ptr <= tc_ptr <
1668 tb[1].tc_ptr. Return NULL if not found */
1669 static TranslationBlock *tb_find_pc(uintptr_t tc_ptr)
1670 {
1671 int m_min, m_max, m;
1672 uintptr_t v;
1673 TranslationBlock *tb;
1674
1675 if (tcg_ctx.tb_ctx.nb_tbs <= 0) {
1676 return NULL;
1677 }
1678 if (tc_ptr < (uintptr_t)tcg_ctx.code_gen_buffer ||
1679 tc_ptr >= (uintptr_t)tcg_ctx.code_gen_ptr) {
1680 return NULL;
1681 }
1682 /* binary search (cf Knuth) */
1683 m_min = 0;
1684 m_max = tcg_ctx.tb_ctx.nb_tbs - 1;
1685 while (m_min <= m_max) {
1686 m = (m_min + m_max) >> 1;
1687 tb = &tcg_ctx.tb_ctx.tbs[m];
1688 v = (uintptr_t)tb->tc_ptr;
1689 if (v == tc_ptr) {
1690 return tb;
1691 } else if (tc_ptr < v) {
1692 m_max = m - 1;
1693 } else {
1694 m_min = m + 1;
1695 }
1696 }
1697 return &tcg_ctx.tb_ctx.tbs[m_max];
1698 }
1699
1700 #if !defined(CONFIG_USER_ONLY)
1701 void tb_invalidate_phys_addr(AddressSpace *as, hwaddr addr)
1702 {
1703 ram_addr_t ram_addr;
1704 MemoryRegion *mr;
1705 hwaddr l = 1;
1706
1707 rcu_read_lock();
1708 mr = address_space_translate(as, addr, &addr, &l, false);
1709 if (!(memory_region_is_ram(mr)
1710 || memory_region_is_romd(mr))) {
1711 rcu_read_unlock();
1712 return;
1713 }
1714 ram_addr = memory_region_get_ram_addr(mr) + addr;
1715 tb_lock();
1716 tb_invalidate_phys_page_range(ram_addr, ram_addr + 1, 0);
1717 tb_unlock();
1718 rcu_read_unlock();
1719 }
1720 #endif /* !defined(CONFIG_USER_ONLY) */
1721
1722 /* Called with tb_lock held. */
1723 void tb_check_watchpoint(CPUState *cpu)
1724 {
1725 TranslationBlock *tb;
1726
1727 tb = tb_find_pc(cpu->mem_io_pc);
1728 if (tb) {
1729 /* We can use retranslation to find the PC. */
1730 cpu_restore_state_from_tb(cpu, tb, cpu->mem_io_pc);
1731 tb_phys_invalidate(tb, -1);
1732 } else {
1733 /* The exception probably happened in a helper. The CPU state should
1734 have been saved before calling it. Fetch the PC from there. */
1735 CPUArchState *env = cpu->env_ptr;
1736 target_ulong pc, cs_base;
1737 tb_page_addr_t addr;
1738 uint32_t flags;
1739
1740 cpu_get_tb_cpu_state(env, &pc, &cs_base, &flags);
1741 addr = get_page_addr_code(env, pc);
1742 tb_invalidate_phys_range(addr, addr + 1);
1743 }
1744 }
1745
1746 #ifndef CONFIG_USER_ONLY
1747 /* in deterministic execution mode, instructions doing device I/Os
1748 must be at the end of the TB */
1749 void cpu_io_recompile(CPUState *cpu, uintptr_t retaddr)
1750 {
1751 #if defined(TARGET_MIPS) || defined(TARGET_SH4)
1752 CPUArchState *env = cpu->env_ptr;
1753 #endif
1754 TranslationBlock *tb;
1755 uint32_t n, cflags;
1756 target_ulong pc, cs_base;
1757 uint32_t flags;
1758
1759 tb_lock();
1760 tb = tb_find_pc(retaddr);
1761 if (!tb) {
1762 cpu_abort(cpu, "cpu_io_recompile: could not find TB for pc=%p",
1763 (void *)retaddr);
1764 }
1765 n = cpu->icount_decr.u16.low + tb->icount;
1766 cpu_restore_state_from_tb(cpu, tb, retaddr);
1767 /* Calculate how many instructions had been executed before the fault
1768 occurred. */
1769 n = n - cpu->icount_decr.u16.low;
1770 /* Generate a new TB ending on the I/O insn. */
1771 n++;
1772 /* On MIPS and SH, delay slot instructions can only be restarted if
1773 they were already the first instruction in the TB. If this is not
1774 the first instruction in a TB then re-execute the preceding
1775 branch. */
1776 #if defined(TARGET_MIPS)
1777 if ((env->hflags & MIPS_HFLAG_BMASK) != 0 && n > 1) {
1778 env->active_tc.PC -= (env->hflags & MIPS_HFLAG_B16 ? 2 : 4);
1779 cpu->icount_decr.u16.low++;
1780 env->hflags &= ~MIPS_HFLAG_BMASK;
1781 }
1782 #elif defined(TARGET_SH4)
1783 if ((env->flags & ((DELAY_SLOT | DELAY_SLOT_CONDITIONAL))) != 0
1784 && n > 1) {
1785 env->pc -= 2;
1786 cpu->icount_decr.u16.low++;
1787 env->flags &= ~(DELAY_SLOT | DELAY_SLOT_CONDITIONAL);
1788 }
1789 #endif
1790 /* This should never happen. */
1791 if (n > CF_COUNT_MASK) {
1792 cpu_abort(cpu, "TB too big during recompile");
1793 }
1794
1795 cflags = n | CF_LAST_IO;
1796 pc = tb->pc;
1797 cs_base = tb->cs_base;
1798 flags = tb->flags;
1799 tb_phys_invalidate(tb, -1);
1800 if (tb->cflags & CF_NOCACHE) {
1801 if (tb->orig_tb) {
1802 /* Invalidate original TB if this TB was generated in
1803 * cpu_exec_nocache() */
1804 tb_phys_invalidate(tb->orig_tb, -1);
1805 }
1806 tb_free(tb);
1807 }
1808 /* FIXME: In theory this could raise an exception. In practice
1809 we have already translated the block once so it's probably ok. */
1810 tb_gen_code(cpu, pc, cs_base, flags, cflags);
1811
1812 /* TODO: If env->pc != tb->pc (i.e. the faulting instruction was not
1813 * the first in the TB) then we end up generating a whole new TB and
1814 * repeating the fault, which is horribly inefficient.
1815 * Better would be to execute just this insn uncached, or generate a
1816 * second new TB.
1817 *
1818 * cpu_loop_exit_noexc will longjmp back to cpu_exec where the
1819 * tb_lock gets reset.
1820 */
1821 cpu_loop_exit_noexc(cpu);
1822 }
1823
1824 void tb_flush_jmp_cache(CPUState *cpu, target_ulong addr)
1825 {
1826 unsigned int i;
1827
1828 /* Discard jump cache entries for any tb which might potentially
1829 overlap the flushed page. */
1830 i = tb_jmp_cache_hash_page(addr - TARGET_PAGE_SIZE);
1831 memset(&cpu->tb_jmp_cache[i], 0,
1832 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1833
1834 i = tb_jmp_cache_hash_page(addr);
1835 memset(&cpu->tb_jmp_cache[i], 0,
1836 TB_JMP_PAGE_SIZE * sizeof(TranslationBlock *));
1837 }
1838
1839 static void print_qht_statistics(FILE *f, fprintf_function cpu_fprintf,
1840 struct qht_stats hst)
1841 {
1842 uint32_t hgram_opts;
1843 size_t hgram_bins;
1844 char *hgram;
1845
1846 if (!hst.head_buckets) {
1847 return;
1848 }
1849 cpu_fprintf(f, "TB hash buckets %zu/%zu (%0.2f%% head buckets used)\n",
1850 hst.used_head_buckets, hst.head_buckets,
1851 (double)hst.used_head_buckets / hst.head_buckets * 100);
1852
1853 hgram_opts = QDIST_PR_BORDER | QDIST_PR_LABELS;
1854 hgram_opts |= QDIST_PR_100X | QDIST_PR_PERCENT;
1855 if (qdist_xmax(&hst.occupancy) - qdist_xmin(&hst.occupancy) == 1) {
1856 hgram_opts |= QDIST_PR_NODECIMAL;
1857 }
1858 hgram = qdist_pr(&hst.occupancy, 10, hgram_opts);
1859 cpu_fprintf(f, "TB hash occupancy %0.2f%% avg chain occ. Histogram: %s\n",
1860 qdist_avg(&hst.occupancy) * 100, hgram);
1861 g_free(hgram);
1862
1863 hgram_opts = QDIST_PR_BORDER | QDIST_PR_LABELS;
1864 hgram_bins = qdist_xmax(&hst.chain) - qdist_xmin(&hst.chain);
1865 if (hgram_bins > 10) {
1866 hgram_bins = 10;
1867 } else {
1868 hgram_bins = 0;
1869 hgram_opts |= QDIST_PR_NODECIMAL | QDIST_PR_NOBINRANGE;
1870 }
1871 hgram = qdist_pr(&hst.chain, hgram_bins, hgram_opts);
1872 cpu_fprintf(f, "TB hash avg chain %0.3f buckets. Histogram: %s\n",
1873 qdist_avg(&hst.chain), hgram);
1874 g_free(hgram);
1875 }
1876
1877 void dump_exec_info(FILE *f, fprintf_function cpu_fprintf)
1878 {
1879 int i, target_code_size, max_target_code_size;
1880 int direct_jmp_count, direct_jmp2_count, cross_page;
1881 TranslationBlock *tb;
1882 struct qht_stats hst;
1883
1884 tb_lock();
1885
1886 target_code_size = 0;
1887 max_target_code_size = 0;
1888 cross_page = 0;
1889 direct_jmp_count = 0;
1890 direct_jmp2_count = 0;
1891 for (i = 0; i < tcg_ctx.tb_ctx.nb_tbs; i++) {
1892 tb = &tcg_ctx.tb_ctx.tbs[i];
1893 target_code_size += tb->size;
1894 if (tb->size > max_target_code_size) {
1895 max_target_code_size = tb->size;
1896 }
1897 if (tb->page_addr[1] != -1) {
1898 cross_page++;
1899 }
1900 if (tb->jmp_reset_offset[0] != TB_JMP_RESET_OFFSET_INVALID) {
1901 direct_jmp_count++;
1902 if (tb->jmp_reset_offset[1] != TB_JMP_RESET_OFFSET_INVALID) {
1903 direct_jmp2_count++;
1904 }
1905 }
1906 }
1907 /* XXX: avoid using doubles ? */
1908 cpu_fprintf(f, "Translation buffer state:\n");
1909 cpu_fprintf(f, "gen code size %td/%zd\n",
1910 tcg_ctx.code_gen_ptr - tcg_ctx.code_gen_buffer,
1911 tcg_ctx.code_gen_highwater - tcg_ctx.code_gen_buffer);
1912 cpu_fprintf(f, "TB count %d/%d\n",
1913 tcg_ctx.tb_ctx.nb_tbs, tcg_ctx.code_gen_max_blocks);
1914 cpu_fprintf(f, "TB avg target size %d max=%d bytes\n",
1915 tcg_ctx.tb_ctx.nb_tbs ? target_code_size /
1916 tcg_ctx.tb_ctx.nb_tbs : 0,
1917 max_target_code_size);
1918 cpu_fprintf(f, "TB avg host size %td bytes (expansion ratio: %0.1f)\n",
1919 tcg_ctx.tb_ctx.nb_tbs ? (tcg_ctx.code_gen_ptr -
1920 tcg_ctx.code_gen_buffer) /
1921 tcg_ctx.tb_ctx.nb_tbs : 0,
1922 target_code_size ? (double) (tcg_ctx.code_gen_ptr -
1923 tcg_ctx.code_gen_buffer) /
1924 target_code_size : 0);
1925 cpu_fprintf(f, "cross page TB count %d (%d%%)\n", cross_page,
1926 tcg_ctx.tb_ctx.nb_tbs ? (cross_page * 100) /
1927 tcg_ctx.tb_ctx.nb_tbs : 0);
1928 cpu_fprintf(f, "direct jump count %d (%d%%) (2 jumps=%d %d%%)\n",
1929 direct_jmp_count,
1930 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp_count * 100) /
1931 tcg_ctx.tb_ctx.nb_tbs : 0,
1932 direct_jmp2_count,
1933 tcg_ctx.tb_ctx.nb_tbs ? (direct_jmp2_count * 100) /
1934 tcg_ctx.tb_ctx.nb_tbs : 0);
1935
1936 qht_statistics_init(&tcg_ctx.tb_ctx.htable, &hst);
1937 print_qht_statistics(f, cpu_fprintf, hst);
1938 qht_statistics_destroy(&hst);
1939
1940 cpu_fprintf(f, "\nStatistics:\n");
1941 cpu_fprintf(f, "TB flush count %u\n",
1942 atomic_read(&tcg_ctx.tb_ctx.tb_flush_count));
1943 cpu_fprintf(f, "TB invalidate count %d\n",
1944 tcg_ctx.tb_ctx.tb_phys_invalidate_count);
1945 cpu_fprintf(f, "TLB flush count %d\n", tlb_flush_count);
1946 tcg_dump_info(f, cpu_fprintf);
1947
1948 tb_unlock();
1949 }
1950
1951 void dump_opcount_info(FILE *f, fprintf_function cpu_fprintf)
1952 {
1953 tcg_dump_op_count(f, cpu_fprintf);
1954 }
1955
1956 #else /* CONFIG_USER_ONLY */
1957
1958 void cpu_interrupt(CPUState *cpu, int mask)
1959 {
1960 cpu->interrupt_request |= mask;
1961 cpu->tcg_exit_req = 1;
1962 }
1963
1964 /*
1965 * Walks guest process memory "regions" one by one
1966 * and calls callback function 'fn' for each region.
1967 */
1968 struct walk_memory_regions_data {
1969 walk_memory_regions_fn fn;
1970 void *priv;
1971 target_ulong start;
1972 int prot;
1973 };
1974
1975 static int walk_memory_regions_end(struct walk_memory_regions_data *data,
1976 target_ulong end, int new_prot)
1977 {
1978 if (data->start != -1u) {
1979 int rc = data->fn(data->priv, data->start, end, data->prot);
1980 if (rc != 0) {
1981 return rc;
1982 }
1983 }
1984
1985 data->start = (new_prot ? end : -1u);
1986 data->prot = new_prot;
1987
1988 return 0;
1989 }
1990
1991 static int walk_memory_regions_1(struct walk_memory_regions_data *data,
1992 target_ulong base, int level, void **lp)
1993 {
1994 target_ulong pa;
1995 int i, rc;
1996
1997 if (*lp == NULL) {
1998 return walk_memory_regions_end(data, base, 0);
1999 }
2000
2001 if (level == 0) {
2002 PageDesc *pd = *lp;
2003
2004 for (i = 0; i < V_L2_SIZE; ++i) {
2005 int prot = pd[i].flags;
2006
2007 pa = base | (i << TARGET_PAGE_BITS);
2008 if (prot != data->prot) {
2009 rc = walk_memory_regions_end(data, pa, prot);
2010 if (rc != 0) {
2011 return rc;
2012 }
2013 }
2014 }
2015 } else {
2016 void **pp = *lp;
2017
2018 for (i = 0; i < V_L2_SIZE; ++i) {
2019 pa = base | ((target_ulong)i <<
2020 (TARGET_PAGE_BITS + V_L2_BITS * level));
2021 rc = walk_memory_regions_1(data, pa, level - 1, pp + i);
2022 if (rc != 0) {
2023 return rc;
2024 }
2025 }
2026 }
2027
2028 return 0;
2029 }
2030
2031 int walk_memory_regions(void *priv, walk_memory_regions_fn fn)
2032 {
2033 struct walk_memory_regions_data data;
2034 uintptr_t i, l1_sz = v_l1_size;
2035
2036 data.fn = fn;
2037 data.priv = priv;
2038 data.start = -1u;
2039 data.prot = 0;
2040
2041 for (i = 0; i < l1_sz; i++) {
2042 target_ulong base = i << (v_l1_shift + TARGET_PAGE_BITS);
2043 int rc = walk_memory_regions_1(&data, base, v_l2_levels, l1_map + i);
2044 if (rc != 0) {
2045 return rc;
2046 }
2047 }
2048
2049 return walk_memory_regions_end(&data, 0, 0);
2050 }
2051
2052 static int dump_region(void *priv, target_ulong start,
2053 target_ulong end, unsigned long prot)
2054 {
2055 FILE *f = (FILE *)priv;
2056
2057 (void) fprintf(f, TARGET_FMT_lx"-"TARGET_FMT_lx
2058 " "TARGET_FMT_lx" %c%c%c\n",
2059 start, end, end - start,
2060 ((prot & PAGE_READ) ? 'r' : '-'),
2061 ((prot & PAGE_WRITE) ? 'w' : '-'),
2062 ((prot & PAGE_EXEC) ? 'x' : '-'));
2063
2064 return 0;
2065 }
2066
2067 /* dump memory mappings */
2068 void page_dump(FILE *f)
2069 {
2070 const int length = sizeof(target_ulong) * 2;
2071 (void) fprintf(f, "%-*s %-*s %-*s %s\n",
2072 length, "start", length, "end", length, "size", "prot");
2073 walk_memory_regions(f, dump_region);
2074 }
2075
2076 int page_get_flags(target_ulong address)
2077 {
2078 PageDesc *p;
2079
2080 p = page_find(address >> TARGET_PAGE_BITS);
2081 if (!p) {
2082 return 0;
2083 }
2084 return p->flags;
2085 }
2086
2087 /* Modify the flags of a page and invalidate the code if necessary.
2088 The flag PAGE_WRITE_ORG is positioned automatically depending
2089 on PAGE_WRITE. The mmap_lock should already be held. */
2090 void page_set_flags(target_ulong start, target_ulong end, int flags)
2091 {
2092 target_ulong addr, len;
2093
2094 /* This function should never be called with addresses outside the
2095 guest address space. If this assert fires, it probably indicates
2096 a missing call to h2g_valid. */
2097 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2098 assert(end < ((target_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2099 #endif
2100 assert(start < end);
2101 assert_memory_lock();
2102
2103 start = start & TARGET_PAGE_MASK;
2104 end = TARGET_PAGE_ALIGN(end);
2105
2106 if (flags & PAGE_WRITE) {
2107 flags |= PAGE_WRITE_ORG;
2108 }
2109
2110 for (addr = start, len = end - start;
2111 len != 0;
2112 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2113 PageDesc *p = page_find_alloc(addr >> TARGET_PAGE_BITS, 1);
2114
2115 /* If the write protection bit is set, then we invalidate
2116 the code inside. */
2117 if (!(p->flags & PAGE_WRITE) &&
2118 (flags & PAGE_WRITE) &&
2119 p->first_tb) {
2120 tb_invalidate_phys_page(addr, 0);
2121 }
2122 p->flags = flags;
2123 }
2124 }
2125
2126 int page_check_range(target_ulong start, target_ulong len, int flags)
2127 {
2128 PageDesc *p;
2129 target_ulong end;
2130 target_ulong addr;
2131
2132 /* This function should never be called with addresses outside the
2133 guest address space. If this assert fires, it probably indicates
2134 a missing call to h2g_valid. */
2135 #if TARGET_ABI_BITS > L1_MAP_ADDR_SPACE_BITS
2136 assert(start < ((target_ulong)1 << L1_MAP_ADDR_SPACE_BITS));
2137 #endif
2138
2139 if (len == 0) {
2140 return 0;
2141 }
2142 if (start + len - 1 < start) {
2143 /* We've wrapped around. */
2144 return -1;
2145 }
2146
2147 /* must do before we loose bits in the next step */
2148 end = TARGET_PAGE_ALIGN(start + len);
2149 start = start & TARGET_PAGE_MASK;
2150
2151 for (addr = start, len = end - start;
2152 len != 0;
2153 len -= TARGET_PAGE_SIZE, addr += TARGET_PAGE_SIZE) {
2154 p = page_find(addr >> TARGET_PAGE_BITS);
2155 if (!p) {
2156 return -1;
2157 }
2158 if (!(p->flags & PAGE_VALID)) {
2159 return -1;
2160 }
2161
2162 if ((flags & PAGE_READ) && !(p->flags & PAGE_READ)) {
2163 return -1;
2164 }
2165 if (flags & PAGE_WRITE) {
2166 if (!(p->flags & PAGE_WRITE_ORG)) {
2167 return -1;
2168 }
2169 /* unprotect the page if it was put read-only because it
2170 contains translated code */
2171 if (!(p->flags & PAGE_WRITE)) {
2172 if (!page_unprotect(addr, 0)) {
2173 return -1;
2174 }
2175 }
2176 }
2177 }
2178 return 0;
2179 }
2180
2181 /* called from signal handler: invalidate the code and unprotect the
2182 * page. Return 0 if the fault was not handled, 1 if it was handled,
2183 * and 2 if it was handled but the caller must cause the TB to be
2184 * immediately exited. (We can only return 2 if the 'pc' argument is
2185 * non-zero.)
2186 */
2187 int page_unprotect(target_ulong address, uintptr_t pc)
2188 {
2189 unsigned int prot;
2190 bool current_tb_invalidated;
2191 PageDesc *p;
2192 target_ulong host_start, host_end, addr;
2193
2194 /* Technically this isn't safe inside a signal handler. However we
2195 know this only ever happens in a synchronous SEGV handler, so in
2196 practice it seems to be ok. */
2197 mmap_lock();
2198
2199 p = page_find(address >> TARGET_PAGE_BITS);
2200 if (!p) {
2201 mmap_unlock();
2202 return 0;
2203 }
2204
2205 /* if the page was really writable, then we change its
2206 protection back to writable */
2207 if ((p->flags & PAGE_WRITE_ORG) && !(p->flags & PAGE_WRITE)) {
2208 host_start = address & qemu_host_page_mask;
2209 host_end = host_start + qemu_host_page_size;
2210
2211 prot = 0;
2212 current_tb_invalidated = false;
2213 for (addr = host_start ; addr < host_end ; addr += TARGET_PAGE_SIZE) {
2214 p = page_find(addr >> TARGET_PAGE_BITS);
2215 p->flags |= PAGE_WRITE;
2216 prot |= p->flags;
2217
2218 /* and since the content will be modified, we must invalidate
2219 the corresponding translated code. */
2220 current_tb_invalidated |= tb_invalidate_phys_page(addr, pc);
2221 #ifdef DEBUG_TB_CHECK
2222 tb_invalidate_check(addr);
2223 #endif
2224 }
2225 mprotect((void *)g2h(host_start), qemu_host_page_size,
2226 prot & PAGE_BITS);
2227
2228 mmap_unlock();
2229 /* If current TB was invalidated return to main loop */
2230 return current_tb_invalidated ? 2 : 1;
2231 }
2232 mmap_unlock();
2233 return 0;
2234 }
2235 #endif /* CONFIG_USER_ONLY */