]> git.proxmox.com Git - qemu.git/blob - target-i386/translate.c
target-i386: introduce CCPrepare
[qemu.git] / target-i386 / translate.c
1 /*
2 * i386 translation
3 *
4 * Copyright (c) 2003 Fabrice Bellard
5 *
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Lesser General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
10 *
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Lesser General Public License for more details.
15 *
16 * You should have received a copy of the GNU Lesser General Public
17 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
18 */
19 #include <stdarg.h>
20 #include <stdlib.h>
21 #include <stdio.h>
22 #include <string.h>
23 #include <inttypes.h>
24 #include <signal.h>
25
26 #include "qemu/host-utils.h"
27 #include "cpu.h"
28 #include "disas/disas.h"
29 #include "tcg-op.h"
30
31 #include "helper.h"
32 #define GEN_HELPER 1
33 #include "helper.h"
34
35 #define PREFIX_REPZ 0x01
36 #define PREFIX_REPNZ 0x02
37 #define PREFIX_LOCK 0x04
38 #define PREFIX_DATA 0x08
39 #define PREFIX_ADR 0x10
40
41 #ifdef TARGET_X86_64
42 #define CODE64(s) ((s)->code64)
43 #define REX_X(s) ((s)->rex_x)
44 #define REX_B(s) ((s)->rex_b)
45 #else
46 #define CODE64(s) 0
47 #define REX_X(s) 0
48 #define REX_B(s) 0
49 #endif
50
51 #ifdef TARGET_X86_64
52 # define ctztl ctz64
53 # define clztl clz64
54 #else
55 # define ctztl ctz32
56 # define clztl clz32
57 #endif
58
59 //#define MACRO_TEST 1
60
61 /* global register indexes */
62 static TCGv_ptr cpu_env;
63 static TCGv cpu_A0, cpu_cc_src, cpu_cc_dst;
64 static TCGv_i32 cpu_cc_op;
65 static TCGv cpu_regs[CPU_NB_REGS];
66 /* local temps */
67 static TCGv cpu_T[2], cpu_T3;
68 /* local register indexes (only used inside old micro ops) */
69 static TCGv cpu_tmp0, cpu_tmp4;
70 static TCGv_ptr cpu_ptr0, cpu_ptr1;
71 static TCGv_i32 cpu_tmp2_i32, cpu_tmp3_i32;
72 static TCGv_i64 cpu_tmp1_i64;
73 static TCGv cpu_tmp5;
74
75 static uint8_t gen_opc_cc_op[OPC_BUF_SIZE];
76
77 #include "exec/gen-icount.h"
78
79 #ifdef TARGET_X86_64
80 static int x86_64_hregs;
81 #endif
82
83 typedef struct DisasContext {
84 /* current insn context */
85 int override; /* -1 if no override */
86 int prefix;
87 int aflag, dflag;
88 target_ulong pc; /* pc = eip + cs_base */
89 int is_jmp; /* 1 = means jump (stop translation), 2 means CPU
90 static state change (stop translation) */
91 /* current block context */
92 target_ulong cs_base; /* base of CS segment */
93 int pe; /* protected mode */
94 int code32; /* 32 bit code segment */
95 #ifdef TARGET_X86_64
96 int lma; /* long mode active */
97 int code64; /* 64 bit code segment */
98 int rex_x, rex_b;
99 #endif
100 int ss32; /* 32 bit stack segment */
101 CCOp cc_op; /* current CC operation */
102 bool cc_op_dirty;
103 int addseg; /* non zero if either DS/ES/SS have a non zero base */
104 int f_st; /* currently unused */
105 int vm86; /* vm86 mode */
106 int cpl;
107 int iopl;
108 int tf; /* TF cpu flag */
109 int singlestep_enabled; /* "hardware" single step enabled */
110 int jmp_opt; /* use direct block chaining for direct jumps */
111 int mem_index; /* select memory access functions */
112 uint64_t flags; /* all execution flags */
113 struct TranslationBlock *tb;
114 int popl_esp_hack; /* for correct popl with esp base handling */
115 int rip_offset; /* only used in x86_64, but left for simplicity */
116 int cpuid_features;
117 int cpuid_ext_features;
118 int cpuid_ext2_features;
119 int cpuid_ext3_features;
120 int cpuid_7_0_ebx_features;
121 } DisasContext;
122
123 static void gen_eob(DisasContext *s);
124 static void gen_jmp(DisasContext *s, target_ulong eip);
125 static void gen_jmp_tb(DisasContext *s, target_ulong eip, int tb_num);
126
127 /* i386 arith/logic operations */
128 enum {
129 OP_ADDL,
130 OP_ORL,
131 OP_ADCL,
132 OP_SBBL,
133 OP_ANDL,
134 OP_SUBL,
135 OP_XORL,
136 OP_CMPL,
137 };
138
139 /* i386 shift ops */
140 enum {
141 OP_ROL,
142 OP_ROR,
143 OP_RCL,
144 OP_RCR,
145 OP_SHL,
146 OP_SHR,
147 OP_SHL1, /* undocumented */
148 OP_SAR = 7,
149 };
150
151 enum {
152 JCC_O,
153 JCC_B,
154 JCC_Z,
155 JCC_BE,
156 JCC_S,
157 JCC_P,
158 JCC_L,
159 JCC_LE,
160 };
161
162 /* operand size */
163 enum {
164 OT_BYTE = 0,
165 OT_WORD,
166 OT_LONG,
167 OT_QUAD,
168 };
169
170 enum {
171 /* I386 int registers */
172 OR_EAX, /* MUST be even numbered */
173 OR_ECX,
174 OR_EDX,
175 OR_EBX,
176 OR_ESP,
177 OR_EBP,
178 OR_ESI,
179 OR_EDI,
180
181 OR_TMP0 = 16, /* temporary operand register */
182 OR_TMP1,
183 OR_A0, /* temporary register used when doing address evaluation */
184 };
185
186 enum {
187 USES_CC_DST = 1,
188 USES_CC_SRC = 2,
189 };
190
191 /* Bit set if the global variable is live after setting CC_OP to X. */
192 static const uint8_t cc_op_live[CC_OP_NB] = {
193 [CC_OP_DYNAMIC] = USES_CC_DST | USES_CC_SRC,
194 [CC_OP_EFLAGS] = USES_CC_SRC,
195 [CC_OP_MULB ... CC_OP_MULQ] = USES_CC_DST | USES_CC_SRC,
196 [CC_OP_ADDB ... CC_OP_ADDQ] = USES_CC_DST | USES_CC_SRC,
197 [CC_OP_ADCB ... CC_OP_ADCQ] = USES_CC_DST | USES_CC_SRC,
198 [CC_OP_SUBB ... CC_OP_SUBQ] = USES_CC_DST | USES_CC_SRC,
199 [CC_OP_SBBB ... CC_OP_SBBQ] = USES_CC_DST | USES_CC_SRC,
200 [CC_OP_LOGICB ... CC_OP_LOGICQ] = USES_CC_DST,
201 [CC_OP_INCB ... CC_OP_INCQ] = USES_CC_DST | USES_CC_SRC,
202 [CC_OP_DECB ... CC_OP_DECQ] = USES_CC_DST | USES_CC_SRC,
203 [CC_OP_SHLB ... CC_OP_SHLQ] = USES_CC_DST | USES_CC_SRC,
204 [CC_OP_SARB ... CC_OP_SARQ] = USES_CC_DST | USES_CC_SRC,
205 };
206
207 static void set_cc_op(DisasContext *s, CCOp op)
208 {
209 int dead;
210
211 if (s->cc_op == op) {
212 return;
213 }
214
215 /* Discard CC computation that will no longer be used. */
216 dead = cc_op_live[s->cc_op] & ~cc_op_live[op];
217 if (dead & USES_CC_DST) {
218 tcg_gen_discard_tl(cpu_cc_dst);
219 }
220 if (dead & USES_CC_SRC) {
221 tcg_gen_discard_tl(cpu_cc_src);
222 }
223
224 s->cc_op = op;
225 /* The DYNAMIC setting is translator only, and should never be
226 stored. Thus we always consider it clean. */
227 s->cc_op_dirty = (op != CC_OP_DYNAMIC);
228 }
229
230 static void gen_update_cc_op(DisasContext *s)
231 {
232 if (s->cc_op_dirty) {
233 tcg_gen_movi_i32(cpu_cc_op, s->cc_op);
234 s->cc_op_dirty = false;
235 }
236 }
237
238 static inline void gen_op_movl_T0_0(void)
239 {
240 tcg_gen_movi_tl(cpu_T[0], 0);
241 }
242
243 static inline void gen_op_movl_T0_im(int32_t val)
244 {
245 tcg_gen_movi_tl(cpu_T[0], val);
246 }
247
248 static inline void gen_op_movl_T0_imu(uint32_t val)
249 {
250 tcg_gen_movi_tl(cpu_T[0], val);
251 }
252
253 static inline void gen_op_movl_T1_im(int32_t val)
254 {
255 tcg_gen_movi_tl(cpu_T[1], val);
256 }
257
258 static inline void gen_op_movl_T1_imu(uint32_t val)
259 {
260 tcg_gen_movi_tl(cpu_T[1], val);
261 }
262
263 static inline void gen_op_movl_A0_im(uint32_t val)
264 {
265 tcg_gen_movi_tl(cpu_A0, val);
266 }
267
268 #ifdef TARGET_X86_64
269 static inline void gen_op_movq_A0_im(int64_t val)
270 {
271 tcg_gen_movi_tl(cpu_A0, val);
272 }
273 #endif
274
275 static inline void gen_movtl_T0_im(target_ulong val)
276 {
277 tcg_gen_movi_tl(cpu_T[0], val);
278 }
279
280 static inline void gen_movtl_T1_im(target_ulong val)
281 {
282 tcg_gen_movi_tl(cpu_T[1], val);
283 }
284
285 static inline void gen_op_andl_T0_ffff(void)
286 {
287 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xffff);
288 }
289
290 static inline void gen_op_andl_T0_im(uint32_t val)
291 {
292 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], val);
293 }
294
295 static inline void gen_op_movl_T0_T1(void)
296 {
297 tcg_gen_mov_tl(cpu_T[0], cpu_T[1]);
298 }
299
300 static inline void gen_op_andl_A0_ffff(void)
301 {
302 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffff);
303 }
304
305 #ifdef TARGET_X86_64
306
307 #define NB_OP_SIZES 4
308
309 #else /* !TARGET_X86_64 */
310
311 #define NB_OP_SIZES 3
312
313 #endif /* !TARGET_X86_64 */
314
315 #if defined(HOST_WORDS_BIGENDIAN)
316 #define REG_B_OFFSET (sizeof(target_ulong) - 1)
317 #define REG_H_OFFSET (sizeof(target_ulong) - 2)
318 #define REG_W_OFFSET (sizeof(target_ulong) - 2)
319 #define REG_L_OFFSET (sizeof(target_ulong) - 4)
320 #define REG_LH_OFFSET (sizeof(target_ulong) - 8)
321 #else
322 #define REG_B_OFFSET 0
323 #define REG_H_OFFSET 1
324 #define REG_W_OFFSET 0
325 #define REG_L_OFFSET 0
326 #define REG_LH_OFFSET 4
327 #endif
328
329 /* In instruction encodings for byte register accesses the
330 * register number usually indicates "low 8 bits of register N";
331 * however there are some special cases where N 4..7 indicates
332 * [AH, CH, DH, BH], ie "bits 15..8 of register N-4". Return
333 * true for this special case, false otherwise.
334 */
335 static inline bool byte_reg_is_xH(int reg)
336 {
337 if (reg < 4) {
338 return false;
339 }
340 #ifdef TARGET_X86_64
341 if (reg >= 8 || x86_64_hregs) {
342 return false;
343 }
344 #endif
345 return true;
346 }
347
348 static inline void gen_op_mov_reg_v(int ot, int reg, TCGv t0)
349 {
350 switch(ot) {
351 case OT_BYTE:
352 if (!byte_reg_is_xH(reg)) {
353 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], t0, 0, 8);
354 } else {
355 tcg_gen_deposit_tl(cpu_regs[reg - 4], cpu_regs[reg - 4], t0, 8, 8);
356 }
357 break;
358 case OT_WORD:
359 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], t0, 0, 16);
360 break;
361 default: /* XXX this shouldn't be reached; abort? */
362 case OT_LONG:
363 /* For x86_64, this sets the higher half of register to zero.
364 For i386, this is equivalent to a mov. */
365 tcg_gen_ext32u_tl(cpu_regs[reg], t0);
366 break;
367 #ifdef TARGET_X86_64
368 case OT_QUAD:
369 tcg_gen_mov_tl(cpu_regs[reg], t0);
370 break;
371 #endif
372 }
373 }
374
375 static inline void gen_op_mov_reg_T0(int ot, int reg)
376 {
377 gen_op_mov_reg_v(ot, reg, cpu_T[0]);
378 }
379
380 static inline void gen_op_mov_reg_T1(int ot, int reg)
381 {
382 gen_op_mov_reg_v(ot, reg, cpu_T[1]);
383 }
384
385 static inline void gen_op_mov_reg_A0(int size, int reg)
386 {
387 switch(size) {
388 case OT_BYTE:
389 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], cpu_A0, 0, 16);
390 break;
391 default: /* XXX this shouldn't be reached; abort? */
392 case OT_WORD:
393 /* For x86_64, this sets the higher half of register to zero.
394 For i386, this is equivalent to a mov. */
395 tcg_gen_ext32u_tl(cpu_regs[reg], cpu_A0);
396 break;
397 #ifdef TARGET_X86_64
398 case OT_LONG:
399 tcg_gen_mov_tl(cpu_regs[reg], cpu_A0);
400 break;
401 #endif
402 }
403 }
404
405 static inline void gen_op_mov_v_reg(int ot, TCGv t0, int reg)
406 {
407 if (ot == OT_BYTE && byte_reg_is_xH(reg)) {
408 tcg_gen_shri_tl(t0, cpu_regs[reg - 4], 8);
409 tcg_gen_ext8u_tl(t0, t0);
410 } else {
411 tcg_gen_mov_tl(t0, cpu_regs[reg]);
412 }
413 }
414
415 static inline void gen_op_mov_TN_reg(int ot, int t_index, int reg)
416 {
417 gen_op_mov_v_reg(ot, cpu_T[t_index], reg);
418 }
419
420 static inline void gen_op_movl_A0_reg(int reg)
421 {
422 tcg_gen_mov_tl(cpu_A0, cpu_regs[reg]);
423 }
424
425 static inline void gen_op_addl_A0_im(int32_t val)
426 {
427 tcg_gen_addi_tl(cpu_A0, cpu_A0, val);
428 #ifdef TARGET_X86_64
429 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
430 #endif
431 }
432
433 #ifdef TARGET_X86_64
434 static inline void gen_op_addq_A0_im(int64_t val)
435 {
436 tcg_gen_addi_tl(cpu_A0, cpu_A0, val);
437 }
438 #endif
439
440 static void gen_add_A0_im(DisasContext *s, int val)
441 {
442 #ifdef TARGET_X86_64
443 if (CODE64(s))
444 gen_op_addq_A0_im(val);
445 else
446 #endif
447 gen_op_addl_A0_im(val);
448 }
449
450 static inline void gen_op_addl_T0_T1(void)
451 {
452 tcg_gen_add_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
453 }
454
455 static inline void gen_op_jmp_T0(void)
456 {
457 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, eip));
458 }
459
460 static inline void gen_op_add_reg_im(int size, int reg, int32_t val)
461 {
462 switch(size) {
463 case OT_BYTE:
464 tcg_gen_addi_tl(cpu_tmp0, cpu_regs[reg], val);
465 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], cpu_tmp0, 0, 16);
466 break;
467 case OT_WORD:
468 tcg_gen_addi_tl(cpu_tmp0, cpu_regs[reg], val);
469 /* For x86_64, this sets the higher half of register to zero.
470 For i386, this is equivalent to a nop. */
471 tcg_gen_ext32u_tl(cpu_tmp0, cpu_tmp0);
472 tcg_gen_mov_tl(cpu_regs[reg], cpu_tmp0);
473 break;
474 #ifdef TARGET_X86_64
475 case OT_LONG:
476 tcg_gen_addi_tl(cpu_regs[reg], cpu_regs[reg], val);
477 break;
478 #endif
479 }
480 }
481
482 static inline void gen_op_add_reg_T0(int size, int reg)
483 {
484 switch(size) {
485 case OT_BYTE:
486 tcg_gen_add_tl(cpu_tmp0, cpu_regs[reg], cpu_T[0]);
487 tcg_gen_deposit_tl(cpu_regs[reg], cpu_regs[reg], cpu_tmp0, 0, 16);
488 break;
489 case OT_WORD:
490 tcg_gen_add_tl(cpu_tmp0, cpu_regs[reg], cpu_T[0]);
491 /* For x86_64, this sets the higher half of register to zero.
492 For i386, this is equivalent to a nop. */
493 tcg_gen_ext32u_tl(cpu_tmp0, cpu_tmp0);
494 tcg_gen_mov_tl(cpu_regs[reg], cpu_tmp0);
495 break;
496 #ifdef TARGET_X86_64
497 case OT_LONG:
498 tcg_gen_add_tl(cpu_regs[reg], cpu_regs[reg], cpu_T[0]);
499 break;
500 #endif
501 }
502 }
503
504 static inline void gen_op_addl_A0_reg_sN(int shift, int reg)
505 {
506 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[reg]);
507 if (shift != 0)
508 tcg_gen_shli_tl(cpu_tmp0, cpu_tmp0, shift);
509 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
510 /* For x86_64, this sets the higher half of register to zero.
511 For i386, this is equivalent to a nop. */
512 tcg_gen_ext32u_tl(cpu_A0, cpu_A0);
513 }
514
515 static inline void gen_op_movl_A0_seg(int reg)
516 {
517 tcg_gen_ld32u_tl(cpu_A0, cpu_env, offsetof(CPUX86State, segs[reg].base) + REG_L_OFFSET);
518 }
519
520 static inline void gen_op_addl_A0_seg(DisasContext *s, int reg)
521 {
522 tcg_gen_ld_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State, segs[reg].base));
523 #ifdef TARGET_X86_64
524 if (CODE64(s)) {
525 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
526 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
527 } else {
528 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
529 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
530 }
531 #else
532 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
533 #endif
534 }
535
536 #ifdef TARGET_X86_64
537 static inline void gen_op_movq_A0_seg(int reg)
538 {
539 tcg_gen_ld_tl(cpu_A0, cpu_env, offsetof(CPUX86State, segs[reg].base));
540 }
541
542 static inline void gen_op_addq_A0_seg(int reg)
543 {
544 tcg_gen_ld_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State, segs[reg].base));
545 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
546 }
547
548 static inline void gen_op_movq_A0_reg(int reg)
549 {
550 tcg_gen_mov_tl(cpu_A0, cpu_regs[reg]);
551 }
552
553 static inline void gen_op_addq_A0_reg_sN(int shift, int reg)
554 {
555 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[reg]);
556 if (shift != 0)
557 tcg_gen_shli_tl(cpu_tmp0, cpu_tmp0, shift);
558 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
559 }
560 #endif
561
562 static inline void gen_op_lds_T0_A0(int idx)
563 {
564 int mem_index = (idx >> 2) - 1;
565 switch(idx & 3) {
566 case OT_BYTE:
567 tcg_gen_qemu_ld8s(cpu_T[0], cpu_A0, mem_index);
568 break;
569 case OT_WORD:
570 tcg_gen_qemu_ld16s(cpu_T[0], cpu_A0, mem_index);
571 break;
572 default:
573 case OT_LONG:
574 tcg_gen_qemu_ld32s(cpu_T[0], cpu_A0, mem_index);
575 break;
576 }
577 }
578
579 static inline void gen_op_ld_v(int idx, TCGv t0, TCGv a0)
580 {
581 int mem_index = (idx >> 2) - 1;
582 switch(idx & 3) {
583 case OT_BYTE:
584 tcg_gen_qemu_ld8u(t0, a0, mem_index);
585 break;
586 case OT_WORD:
587 tcg_gen_qemu_ld16u(t0, a0, mem_index);
588 break;
589 case OT_LONG:
590 tcg_gen_qemu_ld32u(t0, a0, mem_index);
591 break;
592 default:
593 case OT_QUAD:
594 /* Should never happen on 32-bit targets. */
595 #ifdef TARGET_X86_64
596 tcg_gen_qemu_ld64(t0, a0, mem_index);
597 #endif
598 break;
599 }
600 }
601
602 /* XXX: always use ldu or lds */
603 static inline void gen_op_ld_T0_A0(int idx)
604 {
605 gen_op_ld_v(idx, cpu_T[0], cpu_A0);
606 }
607
608 static inline void gen_op_ldu_T0_A0(int idx)
609 {
610 gen_op_ld_v(idx, cpu_T[0], cpu_A0);
611 }
612
613 static inline void gen_op_ld_T1_A0(int idx)
614 {
615 gen_op_ld_v(idx, cpu_T[1], cpu_A0);
616 }
617
618 static inline void gen_op_st_v(int idx, TCGv t0, TCGv a0)
619 {
620 int mem_index = (idx >> 2) - 1;
621 switch(idx & 3) {
622 case OT_BYTE:
623 tcg_gen_qemu_st8(t0, a0, mem_index);
624 break;
625 case OT_WORD:
626 tcg_gen_qemu_st16(t0, a0, mem_index);
627 break;
628 case OT_LONG:
629 tcg_gen_qemu_st32(t0, a0, mem_index);
630 break;
631 default:
632 case OT_QUAD:
633 /* Should never happen on 32-bit targets. */
634 #ifdef TARGET_X86_64
635 tcg_gen_qemu_st64(t0, a0, mem_index);
636 #endif
637 break;
638 }
639 }
640
641 static inline void gen_op_st_T0_A0(int idx)
642 {
643 gen_op_st_v(idx, cpu_T[0], cpu_A0);
644 }
645
646 static inline void gen_op_st_T1_A0(int idx)
647 {
648 gen_op_st_v(idx, cpu_T[1], cpu_A0);
649 }
650
651 static inline void gen_jmp_im(target_ulong pc)
652 {
653 tcg_gen_movi_tl(cpu_tmp0, pc);
654 tcg_gen_st_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State, eip));
655 }
656
657 static inline void gen_string_movl_A0_ESI(DisasContext *s)
658 {
659 int override;
660
661 override = s->override;
662 #ifdef TARGET_X86_64
663 if (s->aflag == 2) {
664 if (override >= 0) {
665 gen_op_movq_A0_seg(override);
666 gen_op_addq_A0_reg_sN(0, R_ESI);
667 } else {
668 gen_op_movq_A0_reg(R_ESI);
669 }
670 } else
671 #endif
672 if (s->aflag) {
673 /* 32 bit address */
674 if (s->addseg && override < 0)
675 override = R_DS;
676 if (override >= 0) {
677 gen_op_movl_A0_seg(override);
678 gen_op_addl_A0_reg_sN(0, R_ESI);
679 } else {
680 gen_op_movl_A0_reg(R_ESI);
681 }
682 } else {
683 /* 16 address, always override */
684 if (override < 0)
685 override = R_DS;
686 gen_op_movl_A0_reg(R_ESI);
687 gen_op_andl_A0_ffff();
688 gen_op_addl_A0_seg(s, override);
689 }
690 }
691
692 static inline void gen_string_movl_A0_EDI(DisasContext *s)
693 {
694 #ifdef TARGET_X86_64
695 if (s->aflag == 2) {
696 gen_op_movq_A0_reg(R_EDI);
697 } else
698 #endif
699 if (s->aflag) {
700 if (s->addseg) {
701 gen_op_movl_A0_seg(R_ES);
702 gen_op_addl_A0_reg_sN(0, R_EDI);
703 } else {
704 gen_op_movl_A0_reg(R_EDI);
705 }
706 } else {
707 gen_op_movl_A0_reg(R_EDI);
708 gen_op_andl_A0_ffff();
709 gen_op_addl_A0_seg(s, R_ES);
710 }
711 }
712
713 static inline void gen_op_movl_T0_Dshift(int ot)
714 {
715 tcg_gen_ld32s_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, df));
716 tcg_gen_shli_tl(cpu_T[0], cpu_T[0], ot);
717 };
718
719 static TCGv gen_ext_tl(TCGv dst, TCGv src, int size, bool sign)
720 {
721 switch (size) {
722 case OT_BYTE:
723 if (sign) {
724 tcg_gen_ext8s_tl(dst, src);
725 } else {
726 tcg_gen_ext8u_tl(dst, src);
727 }
728 return dst;
729 case OT_WORD:
730 if (sign) {
731 tcg_gen_ext16s_tl(dst, src);
732 } else {
733 tcg_gen_ext16u_tl(dst, src);
734 }
735 return dst;
736 #ifdef TARGET_X86_64
737 case OT_LONG:
738 if (sign) {
739 tcg_gen_ext32s_tl(dst, src);
740 } else {
741 tcg_gen_ext32u_tl(dst, src);
742 }
743 return dst;
744 #endif
745 default:
746 return src;
747 }
748 }
749
750 static void gen_extu(int ot, TCGv reg)
751 {
752 gen_ext_tl(reg, reg, ot, false);
753 }
754
755 static void gen_exts(int ot, TCGv reg)
756 {
757 gen_ext_tl(reg, reg, ot, true);
758 }
759
760 static inline void gen_op_jnz_ecx(int size, int label1)
761 {
762 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[R_ECX]);
763 gen_extu(size + 1, cpu_tmp0);
764 tcg_gen_brcondi_tl(TCG_COND_NE, cpu_tmp0, 0, label1);
765 }
766
767 static inline void gen_op_jz_ecx(int size, int label1)
768 {
769 tcg_gen_mov_tl(cpu_tmp0, cpu_regs[R_ECX]);
770 gen_extu(size + 1, cpu_tmp0);
771 tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_tmp0, 0, label1);
772 }
773
774 static void gen_helper_in_func(int ot, TCGv v, TCGv_i32 n)
775 {
776 switch (ot) {
777 case OT_BYTE:
778 gen_helper_inb(v, n);
779 break;
780 case OT_WORD:
781 gen_helper_inw(v, n);
782 break;
783 case OT_LONG:
784 gen_helper_inl(v, n);
785 break;
786 }
787 }
788
789 static void gen_helper_out_func(int ot, TCGv_i32 v, TCGv_i32 n)
790 {
791 switch (ot) {
792 case OT_BYTE:
793 gen_helper_outb(v, n);
794 break;
795 case OT_WORD:
796 gen_helper_outw(v, n);
797 break;
798 case OT_LONG:
799 gen_helper_outl(v, n);
800 break;
801 }
802 }
803
804 static void gen_check_io(DisasContext *s, int ot, target_ulong cur_eip,
805 uint32_t svm_flags)
806 {
807 int state_saved;
808 target_ulong next_eip;
809
810 state_saved = 0;
811 if (s->pe && (s->cpl > s->iopl || s->vm86)) {
812 gen_update_cc_op(s);
813 gen_jmp_im(cur_eip);
814 state_saved = 1;
815 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
816 switch (ot) {
817 case OT_BYTE:
818 gen_helper_check_iob(cpu_env, cpu_tmp2_i32);
819 break;
820 case OT_WORD:
821 gen_helper_check_iow(cpu_env, cpu_tmp2_i32);
822 break;
823 case OT_LONG:
824 gen_helper_check_iol(cpu_env, cpu_tmp2_i32);
825 break;
826 }
827 }
828 if(s->flags & HF_SVMI_MASK) {
829 if (!state_saved) {
830 gen_update_cc_op(s);
831 gen_jmp_im(cur_eip);
832 }
833 svm_flags |= (1 << (4 + ot));
834 next_eip = s->pc - s->cs_base;
835 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
836 gen_helper_svm_check_io(cpu_env, cpu_tmp2_i32,
837 tcg_const_i32(svm_flags),
838 tcg_const_i32(next_eip - cur_eip));
839 }
840 }
841
842 static inline void gen_movs(DisasContext *s, int ot)
843 {
844 gen_string_movl_A0_ESI(s);
845 gen_op_ld_T0_A0(ot + s->mem_index);
846 gen_string_movl_A0_EDI(s);
847 gen_op_st_T0_A0(ot + s->mem_index);
848 gen_op_movl_T0_Dshift(ot);
849 gen_op_add_reg_T0(s->aflag, R_ESI);
850 gen_op_add_reg_T0(s->aflag, R_EDI);
851 }
852
853 static void gen_op_update1_cc(void)
854 {
855 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
856 }
857
858 static void gen_op_update2_cc(void)
859 {
860 tcg_gen_mov_tl(cpu_cc_src, cpu_T[1]);
861 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
862 }
863
864 static inline void gen_op_cmpl_T0_T1_cc(void)
865 {
866 tcg_gen_mov_tl(cpu_cc_src, cpu_T[1]);
867 tcg_gen_sub_tl(cpu_cc_dst, cpu_T[0], cpu_T[1]);
868 }
869
870 static inline void gen_op_testl_T0_T1_cc(void)
871 {
872 tcg_gen_and_tl(cpu_cc_dst, cpu_T[0], cpu_T[1]);
873 }
874
875 static void gen_op_update_neg_cc(void)
876 {
877 tcg_gen_neg_tl(cpu_cc_src, cpu_T[0]);
878 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
879 }
880
881 /* compute all eflags to cc_src */
882 static void gen_compute_eflags(DisasContext *s)
883 {
884 if (s->cc_op == CC_OP_EFLAGS) {
885 return;
886 }
887 gen_update_cc_op(s);
888 gen_helper_cc_compute_all(cpu_tmp2_i32, cpu_env, cpu_cc_op);
889 set_cc_op(s, CC_OP_EFLAGS);
890 tcg_gen_extu_i32_tl(cpu_cc_src, cpu_tmp2_i32);
891 }
892
893 typedef struct CCPrepare {
894 TCGCond cond;
895 TCGv reg;
896 TCGv reg2;
897 target_ulong imm;
898 target_ulong mask;
899 bool use_reg2;
900 bool no_setcond;
901 } CCPrepare;
902
903 /* compute eflags.C to reg */
904 static CCPrepare gen_prepare_eflags_c(DisasContext *s, TCGv reg)
905 {
906 TCGv t0, t1;
907 int size, shift;
908
909 switch (s->cc_op) {
910 case CC_OP_SUBB ... CC_OP_SUBQ:
911 /* (DATA_TYPE)(CC_DST + CC_SRC) < (DATA_TYPE)CC_SRC */
912 size = s->cc_op - CC_OP_SUBB;
913 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
914 /* If no temporary was used, be careful not to alias t1 and t0. */
915 t0 = TCGV_EQUAL(t1, cpu_cc_src) ? cpu_tmp0 : reg;
916 tcg_gen_add_tl(t0, cpu_cc_dst, cpu_cc_src);
917 gen_extu(size, t0);
918 goto add_sub;
919
920 case CC_OP_ADDB ... CC_OP_ADDQ:
921 /* (DATA_TYPE)CC_DST < (DATA_TYPE)CC_SRC */
922 size = s->cc_op - CC_OP_ADDB;
923 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
924 t0 = gen_ext_tl(reg, cpu_cc_dst, size, false);
925 add_sub:
926 return (CCPrepare) { .cond = TCG_COND_LTU, .reg = t0,
927 .reg2 = t1, .mask = -1, .use_reg2 = true };
928
929 case CC_OP_SBBB ... CC_OP_SBBQ:
930 /* (DATA_TYPE)(CC_DST + CC_SRC + 1) <= (DATA_TYPE)CC_SRC */
931 size = s->cc_op - CC_OP_SBBB;
932 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
933 if (TCGV_EQUAL(t1, reg) && TCGV_EQUAL(reg, cpu_cc_src)) {
934 tcg_gen_mov_tl(cpu_tmp0, cpu_cc_src);
935 t1 = cpu_tmp0;
936 }
937
938 tcg_gen_add_tl(reg, cpu_cc_dst, cpu_cc_src);
939 tcg_gen_addi_tl(reg, reg, 1);
940 gen_extu(size, reg);
941 t0 = reg;
942 goto adc_sbb;
943
944 case CC_OP_ADCB ... CC_OP_ADCQ:
945 /* (DATA_TYPE)CC_DST <= (DATA_TYPE)CC_SRC */
946 size = s->cc_op - CC_OP_ADCB;
947 t1 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
948 t0 = gen_ext_tl(reg, cpu_cc_dst, size, false);
949 adc_sbb:
950 return (CCPrepare) { .cond = TCG_COND_LEU, .reg = t0,
951 .reg2 = t1, .mask = -1, .use_reg2 = true };
952
953 case CC_OP_LOGICB ... CC_OP_LOGICQ:
954 return (CCPrepare) { .cond = TCG_COND_NEVER, .mask = -1 };
955
956 case CC_OP_INCB ... CC_OP_INCQ:
957 case CC_OP_DECB ... CC_OP_DECQ:
958 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
959 .mask = -1, .no_setcond = true };
960
961 case CC_OP_SHLB ... CC_OP_SHLQ:
962 /* (CC_SRC >> (DATA_BITS - 1)) & 1 */
963 size = s->cc_op - CC_OP_SHLB;
964 shift = (8 << size) - 1;
965 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
966 .mask = (target_ulong)1 << shift };
967
968 case CC_OP_MULB ... CC_OP_MULQ:
969 return (CCPrepare) { .cond = TCG_COND_NE,
970 .reg = cpu_cc_src, .mask = -1 };
971
972 case CC_OP_EFLAGS:
973 case CC_OP_SARB ... CC_OP_SARQ:
974 /* CC_SRC & 1 */
975 return (CCPrepare) { .cond = TCG_COND_NE,
976 .reg = cpu_cc_src, .mask = CC_C };
977
978 default:
979 /* The need to compute only C from CC_OP_DYNAMIC is important
980 in efficiently implementing e.g. INC at the start of a TB. */
981 gen_update_cc_op(s);
982 gen_helper_cc_compute_c(cpu_tmp2_i32, cpu_env, cpu_cc_op);
983 tcg_gen_extu_i32_tl(reg, cpu_tmp2_i32);
984 return (CCPrepare) { .cond = TCG_COND_NE, .reg = reg,
985 .mask = -1, .no_setcond = true };
986 }
987 }
988
989 /* compute eflags.P to reg */
990 static CCPrepare gen_prepare_eflags_p(DisasContext *s, TCGv reg)
991 {
992 gen_compute_eflags(s);
993 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
994 .mask = CC_P };
995 }
996
997 /* compute eflags.S to reg */
998 static CCPrepare gen_prepare_eflags_s(DisasContext *s, TCGv reg)
999 {
1000 switch (s->cc_op) {
1001 case CC_OP_DYNAMIC:
1002 gen_compute_eflags(s);
1003 /* FALLTHRU */
1004 case CC_OP_EFLAGS:
1005 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1006 .mask = CC_S };
1007 default:
1008 {
1009 int size = (s->cc_op - CC_OP_ADDB) & 3;
1010 TCGv t0 = gen_ext_tl(reg, cpu_cc_dst, size, true);
1011 return (CCPrepare) { .cond = TCG_COND_LT, .reg = t0, .mask = -1 };
1012 }
1013 }
1014 }
1015
1016 /* compute eflags.O to reg */
1017 static CCPrepare gen_prepare_eflags_o(DisasContext *s, TCGv reg)
1018 {
1019 gen_compute_eflags(s);
1020 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1021 .mask = CC_O };
1022 }
1023
1024 /* compute eflags.Z to reg */
1025 static CCPrepare gen_prepare_eflags_z(DisasContext *s, TCGv reg)
1026 {
1027 switch (s->cc_op) {
1028 case CC_OP_DYNAMIC:
1029 gen_compute_eflags(s);
1030 /* FALLTHRU */
1031 case CC_OP_EFLAGS:
1032 return (CCPrepare) { .cond = TCG_COND_NE, .reg = cpu_cc_src,
1033 .mask = CC_Z };
1034 default:
1035 {
1036 int size = (s->cc_op - CC_OP_ADDB) & 3;
1037 TCGv t0 = gen_ext_tl(reg, cpu_cc_dst, size, false);
1038 return (CCPrepare) { .cond = TCG_COND_EQ, .reg = t0, .mask = -1 };
1039 }
1040 }
1041 }
1042
1043 #define gen_compute_eflags_c(s, reg, inv) \
1044 gen_do_setcc(reg, gen_prepare_eflags_c(s, reg), inv)
1045 #define gen_compute_eflags_p(s, reg) \
1046 gen_do_setcc(reg, gen_prepare_eflags_p(s, reg), false)
1047 #define gen_compute_eflags_s(s, reg, inv) \
1048 gen_do_setcc(reg, gen_prepare_eflags_s(s, reg), inv)
1049 #define gen_compute_eflags_o(s, reg) \
1050 gen_do_setcc(reg, gen_prepare_eflags_o(s, reg), false)
1051 #define gen_compute_eflags_z(s, reg, inv) \
1052 gen_do_setcc(reg, gen_prepare_eflags_z(s, reg), inv)
1053
1054 static void gen_do_setcc(TCGv reg, struct CCPrepare cc, bool inv)
1055 {
1056 if (inv) {
1057 cc.cond = tcg_invert_cond(cc.cond);
1058 }
1059
1060 if (cc.no_setcond) {
1061 if (cc.cond == TCG_COND_EQ) {
1062 tcg_gen_xori_tl(reg, cc.reg, 1);
1063 } else {
1064 tcg_gen_mov_tl(reg, cc.reg);
1065 }
1066 return;
1067 }
1068
1069 if (cc.cond == TCG_COND_NE && !cc.use_reg2 && cc.imm == 0 &&
1070 cc.mask != 0 && (cc.mask & (cc.mask - 1)) == 0) {
1071 tcg_gen_shri_tl(reg, cc.reg, ctztl(cc.mask));
1072 tcg_gen_andi_tl(reg, reg, 1);
1073 return;
1074 }
1075 if (cc.mask != -1) {
1076 tcg_gen_andi_tl(reg, cc.reg, cc.mask);
1077 }
1078 if (cc.use_reg2) {
1079 tcg_gen_setcond_tl(cc.cond, reg, cc.reg, cc.reg2);
1080 } else {
1081 tcg_gen_setcondi_tl(cc.cond, reg, cc.reg, cc.imm);
1082 }
1083 }
1084
1085 static void gen_setcc_slow(DisasContext *s, int jcc_op, TCGv reg, bool inv)
1086 {
1087 switch(jcc_op) {
1088 case JCC_O:
1089 gen_compute_eflags_o(s, reg);
1090 break;
1091 case JCC_B:
1092 gen_compute_eflags_c(s, reg, inv);
1093 inv = false;
1094 break;
1095 case JCC_Z:
1096 gen_compute_eflags_z(s, reg, inv);
1097 inv = false;
1098 break;
1099 case JCC_BE:
1100 gen_compute_eflags(s);
1101 tcg_gen_andi_tl(reg, cpu_cc_src, CC_Z | CC_C);
1102 tcg_gen_setcondi_tl(inv ? TCG_COND_EQ : TCG_COND_NE, reg, reg, 0);
1103 return;
1104 case JCC_S:
1105 gen_compute_eflags_s(s, reg, inv);
1106 inv = false;
1107 break;
1108 case JCC_P:
1109 gen_compute_eflags_p(s, reg);
1110 break;
1111 case JCC_L:
1112 gen_compute_eflags(s);
1113 tcg_gen_shri_tl(cpu_tmp0, cpu_cc_src, 11); /* CC_O */
1114 tcg_gen_shri_tl(reg, cpu_cc_src, 7); /* CC_S */
1115 tcg_gen_xor_tl(reg, reg, cpu_tmp0);
1116 tcg_gen_andi_tl(reg, reg, 1);
1117 break;
1118 default:
1119 case JCC_LE:
1120 gen_compute_eflags(s);
1121 tcg_gen_shri_tl(cpu_tmp0, cpu_cc_src, 4); /* CC_O -> CC_S */
1122 tcg_gen_xor_tl(reg, cpu_tmp0, cpu_cc_src);
1123 tcg_gen_andi_tl(reg, reg, CC_S | CC_Z);
1124 tcg_gen_setcondi_tl(inv ? TCG_COND_EQ : TCG_COND_NE, reg, reg, 0);
1125 break;
1126 }
1127 if (inv) {
1128 tcg_gen_xori_tl(reg, reg, 1);
1129 }
1130 }
1131
1132 /* perform a conditional store into register 'reg' according to jump opcode
1133 value 'b'. In the fast case, T0 is guaranted not to be used. */
1134 static inline void gen_setcc1(DisasContext *s, int b, TCGv reg)
1135 {
1136 int inv, jcc_op, size, cond;
1137 TCGv t0;
1138
1139 inv = b & 1;
1140 jcc_op = (b >> 1) & 7;
1141
1142 switch (s->cc_op) {
1143 /* we optimize relational operators for the cmp/jcc case */
1144 case CC_OP_SUBB:
1145 case CC_OP_SUBW:
1146 case CC_OP_SUBL:
1147 case CC_OP_SUBQ:
1148 size = s->cc_op - CC_OP_SUBB;
1149 switch (jcc_op) {
1150 case JCC_BE:
1151 cond = inv ? TCG_COND_GTU : TCG_COND_LEU;
1152 tcg_gen_add_tl(cpu_tmp4, cpu_cc_dst, cpu_cc_src);
1153 gen_extu(size, cpu_tmp4);
1154 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
1155 tcg_gen_setcond_tl(cond, reg, cpu_tmp4, t0);
1156 break;
1157
1158 case JCC_L:
1159 cond = inv ? TCG_COND_GE : TCG_COND_LT;
1160 goto fast_jcc_l;
1161 case JCC_LE:
1162 cond = inv ? TCG_COND_GT : TCG_COND_LE;
1163 fast_jcc_l:
1164 tcg_gen_add_tl(cpu_tmp4, cpu_cc_dst, cpu_cc_src);
1165 gen_exts(size, cpu_tmp4);
1166 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, true);
1167 tcg_gen_setcond_tl(cond, reg, cpu_tmp4, t0);
1168 break;
1169
1170 default:
1171 goto slow_jcc;
1172 }
1173 break;
1174
1175 default:
1176 slow_jcc:
1177 /* gen_setcc_slow actually generates good code for JC, JZ and JS */
1178 gen_setcc_slow(s, jcc_op, reg, inv);
1179 break;
1180 }
1181 }
1182
1183 /* generate a conditional jump to label 'l1' according to jump opcode
1184 value 'b'. In the fast case, T0 is guaranted not to be used. */
1185 static inline void gen_jcc1(DisasContext *s, int b, int l1)
1186 {
1187 int inv, jcc_op, size, cond;
1188 TCGv t0;
1189
1190 inv = b & 1;
1191 jcc_op = (b >> 1) & 7;
1192
1193 switch (s->cc_op) {
1194 /* we optimize the cmp/jcc case */
1195 case CC_OP_SUBB:
1196 case CC_OP_SUBW:
1197 case CC_OP_SUBL:
1198 case CC_OP_SUBQ:
1199
1200 size = s->cc_op - CC_OP_SUBB;
1201 switch(jcc_op) {
1202 case JCC_Z:
1203 fast_jcc_z:
1204 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_dst, size, false);
1205 tcg_gen_brcondi_tl(inv ? TCG_COND_NE : TCG_COND_EQ, t0, 0, l1);
1206 break;
1207 case JCC_S:
1208 fast_jcc_s:
1209 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_dst, size, true);
1210 tcg_gen_brcondi_tl(inv ? TCG_COND_GE : TCG_COND_LT, t0, 0, l1);
1211 break;
1212
1213 case JCC_B:
1214 cond = inv ? TCG_COND_GEU : TCG_COND_LTU;
1215 goto fast_jcc_b;
1216 case JCC_BE:
1217 cond = inv ? TCG_COND_GTU : TCG_COND_LEU;
1218 fast_jcc_b:
1219 tcg_gen_add_tl(cpu_tmp4, cpu_cc_dst, cpu_cc_src);
1220 gen_extu(size, cpu_tmp4);
1221 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, false);
1222 tcg_gen_brcond_tl(cond, cpu_tmp4, t0, l1);
1223 break;
1224
1225 case JCC_L:
1226 cond = inv ? TCG_COND_GE : TCG_COND_LT;
1227 goto fast_jcc_l;
1228 case JCC_LE:
1229 cond = inv ? TCG_COND_GT : TCG_COND_LE;
1230 fast_jcc_l:
1231 tcg_gen_add_tl(cpu_tmp4, cpu_cc_dst, cpu_cc_src);
1232 gen_exts(size, cpu_tmp4);
1233 t0 = gen_ext_tl(cpu_tmp0, cpu_cc_src, size, true);
1234 tcg_gen_brcond_tl(cond, cpu_tmp4, t0, l1);
1235 break;
1236
1237 default:
1238 goto slow_jcc;
1239 }
1240 break;
1241
1242 /* some jumps are easy to compute */
1243 case CC_OP_ADDB:
1244 case CC_OP_ADDW:
1245 case CC_OP_ADDL:
1246 case CC_OP_ADDQ:
1247
1248 case CC_OP_ADCB:
1249 case CC_OP_ADCW:
1250 case CC_OP_ADCL:
1251 case CC_OP_ADCQ:
1252
1253 case CC_OP_SBBB:
1254 case CC_OP_SBBW:
1255 case CC_OP_SBBL:
1256 case CC_OP_SBBQ:
1257
1258 case CC_OP_LOGICB:
1259 case CC_OP_LOGICW:
1260 case CC_OP_LOGICL:
1261 case CC_OP_LOGICQ:
1262
1263 case CC_OP_INCB:
1264 case CC_OP_INCW:
1265 case CC_OP_INCL:
1266 case CC_OP_INCQ:
1267
1268 case CC_OP_DECB:
1269 case CC_OP_DECW:
1270 case CC_OP_DECL:
1271 case CC_OP_DECQ:
1272
1273 case CC_OP_SHLB:
1274 case CC_OP_SHLW:
1275 case CC_OP_SHLL:
1276 case CC_OP_SHLQ:
1277
1278 case CC_OP_SARB:
1279 case CC_OP_SARW:
1280 case CC_OP_SARL:
1281 case CC_OP_SARQ:
1282 switch(jcc_op) {
1283 case JCC_Z:
1284 size = (s->cc_op - CC_OP_ADDB) & 3;
1285 goto fast_jcc_z;
1286 case JCC_S:
1287 size = (s->cc_op - CC_OP_ADDB) & 3;
1288 goto fast_jcc_s;
1289 default:
1290 goto slow_jcc;
1291 }
1292 break;
1293 default:
1294 slow_jcc:
1295 gen_setcc_slow(s, jcc_op, cpu_T[0], false);
1296 tcg_gen_brcondi_tl(inv ? TCG_COND_EQ : TCG_COND_NE,
1297 cpu_T[0], 0, l1);
1298 break;
1299 }
1300 }
1301
1302 /* XXX: does not work with gdbstub "ice" single step - not a
1303 serious problem */
1304 static int gen_jz_ecx_string(DisasContext *s, target_ulong next_eip)
1305 {
1306 int l1, l2;
1307
1308 l1 = gen_new_label();
1309 l2 = gen_new_label();
1310 gen_op_jnz_ecx(s->aflag, l1);
1311 gen_set_label(l2);
1312 gen_jmp_tb(s, next_eip, 1);
1313 gen_set_label(l1);
1314 return l2;
1315 }
1316
1317 static inline void gen_stos(DisasContext *s, int ot)
1318 {
1319 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
1320 gen_string_movl_A0_EDI(s);
1321 gen_op_st_T0_A0(ot + s->mem_index);
1322 gen_op_movl_T0_Dshift(ot);
1323 gen_op_add_reg_T0(s->aflag, R_EDI);
1324 }
1325
1326 static inline void gen_lods(DisasContext *s, int ot)
1327 {
1328 gen_string_movl_A0_ESI(s);
1329 gen_op_ld_T0_A0(ot + s->mem_index);
1330 gen_op_mov_reg_T0(ot, R_EAX);
1331 gen_op_movl_T0_Dshift(ot);
1332 gen_op_add_reg_T0(s->aflag, R_ESI);
1333 }
1334
1335 static inline void gen_scas(DisasContext *s, int ot)
1336 {
1337 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
1338 gen_string_movl_A0_EDI(s);
1339 gen_op_ld_T1_A0(ot + s->mem_index);
1340 gen_op_cmpl_T0_T1_cc();
1341 gen_op_movl_T0_Dshift(ot);
1342 gen_op_add_reg_T0(s->aflag, R_EDI);
1343 set_cc_op(s, CC_OP_SUBB + ot);
1344 }
1345
1346 static inline void gen_cmps(DisasContext *s, int ot)
1347 {
1348 gen_string_movl_A0_ESI(s);
1349 gen_op_ld_T0_A0(ot + s->mem_index);
1350 gen_string_movl_A0_EDI(s);
1351 gen_op_ld_T1_A0(ot + s->mem_index);
1352 gen_op_cmpl_T0_T1_cc();
1353 gen_op_movl_T0_Dshift(ot);
1354 gen_op_add_reg_T0(s->aflag, R_ESI);
1355 gen_op_add_reg_T0(s->aflag, R_EDI);
1356 set_cc_op(s, CC_OP_SUBB + ot);
1357 }
1358
1359 static inline void gen_ins(DisasContext *s, int ot)
1360 {
1361 if (use_icount)
1362 gen_io_start();
1363 gen_string_movl_A0_EDI(s);
1364 /* Note: we must do this dummy write first to be restartable in
1365 case of page fault. */
1366 gen_op_movl_T0_0();
1367 gen_op_st_T0_A0(ot + s->mem_index);
1368 gen_op_mov_TN_reg(OT_WORD, 1, R_EDX);
1369 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[1]);
1370 tcg_gen_andi_i32(cpu_tmp2_i32, cpu_tmp2_i32, 0xffff);
1371 gen_helper_in_func(ot, cpu_T[0], cpu_tmp2_i32);
1372 gen_op_st_T0_A0(ot + s->mem_index);
1373 gen_op_movl_T0_Dshift(ot);
1374 gen_op_add_reg_T0(s->aflag, R_EDI);
1375 if (use_icount)
1376 gen_io_end();
1377 }
1378
1379 static inline void gen_outs(DisasContext *s, int ot)
1380 {
1381 if (use_icount)
1382 gen_io_start();
1383 gen_string_movl_A0_ESI(s);
1384 gen_op_ld_T0_A0(ot + s->mem_index);
1385
1386 gen_op_mov_TN_reg(OT_WORD, 1, R_EDX);
1387 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[1]);
1388 tcg_gen_andi_i32(cpu_tmp2_i32, cpu_tmp2_i32, 0xffff);
1389 tcg_gen_trunc_tl_i32(cpu_tmp3_i32, cpu_T[0]);
1390 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
1391
1392 gen_op_movl_T0_Dshift(ot);
1393 gen_op_add_reg_T0(s->aflag, R_ESI);
1394 if (use_icount)
1395 gen_io_end();
1396 }
1397
1398 /* same method as Valgrind : we generate jumps to current or next
1399 instruction */
1400 #define GEN_REPZ(op) \
1401 static inline void gen_repz_ ## op(DisasContext *s, int ot, \
1402 target_ulong cur_eip, target_ulong next_eip) \
1403 { \
1404 int l2;\
1405 gen_update_cc_op(s); \
1406 l2 = gen_jz_ecx_string(s, next_eip); \
1407 gen_ ## op(s, ot); \
1408 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1409 /* a loop would cause two single step exceptions if ECX = 1 \
1410 before rep string_insn */ \
1411 if (!s->jmp_opt) \
1412 gen_op_jz_ecx(s->aflag, l2); \
1413 gen_jmp(s, cur_eip); \
1414 }
1415
1416 #define GEN_REPZ2(op) \
1417 static inline void gen_repz_ ## op(DisasContext *s, int ot, \
1418 target_ulong cur_eip, \
1419 target_ulong next_eip, \
1420 int nz) \
1421 { \
1422 int l2;\
1423 gen_update_cc_op(s); \
1424 l2 = gen_jz_ecx_string(s, next_eip); \
1425 gen_ ## op(s, ot); \
1426 gen_op_add_reg_im(s->aflag, R_ECX, -1); \
1427 gen_update_cc_op(s); \
1428 gen_jcc1(s, (JCC_Z << 1) | (nz ^ 1), l2); \
1429 if (!s->jmp_opt) \
1430 gen_op_jz_ecx(s->aflag, l2); \
1431 gen_jmp(s, cur_eip); \
1432 set_cc_op(s, CC_OP_DYNAMIC); \
1433 }
1434
1435 GEN_REPZ(movs)
1436 GEN_REPZ(stos)
1437 GEN_REPZ(lods)
1438 GEN_REPZ(ins)
1439 GEN_REPZ(outs)
1440 GEN_REPZ2(scas)
1441 GEN_REPZ2(cmps)
1442
1443 static void gen_helper_fp_arith_ST0_FT0(int op)
1444 {
1445 switch (op) {
1446 case 0:
1447 gen_helper_fadd_ST0_FT0(cpu_env);
1448 break;
1449 case 1:
1450 gen_helper_fmul_ST0_FT0(cpu_env);
1451 break;
1452 case 2:
1453 gen_helper_fcom_ST0_FT0(cpu_env);
1454 break;
1455 case 3:
1456 gen_helper_fcom_ST0_FT0(cpu_env);
1457 break;
1458 case 4:
1459 gen_helper_fsub_ST0_FT0(cpu_env);
1460 break;
1461 case 5:
1462 gen_helper_fsubr_ST0_FT0(cpu_env);
1463 break;
1464 case 6:
1465 gen_helper_fdiv_ST0_FT0(cpu_env);
1466 break;
1467 case 7:
1468 gen_helper_fdivr_ST0_FT0(cpu_env);
1469 break;
1470 }
1471 }
1472
1473 /* NOTE the exception in "r" op ordering */
1474 static void gen_helper_fp_arith_STN_ST0(int op, int opreg)
1475 {
1476 TCGv_i32 tmp = tcg_const_i32(opreg);
1477 switch (op) {
1478 case 0:
1479 gen_helper_fadd_STN_ST0(cpu_env, tmp);
1480 break;
1481 case 1:
1482 gen_helper_fmul_STN_ST0(cpu_env, tmp);
1483 break;
1484 case 4:
1485 gen_helper_fsubr_STN_ST0(cpu_env, tmp);
1486 break;
1487 case 5:
1488 gen_helper_fsub_STN_ST0(cpu_env, tmp);
1489 break;
1490 case 6:
1491 gen_helper_fdivr_STN_ST0(cpu_env, tmp);
1492 break;
1493 case 7:
1494 gen_helper_fdiv_STN_ST0(cpu_env, tmp);
1495 break;
1496 }
1497 }
1498
1499 /* if d == OR_TMP0, it means memory operand (address in A0) */
1500 static void gen_op(DisasContext *s1, int op, int ot, int d)
1501 {
1502 if (d != OR_TMP0) {
1503 gen_op_mov_TN_reg(ot, 0, d);
1504 } else {
1505 gen_op_ld_T0_A0(ot + s1->mem_index);
1506 }
1507 switch(op) {
1508 case OP_ADCL:
1509 gen_compute_eflags_c(s1, cpu_tmp4, false);
1510 tcg_gen_add_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1511 tcg_gen_add_tl(cpu_T[0], cpu_T[0], cpu_tmp4);
1512 if (d != OR_TMP0)
1513 gen_op_mov_reg_T0(ot, d);
1514 else
1515 gen_op_st_T0_A0(ot + s1->mem_index);
1516 tcg_gen_mov_tl(cpu_cc_src, cpu_T[1]);
1517 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
1518 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp4);
1519 tcg_gen_shli_i32(cpu_tmp2_i32, cpu_tmp2_i32, 2);
1520 tcg_gen_addi_i32(cpu_cc_op, cpu_tmp2_i32, CC_OP_ADDB + ot);
1521 set_cc_op(s1, CC_OP_DYNAMIC);
1522 break;
1523 case OP_SBBL:
1524 gen_compute_eflags_c(s1, cpu_tmp4, false);
1525 tcg_gen_sub_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1526 tcg_gen_sub_tl(cpu_T[0], cpu_T[0], cpu_tmp4);
1527 if (d != OR_TMP0)
1528 gen_op_mov_reg_T0(ot, d);
1529 else
1530 gen_op_st_T0_A0(ot + s1->mem_index);
1531 tcg_gen_mov_tl(cpu_cc_src, cpu_T[1]);
1532 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
1533 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp4);
1534 tcg_gen_shli_i32(cpu_tmp2_i32, cpu_tmp2_i32, 2);
1535 tcg_gen_addi_i32(cpu_cc_op, cpu_tmp2_i32, CC_OP_SUBB + ot);
1536 set_cc_op(s1, CC_OP_DYNAMIC);
1537 break;
1538 case OP_ADDL:
1539 gen_op_addl_T0_T1();
1540 if (d != OR_TMP0)
1541 gen_op_mov_reg_T0(ot, d);
1542 else
1543 gen_op_st_T0_A0(ot + s1->mem_index);
1544 gen_op_update2_cc();
1545 set_cc_op(s1, CC_OP_ADDB + ot);
1546 break;
1547 case OP_SUBL:
1548 tcg_gen_sub_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1549 if (d != OR_TMP0)
1550 gen_op_mov_reg_T0(ot, d);
1551 else
1552 gen_op_st_T0_A0(ot + s1->mem_index);
1553 gen_op_update2_cc();
1554 set_cc_op(s1, CC_OP_SUBB + ot);
1555 break;
1556 default:
1557 case OP_ANDL:
1558 tcg_gen_and_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1559 if (d != OR_TMP0)
1560 gen_op_mov_reg_T0(ot, d);
1561 else
1562 gen_op_st_T0_A0(ot + s1->mem_index);
1563 gen_op_update1_cc();
1564 set_cc_op(s1, CC_OP_LOGICB + ot);
1565 break;
1566 case OP_ORL:
1567 tcg_gen_or_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1568 if (d != OR_TMP0)
1569 gen_op_mov_reg_T0(ot, d);
1570 else
1571 gen_op_st_T0_A0(ot + s1->mem_index);
1572 gen_op_update1_cc();
1573 set_cc_op(s1, CC_OP_LOGICB + ot);
1574 break;
1575 case OP_XORL:
1576 tcg_gen_xor_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
1577 if (d != OR_TMP0)
1578 gen_op_mov_reg_T0(ot, d);
1579 else
1580 gen_op_st_T0_A0(ot + s1->mem_index);
1581 gen_op_update1_cc();
1582 set_cc_op(s1, CC_OP_LOGICB + ot);
1583 break;
1584 case OP_CMPL:
1585 gen_op_cmpl_T0_T1_cc();
1586 set_cc_op(s1, CC_OP_SUBB + ot);
1587 break;
1588 }
1589 }
1590
1591 /* if d == OR_TMP0, it means memory operand (address in A0) */
1592 static void gen_inc(DisasContext *s1, int ot, int d, int c)
1593 {
1594 if (d != OR_TMP0)
1595 gen_op_mov_TN_reg(ot, 0, d);
1596 else
1597 gen_op_ld_T0_A0(ot + s1->mem_index);
1598 gen_compute_eflags_c(s1, cpu_cc_src, false);
1599 if (c > 0) {
1600 tcg_gen_addi_tl(cpu_T[0], cpu_T[0], 1);
1601 set_cc_op(s1, CC_OP_INCB + ot);
1602 } else {
1603 tcg_gen_addi_tl(cpu_T[0], cpu_T[0], -1);
1604 set_cc_op(s1, CC_OP_DECB + ot);
1605 }
1606 if (d != OR_TMP0)
1607 gen_op_mov_reg_T0(ot, d);
1608 else
1609 gen_op_st_T0_A0(ot + s1->mem_index);
1610 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
1611 }
1612
1613 static void gen_shift_rm_T1(DisasContext *s, int ot, int op1,
1614 int is_right, int is_arith)
1615 {
1616 target_ulong mask;
1617 int shift_label;
1618 TCGv t0, t1, t2;
1619
1620 if (ot == OT_QUAD) {
1621 mask = 0x3f;
1622 } else {
1623 mask = 0x1f;
1624 }
1625
1626 /* load */
1627 if (op1 == OR_TMP0) {
1628 gen_op_ld_T0_A0(ot + s->mem_index);
1629 } else {
1630 gen_op_mov_TN_reg(ot, 0, op1);
1631 }
1632
1633 t0 = tcg_temp_local_new();
1634 t1 = tcg_temp_local_new();
1635 t2 = tcg_temp_local_new();
1636
1637 tcg_gen_andi_tl(t2, cpu_T[1], mask);
1638
1639 if (is_right) {
1640 if (is_arith) {
1641 gen_exts(ot, cpu_T[0]);
1642 tcg_gen_mov_tl(t0, cpu_T[0]);
1643 tcg_gen_sar_tl(cpu_T[0], cpu_T[0], t2);
1644 } else {
1645 gen_extu(ot, cpu_T[0]);
1646 tcg_gen_mov_tl(t0, cpu_T[0]);
1647 tcg_gen_shr_tl(cpu_T[0], cpu_T[0], t2);
1648 }
1649 } else {
1650 tcg_gen_mov_tl(t0, cpu_T[0]);
1651 tcg_gen_shl_tl(cpu_T[0], cpu_T[0], t2);
1652 }
1653
1654 /* store */
1655 if (op1 == OR_TMP0) {
1656 gen_op_st_T0_A0(ot + s->mem_index);
1657 } else {
1658 gen_op_mov_reg_T0(ot, op1);
1659 }
1660
1661 /* update eflags */
1662 gen_update_cc_op(s);
1663
1664 tcg_gen_mov_tl(t1, cpu_T[0]);
1665
1666 shift_label = gen_new_label();
1667 tcg_gen_brcondi_tl(TCG_COND_EQ, t2, 0, shift_label);
1668
1669 tcg_gen_addi_tl(t2, t2, -1);
1670 tcg_gen_mov_tl(cpu_cc_dst, t1);
1671
1672 if (is_right) {
1673 if (is_arith) {
1674 tcg_gen_sar_tl(cpu_cc_src, t0, t2);
1675 } else {
1676 tcg_gen_shr_tl(cpu_cc_src, t0, t2);
1677 }
1678 } else {
1679 tcg_gen_shl_tl(cpu_cc_src, t0, t2);
1680 }
1681
1682 if (is_right) {
1683 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SARB + ot);
1684 } else {
1685 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SHLB + ot);
1686 }
1687
1688 gen_set_label(shift_label);
1689 set_cc_op(s, CC_OP_DYNAMIC); /* cannot predict flags after */
1690
1691 tcg_temp_free(t0);
1692 tcg_temp_free(t1);
1693 tcg_temp_free(t2);
1694 }
1695
1696 static void gen_shift_rm_im(DisasContext *s, int ot, int op1, int op2,
1697 int is_right, int is_arith)
1698 {
1699 int mask;
1700
1701 if (ot == OT_QUAD)
1702 mask = 0x3f;
1703 else
1704 mask = 0x1f;
1705
1706 /* load */
1707 if (op1 == OR_TMP0)
1708 gen_op_ld_T0_A0(ot + s->mem_index);
1709 else
1710 gen_op_mov_TN_reg(ot, 0, op1);
1711
1712 op2 &= mask;
1713 if (op2 != 0) {
1714 if (is_right) {
1715 if (is_arith) {
1716 gen_exts(ot, cpu_T[0]);
1717 tcg_gen_sari_tl(cpu_tmp4, cpu_T[0], op2 - 1);
1718 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], op2);
1719 } else {
1720 gen_extu(ot, cpu_T[0]);
1721 tcg_gen_shri_tl(cpu_tmp4, cpu_T[0], op2 - 1);
1722 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], op2);
1723 }
1724 } else {
1725 tcg_gen_shli_tl(cpu_tmp4, cpu_T[0], op2 - 1);
1726 tcg_gen_shli_tl(cpu_T[0], cpu_T[0], op2);
1727 }
1728 }
1729
1730 /* store */
1731 if (op1 == OR_TMP0)
1732 gen_op_st_T0_A0(ot + s->mem_index);
1733 else
1734 gen_op_mov_reg_T0(ot, op1);
1735
1736 /* update eflags if non zero shift */
1737 if (op2 != 0) {
1738 tcg_gen_mov_tl(cpu_cc_src, cpu_tmp4);
1739 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
1740 set_cc_op(s, (is_right ? CC_OP_SARB : CC_OP_SHLB) + ot);
1741 }
1742 }
1743
1744 static inline void tcg_gen_lshift(TCGv ret, TCGv arg1, target_long arg2)
1745 {
1746 if (arg2 >= 0)
1747 tcg_gen_shli_tl(ret, arg1, arg2);
1748 else
1749 tcg_gen_shri_tl(ret, arg1, -arg2);
1750 }
1751
1752 static void gen_rot_rm_T1(DisasContext *s, int ot, int op1,
1753 int is_right)
1754 {
1755 target_ulong mask;
1756 int label1, label2, data_bits;
1757 TCGv t0, t1, t2, a0;
1758
1759 /* XXX: inefficient, but we must use local temps */
1760 t0 = tcg_temp_local_new();
1761 t1 = tcg_temp_local_new();
1762 t2 = tcg_temp_local_new();
1763 a0 = tcg_temp_local_new();
1764
1765 if (ot == OT_QUAD)
1766 mask = 0x3f;
1767 else
1768 mask = 0x1f;
1769
1770 /* load */
1771 if (op1 == OR_TMP0) {
1772 tcg_gen_mov_tl(a0, cpu_A0);
1773 gen_op_ld_v(ot + s->mem_index, t0, a0);
1774 } else {
1775 gen_op_mov_v_reg(ot, t0, op1);
1776 }
1777
1778 tcg_gen_mov_tl(t1, cpu_T[1]);
1779
1780 tcg_gen_andi_tl(t1, t1, mask);
1781
1782 /* Must test zero case to avoid using undefined behaviour in TCG
1783 shifts. */
1784 label1 = gen_new_label();
1785 tcg_gen_brcondi_tl(TCG_COND_EQ, t1, 0, label1);
1786
1787 if (ot <= OT_WORD)
1788 tcg_gen_andi_tl(cpu_tmp0, t1, (1 << (3 + ot)) - 1);
1789 else
1790 tcg_gen_mov_tl(cpu_tmp0, t1);
1791
1792 gen_extu(ot, t0);
1793 tcg_gen_mov_tl(t2, t0);
1794
1795 data_bits = 8 << ot;
1796 /* XXX: rely on behaviour of shifts when operand 2 overflows (XXX:
1797 fix TCG definition) */
1798 if (is_right) {
1799 tcg_gen_shr_tl(cpu_tmp4, t0, cpu_tmp0);
1800 tcg_gen_subfi_tl(cpu_tmp0, data_bits, cpu_tmp0);
1801 tcg_gen_shl_tl(t0, t0, cpu_tmp0);
1802 } else {
1803 tcg_gen_shl_tl(cpu_tmp4, t0, cpu_tmp0);
1804 tcg_gen_subfi_tl(cpu_tmp0, data_bits, cpu_tmp0);
1805 tcg_gen_shr_tl(t0, t0, cpu_tmp0);
1806 }
1807 tcg_gen_or_tl(t0, t0, cpu_tmp4);
1808
1809 gen_set_label(label1);
1810 /* store */
1811 if (op1 == OR_TMP0) {
1812 gen_op_st_v(ot + s->mem_index, t0, a0);
1813 } else {
1814 gen_op_mov_reg_v(ot, op1, t0);
1815 }
1816
1817 /* update eflags. It is needed anyway most of the time, do it always. */
1818 gen_compute_eflags(s);
1819 assert(s->cc_op == CC_OP_EFLAGS);
1820
1821 label2 = gen_new_label();
1822 tcg_gen_brcondi_tl(TCG_COND_EQ, t1, 0, label2);
1823
1824 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~(CC_O | CC_C));
1825 tcg_gen_xor_tl(cpu_tmp0, t2, t0);
1826 tcg_gen_lshift(cpu_tmp0, cpu_tmp0, 11 - (data_bits - 1));
1827 tcg_gen_andi_tl(cpu_tmp0, cpu_tmp0, CC_O);
1828 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, cpu_tmp0);
1829 if (is_right) {
1830 tcg_gen_shri_tl(t0, t0, data_bits - 1);
1831 }
1832 tcg_gen_andi_tl(t0, t0, CC_C);
1833 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, t0);
1834
1835 gen_set_label(label2);
1836
1837 tcg_temp_free(t0);
1838 tcg_temp_free(t1);
1839 tcg_temp_free(t2);
1840 tcg_temp_free(a0);
1841 }
1842
1843 static void gen_rot_rm_im(DisasContext *s, int ot, int op1, int op2,
1844 int is_right)
1845 {
1846 int mask;
1847 int data_bits;
1848 TCGv t0, t1, a0;
1849
1850 /* XXX: inefficient, but we must use local temps */
1851 t0 = tcg_temp_local_new();
1852 t1 = tcg_temp_local_new();
1853 a0 = tcg_temp_local_new();
1854
1855 if (ot == OT_QUAD)
1856 mask = 0x3f;
1857 else
1858 mask = 0x1f;
1859
1860 /* load */
1861 if (op1 == OR_TMP0) {
1862 tcg_gen_mov_tl(a0, cpu_A0);
1863 gen_op_ld_v(ot + s->mem_index, t0, a0);
1864 } else {
1865 gen_op_mov_v_reg(ot, t0, op1);
1866 }
1867
1868 gen_extu(ot, t0);
1869 tcg_gen_mov_tl(t1, t0);
1870
1871 op2 &= mask;
1872 data_bits = 8 << ot;
1873 if (op2 != 0) {
1874 int shift = op2 & ((1 << (3 + ot)) - 1);
1875 if (is_right) {
1876 tcg_gen_shri_tl(cpu_tmp4, t0, shift);
1877 tcg_gen_shli_tl(t0, t0, data_bits - shift);
1878 }
1879 else {
1880 tcg_gen_shli_tl(cpu_tmp4, t0, shift);
1881 tcg_gen_shri_tl(t0, t0, data_bits - shift);
1882 }
1883 tcg_gen_or_tl(t0, t0, cpu_tmp4);
1884 }
1885
1886 /* store */
1887 if (op1 == OR_TMP0) {
1888 gen_op_st_v(ot + s->mem_index, t0, a0);
1889 } else {
1890 gen_op_mov_reg_v(ot, op1, t0);
1891 }
1892
1893 if (op2 != 0) {
1894 /* update eflags */
1895 gen_compute_eflags(s);
1896 assert(s->cc_op == CC_OP_EFLAGS);
1897
1898 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~(CC_O | CC_C));
1899 tcg_gen_xor_tl(cpu_tmp0, t1, t0);
1900 tcg_gen_lshift(cpu_tmp0, cpu_tmp0, 11 - (data_bits - 1));
1901 tcg_gen_andi_tl(cpu_tmp0, cpu_tmp0, CC_O);
1902 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, cpu_tmp0);
1903 if (is_right) {
1904 tcg_gen_shri_tl(t0, t0, data_bits - 1);
1905 }
1906 tcg_gen_andi_tl(t0, t0, CC_C);
1907 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, t0);
1908 }
1909
1910 tcg_temp_free(t0);
1911 tcg_temp_free(t1);
1912 tcg_temp_free(a0);
1913 }
1914
1915 /* XXX: add faster immediate = 1 case */
1916 static void gen_rotc_rm_T1(DisasContext *s, int ot, int op1,
1917 int is_right)
1918 {
1919 gen_compute_eflags(s);
1920 assert(s->cc_op == CC_OP_EFLAGS);
1921
1922 /* load */
1923 if (op1 == OR_TMP0)
1924 gen_op_ld_T0_A0(ot + s->mem_index);
1925 else
1926 gen_op_mov_TN_reg(ot, 0, op1);
1927
1928 if (is_right) {
1929 switch (ot) {
1930 case OT_BYTE:
1931 gen_helper_rcrb(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1932 break;
1933 case OT_WORD:
1934 gen_helper_rcrw(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1935 break;
1936 case OT_LONG:
1937 gen_helper_rcrl(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1938 break;
1939 #ifdef TARGET_X86_64
1940 case OT_QUAD:
1941 gen_helper_rcrq(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1942 break;
1943 #endif
1944 }
1945 } else {
1946 switch (ot) {
1947 case OT_BYTE:
1948 gen_helper_rclb(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1949 break;
1950 case OT_WORD:
1951 gen_helper_rclw(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1952 break;
1953 case OT_LONG:
1954 gen_helper_rcll(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1955 break;
1956 #ifdef TARGET_X86_64
1957 case OT_QUAD:
1958 gen_helper_rclq(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
1959 break;
1960 #endif
1961 }
1962 }
1963 /* store */
1964 if (op1 == OR_TMP0)
1965 gen_op_st_T0_A0(ot + s->mem_index);
1966 else
1967 gen_op_mov_reg_T0(ot, op1);
1968 }
1969
1970 /* XXX: add faster immediate case */
1971 static void gen_shiftd_rm_T1_T3(DisasContext *s, int ot, int op1,
1972 int is_right)
1973 {
1974 int label1, label2, data_bits;
1975 target_ulong mask;
1976 TCGv t0, t1, t2, a0;
1977
1978 t0 = tcg_temp_local_new();
1979 t1 = tcg_temp_local_new();
1980 t2 = tcg_temp_local_new();
1981 a0 = tcg_temp_local_new();
1982
1983 if (ot == OT_QUAD)
1984 mask = 0x3f;
1985 else
1986 mask = 0x1f;
1987
1988 /* load */
1989 if (op1 == OR_TMP0) {
1990 tcg_gen_mov_tl(a0, cpu_A0);
1991 gen_op_ld_v(ot + s->mem_index, t0, a0);
1992 } else {
1993 gen_op_mov_v_reg(ot, t0, op1);
1994 }
1995
1996 tcg_gen_andi_tl(cpu_T3, cpu_T3, mask);
1997
1998 tcg_gen_mov_tl(t1, cpu_T[1]);
1999 tcg_gen_mov_tl(t2, cpu_T3);
2000
2001 /* Must test zero case to avoid using undefined behaviour in TCG
2002 shifts. */
2003 label1 = gen_new_label();
2004 tcg_gen_brcondi_tl(TCG_COND_EQ, t2, 0, label1);
2005
2006 tcg_gen_addi_tl(cpu_tmp5, t2, -1);
2007 if (ot == OT_WORD) {
2008 /* Note: we implement the Intel behaviour for shift count > 16 */
2009 if (is_right) {
2010 tcg_gen_andi_tl(t0, t0, 0xffff);
2011 tcg_gen_shli_tl(cpu_tmp0, t1, 16);
2012 tcg_gen_or_tl(t0, t0, cpu_tmp0);
2013 tcg_gen_ext32u_tl(t0, t0);
2014
2015 tcg_gen_shr_tl(cpu_tmp4, t0, cpu_tmp5);
2016
2017 /* only needed if count > 16, but a test would complicate */
2018 tcg_gen_subfi_tl(cpu_tmp5, 32, t2);
2019 tcg_gen_shl_tl(cpu_tmp0, t0, cpu_tmp5);
2020
2021 tcg_gen_shr_tl(t0, t0, t2);
2022
2023 tcg_gen_or_tl(t0, t0, cpu_tmp0);
2024 } else {
2025 /* XXX: not optimal */
2026 tcg_gen_andi_tl(t0, t0, 0xffff);
2027 tcg_gen_shli_tl(t1, t1, 16);
2028 tcg_gen_or_tl(t1, t1, t0);
2029 tcg_gen_ext32u_tl(t1, t1);
2030
2031 tcg_gen_shl_tl(cpu_tmp4, t0, cpu_tmp5);
2032 tcg_gen_subfi_tl(cpu_tmp0, 32, cpu_tmp5);
2033 tcg_gen_shr_tl(cpu_tmp5, t1, cpu_tmp0);
2034 tcg_gen_or_tl(cpu_tmp4, cpu_tmp4, cpu_tmp5);
2035
2036 tcg_gen_shl_tl(t0, t0, t2);
2037 tcg_gen_subfi_tl(cpu_tmp5, 32, t2);
2038 tcg_gen_shr_tl(t1, t1, cpu_tmp5);
2039 tcg_gen_or_tl(t0, t0, t1);
2040 }
2041 } else {
2042 data_bits = 8 << ot;
2043 if (is_right) {
2044 if (ot == OT_LONG)
2045 tcg_gen_ext32u_tl(t0, t0);
2046
2047 tcg_gen_shr_tl(cpu_tmp4, t0, cpu_tmp5);
2048
2049 tcg_gen_shr_tl(t0, t0, t2);
2050 tcg_gen_subfi_tl(cpu_tmp5, data_bits, t2);
2051 tcg_gen_shl_tl(t1, t1, cpu_tmp5);
2052 tcg_gen_or_tl(t0, t0, t1);
2053
2054 } else {
2055 if (ot == OT_LONG)
2056 tcg_gen_ext32u_tl(t1, t1);
2057
2058 tcg_gen_shl_tl(cpu_tmp4, t0, cpu_tmp5);
2059
2060 tcg_gen_shl_tl(t0, t0, t2);
2061 tcg_gen_subfi_tl(cpu_tmp5, data_bits, t2);
2062 tcg_gen_shr_tl(t1, t1, cpu_tmp5);
2063 tcg_gen_or_tl(t0, t0, t1);
2064 }
2065 }
2066 tcg_gen_mov_tl(t1, cpu_tmp4);
2067
2068 gen_set_label(label1);
2069 /* store */
2070 if (op1 == OR_TMP0) {
2071 gen_op_st_v(ot + s->mem_index, t0, a0);
2072 } else {
2073 gen_op_mov_reg_v(ot, op1, t0);
2074 }
2075
2076 /* update eflags */
2077 gen_update_cc_op(s);
2078
2079 label2 = gen_new_label();
2080 tcg_gen_brcondi_tl(TCG_COND_EQ, t2, 0, label2);
2081
2082 tcg_gen_mov_tl(cpu_cc_src, t1);
2083 tcg_gen_mov_tl(cpu_cc_dst, t0);
2084 if (is_right) {
2085 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SARB + ot);
2086 } else {
2087 tcg_gen_movi_i32(cpu_cc_op, CC_OP_SHLB + ot);
2088 }
2089 gen_set_label(label2);
2090 set_cc_op(s, CC_OP_DYNAMIC); /* cannot predict flags after */
2091
2092 tcg_temp_free(t0);
2093 tcg_temp_free(t1);
2094 tcg_temp_free(t2);
2095 tcg_temp_free(a0);
2096 }
2097
2098 static void gen_shift(DisasContext *s1, int op, int ot, int d, int s)
2099 {
2100 if (s != OR_TMP1)
2101 gen_op_mov_TN_reg(ot, 1, s);
2102 switch(op) {
2103 case OP_ROL:
2104 gen_rot_rm_T1(s1, ot, d, 0);
2105 break;
2106 case OP_ROR:
2107 gen_rot_rm_T1(s1, ot, d, 1);
2108 break;
2109 case OP_SHL:
2110 case OP_SHL1:
2111 gen_shift_rm_T1(s1, ot, d, 0, 0);
2112 break;
2113 case OP_SHR:
2114 gen_shift_rm_T1(s1, ot, d, 1, 0);
2115 break;
2116 case OP_SAR:
2117 gen_shift_rm_T1(s1, ot, d, 1, 1);
2118 break;
2119 case OP_RCL:
2120 gen_rotc_rm_T1(s1, ot, d, 0);
2121 break;
2122 case OP_RCR:
2123 gen_rotc_rm_T1(s1, ot, d, 1);
2124 break;
2125 }
2126 }
2127
2128 static void gen_shifti(DisasContext *s1, int op, int ot, int d, int c)
2129 {
2130 switch(op) {
2131 case OP_ROL:
2132 gen_rot_rm_im(s1, ot, d, c, 0);
2133 break;
2134 case OP_ROR:
2135 gen_rot_rm_im(s1, ot, d, c, 1);
2136 break;
2137 case OP_SHL:
2138 case OP_SHL1:
2139 gen_shift_rm_im(s1, ot, d, c, 0, 0);
2140 break;
2141 case OP_SHR:
2142 gen_shift_rm_im(s1, ot, d, c, 1, 0);
2143 break;
2144 case OP_SAR:
2145 gen_shift_rm_im(s1, ot, d, c, 1, 1);
2146 break;
2147 default:
2148 /* currently not optimized */
2149 gen_op_movl_T1_im(c);
2150 gen_shift(s1, op, ot, d, OR_TMP1);
2151 break;
2152 }
2153 }
2154
2155 static void gen_lea_modrm(CPUX86State *env, DisasContext *s, int modrm,
2156 int *reg_ptr, int *offset_ptr)
2157 {
2158 target_long disp;
2159 int havesib;
2160 int base;
2161 int index;
2162 int scale;
2163 int opreg;
2164 int mod, rm, code, override, must_add_seg;
2165
2166 override = s->override;
2167 must_add_seg = s->addseg;
2168 if (override >= 0)
2169 must_add_seg = 1;
2170 mod = (modrm >> 6) & 3;
2171 rm = modrm & 7;
2172
2173 if (s->aflag) {
2174
2175 havesib = 0;
2176 base = rm;
2177 index = 0;
2178 scale = 0;
2179
2180 if (base == 4) {
2181 havesib = 1;
2182 code = cpu_ldub_code(env, s->pc++);
2183 scale = (code >> 6) & 3;
2184 index = ((code >> 3) & 7) | REX_X(s);
2185 base = (code & 7);
2186 }
2187 base |= REX_B(s);
2188
2189 switch (mod) {
2190 case 0:
2191 if ((base & 7) == 5) {
2192 base = -1;
2193 disp = (int32_t)cpu_ldl_code(env, s->pc);
2194 s->pc += 4;
2195 if (CODE64(s) && !havesib) {
2196 disp += s->pc + s->rip_offset;
2197 }
2198 } else {
2199 disp = 0;
2200 }
2201 break;
2202 case 1:
2203 disp = (int8_t)cpu_ldub_code(env, s->pc++);
2204 break;
2205 default:
2206 case 2:
2207 disp = (int32_t)cpu_ldl_code(env, s->pc);
2208 s->pc += 4;
2209 break;
2210 }
2211
2212 if (base >= 0) {
2213 /* for correct popl handling with esp */
2214 if (base == 4 && s->popl_esp_hack)
2215 disp += s->popl_esp_hack;
2216 #ifdef TARGET_X86_64
2217 if (s->aflag == 2) {
2218 gen_op_movq_A0_reg(base);
2219 if (disp != 0) {
2220 gen_op_addq_A0_im(disp);
2221 }
2222 } else
2223 #endif
2224 {
2225 gen_op_movl_A0_reg(base);
2226 if (disp != 0)
2227 gen_op_addl_A0_im(disp);
2228 }
2229 } else {
2230 #ifdef TARGET_X86_64
2231 if (s->aflag == 2) {
2232 gen_op_movq_A0_im(disp);
2233 } else
2234 #endif
2235 {
2236 gen_op_movl_A0_im(disp);
2237 }
2238 }
2239 /* index == 4 means no index */
2240 if (havesib && (index != 4)) {
2241 #ifdef TARGET_X86_64
2242 if (s->aflag == 2) {
2243 gen_op_addq_A0_reg_sN(scale, index);
2244 } else
2245 #endif
2246 {
2247 gen_op_addl_A0_reg_sN(scale, index);
2248 }
2249 }
2250 if (must_add_seg) {
2251 if (override < 0) {
2252 if (base == R_EBP || base == R_ESP)
2253 override = R_SS;
2254 else
2255 override = R_DS;
2256 }
2257 #ifdef TARGET_X86_64
2258 if (s->aflag == 2) {
2259 gen_op_addq_A0_seg(override);
2260 } else
2261 #endif
2262 {
2263 gen_op_addl_A0_seg(s, override);
2264 }
2265 }
2266 } else {
2267 switch (mod) {
2268 case 0:
2269 if (rm == 6) {
2270 disp = cpu_lduw_code(env, s->pc);
2271 s->pc += 2;
2272 gen_op_movl_A0_im(disp);
2273 rm = 0; /* avoid SS override */
2274 goto no_rm;
2275 } else {
2276 disp = 0;
2277 }
2278 break;
2279 case 1:
2280 disp = (int8_t)cpu_ldub_code(env, s->pc++);
2281 break;
2282 default:
2283 case 2:
2284 disp = cpu_lduw_code(env, s->pc);
2285 s->pc += 2;
2286 break;
2287 }
2288 switch(rm) {
2289 case 0:
2290 gen_op_movl_A0_reg(R_EBX);
2291 gen_op_addl_A0_reg_sN(0, R_ESI);
2292 break;
2293 case 1:
2294 gen_op_movl_A0_reg(R_EBX);
2295 gen_op_addl_A0_reg_sN(0, R_EDI);
2296 break;
2297 case 2:
2298 gen_op_movl_A0_reg(R_EBP);
2299 gen_op_addl_A0_reg_sN(0, R_ESI);
2300 break;
2301 case 3:
2302 gen_op_movl_A0_reg(R_EBP);
2303 gen_op_addl_A0_reg_sN(0, R_EDI);
2304 break;
2305 case 4:
2306 gen_op_movl_A0_reg(R_ESI);
2307 break;
2308 case 5:
2309 gen_op_movl_A0_reg(R_EDI);
2310 break;
2311 case 6:
2312 gen_op_movl_A0_reg(R_EBP);
2313 break;
2314 default:
2315 case 7:
2316 gen_op_movl_A0_reg(R_EBX);
2317 break;
2318 }
2319 if (disp != 0)
2320 gen_op_addl_A0_im(disp);
2321 gen_op_andl_A0_ffff();
2322 no_rm:
2323 if (must_add_seg) {
2324 if (override < 0) {
2325 if (rm == 2 || rm == 3 || rm == 6)
2326 override = R_SS;
2327 else
2328 override = R_DS;
2329 }
2330 gen_op_addl_A0_seg(s, override);
2331 }
2332 }
2333
2334 opreg = OR_A0;
2335 disp = 0;
2336 *reg_ptr = opreg;
2337 *offset_ptr = disp;
2338 }
2339
2340 static void gen_nop_modrm(CPUX86State *env, DisasContext *s, int modrm)
2341 {
2342 int mod, rm, base, code;
2343
2344 mod = (modrm >> 6) & 3;
2345 if (mod == 3)
2346 return;
2347 rm = modrm & 7;
2348
2349 if (s->aflag) {
2350
2351 base = rm;
2352
2353 if (base == 4) {
2354 code = cpu_ldub_code(env, s->pc++);
2355 base = (code & 7);
2356 }
2357
2358 switch (mod) {
2359 case 0:
2360 if (base == 5) {
2361 s->pc += 4;
2362 }
2363 break;
2364 case 1:
2365 s->pc++;
2366 break;
2367 default:
2368 case 2:
2369 s->pc += 4;
2370 break;
2371 }
2372 } else {
2373 switch (mod) {
2374 case 0:
2375 if (rm == 6) {
2376 s->pc += 2;
2377 }
2378 break;
2379 case 1:
2380 s->pc++;
2381 break;
2382 default:
2383 case 2:
2384 s->pc += 2;
2385 break;
2386 }
2387 }
2388 }
2389
2390 /* used for LEA and MOV AX, mem */
2391 static void gen_add_A0_ds_seg(DisasContext *s)
2392 {
2393 int override, must_add_seg;
2394 must_add_seg = s->addseg;
2395 override = R_DS;
2396 if (s->override >= 0) {
2397 override = s->override;
2398 must_add_seg = 1;
2399 }
2400 if (must_add_seg) {
2401 #ifdef TARGET_X86_64
2402 if (CODE64(s)) {
2403 gen_op_addq_A0_seg(override);
2404 } else
2405 #endif
2406 {
2407 gen_op_addl_A0_seg(s, override);
2408 }
2409 }
2410 }
2411
2412 /* generate modrm memory load or store of 'reg'. TMP0 is used if reg ==
2413 OR_TMP0 */
2414 static void gen_ldst_modrm(CPUX86State *env, DisasContext *s, int modrm,
2415 int ot, int reg, int is_store)
2416 {
2417 int mod, rm, opreg, disp;
2418
2419 mod = (modrm >> 6) & 3;
2420 rm = (modrm & 7) | REX_B(s);
2421 if (mod == 3) {
2422 if (is_store) {
2423 if (reg != OR_TMP0)
2424 gen_op_mov_TN_reg(ot, 0, reg);
2425 gen_op_mov_reg_T0(ot, rm);
2426 } else {
2427 gen_op_mov_TN_reg(ot, 0, rm);
2428 if (reg != OR_TMP0)
2429 gen_op_mov_reg_T0(ot, reg);
2430 }
2431 } else {
2432 gen_lea_modrm(env, s, modrm, &opreg, &disp);
2433 if (is_store) {
2434 if (reg != OR_TMP0)
2435 gen_op_mov_TN_reg(ot, 0, reg);
2436 gen_op_st_T0_A0(ot + s->mem_index);
2437 } else {
2438 gen_op_ld_T0_A0(ot + s->mem_index);
2439 if (reg != OR_TMP0)
2440 gen_op_mov_reg_T0(ot, reg);
2441 }
2442 }
2443 }
2444
2445 static inline uint32_t insn_get(CPUX86State *env, DisasContext *s, int ot)
2446 {
2447 uint32_t ret;
2448
2449 switch(ot) {
2450 case OT_BYTE:
2451 ret = cpu_ldub_code(env, s->pc);
2452 s->pc++;
2453 break;
2454 case OT_WORD:
2455 ret = cpu_lduw_code(env, s->pc);
2456 s->pc += 2;
2457 break;
2458 default:
2459 case OT_LONG:
2460 ret = cpu_ldl_code(env, s->pc);
2461 s->pc += 4;
2462 break;
2463 }
2464 return ret;
2465 }
2466
2467 static inline int insn_const_size(unsigned int ot)
2468 {
2469 if (ot <= OT_LONG)
2470 return 1 << ot;
2471 else
2472 return 4;
2473 }
2474
2475 static inline void gen_goto_tb(DisasContext *s, int tb_num, target_ulong eip)
2476 {
2477 TranslationBlock *tb;
2478 target_ulong pc;
2479
2480 pc = s->cs_base + eip;
2481 tb = s->tb;
2482 /* NOTE: we handle the case where the TB spans two pages here */
2483 if ((pc & TARGET_PAGE_MASK) == (tb->pc & TARGET_PAGE_MASK) ||
2484 (pc & TARGET_PAGE_MASK) == ((s->pc - 1) & TARGET_PAGE_MASK)) {
2485 /* jump to same page: we can use a direct jump */
2486 tcg_gen_goto_tb(tb_num);
2487 gen_jmp_im(eip);
2488 tcg_gen_exit_tb((tcg_target_long)tb + tb_num);
2489 } else {
2490 /* jump to another page: currently not optimized */
2491 gen_jmp_im(eip);
2492 gen_eob(s);
2493 }
2494 }
2495
2496 static inline void gen_jcc(DisasContext *s, int b,
2497 target_ulong val, target_ulong next_eip)
2498 {
2499 int l1, l2;
2500
2501 if (s->jmp_opt) {
2502 gen_update_cc_op(s);
2503 l1 = gen_new_label();
2504 gen_jcc1(s, b, l1);
2505 set_cc_op(s, CC_OP_DYNAMIC);
2506
2507 gen_goto_tb(s, 0, next_eip);
2508
2509 gen_set_label(l1);
2510 gen_goto_tb(s, 1, val);
2511 s->is_jmp = DISAS_TB_JUMP;
2512 } else {
2513 l1 = gen_new_label();
2514 l2 = gen_new_label();
2515 gen_jcc1(s, b, l1);
2516
2517 gen_jmp_im(next_eip);
2518 tcg_gen_br(l2);
2519
2520 gen_set_label(l1);
2521 gen_jmp_im(val);
2522 gen_set_label(l2);
2523 gen_eob(s);
2524 }
2525 }
2526
2527 static void gen_setcc(DisasContext *s, int b)
2528 {
2529 gen_setcc1(s, b, cpu_T[0]);
2530 }
2531
2532 static inline void gen_op_movl_T0_seg(int seg_reg)
2533 {
2534 tcg_gen_ld32u_tl(cpu_T[0], cpu_env,
2535 offsetof(CPUX86State,segs[seg_reg].selector));
2536 }
2537
2538 static inline void gen_op_movl_seg_T0_vm(int seg_reg)
2539 {
2540 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xffff);
2541 tcg_gen_st32_tl(cpu_T[0], cpu_env,
2542 offsetof(CPUX86State,segs[seg_reg].selector));
2543 tcg_gen_shli_tl(cpu_T[0], cpu_T[0], 4);
2544 tcg_gen_st_tl(cpu_T[0], cpu_env,
2545 offsetof(CPUX86State,segs[seg_reg].base));
2546 }
2547
2548 /* move T0 to seg_reg and compute if the CPU state may change. Never
2549 call this function with seg_reg == R_CS */
2550 static void gen_movl_seg_T0(DisasContext *s, int seg_reg, target_ulong cur_eip)
2551 {
2552 if (s->pe && !s->vm86) {
2553 /* XXX: optimize by finding processor state dynamically */
2554 gen_update_cc_op(s);
2555 gen_jmp_im(cur_eip);
2556 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
2557 gen_helper_load_seg(cpu_env, tcg_const_i32(seg_reg), cpu_tmp2_i32);
2558 /* abort translation because the addseg value may change or
2559 because ss32 may change. For R_SS, translation must always
2560 stop as a special handling must be done to disable hardware
2561 interrupts for the next instruction */
2562 if (seg_reg == R_SS || (s->code32 && seg_reg < R_FS))
2563 s->is_jmp = DISAS_TB_JUMP;
2564 } else {
2565 gen_op_movl_seg_T0_vm(seg_reg);
2566 if (seg_reg == R_SS)
2567 s->is_jmp = DISAS_TB_JUMP;
2568 }
2569 }
2570
2571 static inline int svm_is_rep(int prefixes)
2572 {
2573 return ((prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) ? 8 : 0);
2574 }
2575
2576 static inline void
2577 gen_svm_check_intercept_param(DisasContext *s, target_ulong pc_start,
2578 uint32_t type, uint64_t param)
2579 {
2580 /* no SVM activated; fast case */
2581 if (likely(!(s->flags & HF_SVMI_MASK)))
2582 return;
2583 gen_update_cc_op(s);
2584 gen_jmp_im(pc_start - s->cs_base);
2585 gen_helper_svm_check_intercept_param(cpu_env, tcg_const_i32(type),
2586 tcg_const_i64(param));
2587 }
2588
2589 static inline void
2590 gen_svm_check_intercept(DisasContext *s, target_ulong pc_start, uint64_t type)
2591 {
2592 gen_svm_check_intercept_param(s, pc_start, type, 0);
2593 }
2594
2595 static inline void gen_stack_update(DisasContext *s, int addend)
2596 {
2597 #ifdef TARGET_X86_64
2598 if (CODE64(s)) {
2599 gen_op_add_reg_im(2, R_ESP, addend);
2600 } else
2601 #endif
2602 if (s->ss32) {
2603 gen_op_add_reg_im(1, R_ESP, addend);
2604 } else {
2605 gen_op_add_reg_im(0, R_ESP, addend);
2606 }
2607 }
2608
2609 /* generate a push. It depends on ss32, addseg and dflag */
2610 static void gen_push_T0(DisasContext *s)
2611 {
2612 #ifdef TARGET_X86_64
2613 if (CODE64(s)) {
2614 gen_op_movq_A0_reg(R_ESP);
2615 if (s->dflag) {
2616 gen_op_addq_A0_im(-8);
2617 gen_op_st_T0_A0(OT_QUAD + s->mem_index);
2618 } else {
2619 gen_op_addq_A0_im(-2);
2620 gen_op_st_T0_A0(OT_WORD + s->mem_index);
2621 }
2622 gen_op_mov_reg_A0(2, R_ESP);
2623 } else
2624 #endif
2625 {
2626 gen_op_movl_A0_reg(R_ESP);
2627 if (!s->dflag)
2628 gen_op_addl_A0_im(-2);
2629 else
2630 gen_op_addl_A0_im(-4);
2631 if (s->ss32) {
2632 if (s->addseg) {
2633 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2634 gen_op_addl_A0_seg(s, R_SS);
2635 }
2636 } else {
2637 gen_op_andl_A0_ffff();
2638 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2639 gen_op_addl_A0_seg(s, R_SS);
2640 }
2641 gen_op_st_T0_A0(s->dflag + 1 + s->mem_index);
2642 if (s->ss32 && !s->addseg)
2643 gen_op_mov_reg_A0(1, R_ESP);
2644 else
2645 gen_op_mov_reg_T1(s->ss32 + 1, R_ESP);
2646 }
2647 }
2648
2649 /* generate a push. It depends on ss32, addseg and dflag */
2650 /* slower version for T1, only used for call Ev */
2651 static void gen_push_T1(DisasContext *s)
2652 {
2653 #ifdef TARGET_X86_64
2654 if (CODE64(s)) {
2655 gen_op_movq_A0_reg(R_ESP);
2656 if (s->dflag) {
2657 gen_op_addq_A0_im(-8);
2658 gen_op_st_T1_A0(OT_QUAD + s->mem_index);
2659 } else {
2660 gen_op_addq_A0_im(-2);
2661 gen_op_st_T0_A0(OT_WORD + s->mem_index);
2662 }
2663 gen_op_mov_reg_A0(2, R_ESP);
2664 } else
2665 #endif
2666 {
2667 gen_op_movl_A0_reg(R_ESP);
2668 if (!s->dflag)
2669 gen_op_addl_A0_im(-2);
2670 else
2671 gen_op_addl_A0_im(-4);
2672 if (s->ss32) {
2673 if (s->addseg) {
2674 gen_op_addl_A0_seg(s, R_SS);
2675 }
2676 } else {
2677 gen_op_andl_A0_ffff();
2678 gen_op_addl_A0_seg(s, R_SS);
2679 }
2680 gen_op_st_T1_A0(s->dflag + 1 + s->mem_index);
2681
2682 if (s->ss32 && !s->addseg)
2683 gen_op_mov_reg_A0(1, R_ESP);
2684 else
2685 gen_stack_update(s, (-2) << s->dflag);
2686 }
2687 }
2688
2689 /* two step pop is necessary for precise exceptions */
2690 static void gen_pop_T0(DisasContext *s)
2691 {
2692 #ifdef TARGET_X86_64
2693 if (CODE64(s)) {
2694 gen_op_movq_A0_reg(R_ESP);
2695 gen_op_ld_T0_A0((s->dflag ? OT_QUAD : OT_WORD) + s->mem_index);
2696 } else
2697 #endif
2698 {
2699 gen_op_movl_A0_reg(R_ESP);
2700 if (s->ss32) {
2701 if (s->addseg)
2702 gen_op_addl_A0_seg(s, R_SS);
2703 } else {
2704 gen_op_andl_A0_ffff();
2705 gen_op_addl_A0_seg(s, R_SS);
2706 }
2707 gen_op_ld_T0_A0(s->dflag + 1 + s->mem_index);
2708 }
2709 }
2710
2711 static void gen_pop_update(DisasContext *s)
2712 {
2713 #ifdef TARGET_X86_64
2714 if (CODE64(s) && s->dflag) {
2715 gen_stack_update(s, 8);
2716 } else
2717 #endif
2718 {
2719 gen_stack_update(s, 2 << s->dflag);
2720 }
2721 }
2722
2723 static void gen_stack_A0(DisasContext *s)
2724 {
2725 gen_op_movl_A0_reg(R_ESP);
2726 if (!s->ss32)
2727 gen_op_andl_A0_ffff();
2728 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2729 if (s->addseg)
2730 gen_op_addl_A0_seg(s, R_SS);
2731 }
2732
2733 /* NOTE: wrap around in 16 bit not fully handled */
2734 static void gen_pusha(DisasContext *s)
2735 {
2736 int i;
2737 gen_op_movl_A0_reg(R_ESP);
2738 gen_op_addl_A0_im(-16 << s->dflag);
2739 if (!s->ss32)
2740 gen_op_andl_A0_ffff();
2741 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2742 if (s->addseg)
2743 gen_op_addl_A0_seg(s, R_SS);
2744 for(i = 0;i < 8; i++) {
2745 gen_op_mov_TN_reg(OT_LONG, 0, 7 - i);
2746 gen_op_st_T0_A0(OT_WORD + s->dflag + s->mem_index);
2747 gen_op_addl_A0_im(2 << s->dflag);
2748 }
2749 gen_op_mov_reg_T1(OT_WORD + s->ss32, R_ESP);
2750 }
2751
2752 /* NOTE: wrap around in 16 bit not fully handled */
2753 static void gen_popa(DisasContext *s)
2754 {
2755 int i;
2756 gen_op_movl_A0_reg(R_ESP);
2757 if (!s->ss32)
2758 gen_op_andl_A0_ffff();
2759 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2760 tcg_gen_addi_tl(cpu_T[1], cpu_T[1], 16 << s->dflag);
2761 if (s->addseg)
2762 gen_op_addl_A0_seg(s, R_SS);
2763 for(i = 0;i < 8; i++) {
2764 /* ESP is not reloaded */
2765 if (i != 3) {
2766 gen_op_ld_T0_A0(OT_WORD + s->dflag + s->mem_index);
2767 gen_op_mov_reg_T0(OT_WORD + s->dflag, 7 - i);
2768 }
2769 gen_op_addl_A0_im(2 << s->dflag);
2770 }
2771 gen_op_mov_reg_T1(OT_WORD + s->ss32, R_ESP);
2772 }
2773
2774 static void gen_enter(DisasContext *s, int esp_addend, int level)
2775 {
2776 int ot, opsize;
2777
2778 level &= 0x1f;
2779 #ifdef TARGET_X86_64
2780 if (CODE64(s)) {
2781 ot = s->dflag ? OT_QUAD : OT_WORD;
2782 opsize = 1 << ot;
2783
2784 gen_op_movl_A0_reg(R_ESP);
2785 gen_op_addq_A0_im(-opsize);
2786 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2787
2788 /* push bp */
2789 gen_op_mov_TN_reg(OT_LONG, 0, R_EBP);
2790 gen_op_st_T0_A0(ot + s->mem_index);
2791 if (level) {
2792 /* XXX: must save state */
2793 gen_helper_enter64_level(cpu_env, tcg_const_i32(level),
2794 tcg_const_i32((ot == OT_QUAD)),
2795 cpu_T[1]);
2796 }
2797 gen_op_mov_reg_T1(ot, R_EBP);
2798 tcg_gen_addi_tl(cpu_T[1], cpu_T[1], -esp_addend + (-opsize * level));
2799 gen_op_mov_reg_T1(OT_QUAD, R_ESP);
2800 } else
2801 #endif
2802 {
2803 ot = s->dflag + OT_WORD;
2804 opsize = 2 << s->dflag;
2805
2806 gen_op_movl_A0_reg(R_ESP);
2807 gen_op_addl_A0_im(-opsize);
2808 if (!s->ss32)
2809 gen_op_andl_A0_ffff();
2810 tcg_gen_mov_tl(cpu_T[1], cpu_A0);
2811 if (s->addseg)
2812 gen_op_addl_A0_seg(s, R_SS);
2813 /* push bp */
2814 gen_op_mov_TN_reg(OT_LONG, 0, R_EBP);
2815 gen_op_st_T0_A0(ot + s->mem_index);
2816 if (level) {
2817 /* XXX: must save state */
2818 gen_helper_enter_level(cpu_env, tcg_const_i32(level),
2819 tcg_const_i32(s->dflag),
2820 cpu_T[1]);
2821 }
2822 gen_op_mov_reg_T1(ot, R_EBP);
2823 tcg_gen_addi_tl(cpu_T[1], cpu_T[1], -esp_addend + (-opsize * level));
2824 gen_op_mov_reg_T1(OT_WORD + s->ss32, R_ESP);
2825 }
2826 }
2827
2828 static void gen_exception(DisasContext *s, int trapno, target_ulong cur_eip)
2829 {
2830 gen_update_cc_op(s);
2831 gen_jmp_im(cur_eip);
2832 gen_helper_raise_exception(cpu_env, tcg_const_i32(trapno));
2833 s->is_jmp = DISAS_TB_JUMP;
2834 }
2835
2836 /* an interrupt is different from an exception because of the
2837 privilege checks */
2838 static void gen_interrupt(DisasContext *s, int intno,
2839 target_ulong cur_eip, target_ulong next_eip)
2840 {
2841 gen_update_cc_op(s);
2842 gen_jmp_im(cur_eip);
2843 gen_helper_raise_interrupt(cpu_env, tcg_const_i32(intno),
2844 tcg_const_i32(next_eip - cur_eip));
2845 s->is_jmp = DISAS_TB_JUMP;
2846 }
2847
2848 static void gen_debug(DisasContext *s, target_ulong cur_eip)
2849 {
2850 gen_update_cc_op(s);
2851 gen_jmp_im(cur_eip);
2852 gen_helper_debug(cpu_env);
2853 s->is_jmp = DISAS_TB_JUMP;
2854 }
2855
2856 /* generate a generic end of block. Trace exception is also generated
2857 if needed */
2858 static void gen_eob(DisasContext *s)
2859 {
2860 gen_update_cc_op(s);
2861 if (s->tb->flags & HF_INHIBIT_IRQ_MASK) {
2862 gen_helper_reset_inhibit_irq(cpu_env);
2863 }
2864 if (s->tb->flags & HF_RF_MASK) {
2865 gen_helper_reset_rf(cpu_env);
2866 }
2867 if (s->singlestep_enabled) {
2868 gen_helper_debug(cpu_env);
2869 } else if (s->tf) {
2870 gen_helper_single_step(cpu_env);
2871 } else {
2872 tcg_gen_exit_tb(0);
2873 }
2874 s->is_jmp = DISAS_TB_JUMP;
2875 }
2876
2877 /* generate a jump to eip. No segment change must happen before as a
2878 direct call to the next block may occur */
2879 static void gen_jmp_tb(DisasContext *s, target_ulong eip, int tb_num)
2880 {
2881 if (s->jmp_opt) {
2882 gen_update_cc_op(s);
2883 gen_goto_tb(s, tb_num, eip);
2884 s->is_jmp = DISAS_TB_JUMP;
2885 } else {
2886 gen_jmp_im(eip);
2887 gen_eob(s);
2888 }
2889 }
2890
2891 static void gen_jmp(DisasContext *s, target_ulong eip)
2892 {
2893 gen_jmp_tb(s, eip, 0);
2894 }
2895
2896 static inline void gen_ldq_env_A0(int idx, int offset)
2897 {
2898 int mem_index = (idx >> 2) - 1;
2899 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0, mem_index);
2900 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset);
2901 }
2902
2903 static inline void gen_stq_env_A0(int idx, int offset)
2904 {
2905 int mem_index = (idx >> 2) - 1;
2906 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset);
2907 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0, mem_index);
2908 }
2909
2910 static inline void gen_ldo_env_A0(int idx, int offset)
2911 {
2912 int mem_index = (idx >> 2) - 1;
2913 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0, mem_index);
2914 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(0)));
2915 tcg_gen_addi_tl(cpu_tmp0, cpu_A0, 8);
2916 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_tmp0, mem_index);
2917 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(1)));
2918 }
2919
2920 static inline void gen_sto_env_A0(int idx, int offset)
2921 {
2922 int mem_index = (idx >> 2) - 1;
2923 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(0)));
2924 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0, mem_index);
2925 tcg_gen_addi_tl(cpu_tmp0, cpu_A0, 8);
2926 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, offset + offsetof(XMMReg, XMM_Q(1)));
2927 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_tmp0, mem_index);
2928 }
2929
2930 static inline void gen_op_movo(int d_offset, int s_offset)
2931 {
2932 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset);
2933 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2934 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset + 8);
2935 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset + 8);
2936 }
2937
2938 static inline void gen_op_movq(int d_offset, int s_offset)
2939 {
2940 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env, s_offset);
2941 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2942 }
2943
2944 static inline void gen_op_movl(int d_offset, int s_offset)
2945 {
2946 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env, s_offset);
2947 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, d_offset);
2948 }
2949
2950 static inline void gen_op_movq_env_0(int d_offset)
2951 {
2952 tcg_gen_movi_i64(cpu_tmp1_i64, 0);
2953 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env, d_offset);
2954 }
2955
2956 typedef void (*SSEFunc_i_ep)(TCGv_i32 val, TCGv_ptr env, TCGv_ptr reg);
2957 typedef void (*SSEFunc_l_ep)(TCGv_i64 val, TCGv_ptr env, TCGv_ptr reg);
2958 typedef void (*SSEFunc_0_epi)(TCGv_ptr env, TCGv_ptr reg, TCGv_i32 val);
2959 typedef void (*SSEFunc_0_epl)(TCGv_ptr env, TCGv_ptr reg, TCGv_i64 val);
2960 typedef void (*SSEFunc_0_epp)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b);
2961 typedef void (*SSEFunc_0_eppi)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b,
2962 TCGv_i32 val);
2963 typedef void (*SSEFunc_0_ppi)(TCGv_ptr reg_a, TCGv_ptr reg_b, TCGv_i32 val);
2964 typedef void (*SSEFunc_0_eppt)(TCGv_ptr env, TCGv_ptr reg_a, TCGv_ptr reg_b,
2965 TCGv val);
2966
2967 #define SSE_SPECIAL ((void *)1)
2968 #define SSE_DUMMY ((void *)2)
2969
2970 #define MMX_OP2(x) { gen_helper_ ## x ## _mmx, gen_helper_ ## x ## _xmm }
2971 #define SSE_FOP(x) { gen_helper_ ## x ## ps, gen_helper_ ## x ## pd, \
2972 gen_helper_ ## x ## ss, gen_helper_ ## x ## sd, }
2973
2974 static const SSEFunc_0_epp sse_op_table1[256][4] = {
2975 /* 3DNow! extensions */
2976 [0x0e] = { SSE_DUMMY }, /* femms */
2977 [0x0f] = { SSE_DUMMY }, /* pf... */
2978 /* pure SSE operations */
2979 [0x10] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movups, movupd, movss, movsd */
2980 [0x11] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movups, movupd, movss, movsd */
2981 [0x12] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movlps, movlpd, movsldup, movddup */
2982 [0x13] = { SSE_SPECIAL, SSE_SPECIAL }, /* movlps, movlpd */
2983 [0x14] = { gen_helper_punpckldq_xmm, gen_helper_punpcklqdq_xmm },
2984 [0x15] = { gen_helper_punpckhdq_xmm, gen_helper_punpckhqdq_xmm },
2985 [0x16] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movhps, movhpd, movshdup */
2986 [0x17] = { SSE_SPECIAL, SSE_SPECIAL }, /* movhps, movhpd */
2987
2988 [0x28] = { SSE_SPECIAL, SSE_SPECIAL }, /* movaps, movapd */
2989 [0x29] = { SSE_SPECIAL, SSE_SPECIAL }, /* movaps, movapd */
2990 [0x2a] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvtpi2ps, cvtpi2pd, cvtsi2ss, cvtsi2sd */
2991 [0x2b] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movntps, movntpd, movntss, movntsd */
2992 [0x2c] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvttps2pi, cvttpd2pi, cvttsd2si, cvttss2si */
2993 [0x2d] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* cvtps2pi, cvtpd2pi, cvtsd2si, cvtss2si */
2994 [0x2e] = { gen_helper_ucomiss, gen_helper_ucomisd },
2995 [0x2f] = { gen_helper_comiss, gen_helper_comisd },
2996 [0x50] = { SSE_SPECIAL, SSE_SPECIAL }, /* movmskps, movmskpd */
2997 [0x51] = SSE_FOP(sqrt),
2998 [0x52] = { gen_helper_rsqrtps, NULL, gen_helper_rsqrtss, NULL },
2999 [0x53] = { gen_helper_rcpps, NULL, gen_helper_rcpss, NULL },
3000 [0x54] = { gen_helper_pand_xmm, gen_helper_pand_xmm }, /* andps, andpd */
3001 [0x55] = { gen_helper_pandn_xmm, gen_helper_pandn_xmm }, /* andnps, andnpd */
3002 [0x56] = { gen_helper_por_xmm, gen_helper_por_xmm }, /* orps, orpd */
3003 [0x57] = { gen_helper_pxor_xmm, gen_helper_pxor_xmm }, /* xorps, xorpd */
3004 [0x58] = SSE_FOP(add),
3005 [0x59] = SSE_FOP(mul),
3006 [0x5a] = { gen_helper_cvtps2pd, gen_helper_cvtpd2ps,
3007 gen_helper_cvtss2sd, gen_helper_cvtsd2ss },
3008 [0x5b] = { gen_helper_cvtdq2ps, gen_helper_cvtps2dq, gen_helper_cvttps2dq },
3009 [0x5c] = SSE_FOP(sub),
3010 [0x5d] = SSE_FOP(min),
3011 [0x5e] = SSE_FOP(div),
3012 [0x5f] = SSE_FOP(max),
3013
3014 [0xc2] = SSE_FOP(cmpeq),
3015 [0xc6] = { (SSEFunc_0_epp)gen_helper_shufps,
3016 (SSEFunc_0_epp)gen_helper_shufpd }, /* XXX: casts */
3017
3018 [0x38] = { SSE_SPECIAL, SSE_SPECIAL, NULL, SSE_SPECIAL }, /* SSSE3/SSE4 */
3019 [0x3a] = { SSE_SPECIAL, SSE_SPECIAL }, /* SSSE3/SSE4 */
3020
3021 /* MMX ops and their SSE extensions */
3022 [0x60] = MMX_OP2(punpcklbw),
3023 [0x61] = MMX_OP2(punpcklwd),
3024 [0x62] = MMX_OP2(punpckldq),
3025 [0x63] = MMX_OP2(packsswb),
3026 [0x64] = MMX_OP2(pcmpgtb),
3027 [0x65] = MMX_OP2(pcmpgtw),
3028 [0x66] = MMX_OP2(pcmpgtl),
3029 [0x67] = MMX_OP2(packuswb),
3030 [0x68] = MMX_OP2(punpckhbw),
3031 [0x69] = MMX_OP2(punpckhwd),
3032 [0x6a] = MMX_OP2(punpckhdq),
3033 [0x6b] = MMX_OP2(packssdw),
3034 [0x6c] = { NULL, gen_helper_punpcklqdq_xmm },
3035 [0x6d] = { NULL, gen_helper_punpckhqdq_xmm },
3036 [0x6e] = { SSE_SPECIAL, SSE_SPECIAL }, /* movd mm, ea */
3037 [0x6f] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movq, movdqa, , movqdu */
3038 [0x70] = { (SSEFunc_0_epp)gen_helper_pshufw_mmx,
3039 (SSEFunc_0_epp)gen_helper_pshufd_xmm,
3040 (SSEFunc_0_epp)gen_helper_pshufhw_xmm,
3041 (SSEFunc_0_epp)gen_helper_pshuflw_xmm }, /* XXX: casts */
3042 [0x71] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftw */
3043 [0x72] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftd */
3044 [0x73] = { SSE_SPECIAL, SSE_SPECIAL }, /* shiftq */
3045 [0x74] = MMX_OP2(pcmpeqb),
3046 [0x75] = MMX_OP2(pcmpeqw),
3047 [0x76] = MMX_OP2(pcmpeql),
3048 [0x77] = { SSE_DUMMY }, /* emms */
3049 [0x78] = { NULL, SSE_SPECIAL, NULL, SSE_SPECIAL }, /* extrq_i, insertq_i */
3050 [0x79] = { NULL, gen_helper_extrq_r, NULL, gen_helper_insertq_r },
3051 [0x7c] = { NULL, gen_helper_haddpd, NULL, gen_helper_haddps },
3052 [0x7d] = { NULL, gen_helper_hsubpd, NULL, gen_helper_hsubps },
3053 [0x7e] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movd, movd, , movq */
3054 [0x7f] = { SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL }, /* movq, movdqa, movdqu */
3055 [0xc4] = { SSE_SPECIAL, SSE_SPECIAL }, /* pinsrw */
3056 [0xc5] = { SSE_SPECIAL, SSE_SPECIAL }, /* pextrw */
3057 [0xd0] = { NULL, gen_helper_addsubpd, NULL, gen_helper_addsubps },
3058 [0xd1] = MMX_OP2(psrlw),
3059 [0xd2] = MMX_OP2(psrld),
3060 [0xd3] = MMX_OP2(psrlq),
3061 [0xd4] = MMX_OP2(paddq),
3062 [0xd5] = MMX_OP2(pmullw),
3063 [0xd6] = { NULL, SSE_SPECIAL, SSE_SPECIAL, SSE_SPECIAL },
3064 [0xd7] = { SSE_SPECIAL, SSE_SPECIAL }, /* pmovmskb */
3065 [0xd8] = MMX_OP2(psubusb),
3066 [0xd9] = MMX_OP2(psubusw),
3067 [0xda] = MMX_OP2(pminub),
3068 [0xdb] = MMX_OP2(pand),
3069 [0xdc] = MMX_OP2(paddusb),
3070 [0xdd] = MMX_OP2(paddusw),
3071 [0xde] = MMX_OP2(pmaxub),
3072 [0xdf] = MMX_OP2(pandn),
3073 [0xe0] = MMX_OP2(pavgb),
3074 [0xe1] = MMX_OP2(psraw),
3075 [0xe2] = MMX_OP2(psrad),
3076 [0xe3] = MMX_OP2(pavgw),
3077 [0xe4] = MMX_OP2(pmulhuw),
3078 [0xe5] = MMX_OP2(pmulhw),
3079 [0xe6] = { NULL, gen_helper_cvttpd2dq, gen_helper_cvtdq2pd, gen_helper_cvtpd2dq },
3080 [0xe7] = { SSE_SPECIAL , SSE_SPECIAL }, /* movntq, movntq */
3081 [0xe8] = MMX_OP2(psubsb),
3082 [0xe9] = MMX_OP2(psubsw),
3083 [0xea] = MMX_OP2(pminsw),
3084 [0xeb] = MMX_OP2(por),
3085 [0xec] = MMX_OP2(paddsb),
3086 [0xed] = MMX_OP2(paddsw),
3087 [0xee] = MMX_OP2(pmaxsw),
3088 [0xef] = MMX_OP2(pxor),
3089 [0xf0] = { NULL, NULL, NULL, SSE_SPECIAL }, /* lddqu */
3090 [0xf1] = MMX_OP2(psllw),
3091 [0xf2] = MMX_OP2(pslld),
3092 [0xf3] = MMX_OP2(psllq),
3093 [0xf4] = MMX_OP2(pmuludq),
3094 [0xf5] = MMX_OP2(pmaddwd),
3095 [0xf6] = MMX_OP2(psadbw),
3096 [0xf7] = { (SSEFunc_0_epp)gen_helper_maskmov_mmx,
3097 (SSEFunc_0_epp)gen_helper_maskmov_xmm }, /* XXX: casts */
3098 [0xf8] = MMX_OP2(psubb),
3099 [0xf9] = MMX_OP2(psubw),
3100 [0xfa] = MMX_OP2(psubl),
3101 [0xfb] = MMX_OP2(psubq),
3102 [0xfc] = MMX_OP2(paddb),
3103 [0xfd] = MMX_OP2(paddw),
3104 [0xfe] = MMX_OP2(paddl),
3105 };
3106
3107 static const SSEFunc_0_epp sse_op_table2[3 * 8][2] = {
3108 [0 + 2] = MMX_OP2(psrlw),
3109 [0 + 4] = MMX_OP2(psraw),
3110 [0 + 6] = MMX_OP2(psllw),
3111 [8 + 2] = MMX_OP2(psrld),
3112 [8 + 4] = MMX_OP2(psrad),
3113 [8 + 6] = MMX_OP2(pslld),
3114 [16 + 2] = MMX_OP2(psrlq),
3115 [16 + 3] = { NULL, gen_helper_psrldq_xmm },
3116 [16 + 6] = MMX_OP2(psllq),
3117 [16 + 7] = { NULL, gen_helper_pslldq_xmm },
3118 };
3119
3120 static const SSEFunc_0_epi sse_op_table3ai[] = {
3121 gen_helper_cvtsi2ss,
3122 gen_helper_cvtsi2sd
3123 };
3124
3125 #ifdef TARGET_X86_64
3126 static const SSEFunc_0_epl sse_op_table3aq[] = {
3127 gen_helper_cvtsq2ss,
3128 gen_helper_cvtsq2sd
3129 };
3130 #endif
3131
3132 static const SSEFunc_i_ep sse_op_table3bi[] = {
3133 gen_helper_cvttss2si,
3134 gen_helper_cvtss2si,
3135 gen_helper_cvttsd2si,
3136 gen_helper_cvtsd2si
3137 };
3138
3139 #ifdef TARGET_X86_64
3140 static const SSEFunc_l_ep sse_op_table3bq[] = {
3141 gen_helper_cvttss2sq,
3142 gen_helper_cvtss2sq,
3143 gen_helper_cvttsd2sq,
3144 gen_helper_cvtsd2sq
3145 };
3146 #endif
3147
3148 static const SSEFunc_0_epp sse_op_table4[8][4] = {
3149 SSE_FOP(cmpeq),
3150 SSE_FOP(cmplt),
3151 SSE_FOP(cmple),
3152 SSE_FOP(cmpunord),
3153 SSE_FOP(cmpneq),
3154 SSE_FOP(cmpnlt),
3155 SSE_FOP(cmpnle),
3156 SSE_FOP(cmpord),
3157 };
3158
3159 static const SSEFunc_0_epp sse_op_table5[256] = {
3160 [0x0c] = gen_helper_pi2fw,
3161 [0x0d] = gen_helper_pi2fd,
3162 [0x1c] = gen_helper_pf2iw,
3163 [0x1d] = gen_helper_pf2id,
3164 [0x8a] = gen_helper_pfnacc,
3165 [0x8e] = gen_helper_pfpnacc,
3166 [0x90] = gen_helper_pfcmpge,
3167 [0x94] = gen_helper_pfmin,
3168 [0x96] = gen_helper_pfrcp,
3169 [0x97] = gen_helper_pfrsqrt,
3170 [0x9a] = gen_helper_pfsub,
3171 [0x9e] = gen_helper_pfadd,
3172 [0xa0] = gen_helper_pfcmpgt,
3173 [0xa4] = gen_helper_pfmax,
3174 [0xa6] = gen_helper_movq, /* pfrcpit1; no need to actually increase precision */
3175 [0xa7] = gen_helper_movq, /* pfrsqit1 */
3176 [0xaa] = gen_helper_pfsubr,
3177 [0xae] = gen_helper_pfacc,
3178 [0xb0] = gen_helper_pfcmpeq,
3179 [0xb4] = gen_helper_pfmul,
3180 [0xb6] = gen_helper_movq, /* pfrcpit2 */
3181 [0xb7] = gen_helper_pmulhrw_mmx,
3182 [0xbb] = gen_helper_pswapd,
3183 [0xbf] = gen_helper_pavgb_mmx /* pavgusb */
3184 };
3185
3186 struct SSEOpHelper_epp {
3187 SSEFunc_0_epp op[2];
3188 uint32_t ext_mask;
3189 };
3190
3191 struct SSEOpHelper_eppi {
3192 SSEFunc_0_eppi op[2];
3193 uint32_t ext_mask;
3194 };
3195
3196 #define SSSE3_OP(x) { MMX_OP2(x), CPUID_EXT_SSSE3 }
3197 #define SSE41_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE41 }
3198 #define SSE42_OP(x) { { NULL, gen_helper_ ## x ## _xmm }, CPUID_EXT_SSE42 }
3199 #define SSE41_SPECIAL { { NULL, SSE_SPECIAL }, CPUID_EXT_SSE41 }
3200
3201 static const struct SSEOpHelper_epp sse_op_table6[256] = {
3202 [0x00] = SSSE3_OP(pshufb),
3203 [0x01] = SSSE3_OP(phaddw),
3204 [0x02] = SSSE3_OP(phaddd),
3205 [0x03] = SSSE3_OP(phaddsw),
3206 [0x04] = SSSE3_OP(pmaddubsw),
3207 [0x05] = SSSE3_OP(phsubw),
3208 [0x06] = SSSE3_OP(phsubd),
3209 [0x07] = SSSE3_OP(phsubsw),
3210 [0x08] = SSSE3_OP(psignb),
3211 [0x09] = SSSE3_OP(psignw),
3212 [0x0a] = SSSE3_OP(psignd),
3213 [0x0b] = SSSE3_OP(pmulhrsw),
3214 [0x10] = SSE41_OP(pblendvb),
3215 [0x14] = SSE41_OP(blendvps),
3216 [0x15] = SSE41_OP(blendvpd),
3217 [0x17] = SSE41_OP(ptest),
3218 [0x1c] = SSSE3_OP(pabsb),
3219 [0x1d] = SSSE3_OP(pabsw),
3220 [0x1e] = SSSE3_OP(pabsd),
3221 [0x20] = SSE41_OP(pmovsxbw),
3222 [0x21] = SSE41_OP(pmovsxbd),
3223 [0x22] = SSE41_OP(pmovsxbq),
3224 [0x23] = SSE41_OP(pmovsxwd),
3225 [0x24] = SSE41_OP(pmovsxwq),
3226 [0x25] = SSE41_OP(pmovsxdq),
3227 [0x28] = SSE41_OP(pmuldq),
3228 [0x29] = SSE41_OP(pcmpeqq),
3229 [0x2a] = SSE41_SPECIAL, /* movntqda */
3230 [0x2b] = SSE41_OP(packusdw),
3231 [0x30] = SSE41_OP(pmovzxbw),
3232 [0x31] = SSE41_OP(pmovzxbd),
3233 [0x32] = SSE41_OP(pmovzxbq),
3234 [0x33] = SSE41_OP(pmovzxwd),
3235 [0x34] = SSE41_OP(pmovzxwq),
3236 [0x35] = SSE41_OP(pmovzxdq),
3237 [0x37] = SSE42_OP(pcmpgtq),
3238 [0x38] = SSE41_OP(pminsb),
3239 [0x39] = SSE41_OP(pminsd),
3240 [0x3a] = SSE41_OP(pminuw),
3241 [0x3b] = SSE41_OP(pminud),
3242 [0x3c] = SSE41_OP(pmaxsb),
3243 [0x3d] = SSE41_OP(pmaxsd),
3244 [0x3e] = SSE41_OP(pmaxuw),
3245 [0x3f] = SSE41_OP(pmaxud),
3246 [0x40] = SSE41_OP(pmulld),
3247 [0x41] = SSE41_OP(phminposuw),
3248 };
3249
3250 static const struct SSEOpHelper_eppi sse_op_table7[256] = {
3251 [0x08] = SSE41_OP(roundps),
3252 [0x09] = SSE41_OP(roundpd),
3253 [0x0a] = SSE41_OP(roundss),
3254 [0x0b] = SSE41_OP(roundsd),
3255 [0x0c] = SSE41_OP(blendps),
3256 [0x0d] = SSE41_OP(blendpd),
3257 [0x0e] = SSE41_OP(pblendw),
3258 [0x0f] = SSSE3_OP(palignr),
3259 [0x14] = SSE41_SPECIAL, /* pextrb */
3260 [0x15] = SSE41_SPECIAL, /* pextrw */
3261 [0x16] = SSE41_SPECIAL, /* pextrd/pextrq */
3262 [0x17] = SSE41_SPECIAL, /* extractps */
3263 [0x20] = SSE41_SPECIAL, /* pinsrb */
3264 [0x21] = SSE41_SPECIAL, /* insertps */
3265 [0x22] = SSE41_SPECIAL, /* pinsrd/pinsrq */
3266 [0x40] = SSE41_OP(dpps),
3267 [0x41] = SSE41_OP(dppd),
3268 [0x42] = SSE41_OP(mpsadbw),
3269 [0x60] = SSE42_OP(pcmpestrm),
3270 [0x61] = SSE42_OP(pcmpestri),
3271 [0x62] = SSE42_OP(pcmpistrm),
3272 [0x63] = SSE42_OP(pcmpistri),
3273 };
3274
3275 static void gen_sse(CPUX86State *env, DisasContext *s, int b,
3276 target_ulong pc_start, int rex_r)
3277 {
3278 int b1, op1_offset, op2_offset, is_xmm, val, ot;
3279 int modrm, mod, rm, reg, reg_addr, offset_addr;
3280 SSEFunc_0_epp sse_fn_epp;
3281 SSEFunc_0_eppi sse_fn_eppi;
3282 SSEFunc_0_ppi sse_fn_ppi;
3283 SSEFunc_0_eppt sse_fn_eppt;
3284
3285 b &= 0xff;
3286 if (s->prefix & PREFIX_DATA)
3287 b1 = 1;
3288 else if (s->prefix & PREFIX_REPZ)
3289 b1 = 2;
3290 else if (s->prefix & PREFIX_REPNZ)
3291 b1 = 3;
3292 else
3293 b1 = 0;
3294 sse_fn_epp = sse_op_table1[b][b1];
3295 if (!sse_fn_epp) {
3296 goto illegal_op;
3297 }
3298 if ((b <= 0x5f && b >= 0x10) || b == 0xc6 || b == 0xc2) {
3299 is_xmm = 1;
3300 } else {
3301 if (b1 == 0) {
3302 /* MMX case */
3303 is_xmm = 0;
3304 } else {
3305 is_xmm = 1;
3306 }
3307 }
3308 /* simple MMX/SSE operation */
3309 if (s->flags & HF_TS_MASK) {
3310 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
3311 return;
3312 }
3313 if (s->flags & HF_EM_MASK) {
3314 illegal_op:
3315 gen_exception(s, EXCP06_ILLOP, pc_start - s->cs_base);
3316 return;
3317 }
3318 if (is_xmm && !(s->flags & HF_OSFXSR_MASK))
3319 if ((b != 0x38 && b != 0x3a) || (s->prefix & PREFIX_DATA))
3320 goto illegal_op;
3321 if (b == 0x0e) {
3322 if (!(s->cpuid_ext2_features & CPUID_EXT2_3DNOW))
3323 goto illegal_op;
3324 /* femms */
3325 gen_helper_emms(cpu_env);
3326 return;
3327 }
3328 if (b == 0x77) {
3329 /* emms */
3330 gen_helper_emms(cpu_env);
3331 return;
3332 }
3333 /* prepare MMX state (XXX: optimize by storing fptt and fptags in
3334 the static cpu state) */
3335 if (!is_xmm) {
3336 gen_helper_enter_mmx(cpu_env);
3337 }
3338
3339 modrm = cpu_ldub_code(env, s->pc++);
3340 reg = ((modrm >> 3) & 7);
3341 if (is_xmm)
3342 reg |= rex_r;
3343 mod = (modrm >> 6) & 3;
3344 if (sse_fn_epp == SSE_SPECIAL) {
3345 b |= (b1 << 8);
3346 switch(b) {
3347 case 0x0e7: /* movntq */
3348 if (mod == 3)
3349 goto illegal_op;
3350 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3351 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,fpregs[reg].mmx));
3352 break;
3353 case 0x1e7: /* movntdq */
3354 case 0x02b: /* movntps */
3355 case 0x12b: /* movntps */
3356 if (mod == 3)
3357 goto illegal_op;
3358 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3359 gen_sto_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3360 break;
3361 case 0x3f0: /* lddqu */
3362 if (mod == 3)
3363 goto illegal_op;
3364 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3365 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3366 break;
3367 case 0x22b: /* movntss */
3368 case 0x32b: /* movntsd */
3369 if (mod == 3)
3370 goto illegal_op;
3371 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3372 if (b1 & 1) {
3373 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,
3374 xmm_regs[reg]));
3375 } else {
3376 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
3377 xmm_regs[reg].XMM_L(0)));
3378 gen_op_st_T0_A0(OT_LONG + s->mem_index);
3379 }
3380 break;
3381 case 0x6e: /* movd mm, ea */
3382 #ifdef TARGET_X86_64
3383 if (s->dflag == 2) {
3384 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 0);
3385 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,fpregs[reg].mmx));
3386 } else
3387 #endif
3388 {
3389 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 0);
3390 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3391 offsetof(CPUX86State,fpregs[reg].mmx));
3392 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
3393 gen_helper_movl_mm_T0_mmx(cpu_ptr0, cpu_tmp2_i32);
3394 }
3395 break;
3396 case 0x16e: /* movd xmm, ea */
3397 #ifdef TARGET_X86_64
3398 if (s->dflag == 2) {
3399 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 0);
3400 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3401 offsetof(CPUX86State,xmm_regs[reg]));
3402 gen_helper_movq_mm_T0_xmm(cpu_ptr0, cpu_T[0]);
3403 } else
3404 #endif
3405 {
3406 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 0);
3407 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3408 offsetof(CPUX86State,xmm_regs[reg]));
3409 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
3410 gen_helper_movl_mm_T0_xmm(cpu_ptr0, cpu_tmp2_i32);
3411 }
3412 break;
3413 case 0x6f: /* movq mm, ea */
3414 if (mod != 3) {
3415 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3416 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,fpregs[reg].mmx));
3417 } else {
3418 rm = (modrm & 7);
3419 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env,
3420 offsetof(CPUX86State,fpregs[rm].mmx));
3421 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env,
3422 offsetof(CPUX86State,fpregs[reg].mmx));
3423 }
3424 break;
3425 case 0x010: /* movups */
3426 case 0x110: /* movupd */
3427 case 0x028: /* movaps */
3428 case 0x128: /* movapd */
3429 case 0x16f: /* movdqa xmm, ea */
3430 case 0x26f: /* movdqu xmm, ea */
3431 if (mod != 3) {
3432 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3433 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3434 } else {
3435 rm = (modrm & 7) | REX_B(s);
3436 gen_op_movo(offsetof(CPUX86State,xmm_regs[reg]),
3437 offsetof(CPUX86State,xmm_regs[rm]));
3438 }
3439 break;
3440 case 0x210: /* movss xmm, ea */
3441 if (mod != 3) {
3442 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3443 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
3444 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3445 gen_op_movl_T0_0();
3446 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)));
3447 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)));
3448 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)));
3449 } else {
3450 rm = (modrm & 7) | REX_B(s);
3451 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)),
3452 offsetof(CPUX86State,xmm_regs[rm].XMM_L(0)));
3453 }
3454 break;
3455 case 0x310: /* movsd xmm, ea */
3456 if (mod != 3) {
3457 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3458 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3459 gen_op_movl_T0_0();
3460 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)));
3461 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)));
3462 } else {
3463 rm = (modrm & 7) | REX_B(s);
3464 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3465 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3466 }
3467 break;
3468 case 0x012: /* movlps */
3469 case 0x112: /* movlpd */
3470 if (mod != 3) {
3471 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3472 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3473 } else {
3474 /* movhlps */
3475 rm = (modrm & 7) | REX_B(s);
3476 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3477 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(1)));
3478 }
3479 break;
3480 case 0x212: /* movsldup */
3481 if (mod != 3) {
3482 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3483 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3484 } else {
3485 rm = (modrm & 7) | REX_B(s);
3486 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)),
3487 offsetof(CPUX86State,xmm_regs[rm].XMM_L(0)));
3488 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)),
3489 offsetof(CPUX86State,xmm_regs[rm].XMM_L(2)));
3490 }
3491 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)),
3492 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3493 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)),
3494 offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)));
3495 break;
3496 case 0x312: /* movddup */
3497 if (mod != 3) {
3498 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3499 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3500 } else {
3501 rm = (modrm & 7) | REX_B(s);
3502 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3503 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3504 }
3505 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)),
3506 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3507 break;
3508 case 0x016: /* movhps */
3509 case 0x116: /* movhpd */
3510 if (mod != 3) {
3511 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3512 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3513 } else {
3514 /* movlhps */
3515 rm = (modrm & 7) | REX_B(s);
3516 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)),
3517 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3518 }
3519 break;
3520 case 0x216: /* movshdup */
3521 if (mod != 3) {
3522 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3523 gen_ldo_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3524 } else {
3525 rm = (modrm & 7) | REX_B(s);
3526 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)),
3527 offsetof(CPUX86State,xmm_regs[rm].XMM_L(1)));
3528 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)),
3529 offsetof(CPUX86State,xmm_regs[rm].XMM_L(3)));
3530 }
3531 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)),
3532 offsetof(CPUX86State,xmm_regs[reg].XMM_L(1)));
3533 gen_op_movl(offsetof(CPUX86State,xmm_regs[reg].XMM_L(2)),
3534 offsetof(CPUX86State,xmm_regs[reg].XMM_L(3)));
3535 break;
3536 case 0x178:
3537 case 0x378:
3538 {
3539 int bit_index, field_length;
3540
3541 if (b1 == 1 && reg != 0)
3542 goto illegal_op;
3543 field_length = cpu_ldub_code(env, s->pc++) & 0x3F;
3544 bit_index = cpu_ldub_code(env, s->pc++) & 0x3F;
3545 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3546 offsetof(CPUX86State,xmm_regs[reg]));
3547 if (b1 == 1)
3548 gen_helper_extrq_i(cpu_env, cpu_ptr0,
3549 tcg_const_i32(bit_index),
3550 tcg_const_i32(field_length));
3551 else
3552 gen_helper_insertq_i(cpu_env, cpu_ptr0,
3553 tcg_const_i32(bit_index),
3554 tcg_const_i32(field_length));
3555 }
3556 break;
3557 case 0x7e: /* movd ea, mm */
3558 #ifdef TARGET_X86_64
3559 if (s->dflag == 2) {
3560 tcg_gen_ld_i64(cpu_T[0], cpu_env,
3561 offsetof(CPUX86State,fpregs[reg].mmx));
3562 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 1);
3563 } else
3564 #endif
3565 {
3566 tcg_gen_ld32u_tl(cpu_T[0], cpu_env,
3567 offsetof(CPUX86State,fpregs[reg].mmx.MMX_L(0)));
3568 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 1);
3569 }
3570 break;
3571 case 0x17e: /* movd ea, xmm */
3572 #ifdef TARGET_X86_64
3573 if (s->dflag == 2) {
3574 tcg_gen_ld_i64(cpu_T[0], cpu_env,
3575 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3576 gen_ldst_modrm(env, s, modrm, OT_QUAD, OR_TMP0, 1);
3577 } else
3578 #endif
3579 {
3580 tcg_gen_ld32u_tl(cpu_T[0], cpu_env,
3581 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3582 gen_ldst_modrm(env, s, modrm, OT_LONG, OR_TMP0, 1);
3583 }
3584 break;
3585 case 0x27e: /* movq xmm, ea */
3586 if (mod != 3) {
3587 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3588 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3589 } else {
3590 rm = (modrm & 7) | REX_B(s);
3591 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3592 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3593 }
3594 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3595 break;
3596 case 0x7f: /* movq ea, mm */
3597 if (mod != 3) {
3598 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3599 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,fpregs[reg].mmx));
3600 } else {
3601 rm = (modrm & 7);
3602 gen_op_movq(offsetof(CPUX86State,fpregs[rm].mmx),
3603 offsetof(CPUX86State,fpregs[reg].mmx));
3604 }
3605 break;
3606 case 0x011: /* movups */
3607 case 0x111: /* movupd */
3608 case 0x029: /* movaps */
3609 case 0x129: /* movapd */
3610 case 0x17f: /* movdqa ea, xmm */
3611 case 0x27f: /* movdqu ea, xmm */
3612 if (mod != 3) {
3613 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3614 gen_sto_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg]));
3615 } else {
3616 rm = (modrm & 7) | REX_B(s);
3617 gen_op_movo(offsetof(CPUX86State,xmm_regs[rm]),
3618 offsetof(CPUX86State,xmm_regs[reg]));
3619 }
3620 break;
3621 case 0x211: /* movss ea, xmm */
3622 if (mod != 3) {
3623 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3624 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3625 gen_op_st_T0_A0(OT_LONG + s->mem_index);
3626 } else {
3627 rm = (modrm & 7) | REX_B(s);
3628 gen_op_movl(offsetof(CPUX86State,xmm_regs[rm].XMM_L(0)),
3629 offsetof(CPUX86State,xmm_regs[reg].XMM_L(0)));
3630 }
3631 break;
3632 case 0x311: /* movsd ea, xmm */
3633 if (mod != 3) {
3634 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3635 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3636 } else {
3637 rm = (modrm & 7) | REX_B(s);
3638 gen_op_movq(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)),
3639 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3640 }
3641 break;
3642 case 0x013: /* movlps */
3643 case 0x113: /* movlpd */
3644 if (mod != 3) {
3645 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3646 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3647 } else {
3648 goto illegal_op;
3649 }
3650 break;
3651 case 0x017: /* movhps */
3652 case 0x117: /* movhpd */
3653 if (mod != 3) {
3654 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3655 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3656 } else {
3657 goto illegal_op;
3658 }
3659 break;
3660 case 0x71: /* shift mm, im */
3661 case 0x72:
3662 case 0x73:
3663 case 0x171: /* shift xmm, im */
3664 case 0x172:
3665 case 0x173:
3666 if (b1 >= 2) {
3667 goto illegal_op;
3668 }
3669 val = cpu_ldub_code(env, s->pc++);
3670 if (is_xmm) {
3671 gen_op_movl_T0_im(val);
3672 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0)));
3673 gen_op_movl_T0_0();
3674 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(1)));
3675 op1_offset = offsetof(CPUX86State,xmm_t0);
3676 } else {
3677 gen_op_movl_T0_im(val);
3678 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,mmx_t0.MMX_L(0)));
3679 gen_op_movl_T0_0();
3680 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,mmx_t0.MMX_L(1)));
3681 op1_offset = offsetof(CPUX86State,mmx_t0);
3682 }
3683 sse_fn_epp = sse_op_table2[((b - 1) & 3) * 8 +
3684 (((modrm >> 3)) & 7)][b1];
3685 if (!sse_fn_epp) {
3686 goto illegal_op;
3687 }
3688 if (is_xmm) {
3689 rm = (modrm & 7) | REX_B(s);
3690 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
3691 } else {
3692 rm = (modrm & 7);
3693 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
3694 }
3695 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op2_offset);
3696 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op1_offset);
3697 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
3698 break;
3699 case 0x050: /* movmskps */
3700 rm = (modrm & 7) | REX_B(s);
3701 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3702 offsetof(CPUX86State,xmm_regs[rm]));
3703 gen_helper_movmskps(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3704 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3705 gen_op_mov_reg_T0(OT_LONG, reg);
3706 break;
3707 case 0x150: /* movmskpd */
3708 rm = (modrm & 7) | REX_B(s);
3709 tcg_gen_addi_ptr(cpu_ptr0, cpu_env,
3710 offsetof(CPUX86State,xmm_regs[rm]));
3711 gen_helper_movmskpd(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3712 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3713 gen_op_mov_reg_T0(OT_LONG, reg);
3714 break;
3715 case 0x02a: /* cvtpi2ps */
3716 case 0x12a: /* cvtpi2pd */
3717 gen_helper_enter_mmx(cpu_env);
3718 if (mod != 3) {
3719 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3720 op2_offset = offsetof(CPUX86State,mmx_t0);
3721 gen_ldq_env_A0(s->mem_index, op2_offset);
3722 } else {
3723 rm = (modrm & 7);
3724 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
3725 }
3726 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
3727 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3728 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
3729 switch(b >> 8) {
3730 case 0x0:
3731 gen_helper_cvtpi2ps(cpu_env, cpu_ptr0, cpu_ptr1);
3732 break;
3733 default:
3734 case 0x1:
3735 gen_helper_cvtpi2pd(cpu_env, cpu_ptr0, cpu_ptr1);
3736 break;
3737 }
3738 break;
3739 case 0x22a: /* cvtsi2ss */
3740 case 0x32a: /* cvtsi2sd */
3741 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3742 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
3743 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
3744 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3745 if (ot == OT_LONG) {
3746 SSEFunc_0_epi sse_fn_epi = sse_op_table3ai[(b >> 8) & 1];
3747 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
3748 sse_fn_epi(cpu_env, cpu_ptr0, cpu_tmp2_i32);
3749 } else {
3750 #ifdef TARGET_X86_64
3751 SSEFunc_0_epl sse_fn_epl = sse_op_table3aq[(b >> 8) & 1];
3752 sse_fn_epl(cpu_env, cpu_ptr0, cpu_T[0]);
3753 #else
3754 goto illegal_op;
3755 #endif
3756 }
3757 break;
3758 case 0x02c: /* cvttps2pi */
3759 case 0x12c: /* cvttpd2pi */
3760 case 0x02d: /* cvtps2pi */
3761 case 0x12d: /* cvtpd2pi */
3762 gen_helper_enter_mmx(cpu_env);
3763 if (mod != 3) {
3764 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3765 op2_offset = offsetof(CPUX86State,xmm_t0);
3766 gen_ldo_env_A0(s->mem_index, op2_offset);
3767 } else {
3768 rm = (modrm & 7) | REX_B(s);
3769 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
3770 }
3771 op1_offset = offsetof(CPUX86State,fpregs[reg & 7].mmx);
3772 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3773 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
3774 switch(b) {
3775 case 0x02c:
3776 gen_helper_cvttps2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3777 break;
3778 case 0x12c:
3779 gen_helper_cvttpd2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3780 break;
3781 case 0x02d:
3782 gen_helper_cvtps2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3783 break;
3784 case 0x12d:
3785 gen_helper_cvtpd2pi(cpu_env, cpu_ptr0, cpu_ptr1);
3786 break;
3787 }
3788 break;
3789 case 0x22c: /* cvttss2si */
3790 case 0x32c: /* cvttsd2si */
3791 case 0x22d: /* cvtss2si */
3792 case 0x32d: /* cvtsd2si */
3793 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3794 if (mod != 3) {
3795 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3796 if ((b >> 8) & 1) {
3797 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_t0.XMM_Q(0)));
3798 } else {
3799 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
3800 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0)));
3801 }
3802 op2_offset = offsetof(CPUX86State,xmm_t0);
3803 } else {
3804 rm = (modrm & 7) | REX_B(s);
3805 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
3806 }
3807 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op2_offset);
3808 if (ot == OT_LONG) {
3809 SSEFunc_i_ep sse_fn_i_ep =
3810 sse_op_table3bi[((b >> 7) & 2) | (b & 1)];
3811 sse_fn_i_ep(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3812 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3813 } else {
3814 #ifdef TARGET_X86_64
3815 SSEFunc_l_ep sse_fn_l_ep =
3816 sse_op_table3bq[((b >> 7) & 2) | (b & 1)];
3817 sse_fn_l_ep(cpu_T[0], cpu_env, cpu_ptr0);
3818 #else
3819 goto illegal_op;
3820 #endif
3821 }
3822 gen_op_mov_reg_T0(ot, reg);
3823 break;
3824 case 0xc4: /* pinsrw */
3825 case 0x1c4:
3826 s->rip_offset = 1;
3827 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
3828 val = cpu_ldub_code(env, s->pc++);
3829 if (b1) {
3830 val &= 7;
3831 tcg_gen_st16_tl(cpu_T[0], cpu_env,
3832 offsetof(CPUX86State,xmm_regs[reg].XMM_W(val)));
3833 } else {
3834 val &= 3;
3835 tcg_gen_st16_tl(cpu_T[0], cpu_env,
3836 offsetof(CPUX86State,fpregs[reg].mmx.MMX_W(val)));
3837 }
3838 break;
3839 case 0xc5: /* pextrw */
3840 case 0x1c5:
3841 if (mod != 3)
3842 goto illegal_op;
3843 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
3844 val = cpu_ldub_code(env, s->pc++);
3845 if (b1) {
3846 val &= 7;
3847 rm = (modrm & 7) | REX_B(s);
3848 tcg_gen_ld16u_tl(cpu_T[0], cpu_env,
3849 offsetof(CPUX86State,xmm_regs[rm].XMM_W(val)));
3850 } else {
3851 val &= 3;
3852 rm = (modrm & 7);
3853 tcg_gen_ld16u_tl(cpu_T[0], cpu_env,
3854 offsetof(CPUX86State,fpregs[rm].mmx.MMX_W(val)));
3855 }
3856 reg = ((modrm >> 3) & 7) | rex_r;
3857 gen_op_mov_reg_T0(ot, reg);
3858 break;
3859 case 0x1d6: /* movq ea, xmm */
3860 if (mod != 3) {
3861 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3862 gen_stq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3863 } else {
3864 rm = (modrm & 7) | REX_B(s);
3865 gen_op_movq(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)),
3866 offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)));
3867 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[rm].XMM_Q(1)));
3868 }
3869 break;
3870 case 0x2d6: /* movq2dq */
3871 gen_helper_enter_mmx(cpu_env);
3872 rm = (modrm & 7);
3873 gen_op_movq(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(0)),
3874 offsetof(CPUX86State,fpregs[rm].mmx));
3875 gen_op_movq_env_0(offsetof(CPUX86State,xmm_regs[reg].XMM_Q(1)));
3876 break;
3877 case 0x3d6: /* movdq2q */
3878 gen_helper_enter_mmx(cpu_env);
3879 rm = (modrm & 7) | REX_B(s);
3880 gen_op_movq(offsetof(CPUX86State,fpregs[reg & 7].mmx),
3881 offsetof(CPUX86State,xmm_regs[rm].XMM_Q(0)));
3882 break;
3883 case 0xd7: /* pmovmskb */
3884 case 0x1d7:
3885 if (mod != 3)
3886 goto illegal_op;
3887 if (b1) {
3888 rm = (modrm & 7) | REX_B(s);
3889 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, offsetof(CPUX86State,xmm_regs[rm]));
3890 gen_helper_pmovmskb_xmm(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3891 } else {
3892 rm = (modrm & 7);
3893 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, offsetof(CPUX86State,fpregs[rm].mmx));
3894 gen_helper_pmovmskb_mmx(cpu_tmp2_i32, cpu_env, cpu_ptr0);
3895 }
3896 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
3897 reg = ((modrm >> 3) & 7) | rex_r;
3898 gen_op_mov_reg_T0(OT_LONG, reg);
3899 break;
3900 case 0x138:
3901 if (s->prefix & PREFIX_REPNZ)
3902 goto crc32;
3903 case 0x038:
3904 b = modrm;
3905 modrm = cpu_ldub_code(env, s->pc++);
3906 rm = modrm & 7;
3907 reg = ((modrm >> 3) & 7) | rex_r;
3908 mod = (modrm >> 6) & 3;
3909 if (b1 >= 2) {
3910 goto illegal_op;
3911 }
3912
3913 sse_fn_epp = sse_op_table6[b].op[b1];
3914 if (!sse_fn_epp) {
3915 goto illegal_op;
3916 }
3917 if (!(s->cpuid_ext_features & sse_op_table6[b].ext_mask))
3918 goto illegal_op;
3919
3920 if (b1) {
3921 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
3922 if (mod == 3) {
3923 op2_offset = offsetof(CPUX86State,xmm_regs[rm | REX_B(s)]);
3924 } else {
3925 op2_offset = offsetof(CPUX86State,xmm_t0);
3926 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3927 switch (b) {
3928 case 0x20: case 0x30: /* pmovsxbw, pmovzxbw */
3929 case 0x23: case 0x33: /* pmovsxwd, pmovzxwd */
3930 case 0x25: case 0x35: /* pmovsxdq, pmovzxdq */
3931 gen_ldq_env_A0(s->mem_index, op2_offset +
3932 offsetof(XMMReg, XMM_Q(0)));
3933 break;
3934 case 0x21: case 0x31: /* pmovsxbd, pmovzxbd */
3935 case 0x24: case 0x34: /* pmovsxwq, pmovzxwq */
3936 tcg_gen_qemu_ld32u(cpu_tmp0, cpu_A0,
3937 (s->mem_index >> 2) - 1);
3938 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp0);
3939 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, op2_offset +
3940 offsetof(XMMReg, XMM_L(0)));
3941 break;
3942 case 0x22: case 0x32: /* pmovsxbq, pmovzxbq */
3943 tcg_gen_qemu_ld16u(cpu_tmp0, cpu_A0,
3944 (s->mem_index >> 2) - 1);
3945 tcg_gen_st16_tl(cpu_tmp0, cpu_env, op2_offset +
3946 offsetof(XMMReg, XMM_W(0)));
3947 break;
3948 case 0x2a: /* movntqda */
3949 gen_ldo_env_A0(s->mem_index, op1_offset);
3950 return;
3951 default:
3952 gen_ldo_env_A0(s->mem_index, op2_offset);
3953 }
3954 }
3955 } else {
3956 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx);
3957 if (mod == 3) {
3958 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
3959 } else {
3960 op2_offset = offsetof(CPUX86State,mmx_t0);
3961 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
3962 gen_ldq_env_A0(s->mem_index, op2_offset);
3963 }
3964 }
3965 if (sse_fn_epp == SSE_SPECIAL) {
3966 goto illegal_op;
3967 }
3968
3969 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
3970 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
3971 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
3972
3973 if (b == 0x17) {
3974 set_cc_op(s, CC_OP_EFLAGS);
3975 }
3976 break;
3977 case 0x338: /* crc32 */
3978 crc32:
3979 b = modrm;
3980 modrm = cpu_ldub_code(env, s->pc++);
3981 reg = ((modrm >> 3) & 7) | rex_r;
3982
3983 if (b != 0xf0 && b != 0xf1)
3984 goto illegal_op;
3985 if (!(s->cpuid_ext_features & CPUID_EXT_SSE42))
3986 goto illegal_op;
3987
3988 if (b == 0xf0)
3989 ot = OT_BYTE;
3990 else if (b == 0xf1 && s->dflag != 2)
3991 if (s->prefix & PREFIX_DATA)
3992 ot = OT_WORD;
3993 else
3994 ot = OT_LONG;
3995 else
3996 ot = OT_QUAD;
3997
3998 gen_op_mov_TN_reg(OT_LONG, 0, reg);
3999 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
4000 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4001 gen_helper_crc32(cpu_T[0], cpu_tmp2_i32,
4002 cpu_T[0], tcg_const_i32(8 << ot));
4003
4004 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
4005 gen_op_mov_reg_T0(ot, reg);
4006 break;
4007 case 0x03a:
4008 case 0x13a:
4009 b = modrm;
4010 modrm = cpu_ldub_code(env, s->pc++);
4011 rm = modrm & 7;
4012 reg = ((modrm >> 3) & 7) | rex_r;
4013 mod = (modrm >> 6) & 3;
4014 if (b1 >= 2) {
4015 goto illegal_op;
4016 }
4017
4018 sse_fn_eppi = sse_op_table7[b].op[b1];
4019 if (!sse_fn_eppi) {
4020 goto illegal_op;
4021 }
4022 if (!(s->cpuid_ext_features & sse_op_table7[b].ext_mask))
4023 goto illegal_op;
4024
4025 if (sse_fn_eppi == SSE_SPECIAL) {
4026 ot = (s->dflag == 2) ? OT_QUAD : OT_LONG;
4027 rm = (modrm & 7) | REX_B(s);
4028 if (mod != 3)
4029 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4030 reg = ((modrm >> 3) & 7) | rex_r;
4031 val = cpu_ldub_code(env, s->pc++);
4032 switch (b) {
4033 case 0x14: /* pextrb */
4034 tcg_gen_ld8u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
4035 xmm_regs[reg].XMM_B(val & 15)));
4036 if (mod == 3)
4037 gen_op_mov_reg_T0(ot, rm);
4038 else
4039 tcg_gen_qemu_st8(cpu_T[0], cpu_A0,
4040 (s->mem_index >> 2) - 1);
4041 break;
4042 case 0x15: /* pextrw */
4043 tcg_gen_ld16u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
4044 xmm_regs[reg].XMM_W(val & 7)));
4045 if (mod == 3)
4046 gen_op_mov_reg_T0(ot, rm);
4047 else
4048 tcg_gen_qemu_st16(cpu_T[0], cpu_A0,
4049 (s->mem_index >> 2) - 1);
4050 break;
4051 case 0x16:
4052 if (ot == OT_LONG) { /* pextrd */
4053 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env,
4054 offsetof(CPUX86State,
4055 xmm_regs[reg].XMM_L(val & 3)));
4056 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
4057 if (mod == 3)
4058 gen_op_mov_reg_v(ot, rm, cpu_T[0]);
4059 else
4060 tcg_gen_qemu_st32(cpu_T[0], cpu_A0,
4061 (s->mem_index >> 2) - 1);
4062 } else { /* pextrq */
4063 #ifdef TARGET_X86_64
4064 tcg_gen_ld_i64(cpu_tmp1_i64, cpu_env,
4065 offsetof(CPUX86State,
4066 xmm_regs[reg].XMM_Q(val & 1)));
4067 if (mod == 3)
4068 gen_op_mov_reg_v(ot, rm, cpu_tmp1_i64);
4069 else
4070 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
4071 (s->mem_index >> 2) - 1);
4072 #else
4073 goto illegal_op;
4074 #endif
4075 }
4076 break;
4077 case 0x17: /* extractps */
4078 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,
4079 xmm_regs[reg].XMM_L(val & 3)));
4080 if (mod == 3)
4081 gen_op_mov_reg_T0(ot, rm);
4082 else
4083 tcg_gen_qemu_st32(cpu_T[0], cpu_A0,
4084 (s->mem_index >> 2) - 1);
4085 break;
4086 case 0x20: /* pinsrb */
4087 if (mod == 3)
4088 gen_op_mov_TN_reg(OT_LONG, 0, rm);
4089 else
4090 tcg_gen_qemu_ld8u(cpu_tmp0, cpu_A0,
4091 (s->mem_index >> 2) - 1);
4092 tcg_gen_st8_tl(cpu_tmp0, cpu_env, offsetof(CPUX86State,
4093 xmm_regs[reg].XMM_B(val & 15)));
4094 break;
4095 case 0x21: /* insertps */
4096 if (mod == 3) {
4097 tcg_gen_ld_i32(cpu_tmp2_i32, cpu_env,
4098 offsetof(CPUX86State,xmm_regs[rm]
4099 .XMM_L((val >> 6) & 3)));
4100 } else {
4101 tcg_gen_qemu_ld32u(cpu_tmp0, cpu_A0,
4102 (s->mem_index >> 2) - 1);
4103 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp0);
4104 }
4105 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env,
4106 offsetof(CPUX86State,xmm_regs[reg]
4107 .XMM_L((val >> 4) & 3)));
4108 if ((val >> 0) & 1)
4109 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4110 cpu_env, offsetof(CPUX86State,
4111 xmm_regs[reg].XMM_L(0)));
4112 if ((val >> 1) & 1)
4113 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4114 cpu_env, offsetof(CPUX86State,
4115 xmm_regs[reg].XMM_L(1)));
4116 if ((val >> 2) & 1)
4117 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4118 cpu_env, offsetof(CPUX86State,
4119 xmm_regs[reg].XMM_L(2)));
4120 if ((val >> 3) & 1)
4121 tcg_gen_st_i32(tcg_const_i32(0 /*float32_zero*/),
4122 cpu_env, offsetof(CPUX86State,
4123 xmm_regs[reg].XMM_L(3)));
4124 break;
4125 case 0x22:
4126 if (ot == OT_LONG) { /* pinsrd */
4127 if (mod == 3)
4128 gen_op_mov_v_reg(ot, cpu_tmp0, rm);
4129 else
4130 tcg_gen_qemu_ld32u(cpu_tmp0, cpu_A0,
4131 (s->mem_index >> 2) - 1);
4132 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_tmp0);
4133 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env,
4134 offsetof(CPUX86State,
4135 xmm_regs[reg].XMM_L(val & 3)));
4136 } else { /* pinsrq */
4137 #ifdef TARGET_X86_64
4138 if (mod == 3)
4139 gen_op_mov_v_reg(ot, cpu_tmp1_i64, rm);
4140 else
4141 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
4142 (s->mem_index >> 2) - 1);
4143 tcg_gen_st_i64(cpu_tmp1_i64, cpu_env,
4144 offsetof(CPUX86State,
4145 xmm_regs[reg].XMM_Q(val & 1)));
4146 #else
4147 goto illegal_op;
4148 #endif
4149 }
4150 break;
4151 }
4152 return;
4153 }
4154
4155 if (b1) {
4156 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
4157 if (mod == 3) {
4158 op2_offset = offsetof(CPUX86State,xmm_regs[rm | REX_B(s)]);
4159 } else {
4160 op2_offset = offsetof(CPUX86State,xmm_t0);
4161 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4162 gen_ldo_env_A0(s->mem_index, op2_offset);
4163 }
4164 } else {
4165 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx);
4166 if (mod == 3) {
4167 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
4168 } else {
4169 op2_offset = offsetof(CPUX86State,mmx_t0);
4170 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4171 gen_ldq_env_A0(s->mem_index, op2_offset);
4172 }
4173 }
4174 val = cpu_ldub_code(env, s->pc++);
4175
4176 if ((b & 0xfc) == 0x60) { /* pcmpXstrX */
4177 set_cc_op(s, CC_OP_EFLAGS);
4178
4179 if (s->dflag == 2)
4180 /* The helper must use entire 64-bit gp registers */
4181 val |= 1 << 8;
4182 }
4183
4184 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4185 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4186 sse_fn_eppi(cpu_env, cpu_ptr0, cpu_ptr1, tcg_const_i32(val));
4187 break;
4188 default:
4189 goto illegal_op;
4190 }
4191 } else {
4192 /* generic MMX or SSE operation */
4193 switch(b) {
4194 case 0x70: /* pshufx insn */
4195 case 0xc6: /* pshufx insn */
4196 case 0xc2: /* compare insns */
4197 s->rip_offset = 1;
4198 break;
4199 default:
4200 break;
4201 }
4202 if (is_xmm) {
4203 op1_offset = offsetof(CPUX86State,xmm_regs[reg]);
4204 if (mod != 3) {
4205 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4206 op2_offset = offsetof(CPUX86State,xmm_t0);
4207 if (b1 >= 2 && ((b >= 0x50 && b <= 0x5f && b != 0x5b) ||
4208 b == 0xc2)) {
4209 /* specific case for SSE single instructions */
4210 if (b1 == 2) {
4211 /* 32 bit access */
4212 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
4213 tcg_gen_st32_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,xmm_t0.XMM_L(0)));
4214 } else {
4215 /* 64 bit access */
4216 gen_ldq_env_A0(s->mem_index, offsetof(CPUX86State,xmm_t0.XMM_D(0)));
4217 }
4218 } else {
4219 gen_ldo_env_A0(s->mem_index, op2_offset);
4220 }
4221 } else {
4222 rm = (modrm & 7) | REX_B(s);
4223 op2_offset = offsetof(CPUX86State,xmm_regs[rm]);
4224 }
4225 } else {
4226 op1_offset = offsetof(CPUX86State,fpregs[reg].mmx);
4227 if (mod != 3) {
4228 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4229 op2_offset = offsetof(CPUX86State,mmx_t0);
4230 gen_ldq_env_A0(s->mem_index, op2_offset);
4231 } else {
4232 rm = (modrm & 7);
4233 op2_offset = offsetof(CPUX86State,fpregs[rm].mmx);
4234 }
4235 }
4236 switch(b) {
4237 case 0x0f: /* 3DNow! data insns */
4238 if (!(s->cpuid_ext2_features & CPUID_EXT2_3DNOW))
4239 goto illegal_op;
4240 val = cpu_ldub_code(env, s->pc++);
4241 sse_fn_epp = sse_op_table5[val];
4242 if (!sse_fn_epp) {
4243 goto illegal_op;
4244 }
4245 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4246 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4247 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4248 break;
4249 case 0x70: /* pshufx insn */
4250 case 0xc6: /* pshufx insn */
4251 val = cpu_ldub_code(env, s->pc++);
4252 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4253 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4254 /* XXX: introduce a new table? */
4255 sse_fn_ppi = (SSEFunc_0_ppi)sse_fn_epp;
4256 sse_fn_ppi(cpu_ptr0, cpu_ptr1, tcg_const_i32(val));
4257 break;
4258 case 0xc2:
4259 /* compare insns */
4260 val = cpu_ldub_code(env, s->pc++);
4261 if (val >= 8)
4262 goto illegal_op;
4263 sse_fn_epp = sse_op_table4[val][b1];
4264
4265 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4266 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4267 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4268 break;
4269 case 0xf7:
4270 /* maskmov : we must prepare A0 */
4271 if (mod != 3)
4272 goto illegal_op;
4273 #ifdef TARGET_X86_64
4274 if (s->aflag == 2) {
4275 gen_op_movq_A0_reg(R_EDI);
4276 } else
4277 #endif
4278 {
4279 gen_op_movl_A0_reg(R_EDI);
4280 if (s->aflag == 0)
4281 gen_op_andl_A0_ffff();
4282 }
4283 gen_add_A0_ds_seg(s);
4284
4285 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4286 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4287 /* XXX: introduce a new table? */
4288 sse_fn_eppt = (SSEFunc_0_eppt)sse_fn_epp;
4289 sse_fn_eppt(cpu_env, cpu_ptr0, cpu_ptr1, cpu_A0);
4290 break;
4291 default:
4292 tcg_gen_addi_ptr(cpu_ptr0, cpu_env, op1_offset);
4293 tcg_gen_addi_ptr(cpu_ptr1, cpu_env, op2_offset);
4294 sse_fn_epp(cpu_env, cpu_ptr0, cpu_ptr1);
4295 break;
4296 }
4297 if (b == 0x2e || b == 0x2f) {
4298 set_cc_op(s, CC_OP_EFLAGS);
4299 }
4300 }
4301 }
4302
4303 /* convert one instruction. s->is_jmp is set if the translation must
4304 be stopped. Return the next pc value */
4305 static target_ulong disas_insn(CPUX86State *env, DisasContext *s,
4306 target_ulong pc_start)
4307 {
4308 int b, prefixes, aflag, dflag;
4309 int shift, ot;
4310 int modrm, reg, rm, mod, reg_addr, op, opreg, offset_addr, val;
4311 target_ulong next_eip, tval;
4312 int rex_w, rex_r;
4313
4314 if (unlikely(qemu_loglevel_mask(CPU_LOG_TB_OP | CPU_LOG_TB_OP_OPT))) {
4315 tcg_gen_debug_insn_start(pc_start);
4316 }
4317 s->pc = pc_start;
4318 prefixes = 0;
4319 aflag = s->code32;
4320 dflag = s->code32;
4321 s->override = -1;
4322 rex_w = -1;
4323 rex_r = 0;
4324 #ifdef TARGET_X86_64
4325 s->rex_x = 0;
4326 s->rex_b = 0;
4327 x86_64_hregs = 0;
4328 #endif
4329 s->rip_offset = 0; /* for relative ip address */
4330 next_byte:
4331 b = cpu_ldub_code(env, s->pc);
4332 s->pc++;
4333 /* check prefixes */
4334 #ifdef TARGET_X86_64
4335 if (CODE64(s)) {
4336 switch (b) {
4337 case 0xf3:
4338 prefixes |= PREFIX_REPZ;
4339 goto next_byte;
4340 case 0xf2:
4341 prefixes |= PREFIX_REPNZ;
4342 goto next_byte;
4343 case 0xf0:
4344 prefixes |= PREFIX_LOCK;
4345 goto next_byte;
4346 case 0x2e:
4347 s->override = R_CS;
4348 goto next_byte;
4349 case 0x36:
4350 s->override = R_SS;
4351 goto next_byte;
4352 case 0x3e:
4353 s->override = R_DS;
4354 goto next_byte;
4355 case 0x26:
4356 s->override = R_ES;
4357 goto next_byte;
4358 case 0x64:
4359 s->override = R_FS;
4360 goto next_byte;
4361 case 0x65:
4362 s->override = R_GS;
4363 goto next_byte;
4364 case 0x66:
4365 prefixes |= PREFIX_DATA;
4366 goto next_byte;
4367 case 0x67:
4368 prefixes |= PREFIX_ADR;
4369 goto next_byte;
4370 case 0x40 ... 0x4f:
4371 /* REX prefix */
4372 rex_w = (b >> 3) & 1;
4373 rex_r = (b & 0x4) << 1;
4374 s->rex_x = (b & 0x2) << 2;
4375 REX_B(s) = (b & 0x1) << 3;
4376 x86_64_hregs = 1; /* select uniform byte register addressing */
4377 goto next_byte;
4378 }
4379 if (rex_w == 1) {
4380 /* 0x66 is ignored if rex.w is set */
4381 dflag = 2;
4382 } else {
4383 if (prefixes & PREFIX_DATA)
4384 dflag ^= 1;
4385 }
4386 if (!(prefixes & PREFIX_ADR))
4387 aflag = 2;
4388 } else
4389 #endif
4390 {
4391 switch (b) {
4392 case 0xf3:
4393 prefixes |= PREFIX_REPZ;
4394 goto next_byte;
4395 case 0xf2:
4396 prefixes |= PREFIX_REPNZ;
4397 goto next_byte;
4398 case 0xf0:
4399 prefixes |= PREFIX_LOCK;
4400 goto next_byte;
4401 case 0x2e:
4402 s->override = R_CS;
4403 goto next_byte;
4404 case 0x36:
4405 s->override = R_SS;
4406 goto next_byte;
4407 case 0x3e:
4408 s->override = R_DS;
4409 goto next_byte;
4410 case 0x26:
4411 s->override = R_ES;
4412 goto next_byte;
4413 case 0x64:
4414 s->override = R_FS;
4415 goto next_byte;
4416 case 0x65:
4417 s->override = R_GS;
4418 goto next_byte;
4419 case 0x66:
4420 prefixes |= PREFIX_DATA;
4421 goto next_byte;
4422 case 0x67:
4423 prefixes |= PREFIX_ADR;
4424 goto next_byte;
4425 }
4426 if (prefixes & PREFIX_DATA)
4427 dflag ^= 1;
4428 if (prefixes & PREFIX_ADR)
4429 aflag ^= 1;
4430 }
4431
4432 s->prefix = prefixes;
4433 s->aflag = aflag;
4434 s->dflag = dflag;
4435
4436 /* lock generation */
4437 if (prefixes & PREFIX_LOCK)
4438 gen_helper_lock();
4439
4440 /* now check op code */
4441 reswitch:
4442 switch(b) {
4443 case 0x0f:
4444 /**************************/
4445 /* extended op code */
4446 b = cpu_ldub_code(env, s->pc++) | 0x100;
4447 goto reswitch;
4448
4449 /**************************/
4450 /* arith & logic */
4451 case 0x00 ... 0x05:
4452 case 0x08 ... 0x0d:
4453 case 0x10 ... 0x15:
4454 case 0x18 ... 0x1d:
4455 case 0x20 ... 0x25:
4456 case 0x28 ... 0x2d:
4457 case 0x30 ... 0x35:
4458 case 0x38 ... 0x3d:
4459 {
4460 int op, f, val;
4461 op = (b >> 3) & 7;
4462 f = (b >> 1) & 3;
4463
4464 if ((b & 1) == 0)
4465 ot = OT_BYTE;
4466 else
4467 ot = dflag + OT_WORD;
4468
4469 switch(f) {
4470 case 0: /* OP Ev, Gv */
4471 modrm = cpu_ldub_code(env, s->pc++);
4472 reg = ((modrm >> 3) & 7) | rex_r;
4473 mod = (modrm >> 6) & 3;
4474 rm = (modrm & 7) | REX_B(s);
4475 if (mod != 3) {
4476 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4477 opreg = OR_TMP0;
4478 } else if (op == OP_XORL && rm == reg) {
4479 xor_zero:
4480 /* xor reg, reg optimisation */
4481 gen_op_movl_T0_0();
4482 set_cc_op(s, CC_OP_LOGICB + ot);
4483 gen_op_mov_reg_T0(ot, reg);
4484 gen_op_update1_cc();
4485 break;
4486 } else {
4487 opreg = rm;
4488 }
4489 gen_op_mov_TN_reg(ot, 1, reg);
4490 gen_op(s, op, ot, opreg);
4491 break;
4492 case 1: /* OP Gv, Ev */
4493 modrm = cpu_ldub_code(env, s->pc++);
4494 mod = (modrm >> 6) & 3;
4495 reg = ((modrm >> 3) & 7) | rex_r;
4496 rm = (modrm & 7) | REX_B(s);
4497 if (mod != 3) {
4498 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4499 gen_op_ld_T1_A0(ot + s->mem_index);
4500 } else if (op == OP_XORL && rm == reg) {
4501 goto xor_zero;
4502 } else {
4503 gen_op_mov_TN_reg(ot, 1, rm);
4504 }
4505 gen_op(s, op, ot, reg);
4506 break;
4507 case 2: /* OP A, Iv */
4508 val = insn_get(env, s, ot);
4509 gen_op_movl_T1_im(val);
4510 gen_op(s, op, ot, OR_EAX);
4511 break;
4512 }
4513 }
4514 break;
4515
4516 case 0x82:
4517 if (CODE64(s))
4518 goto illegal_op;
4519 case 0x80: /* GRP1 */
4520 case 0x81:
4521 case 0x83:
4522 {
4523 int val;
4524
4525 if ((b & 1) == 0)
4526 ot = OT_BYTE;
4527 else
4528 ot = dflag + OT_WORD;
4529
4530 modrm = cpu_ldub_code(env, s->pc++);
4531 mod = (modrm >> 6) & 3;
4532 rm = (modrm & 7) | REX_B(s);
4533 op = (modrm >> 3) & 7;
4534
4535 if (mod != 3) {
4536 if (b == 0x83)
4537 s->rip_offset = 1;
4538 else
4539 s->rip_offset = insn_const_size(ot);
4540 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4541 opreg = OR_TMP0;
4542 } else {
4543 opreg = rm;
4544 }
4545
4546 switch(b) {
4547 default:
4548 case 0x80:
4549 case 0x81:
4550 case 0x82:
4551 val = insn_get(env, s, ot);
4552 break;
4553 case 0x83:
4554 val = (int8_t)insn_get(env, s, OT_BYTE);
4555 break;
4556 }
4557 gen_op_movl_T1_im(val);
4558 gen_op(s, op, ot, opreg);
4559 }
4560 break;
4561
4562 /**************************/
4563 /* inc, dec, and other misc arith */
4564 case 0x40 ... 0x47: /* inc Gv */
4565 ot = dflag ? OT_LONG : OT_WORD;
4566 gen_inc(s, ot, OR_EAX + (b & 7), 1);
4567 break;
4568 case 0x48 ... 0x4f: /* dec Gv */
4569 ot = dflag ? OT_LONG : OT_WORD;
4570 gen_inc(s, ot, OR_EAX + (b & 7), -1);
4571 break;
4572 case 0xf6: /* GRP3 */
4573 case 0xf7:
4574 if ((b & 1) == 0)
4575 ot = OT_BYTE;
4576 else
4577 ot = dflag + OT_WORD;
4578
4579 modrm = cpu_ldub_code(env, s->pc++);
4580 mod = (modrm >> 6) & 3;
4581 rm = (modrm & 7) | REX_B(s);
4582 op = (modrm >> 3) & 7;
4583 if (mod != 3) {
4584 if (op == 0)
4585 s->rip_offset = insn_const_size(ot);
4586 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4587 gen_op_ld_T0_A0(ot + s->mem_index);
4588 } else {
4589 gen_op_mov_TN_reg(ot, 0, rm);
4590 }
4591
4592 switch(op) {
4593 case 0: /* test */
4594 val = insn_get(env, s, ot);
4595 gen_op_movl_T1_im(val);
4596 gen_op_testl_T0_T1_cc();
4597 set_cc_op(s, CC_OP_LOGICB + ot);
4598 break;
4599 case 2: /* not */
4600 tcg_gen_not_tl(cpu_T[0], cpu_T[0]);
4601 if (mod != 3) {
4602 gen_op_st_T0_A0(ot + s->mem_index);
4603 } else {
4604 gen_op_mov_reg_T0(ot, rm);
4605 }
4606 break;
4607 case 3: /* neg */
4608 tcg_gen_neg_tl(cpu_T[0], cpu_T[0]);
4609 if (mod != 3) {
4610 gen_op_st_T0_A0(ot + s->mem_index);
4611 } else {
4612 gen_op_mov_reg_T0(ot, rm);
4613 }
4614 gen_op_update_neg_cc();
4615 set_cc_op(s, CC_OP_SUBB + ot);
4616 break;
4617 case 4: /* mul */
4618 switch(ot) {
4619 case OT_BYTE:
4620 gen_op_mov_TN_reg(OT_BYTE, 1, R_EAX);
4621 tcg_gen_ext8u_tl(cpu_T[0], cpu_T[0]);
4622 tcg_gen_ext8u_tl(cpu_T[1], cpu_T[1]);
4623 /* XXX: use 32 bit mul which could be faster */
4624 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4625 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4626 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4627 tcg_gen_andi_tl(cpu_cc_src, cpu_T[0], 0xff00);
4628 set_cc_op(s, CC_OP_MULB);
4629 break;
4630 case OT_WORD:
4631 gen_op_mov_TN_reg(OT_WORD, 1, R_EAX);
4632 tcg_gen_ext16u_tl(cpu_T[0], cpu_T[0]);
4633 tcg_gen_ext16u_tl(cpu_T[1], cpu_T[1]);
4634 /* XXX: use 32 bit mul which could be faster */
4635 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4636 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4637 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4638 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 16);
4639 gen_op_mov_reg_T0(OT_WORD, R_EDX);
4640 tcg_gen_mov_tl(cpu_cc_src, cpu_T[0]);
4641 set_cc_op(s, CC_OP_MULW);
4642 break;
4643 default:
4644 case OT_LONG:
4645 #ifdef TARGET_X86_64
4646 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4647 tcg_gen_ext32u_tl(cpu_T[0], cpu_T[0]);
4648 tcg_gen_ext32u_tl(cpu_T[1], cpu_T[1]);
4649 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4650 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4651 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4652 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 32);
4653 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4654 tcg_gen_mov_tl(cpu_cc_src, cpu_T[0]);
4655 #else
4656 {
4657 TCGv_i64 t0, t1;
4658 t0 = tcg_temp_new_i64();
4659 t1 = tcg_temp_new_i64();
4660 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4661 tcg_gen_extu_i32_i64(t0, cpu_T[0]);
4662 tcg_gen_extu_i32_i64(t1, cpu_T[1]);
4663 tcg_gen_mul_i64(t0, t0, t1);
4664 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4665 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4666 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4667 tcg_gen_shri_i64(t0, t0, 32);
4668 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4669 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4670 tcg_gen_mov_tl(cpu_cc_src, cpu_T[0]);
4671 }
4672 #endif
4673 set_cc_op(s, CC_OP_MULL);
4674 break;
4675 #ifdef TARGET_X86_64
4676 case OT_QUAD:
4677 gen_helper_mulq_EAX_T0(cpu_env, cpu_T[0]);
4678 set_cc_op(s, CC_OP_MULQ);
4679 break;
4680 #endif
4681 }
4682 break;
4683 case 5: /* imul */
4684 switch(ot) {
4685 case OT_BYTE:
4686 gen_op_mov_TN_reg(OT_BYTE, 1, R_EAX);
4687 tcg_gen_ext8s_tl(cpu_T[0], cpu_T[0]);
4688 tcg_gen_ext8s_tl(cpu_T[1], cpu_T[1]);
4689 /* XXX: use 32 bit mul which could be faster */
4690 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4691 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4692 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4693 tcg_gen_ext8s_tl(cpu_tmp0, cpu_T[0]);
4694 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4695 set_cc_op(s, CC_OP_MULB);
4696 break;
4697 case OT_WORD:
4698 gen_op_mov_TN_reg(OT_WORD, 1, R_EAX);
4699 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
4700 tcg_gen_ext16s_tl(cpu_T[1], cpu_T[1]);
4701 /* XXX: use 32 bit mul which could be faster */
4702 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4703 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4704 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4705 tcg_gen_ext16s_tl(cpu_tmp0, cpu_T[0]);
4706 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4707 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 16);
4708 gen_op_mov_reg_T0(OT_WORD, R_EDX);
4709 set_cc_op(s, CC_OP_MULW);
4710 break;
4711 default:
4712 case OT_LONG:
4713 #ifdef TARGET_X86_64
4714 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4715 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
4716 tcg_gen_ext32s_tl(cpu_T[1], cpu_T[1]);
4717 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
4718 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4719 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4720 tcg_gen_ext32s_tl(cpu_tmp0, cpu_T[0]);
4721 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4722 tcg_gen_shri_tl(cpu_T[0], cpu_T[0], 32);
4723 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4724 #else
4725 {
4726 TCGv_i64 t0, t1;
4727 t0 = tcg_temp_new_i64();
4728 t1 = tcg_temp_new_i64();
4729 gen_op_mov_TN_reg(OT_LONG, 1, R_EAX);
4730 tcg_gen_ext_i32_i64(t0, cpu_T[0]);
4731 tcg_gen_ext_i32_i64(t1, cpu_T[1]);
4732 tcg_gen_mul_i64(t0, t0, t1);
4733 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4734 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4735 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
4736 tcg_gen_sari_tl(cpu_tmp0, cpu_T[0], 31);
4737 tcg_gen_shri_i64(t0, t0, 32);
4738 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
4739 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4740 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
4741 }
4742 #endif
4743 set_cc_op(s, CC_OP_MULL);
4744 break;
4745 #ifdef TARGET_X86_64
4746 case OT_QUAD:
4747 gen_helper_imulq_EAX_T0(cpu_env, cpu_T[0]);
4748 set_cc_op(s, CC_OP_MULQ);
4749 break;
4750 #endif
4751 }
4752 break;
4753 case 6: /* div */
4754 switch(ot) {
4755 case OT_BYTE:
4756 gen_jmp_im(pc_start - s->cs_base);
4757 gen_helper_divb_AL(cpu_env, cpu_T[0]);
4758 break;
4759 case OT_WORD:
4760 gen_jmp_im(pc_start - s->cs_base);
4761 gen_helper_divw_AX(cpu_env, cpu_T[0]);
4762 break;
4763 default:
4764 case OT_LONG:
4765 gen_jmp_im(pc_start - s->cs_base);
4766 gen_helper_divl_EAX(cpu_env, cpu_T[0]);
4767 break;
4768 #ifdef TARGET_X86_64
4769 case OT_QUAD:
4770 gen_jmp_im(pc_start - s->cs_base);
4771 gen_helper_divq_EAX(cpu_env, cpu_T[0]);
4772 break;
4773 #endif
4774 }
4775 break;
4776 case 7: /* idiv */
4777 switch(ot) {
4778 case OT_BYTE:
4779 gen_jmp_im(pc_start - s->cs_base);
4780 gen_helper_idivb_AL(cpu_env, cpu_T[0]);
4781 break;
4782 case OT_WORD:
4783 gen_jmp_im(pc_start - s->cs_base);
4784 gen_helper_idivw_AX(cpu_env, cpu_T[0]);
4785 break;
4786 default:
4787 case OT_LONG:
4788 gen_jmp_im(pc_start - s->cs_base);
4789 gen_helper_idivl_EAX(cpu_env, cpu_T[0]);
4790 break;
4791 #ifdef TARGET_X86_64
4792 case OT_QUAD:
4793 gen_jmp_im(pc_start - s->cs_base);
4794 gen_helper_idivq_EAX(cpu_env, cpu_T[0]);
4795 break;
4796 #endif
4797 }
4798 break;
4799 default:
4800 goto illegal_op;
4801 }
4802 break;
4803
4804 case 0xfe: /* GRP4 */
4805 case 0xff: /* GRP5 */
4806 if ((b & 1) == 0)
4807 ot = OT_BYTE;
4808 else
4809 ot = dflag + OT_WORD;
4810
4811 modrm = cpu_ldub_code(env, s->pc++);
4812 mod = (modrm >> 6) & 3;
4813 rm = (modrm & 7) | REX_B(s);
4814 op = (modrm >> 3) & 7;
4815 if (op >= 2 && b == 0xfe) {
4816 goto illegal_op;
4817 }
4818 if (CODE64(s)) {
4819 if (op == 2 || op == 4) {
4820 /* operand size for jumps is 64 bit */
4821 ot = OT_QUAD;
4822 } else if (op == 3 || op == 5) {
4823 ot = dflag ? OT_LONG + (rex_w == 1) : OT_WORD;
4824 } else if (op == 6) {
4825 /* default push size is 64 bit */
4826 ot = dflag ? OT_QUAD : OT_WORD;
4827 }
4828 }
4829 if (mod != 3) {
4830 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
4831 if (op >= 2 && op != 3 && op != 5)
4832 gen_op_ld_T0_A0(ot + s->mem_index);
4833 } else {
4834 gen_op_mov_TN_reg(ot, 0, rm);
4835 }
4836
4837 switch(op) {
4838 case 0: /* inc Ev */
4839 if (mod != 3)
4840 opreg = OR_TMP0;
4841 else
4842 opreg = rm;
4843 gen_inc(s, ot, opreg, 1);
4844 break;
4845 case 1: /* dec Ev */
4846 if (mod != 3)
4847 opreg = OR_TMP0;
4848 else
4849 opreg = rm;
4850 gen_inc(s, ot, opreg, -1);
4851 break;
4852 case 2: /* call Ev */
4853 /* XXX: optimize if memory (no 'and' is necessary) */
4854 if (s->dflag == 0)
4855 gen_op_andl_T0_ffff();
4856 next_eip = s->pc - s->cs_base;
4857 gen_movtl_T1_im(next_eip);
4858 gen_push_T1(s);
4859 gen_op_jmp_T0();
4860 gen_eob(s);
4861 break;
4862 case 3: /* lcall Ev */
4863 gen_op_ld_T1_A0(ot + s->mem_index);
4864 gen_add_A0_im(s, 1 << (ot - OT_WORD + 1));
4865 gen_op_ldu_T0_A0(OT_WORD + s->mem_index);
4866 do_lcall:
4867 if (s->pe && !s->vm86) {
4868 gen_update_cc_op(s);
4869 gen_jmp_im(pc_start - s->cs_base);
4870 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
4871 gen_helper_lcall_protected(cpu_env, cpu_tmp2_i32, cpu_T[1],
4872 tcg_const_i32(dflag),
4873 tcg_const_i32(s->pc - pc_start));
4874 } else {
4875 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
4876 gen_helper_lcall_real(cpu_env, cpu_tmp2_i32, cpu_T[1],
4877 tcg_const_i32(dflag),
4878 tcg_const_i32(s->pc - s->cs_base));
4879 }
4880 gen_eob(s);
4881 break;
4882 case 4: /* jmp Ev */
4883 if (s->dflag == 0)
4884 gen_op_andl_T0_ffff();
4885 gen_op_jmp_T0();
4886 gen_eob(s);
4887 break;
4888 case 5: /* ljmp Ev */
4889 gen_op_ld_T1_A0(ot + s->mem_index);
4890 gen_add_A0_im(s, 1 << (ot - OT_WORD + 1));
4891 gen_op_ldu_T0_A0(OT_WORD + s->mem_index);
4892 do_ljmp:
4893 if (s->pe && !s->vm86) {
4894 gen_update_cc_op(s);
4895 gen_jmp_im(pc_start - s->cs_base);
4896 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
4897 gen_helper_ljmp_protected(cpu_env, cpu_tmp2_i32, cpu_T[1],
4898 tcg_const_i32(s->pc - pc_start));
4899 } else {
4900 gen_op_movl_seg_T0_vm(R_CS);
4901 gen_op_movl_T0_T1();
4902 gen_op_jmp_T0();
4903 }
4904 gen_eob(s);
4905 break;
4906 case 6: /* push Ev */
4907 gen_push_T0(s);
4908 break;
4909 default:
4910 goto illegal_op;
4911 }
4912 break;
4913
4914 case 0x84: /* test Ev, Gv */
4915 case 0x85:
4916 if ((b & 1) == 0)
4917 ot = OT_BYTE;
4918 else
4919 ot = dflag + OT_WORD;
4920
4921 modrm = cpu_ldub_code(env, s->pc++);
4922 reg = ((modrm >> 3) & 7) | rex_r;
4923
4924 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4925 gen_op_mov_TN_reg(ot, 1, reg);
4926 gen_op_testl_T0_T1_cc();
4927 set_cc_op(s, CC_OP_LOGICB + ot);
4928 break;
4929
4930 case 0xa8: /* test eAX, Iv */
4931 case 0xa9:
4932 if ((b & 1) == 0)
4933 ot = OT_BYTE;
4934 else
4935 ot = dflag + OT_WORD;
4936 val = insn_get(env, s, ot);
4937
4938 gen_op_mov_TN_reg(ot, 0, OR_EAX);
4939 gen_op_movl_T1_im(val);
4940 gen_op_testl_T0_T1_cc();
4941 set_cc_op(s, CC_OP_LOGICB + ot);
4942 break;
4943
4944 case 0x98: /* CWDE/CBW */
4945 #ifdef TARGET_X86_64
4946 if (dflag == 2) {
4947 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
4948 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
4949 gen_op_mov_reg_T0(OT_QUAD, R_EAX);
4950 } else
4951 #endif
4952 if (dflag == 1) {
4953 gen_op_mov_TN_reg(OT_WORD, 0, R_EAX);
4954 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
4955 gen_op_mov_reg_T0(OT_LONG, R_EAX);
4956 } else {
4957 gen_op_mov_TN_reg(OT_BYTE, 0, R_EAX);
4958 tcg_gen_ext8s_tl(cpu_T[0], cpu_T[0]);
4959 gen_op_mov_reg_T0(OT_WORD, R_EAX);
4960 }
4961 break;
4962 case 0x99: /* CDQ/CWD */
4963 #ifdef TARGET_X86_64
4964 if (dflag == 2) {
4965 gen_op_mov_TN_reg(OT_QUAD, 0, R_EAX);
4966 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], 63);
4967 gen_op_mov_reg_T0(OT_QUAD, R_EDX);
4968 } else
4969 #endif
4970 if (dflag == 1) {
4971 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
4972 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
4973 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], 31);
4974 gen_op_mov_reg_T0(OT_LONG, R_EDX);
4975 } else {
4976 gen_op_mov_TN_reg(OT_WORD, 0, R_EAX);
4977 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
4978 tcg_gen_sari_tl(cpu_T[0], cpu_T[0], 15);
4979 gen_op_mov_reg_T0(OT_WORD, R_EDX);
4980 }
4981 break;
4982 case 0x1af: /* imul Gv, Ev */
4983 case 0x69: /* imul Gv, Ev, I */
4984 case 0x6b:
4985 ot = dflag + OT_WORD;
4986 modrm = cpu_ldub_code(env, s->pc++);
4987 reg = ((modrm >> 3) & 7) | rex_r;
4988 if (b == 0x69)
4989 s->rip_offset = insn_const_size(ot);
4990 else if (b == 0x6b)
4991 s->rip_offset = 1;
4992 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
4993 if (b == 0x69) {
4994 val = insn_get(env, s, ot);
4995 gen_op_movl_T1_im(val);
4996 } else if (b == 0x6b) {
4997 val = (int8_t)insn_get(env, s, OT_BYTE);
4998 gen_op_movl_T1_im(val);
4999 } else {
5000 gen_op_mov_TN_reg(ot, 1, reg);
5001 }
5002
5003 #ifdef TARGET_X86_64
5004 if (ot == OT_QUAD) {
5005 gen_helper_imulq_T0_T1(cpu_T[0], cpu_env, cpu_T[0], cpu_T[1]);
5006 } else
5007 #endif
5008 if (ot == OT_LONG) {
5009 #ifdef TARGET_X86_64
5010 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
5011 tcg_gen_ext32s_tl(cpu_T[1], cpu_T[1]);
5012 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
5013 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
5014 tcg_gen_ext32s_tl(cpu_tmp0, cpu_T[0]);
5015 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
5016 #else
5017 {
5018 TCGv_i64 t0, t1;
5019 t0 = tcg_temp_new_i64();
5020 t1 = tcg_temp_new_i64();
5021 tcg_gen_ext_i32_i64(t0, cpu_T[0]);
5022 tcg_gen_ext_i32_i64(t1, cpu_T[1]);
5023 tcg_gen_mul_i64(t0, t0, t1);
5024 tcg_gen_trunc_i64_i32(cpu_T[0], t0);
5025 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
5026 tcg_gen_sari_tl(cpu_tmp0, cpu_T[0], 31);
5027 tcg_gen_shri_i64(t0, t0, 32);
5028 tcg_gen_trunc_i64_i32(cpu_T[1], t0);
5029 tcg_gen_sub_tl(cpu_cc_src, cpu_T[1], cpu_tmp0);
5030 }
5031 #endif
5032 } else {
5033 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
5034 tcg_gen_ext16s_tl(cpu_T[1], cpu_T[1]);
5035 /* XXX: use 32 bit mul which could be faster */
5036 tcg_gen_mul_tl(cpu_T[0], cpu_T[0], cpu_T[1]);
5037 tcg_gen_mov_tl(cpu_cc_dst, cpu_T[0]);
5038 tcg_gen_ext16s_tl(cpu_tmp0, cpu_T[0]);
5039 tcg_gen_sub_tl(cpu_cc_src, cpu_T[0], cpu_tmp0);
5040 }
5041 gen_op_mov_reg_T0(ot, reg);
5042 set_cc_op(s, CC_OP_MULB + ot);
5043 break;
5044 case 0x1c0:
5045 case 0x1c1: /* xadd Ev, Gv */
5046 if ((b & 1) == 0)
5047 ot = OT_BYTE;
5048 else
5049 ot = dflag + OT_WORD;
5050 modrm = cpu_ldub_code(env, s->pc++);
5051 reg = ((modrm >> 3) & 7) | rex_r;
5052 mod = (modrm >> 6) & 3;
5053 if (mod == 3) {
5054 rm = (modrm & 7) | REX_B(s);
5055 gen_op_mov_TN_reg(ot, 0, reg);
5056 gen_op_mov_TN_reg(ot, 1, rm);
5057 gen_op_addl_T0_T1();
5058 gen_op_mov_reg_T1(ot, reg);
5059 gen_op_mov_reg_T0(ot, rm);
5060 } else {
5061 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5062 gen_op_mov_TN_reg(ot, 0, reg);
5063 gen_op_ld_T1_A0(ot + s->mem_index);
5064 gen_op_addl_T0_T1();
5065 gen_op_st_T0_A0(ot + s->mem_index);
5066 gen_op_mov_reg_T1(ot, reg);
5067 }
5068 gen_op_update2_cc();
5069 set_cc_op(s, CC_OP_ADDB + ot);
5070 break;
5071 case 0x1b0:
5072 case 0x1b1: /* cmpxchg Ev, Gv */
5073 {
5074 int label1, label2;
5075 TCGv t0, t1, t2, a0;
5076
5077 if ((b & 1) == 0)
5078 ot = OT_BYTE;
5079 else
5080 ot = dflag + OT_WORD;
5081 modrm = cpu_ldub_code(env, s->pc++);
5082 reg = ((modrm >> 3) & 7) | rex_r;
5083 mod = (modrm >> 6) & 3;
5084 t0 = tcg_temp_local_new();
5085 t1 = tcg_temp_local_new();
5086 t2 = tcg_temp_local_new();
5087 a0 = tcg_temp_local_new();
5088 gen_op_mov_v_reg(ot, t1, reg);
5089 if (mod == 3) {
5090 rm = (modrm & 7) | REX_B(s);
5091 gen_op_mov_v_reg(ot, t0, rm);
5092 } else {
5093 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5094 tcg_gen_mov_tl(a0, cpu_A0);
5095 gen_op_ld_v(ot + s->mem_index, t0, a0);
5096 rm = 0; /* avoid warning */
5097 }
5098 label1 = gen_new_label();
5099 tcg_gen_sub_tl(t2, cpu_regs[R_EAX], t0);
5100 gen_extu(ot, t2);
5101 tcg_gen_brcondi_tl(TCG_COND_EQ, t2, 0, label1);
5102 label2 = gen_new_label();
5103 if (mod == 3) {
5104 gen_op_mov_reg_v(ot, R_EAX, t0);
5105 tcg_gen_br(label2);
5106 gen_set_label(label1);
5107 gen_op_mov_reg_v(ot, rm, t1);
5108 } else {
5109 /* perform no-op store cycle like physical cpu; must be
5110 before changing accumulator to ensure idempotency if
5111 the store faults and the instruction is restarted */
5112 gen_op_st_v(ot + s->mem_index, t0, a0);
5113 gen_op_mov_reg_v(ot, R_EAX, t0);
5114 tcg_gen_br(label2);
5115 gen_set_label(label1);
5116 gen_op_st_v(ot + s->mem_index, t1, a0);
5117 }
5118 gen_set_label(label2);
5119 tcg_gen_mov_tl(cpu_cc_src, t0);
5120 tcg_gen_mov_tl(cpu_cc_dst, t2);
5121 set_cc_op(s, CC_OP_SUBB + ot);
5122 tcg_temp_free(t0);
5123 tcg_temp_free(t1);
5124 tcg_temp_free(t2);
5125 tcg_temp_free(a0);
5126 }
5127 break;
5128 case 0x1c7: /* cmpxchg8b */
5129 modrm = cpu_ldub_code(env, s->pc++);
5130 mod = (modrm >> 6) & 3;
5131 if ((mod == 3) || ((modrm & 0x38) != 0x8))
5132 goto illegal_op;
5133 #ifdef TARGET_X86_64
5134 if (dflag == 2) {
5135 if (!(s->cpuid_ext_features & CPUID_EXT_CX16))
5136 goto illegal_op;
5137 gen_jmp_im(pc_start - s->cs_base);
5138 gen_update_cc_op(s);
5139 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5140 gen_helper_cmpxchg16b(cpu_env, cpu_A0);
5141 } else
5142 #endif
5143 {
5144 if (!(s->cpuid_features & CPUID_CX8))
5145 goto illegal_op;
5146 gen_jmp_im(pc_start - s->cs_base);
5147 gen_update_cc_op(s);
5148 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5149 gen_helper_cmpxchg8b(cpu_env, cpu_A0);
5150 }
5151 set_cc_op(s, CC_OP_EFLAGS);
5152 break;
5153
5154 /**************************/
5155 /* push/pop */
5156 case 0x50 ... 0x57: /* push */
5157 gen_op_mov_TN_reg(OT_LONG, 0, (b & 7) | REX_B(s));
5158 gen_push_T0(s);
5159 break;
5160 case 0x58 ... 0x5f: /* pop */
5161 if (CODE64(s)) {
5162 ot = dflag ? OT_QUAD : OT_WORD;
5163 } else {
5164 ot = dflag + OT_WORD;
5165 }
5166 gen_pop_T0(s);
5167 /* NOTE: order is important for pop %sp */
5168 gen_pop_update(s);
5169 gen_op_mov_reg_T0(ot, (b & 7) | REX_B(s));
5170 break;
5171 case 0x60: /* pusha */
5172 if (CODE64(s))
5173 goto illegal_op;
5174 gen_pusha(s);
5175 break;
5176 case 0x61: /* popa */
5177 if (CODE64(s))
5178 goto illegal_op;
5179 gen_popa(s);
5180 break;
5181 case 0x68: /* push Iv */
5182 case 0x6a:
5183 if (CODE64(s)) {
5184 ot = dflag ? OT_QUAD : OT_WORD;
5185 } else {
5186 ot = dflag + OT_WORD;
5187 }
5188 if (b == 0x68)
5189 val = insn_get(env, s, ot);
5190 else
5191 val = (int8_t)insn_get(env, s, OT_BYTE);
5192 gen_op_movl_T0_im(val);
5193 gen_push_T0(s);
5194 break;
5195 case 0x8f: /* pop Ev */
5196 if (CODE64(s)) {
5197 ot = dflag ? OT_QUAD : OT_WORD;
5198 } else {
5199 ot = dflag + OT_WORD;
5200 }
5201 modrm = cpu_ldub_code(env, s->pc++);
5202 mod = (modrm >> 6) & 3;
5203 gen_pop_T0(s);
5204 if (mod == 3) {
5205 /* NOTE: order is important for pop %sp */
5206 gen_pop_update(s);
5207 rm = (modrm & 7) | REX_B(s);
5208 gen_op_mov_reg_T0(ot, rm);
5209 } else {
5210 /* NOTE: order is important too for MMU exceptions */
5211 s->popl_esp_hack = 1 << ot;
5212 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
5213 s->popl_esp_hack = 0;
5214 gen_pop_update(s);
5215 }
5216 break;
5217 case 0xc8: /* enter */
5218 {
5219 int level;
5220 val = cpu_lduw_code(env, s->pc);
5221 s->pc += 2;
5222 level = cpu_ldub_code(env, s->pc++);
5223 gen_enter(s, val, level);
5224 }
5225 break;
5226 case 0xc9: /* leave */
5227 /* XXX: exception not precise (ESP is updated before potential exception) */
5228 if (CODE64(s)) {
5229 gen_op_mov_TN_reg(OT_QUAD, 0, R_EBP);
5230 gen_op_mov_reg_T0(OT_QUAD, R_ESP);
5231 } else if (s->ss32) {
5232 gen_op_mov_TN_reg(OT_LONG, 0, R_EBP);
5233 gen_op_mov_reg_T0(OT_LONG, R_ESP);
5234 } else {
5235 gen_op_mov_TN_reg(OT_WORD, 0, R_EBP);
5236 gen_op_mov_reg_T0(OT_WORD, R_ESP);
5237 }
5238 gen_pop_T0(s);
5239 if (CODE64(s)) {
5240 ot = dflag ? OT_QUAD : OT_WORD;
5241 } else {
5242 ot = dflag + OT_WORD;
5243 }
5244 gen_op_mov_reg_T0(ot, R_EBP);
5245 gen_pop_update(s);
5246 break;
5247 case 0x06: /* push es */
5248 case 0x0e: /* push cs */
5249 case 0x16: /* push ss */
5250 case 0x1e: /* push ds */
5251 if (CODE64(s))
5252 goto illegal_op;
5253 gen_op_movl_T0_seg(b >> 3);
5254 gen_push_T0(s);
5255 break;
5256 case 0x1a0: /* push fs */
5257 case 0x1a8: /* push gs */
5258 gen_op_movl_T0_seg((b >> 3) & 7);
5259 gen_push_T0(s);
5260 break;
5261 case 0x07: /* pop es */
5262 case 0x17: /* pop ss */
5263 case 0x1f: /* pop ds */
5264 if (CODE64(s))
5265 goto illegal_op;
5266 reg = b >> 3;
5267 gen_pop_T0(s);
5268 gen_movl_seg_T0(s, reg, pc_start - s->cs_base);
5269 gen_pop_update(s);
5270 if (reg == R_SS) {
5271 /* if reg == SS, inhibit interrupts/trace. */
5272 /* If several instructions disable interrupts, only the
5273 _first_ does it */
5274 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK))
5275 gen_helper_set_inhibit_irq(cpu_env);
5276 s->tf = 0;
5277 }
5278 if (s->is_jmp) {
5279 gen_jmp_im(s->pc - s->cs_base);
5280 gen_eob(s);
5281 }
5282 break;
5283 case 0x1a1: /* pop fs */
5284 case 0x1a9: /* pop gs */
5285 gen_pop_T0(s);
5286 gen_movl_seg_T0(s, (b >> 3) & 7, pc_start - s->cs_base);
5287 gen_pop_update(s);
5288 if (s->is_jmp) {
5289 gen_jmp_im(s->pc - s->cs_base);
5290 gen_eob(s);
5291 }
5292 break;
5293
5294 /**************************/
5295 /* mov */
5296 case 0x88:
5297 case 0x89: /* mov Gv, Ev */
5298 if ((b & 1) == 0)
5299 ot = OT_BYTE;
5300 else
5301 ot = dflag + OT_WORD;
5302 modrm = cpu_ldub_code(env, s->pc++);
5303 reg = ((modrm >> 3) & 7) | rex_r;
5304
5305 /* generate a generic store */
5306 gen_ldst_modrm(env, s, modrm, ot, reg, 1);
5307 break;
5308 case 0xc6:
5309 case 0xc7: /* mov Ev, Iv */
5310 if ((b & 1) == 0)
5311 ot = OT_BYTE;
5312 else
5313 ot = dflag + OT_WORD;
5314 modrm = cpu_ldub_code(env, s->pc++);
5315 mod = (modrm >> 6) & 3;
5316 if (mod != 3) {
5317 s->rip_offset = insn_const_size(ot);
5318 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5319 }
5320 val = insn_get(env, s, ot);
5321 gen_op_movl_T0_im(val);
5322 if (mod != 3)
5323 gen_op_st_T0_A0(ot + s->mem_index);
5324 else
5325 gen_op_mov_reg_T0(ot, (modrm & 7) | REX_B(s));
5326 break;
5327 case 0x8a:
5328 case 0x8b: /* mov Ev, Gv */
5329 if ((b & 1) == 0)
5330 ot = OT_BYTE;
5331 else
5332 ot = OT_WORD + dflag;
5333 modrm = cpu_ldub_code(env, s->pc++);
5334 reg = ((modrm >> 3) & 7) | rex_r;
5335
5336 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
5337 gen_op_mov_reg_T0(ot, reg);
5338 break;
5339 case 0x8e: /* mov seg, Gv */
5340 modrm = cpu_ldub_code(env, s->pc++);
5341 reg = (modrm >> 3) & 7;
5342 if (reg >= 6 || reg == R_CS)
5343 goto illegal_op;
5344 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
5345 gen_movl_seg_T0(s, reg, pc_start - s->cs_base);
5346 if (reg == R_SS) {
5347 /* if reg == SS, inhibit interrupts/trace */
5348 /* If several instructions disable interrupts, only the
5349 _first_ does it */
5350 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK))
5351 gen_helper_set_inhibit_irq(cpu_env);
5352 s->tf = 0;
5353 }
5354 if (s->is_jmp) {
5355 gen_jmp_im(s->pc - s->cs_base);
5356 gen_eob(s);
5357 }
5358 break;
5359 case 0x8c: /* mov Gv, seg */
5360 modrm = cpu_ldub_code(env, s->pc++);
5361 reg = (modrm >> 3) & 7;
5362 mod = (modrm >> 6) & 3;
5363 if (reg >= 6)
5364 goto illegal_op;
5365 gen_op_movl_T0_seg(reg);
5366 if (mod == 3)
5367 ot = OT_WORD + dflag;
5368 else
5369 ot = OT_WORD;
5370 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
5371 break;
5372
5373 case 0x1b6: /* movzbS Gv, Eb */
5374 case 0x1b7: /* movzwS Gv, Eb */
5375 case 0x1be: /* movsbS Gv, Eb */
5376 case 0x1bf: /* movswS Gv, Eb */
5377 {
5378 int d_ot;
5379 /* d_ot is the size of destination */
5380 d_ot = dflag + OT_WORD;
5381 /* ot is the size of source */
5382 ot = (b & 1) + OT_BYTE;
5383 modrm = cpu_ldub_code(env, s->pc++);
5384 reg = ((modrm >> 3) & 7) | rex_r;
5385 mod = (modrm >> 6) & 3;
5386 rm = (modrm & 7) | REX_B(s);
5387
5388 if (mod == 3) {
5389 gen_op_mov_TN_reg(ot, 0, rm);
5390 switch(ot | (b & 8)) {
5391 case OT_BYTE:
5392 tcg_gen_ext8u_tl(cpu_T[0], cpu_T[0]);
5393 break;
5394 case OT_BYTE | 8:
5395 tcg_gen_ext8s_tl(cpu_T[0], cpu_T[0]);
5396 break;
5397 case OT_WORD:
5398 tcg_gen_ext16u_tl(cpu_T[0], cpu_T[0]);
5399 break;
5400 default:
5401 case OT_WORD | 8:
5402 tcg_gen_ext16s_tl(cpu_T[0], cpu_T[0]);
5403 break;
5404 }
5405 gen_op_mov_reg_T0(d_ot, reg);
5406 } else {
5407 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5408 if (b & 8) {
5409 gen_op_lds_T0_A0(ot + s->mem_index);
5410 } else {
5411 gen_op_ldu_T0_A0(ot + s->mem_index);
5412 }
5413 gen_op_mov_reg_T0(d_ot, reg);
5414 }
5415 }
5416 break;
5417
5418 case 0x8d: /* lea */
5419 ot = dflag + OT_WORD;
5420 modrm = cpu_ldub_code(env, s->pc++);
5421 mod = (modrm >> 6) & 3;
5422 if (mod == 3)
5423 goto illegal_op;
5424 reg = ((modrm >> 3) & 7) | rex_r;
5425 /* we must ensure that no segment is added */
5426 s->override = -1;
5427 val = s->addseg;
5428 s->addseg = 0;
5429 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5430 s->addseg = val;
5431 gen_op_mov_reg_A0(ot - OT_WORD, reg);
5432 break;
5433
5434 case 0xa0: /* mov EAX, Ov */
5435 case 0xa1:
5436 case 0xa2: /* mov Ov, EAX */
5437 case 0xa3:
5438 {
5439 target_ulong offset_addr;
5440
5441 if ((b & 1) == 0)
5442 ot = OT_BYTE;
5443 else
5444 ot = dflag + OT_WORD;
5445 #ifdef TARGET_X86_64
5446 if (s->aflag == 2) {
5447 offset_addr = cpu_ldq_code(env, s->pc);
5448 s->pc += 8;
5449 gen_op_movq_A0_im(offset_addr);
5450 } else
5451 #endif
5452 {
5453 if (s->aflag) {
5454 offset_addr = insn_get(env, s, OT_LONG);
5455 } else {
5456 offset_addr = insn_get(env, s, OT_WORD);
5457 }
5458 gen_op_movl_A0_im(offset_addr);
5459 }
5460 gen_add_A0_ds_seg(s);
5461 if ((b & 2) == 0) {
5462 gen_op_ld_T0_A0(ot + s->mem_index);
5463 gen_op_mov_reg_T0(ot, R_EAX);
5464 } else {
5465 gen_op_mov_TN_reg(ot, 0, R_EAX);
5466 gen_op_st_T0_A0(ot + s->mem_index);
5467 }
5468 }
5469 break;
5470 case 0xd7: /* xlat */
5471 #ifdef TARGET_X86_64
5472 if (s->aflag == 2) {
5473 gen_op_movq_A0_reg(R_EBX);
5474 gen_op_mov_TN_reg(OT_QUAD, 0, R_EAX);
5475 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xff);
5476 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_T[0]);
5477 } else
5478 #endif
5479 {
5480 gen_op_movl_A0_reg(R_EBX);
5481 gen_op_mov_TN_reg(OT_LONG, 0, R_EAX);
5482 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], 0xff);
5483 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_T[0]);
5484 if (s->aflag == 0)
5485 gen_op_andl_A0_ffff();
5486 else
5487 tcg_gen_andi_tl(cpu_A0, cpu_A0, 0xffffffff);
5488 }
5489 gen_add_A0_ds_seg(s);
5490 gen_op_ldu_T0_A0(OT_BYTE + s->mem_index);
5491 gen_op_mov_reg_T0(OT_BYTE, R_EAX);
5492 break;
5493 case 0xb0 ... 0xb7: /* mov R, Ib */
5494 val = insn_get(env, s, OT_BYTE);
5495 gen_op_movl_T0_im(val);
5496 gen_op_mov_reg_T0(OT_BYTE, (b & 7) | REX_B(s));
5497 break;
5498 case 0xb8 ... 0xbf: /* mov R, Iv */
5499 #ifdef TARGET_X86_64
5500 if (dflag == 2) {
5501 uint64_t tmp;
5502 /* 64 bit case */
5503 tmp = cpu_ldq_code(env, s->pc);
5504 s->pc += 8;
5505 reg = (b & 7) | REX_B(s);
5506 gen_movtl_T0_im(tmp);
5507 gen_op_mov_reg_T0(OT_QUAD, reg);
5508 } else
5509 #endif
5510 {
5511 ot = dflag ? OT_LONG : OT_WORD;
5512 val = insn_get(env, s, ot);
5513 reg = (b & 7) | REX_B(s);
5514 gen_op_movl_T0_im(val);
5515 gen_op_mov_reg_T0(ot, reg);
5516 }
5517 break;
5518
5519 case 0x91 ... 0x97: /* xchg R, EAX */
5520 do_xchg_reg_eax:
5521 ot = dflag + OT_WORD;
5522 reg = (b & 7) | REX_B(s);
5523 rm = R_EAX;
5524 goto do_xchg_reg;
5525 case 0x86:
5526 case 0x87: /* xchg Ev, Gv */
5527 if ((b & 1) == 0)
5528 ot = OT_BYTE;
5529 else
5530 ot = dflag + OT_WORD;
5531 modrm = cpu_ldub_code(env, s->pc++);
5532 reg = ((modrm >> 3) & 7) | rex_r;
5533 mod = (modrm >> 6) & 3;
5534 if (mod == 3) {
5535 rm = (modrm & 7) | REX_B(s);
5536 do_xchg_reg:
5537 gen_op_mov_TN_reg(ot, 0, reg);
5538 gen_op_mov_TN_reg(ot, 1, rm);
5539 gen_op_mov_reg_T0(ot, rm);
5540 gen_op_mov_reg_T1(ot, reg);
5541 } else {
5542 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5543 gen_op_mov_TN_reg(ot, 0, reg);
5544 /* for xchg, lock is implicit */
5545 if (!(prefixes & PREFIX_LOCK))
5546 gen_helper_lock();
5547 gen_op_ld_T1_A0(ot + s->mem_index);
5548 gen_op_st_T0_A0(ot + s->mem_index);
5549 if (!(prefixes & PREFIX_LOCK))
5550 gen_helper_unlock();
5551 gen_op_mov_reg_T1(ot, reg);
5552 }
5553 break;
5554 case 0xc4: /* les Gv */
5555 if (CODE64(s))
5556 goto illegal_op;
5557 op = R_ES;
5558 goto do_lxx;
5559 case 0xc5: /* lds Gv */
5560 if (CODE64(s))
5561 goto illegal_op;
5562 op = R_DS;
5563 goto do_lxx;
5564 case 0x1b2: /* lss Gv */
5565 op = R_SS;
5566 goto do_lxx;
5567 case 0x1b4: /* lfs Gv */
5568 op = R_FS;
5569 goto do_lxx;
5570 case 0x1b5: /* lgs Gv */
5571 op = R_GS;
5572 do_lxx:
5573 ot = dflag ? OT_LONG : OT_WORD;
5574 modrm = cpu_ldub_code(env, s->pc++);
5575 reg = ((modrm >> 3) & 7) | rex_r;
5576 mod = (modrm >> 6) & 3;
5577 if (mod == 3)
5578 goto illegal_op;
5579 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5580 gen_op_ld_T1_A0(ot + s->mem_index);
5581 gen_add_A0_im(s, 1 << (ot - OT_WORD + 1));
5582 /* load the segment first to handle exceptions properly */
5583 gen_op_ldu_T0_A0(OT_WORD + s->mem_index);
5584 gen_movl_seg_T0(s, op, pc_start - s->cs_base);
5585 /* then put the data */
5586 gen_op_mov_reg_T1(ot, reg);
5587 if (s->is_jmp) {
5588 gen_jmp_im(s->pc - s->cs_base);
5589 gen_eob(s);
5590 }
5591 break;
5592
5593 /************************/
5594 /* shifts */
5595 case 0xc0:
5596 case 0xc1:
5597 /* shift Ev,Ib */
5598 shift = 2;
5599 grp2:
5600 {
5601 if ((b & 1) == 0)
5602 ot = OT_BYTE;
5603 else
5604 ot = dflag + OT_WORD;
5605
5606 modrm = cpu_ldub_code(env, s->pc++);
5607 mod = (modrm >> 6) & 3;
5608 op = (modrm >> 3) & 7;
5609
5610 if (mod != 3) {
5611 if (shift == 2) {
5612 s->rip_offset = 1;
5613 }
5614 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5615 opreg = OR_TMP0;
5616 } else {
5617 opreg = (modrm & 7) | REX_B(s);
5618 }
5619
5620 /* simpler op */
5621 if (shift == 0) {
5622 gen_shift(s, op, ot, opreg, OR_ECX);
5623 } else {
5624 if (shift == 2) {
5625 shift = cpu_ldub_code(env, s->pc++);
5626 }
5627 gen_shifti(s, op, ot, opreg, shift);
5628 }
5629 }
5630 break;
5631 case 0xd0:
5632 case 0xd1:
5633 /* shift Ev,1 */
5634 shift = 1;
5635 goto grp2;
5636 case 0xd2:
5637 case 0xd3:
5638 /* shift Ev,cl */
5639 shift = 0;
5640 goto grp2;
5641
5642 case 0x1a4: /* shld imm */
5643 op = 0;
5644 shift = 1;
5645 goto do_shiftd;
5646 case 0x1a5: /* shld cl */
5647 op = 0;
5648 shift = 0;
5649 goto do_shiftd;
5650 case 0x1ac: /* shrd imm */
5651 op = 1;
5652 shift = 1;
5653 goto do_shiftd;
5654 case 0x1ad: /* shrd cl */
5655 op = 1;
5656 shift = 0;
5657 do_shiftd:
5658 ot = dflag + OT_WORD;
5659 modrm = cpu_ldub_code(env, s->pc++);
5660 mod = (modrm >> 6) & 3;
5661 rm = (modrm & 7) | REX_B(s);
5662 reg = ((modrm >> 3) & 7) | rex_r;
5663 if (mod != 3) {
5664 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5665 opreg = OR_TMP0;
5666 } else {
5667 opreg = rm;
5668 }
5669 gen_op_mov_TN_reg(ot, 1, reg);
5670
5671 if (shift) {
5672 val = cpu_ldub_code(env, s->pc++);
5673 tcg_gen_movi_tl(cpu_T3, val);
5674 } else {
5675 tcg_gen_mov_tl(cpu_T3, cpu_regs[R_ECX]);
5676 }
5677 gen_shiftd_rm_T1_T3(s, ot, opreg, op);
5678 break;
5679
5680 /************************/
5681 /* floats */
5682 case 0xd8 ... 0xdf:
5683 if (s->flags & (HF_EM_MASK | HF_TS_MASK)) {
5684 /* if CR0.EM or CR0.TS are set, generate an FPU exception */
5685 /* XXX: what to do if illegal op ? */
5686 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
5687 break;
5688 }
5689 modrm = cpu_ldub_code(env, s->pc++);
5690 mod = (modrm >> 6) & 3;
5691 rm = modrm & 7;
5692 op = ((b & 7) << 3) | ((modrm >> 3) & 7);
5693 if (mod != 3) {
5694 /* memory op */
5695 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
5696 switch(op) {
5697 case 0x00 ... 0x07: /* fxxxs */
5698 case 0x10 ... 0x17: /* fixxxl */
5699 case 0x20 ... 0x27: /* fxxxl */
5700 case 0x30 ... 0x37: /* fixxx */
5701 {
5702 int op1;
5703 op1 = op & 7;
5704
5705 switch(op >> 4) {
5706 case 0:
5707 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5708 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5709 gen_helper_flds_FT0(cpu_env, cpu_tmp2_i32);
5710 break;
5711 case 1:
5712 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5713 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5714 gen_helper_fildl_FT0(cpu_env, cpu_tmp2_i32);
5715 break;
5716 case 2:
5717 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
5718 (s->mem_index >> 2) - 1);
5719 gen_helper_fldl_FT0(cpu_env, cpu_tmp1_i64);
5720 break;
5721 case 3:
5722 default:
5723 gen_op_lds_T0_A0(OT_WORD + s->mem_index);
5724 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5725 gen_helper_fildl_FT0(cpu_env, cpu_tmp2_i32);
5726 break;
5727 }
5728
5729 gen_helper_fp_arith_ST0_FT0(op1);
5730 if (op1 == 3) {
5731 /* fcomp needs pop */
5732 gen_helper_fpop(cpu_env);
5733 }
5734 }
5735 break;
5736 case 0x08: /* flds */
5737 case 0x0a: /* fsts */
5738 case 0x0b: /* fstps */
5739 case 0x18 ... 0x1b: /* fildl, fisttpl, fistl, fistpl */
5740 case 0x28 ... 0x2b: /* fldl, fisttpll, fstl, fstpl */
5741 case 0x38 ... 0x3b: /* filds, fisttps, fists, fistps */
5742 switch(op & 7) {
5743 case 0:
5744 switch(op >> 4) {
5745 case 0:
5746 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5747 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5748 gen_helper_flds_ST0(cpu_env, cpu_tmp2_i32);
5749 break;
5750 case 1:
5751 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
5752 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5753 gen_helper_fildl_ST0(cpu_env, cpu_tmp2_i32);
5754 break;
5755 case 2:
5756 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
5757 (s->mem_index >> 2) - 1);
5758 gen_helper_fldl_ST0(cpu_env, cpu_tmp1_i64);
5759 break;
5760 case 3:
5761 default:
5762 gen_op_lds_T0_A0(OT_WORD + s->mem_index);
5763 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5764 gen_helper_fildl_ST0(cpu_env, cpu_tmp2_i32);
5765 break;
5766 }
5767 break;
5768 case 1:
5769 /* XXX: the corresponding CPUID bit must be tested ! */
5770 switch(op >> 4) {
5771 case 1:
5772 gen_helper_fisttl_ST0(cpu_tmp2_i32, cpu_env);
5773 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5774 gen_op_st_T0_A0(OT_LONG + s->mem_index);
5775 break;
5776 case 2:
5777 gen_helper_fisttll_ST0(cpu_tmp1_i64, cpu_env);
5778 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
5779 (s->mem_index >> 2) - 1);
5780 break;
5781 case 3:
5782 default:
5783 gen_helper_fistt_ST0(cpu_tmp2_i32, cpu_env);
5784 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5785 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5786 break;
5787 }
5788 gen_helper_fpop(cpu_env);
5789 break;
5790 default:
5791 switch(op >> 4) {
5792 case 0:
5793 gen_helper_fsts_ST0(cpu_tmp2_i32, cpu_env);
5794 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5795 gen_op_st_T0_A0(OT_LONG + s->mem_index);
5796 break;
5797 case 1:
5798 gen_helper_fistl_ST0(cpu_tmp2_i32, cpu_env);
5799 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5800 gen_op_st_T0_A0(OT_LONG + s->mem_index);
5801 break;
5802 case 2:
5803 gen_helper_fstl_ST0(cpu_tmp1_i64, cpu_env);
5804 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
5805 (s->mem_index >> 2) - 1);
5806 break;
5807 case 3:
5808 default:
5809 gen_helper_fist_ST0(cpu_tmp2_i32, cpu_env);
5810 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5811 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5812 break;
5813 }
5814 if ((op & 7) == 3)
5815 gen_helper_fpop(cpu_env);
5816 break;
5817 }
5818 break;
5819 case 0x0c: /* fldenv mem */
5820 gen_update_cc_op(s);
5821 gen_jmp_im(pc_start - s->cs_base);
5822 gen_helper_fldenv(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5823 break;
5824 case 0x0d: /* fldcw mem */
5825 gen_op_ld_T0_A0(OT_WORD + s->mem_index);
5826 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
5827 gen_helper_fldcw(cpu_env, cpu_tmp2_i32);
5828 break;
5829 case 0x0e: /* fnstenv mem */
5830 gen_update_cc_op(s);
5831 gen_jmp_im(pc_start - s->cs_base);
5832 gen_helper_fstenv(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5833 break;
5834 case 0x0f: /* fnstcw mem */
5835 gen_helper_fnstcw(cpu_tmp2_i32, cpu_env);
5836 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5837 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5838 break;
5839 case 0x1d: /* fldt mem */
5840 gen_update_cc_op(s);
5841 gen_jmp_im(pc_start - s->cs_base);
5842 gen_helper_fldt_ST0(cpu_env, cpu_A0);
5843 break;
5844 case 0x1f: /* fstpt mem */
5845 gen_update_cc_op(s);
5846 gen_jmp_im(pc_start - s->cs_base);
5847 gen_helper_fstt_ST0(cpu_env, cpu_A0);
5848 gen_helper_fpop(cpu_env);
5849 break;
5850 case 0x2c: /* frstor mem */
5851 gen_update_cc_op(s);
5852 gen_jmp_im(pc_start - s->cs_base);
5853 gen_helper_frstor(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5854 break;
5855 case 0x2e: /* fnsave mem */
5856 gen_update_cc_op(s);
5857 gen_jmp_im(pc_start - s->cs_base);
5858 gen_helper_fsave(cpu_env, cpu_A0, tcg_const_i32(s->dflag));
5859 break;
5860 case 0x2f: /* fnstsw mem */
5861 gen_helper_fnstsw(cpu_tmp2_i32, cpu_env);
5862 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
5863 gen_op_st_T0_A0(OT_WORD + s->mem_index);
5864 break;
5865 case 0x3c: /* fbld */
5866 gen_update_cc_op(s);
5867 gen_jmp_im(pc_start - s->cs_base);
5868 gen_helper_fbld_ST0(cpu_env, cpu_A0);
5869 break;
5870 case 0x3e: /* fbstp */
5871 gen_update_cc_op(s);
5872 gen_jmp_im(pc_start - s->cs_base);
5873 gen_helper_fbst_ST0(cpu_env, cpu_A0);
5874 gen_helper_fpop(cpu_env);
5875 break;
5876 case 0x3d: /* fildll */
5877 tcg_gen_qemu_ld64(cpu_tmp1_i64, cpu_A0,
5878 (s->mem_index >> 2) - 1);
5879 gen_helper_fildll_ST0(cpu_env, cpu_tmp1_i64);
5880 break;
5881 case 0x3f: /* fistpll */
5882 gen_helper_fistll_ST0(cpu_tmp1_i64, cpu_env);
5883 tcg_gen_qemu_st64(cpu_tmp1_i64, cpu_A0,
5884 (s->mem_index >> 2) - 1);
5885 gen_helper_fpop(cpu_env);
5886 break;
5887 default:
5888 goto illegal_op;
5889 }
5890 } else {
5891 /* register float ops */
5892 opreg = rm;
5893
5894 switch(op) {
5895 case 0x08: /* fld sti */
5896 gen_helper_fpush(cpu_env);
5897 gen_helper_fmov_ST0_STN(cpu_env,
5898 tcg_const_i32((opreg + 1) & 7));
5899 break;
5900 case 0x09: /* fxchg sti */
5901 case 0x29: /* fxchg4 sti, undocumented op */
5902 case 0x39: /* fxchg7 sti, undocumented op */
5903 gen_helper_fxchg_ST0_STN(cpu_env, tcg_const_i32(opreg));
5904 break;
5905 case 0x0a: /* grp d9/2 */
5906 switch(rm) {
5907 case 0: /* fnop */
5908 /* check exceptions (FreeBSD FPU probe) */
5909 gen_update_cc_op(s);
5910 gen_jmp_im(pc_start - s->cs_base);
5911 gen_helper_fwait(cpu_env);
5912 break;
5913 default:
5914 goto illegal_op;
5915 }
5916 break;
5917 case 0x0c: /* grp d9/4 */
5918 switch(rm) {
5919 case 0: /* fchs */
5920 gen_helper_fchs_ST0(cpu_env);
5921 break;
5922 case 1: /* fabs */
5923 gen_helper_fabs_ST0(cpu_env);
5924 break;
5925 case 4: /* ftst */
5926 gen_helper_fldz_FT0(cpu_env);
5927 gen_helper_fcom_ST0_FT0(cpu_env);
5928 break;
5929 case 5: /* fxam */
5930 gen_helper_fxam_ST0(cpu_env);
5931 break;
5932 default:
5933 goto illegal_op;
5934 }
5935 break;
5936 case 0x0d: /* grp d9/5 */
5937 {
5938 switch(rm) {
5939 case 0:
5940 gen_helper_fpush(cpu_env);
5941 gen_helper_fld1_ST0(cpu_env);
5942 break;
5943 case 1:
5944 gen_helper_fpush(cpu_env);
5945 gen_helper_fldl2t_ST0(cpu_env);
5946 break;
5947 case 2:
5948 gen_helper_fpush(cpu_env);
5949 gen_helper_fldl2e_ST0(cpu_env);
5950 break;
5951 case 3:
5952 gen_helper_fpush(cpu_env);
5953 gen_helper_fldpi_ST0(cpu_env);
5954 break;
5955 case 4:
5956 gen_helper_fpush(cpu_env);
5957 gen_helper_fldlg2_ST0(cpu_env);
5958 break;
5959 case 5:
5960 gen_helper_fpush(cpu_env);
5961 gen_helper_fldln2_ST0(cpu_env);
5962 break;
5963 case 6:
5964 gen_helper_fpush(cpu_env);
5965 gen_helper_fldz_ST0(cpu_env);
5966 break;
5967 default:
5968 goto illegal_op;
5969 }
5970 }
5971 break;
5972 case 0x0e: /* grp d9/6 */
5973 switch(rm) {
5974 case 0: /* f2xm1 */
5975 gen_helper_f2xm1(cpu_env);
5976 break;
5977 case 1: /* fyl2x */
5978 gen_helper_fyl2x(cpu_env);
5979 break;
5980 case 2: /* fptan */
5981 gen_helper_fptan(cpu_env);
5982 break;
5983 case 3: /* fpatan */
5984 gen_helper_fpatan(cpu_env);
5985 break;
5986 case 4: /* fxtract */
5987 gen_helper_fxtract(cpu_env);
5988 break;
5989 case 5: /* fprem1 */
5990 gen_helper_fprem1(cpu_env);
5991 break;
5992 case 6: /* fdecstp */
5993 gen_helper_fdecstp(cpu_env);
5994 break;
5995 default:
5996 case 7: /* fincstp */
5997 gen_helper_fincstp(cpu_env);
5998 break;
5999 }
6000 break;
6001 case 0x0f: /* grp d9/7 */
6002 switch(rm) {
6003 case 0: /* fprem */
6004 gen_helper_fprem(cpu_env);
6005 break;
6006 case 1: /* fyl2xp1 */
6007 gen_helper_fyl2xp1(cpu_env);
6008 break;
6009 case 2: /* fsqrt */
6010 gen_helper_fsqrt(cpu_env);
6011 break;
6012 case 3: /* fsincos */
6013 gen_helper_fsincos(cpu_env);
6014 break;
6015 case 5: /* fscale */
6016 gen_helper_fscale(cpu_env);
6017 break;
6018 case 4: /* frndint */
6019 gen_helper_frndint(cpu_env);
6020 break;
6021 case 6: /* fsin */
6022 gen_helper_fsin(cpu_env);
6023 break;
6024 default:
6025 case 7: /* fcos */
6026 gen_helper_fcos(cpu_env);
6027 break;
6028 }
6029 break;
6030 case 0x00: case 0x01: case 0x04 ... 0x07: /* fxxx st, sti */
6031 case 0x20: case 0x21: case 0x24 ... 0x27: /* fxxx sti, st */
6032 case 0x30: case 0x31: case 0x34 ... 0x37: /* fxxxp sti, st */
6033 {
6034 int op1;
6035
6036 op1 = op & 7;
6037 if (op >= 0x20) {
6038 gen_helper_fp_arith_STN_ST0(op1, opreg);
6039 if (op >= 0x30)
6040 gen_helper_fpop(cpu_env);
6041 } else {
6042 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6043 gen_helper_fp_arith_ST0_FT0(op1);
6044 }
6045 }
6046 break;
6047 case 0x02: /* fcom */
6048 case 0x22: /* fcom2, undocumented op */
6049 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6050 gen_helper_fcom_ST0_FT0(cpu_env);
6051 break;
6052 case 0x03: /* fcomp */
6053 case 0x23: /* fcomp3, undocumented op */
6054 case 0x32: /* fcomp5, undocumented op */
6055 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6056 gen_helper_fcom_ST0_FT0(cpu_env);
6057 gen_helper_fpop(cpu_env);
6058 break;
6059 case 0x15: /* da/5 */
6060 switch(rm) {
6061 case 1: /* fucompp */
6062 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(1));
6063 gen_helper_fucom_ST0_FT0(cpu_env);
6064 gen_helper_fpop(cpu_env);
6065 gen_helper_fpop(cpu_env);
6066 break;
6067 default:
6068 goto illegal_op;
6069 }
6070 break;
6071 case 0x1c:
6072 switch(rm) {
6073 case 0: /* feni (287 only, just do nop here) */
6074 break;
6075 case 1: /* fdisi (287 only, just do nop here) */
6076 break;
6077 case 2: /* fclex */
6078 gen_helper_fclex(cpu_env);
6079 break;
6080 case 3: /* fninit */
6081 gen_helper_fninit(cpu_env);
6082 break;
6083 case 4: /* fsetpm (287 only, just do nop here) */
6084 break;
6085 default:
6086 goto illegal_op;
6087 }
6088 break;
6089 case 0x1d: /* fucomi */
6090 gen_update_cc_op(s);
6091 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6092 gen_helper_fucomi_ST0_FT0(cpu_env);
6093 set_cc_op(s, CC_OP_EFLAGS);
6094 break;
6095 case 0x1e: /* fcomi */
6096 gen_update_cc_op(s);
6097 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6098 gen_helper_fcomi_ST0_FT0(cpu_env);
6099 set_cc_op(s, CC_OP_EFLAGS);
6100 break;
6101 case 0x28: /* ffree sti */
6102 gen_helper_ffree_STN(cpu_env, tcg_const_i32(opreg));
6103 break;
6104 case 0x2a: /* fst sti */
6105 gen_helper_fmov_STN_ST0(cpu_env, tcg_const_i32(opreg));
6106 break;
6107 case 0x2b: /* fstp sti */
6108 case 0x0b: /* fstp1 sti, undocumented op */
6109 case 0x3a: /* fstp8 sti, undocumented op */
6110 case 0x3b: /* fstp9 sti, undocumented op */
6111 gen_helper_fmov_STN_ST0(cpu_env, tcg_const_i32(opreg));
6112 gen_helper_fpop(cpu_env);
6113 break;
6114 case 0x2c: /* fucom st(i) */
6115 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6116 gen_helper_fucom_ST0_FT0(cpu_env);
6117 break;
6118 case 0x2d: /* fucomp st(i) */
6119 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6120 gen_helper_fucom_ST0_FT0(cpu_env);
6121 gen_helper_fpop(cpu_env);
6122 break;
6123 case 0x33: /* de/3 */
6124 switch(rm) {
6125 case 1: /* fcompp */
6126 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(1));
6127 gen_helper_fcom_ST0_FT0(cpu_env);
6128 gen_helper_fpop(cpu_env);
6129 gen_helper_fpop(cpu_env);
6130 break;
6131 default:
6132 goto illegal_op;
6133 }
6134 break;
6135 case 0x38: /* ffreep sti, undocumented op */
6136 gen_helper_ffree_STN(cpu_env, tcg_const_i32(opreg));
6137 gen_helper_fpop(cpu_env);
6138 break;
6139 case 0x3c: /* df/4 */
6140 switch(rm) {
6141 case 0:
6142 gen_helper_fnstsw(cpu_tmp2_i32, cpu_env);
6143 tcg_gen_extu_i32_tl(cpu_T[0], cpu_tmp2_i32);
6144 gen_op_mov_reg_T0(OT_WORD, R_EAX);
6145 break;
6146 default:
6147 goto illegal_op;
6148 }
6149 break;
6150 case 0x3d: /* fucomip */
6151 gen_update_cc_op(s);
6152 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6153 gen_helper_fucomi_ST0_FT0(cpu_env);
6154 gen_helper_fpop(cpu_env);
6155 set_cc_op(s, CC_OP_EFLAGS);
6156 break;
6157 case 0x3e: /* fcomip */
6158 gen_update_cc_op(s);
6159 gen_helper_fmov_FT0_STN(cpu_env, tcg_const_i32(opreg));
6160 gen_helper_fcomi_ST0_FT0(cpu_env);
6161 gen_helper_fpop(cpu_env);
6162 set_cc_op(s, CC_OP_EFLAGS);
6163 break;
6164 case 0x10 ... 0x13: /* fcmovxx */
6165 case 0x18 ... 0x1b:
6166 {
6167 int op1, l1;
6168 static const uint8_t fcmov_cc[8] = {
6169 (JCC_B << 1),
6170 (JCC_Z << 1),
6171 (JCC_BE << 1),
6172 (JCC_P << 1),
6173 };
6174 op1 = fcmov_cc[op & 3] | (((op >> 3) & 1) ^ 1);
6175 l1 = gen_new_label();
6176 gen_jcc1(s, op1, l1);
6177 gen_helper_fmov_ST0_STN(cpu_env, tcg_const_i32(opreg));
6178 gen_set_label(l1);
6179 }
6180 break;
6181 default:
6182 goto illegal_op;
6183 }
6184 }
6185 break;
6186 /************************/
6187 /* string ops */
6188
6189 case 0xa4: /* movsS */
6190 case 0xa5:
6191 if ((b & 1) == 0)
6192 ot = OT_BYTE;
6193 else
6194 ot = dflag + OT_WORD;
6195
6196 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6197 gen_repz_movs(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6198 } else {
6199 gen_movs(s, ot);
6200 }
6201 break;
6202
6203 case 0xaa: /* stosS */
6204 case 0xab:
6205 if ((b & 1) == 0)
6206 ot = OT_BYTE;
6207 else
6208 ot = dflag + OT_WORD;
6209
6210 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6211 gen_repz_stos(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6212 } else {
6213 gen_stos(s, ot);
6214 }
6215 break;
6216 case 0xac: /* lodsS */
6217 case 0xad:
6218 if ((b & 1) == 0)
6219 ot = OT_BYTE;
6220 else
6221 ot = dflag + OT_WORD;
6222 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6223 gen_repz_lods(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6224 } else {
6225 gen_lods(s, ot);
6226 }
6227 break;
6228 case 0xae: /* scasS */
6229 case 0xaf:
6230 if ((b & 1) == 0)
6231 ot = OT_BYTE;
6232 else
6233 ot = dflag + OT_WORD;
6234 if (prefixes & PREFIX_REPNZ) {
6235 gen_repz_scas(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 1);
6236 } else if (prefixes & PREFIX_REPZ) {
6237 gen_repz_scas(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 0);
6238 } else {
6239 gen_scas(s, ot);
6240 }
6241 break;
6242
6243 case 0xa6: /* cmpsS */
6244 case 0xa7:
6245 if ((b & 1) == 0)
6246 ot = OT_BYTE;
6247 else
6248 ot = dflag + OT_WORD;
6249 if (prefixes & PREFIX_REPNZ) {
6250 gen_repz_cmps(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 1);
6251 } else if (prefixes & PREFIX_REPZ) {
6252 gen_repz_cmps(s, ot, pc_start - s->cs_base, s->pc - s->cs_base, 0);
6253 } else {
6254 gen_cmps(s, ot);
6255 }
6256 break;
6257 case 0x6c: /* insS */
6258 case 0x6d:
6259 if ((b & 1) == 0)
6260 ot = OT_BYTE;
6261 else
6262 ot = dflag ? OT_LONG : OT_WORD;
6263 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6264 gen_op_andl_T0_ffff();
6265 gen_check_io(s, ot, pc_start - s->cs_base,
6266 SVM_IOIO_TYPE_MASK | svm_is_rep(prefixes) | 4);
6267 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6268 gen_repz_ins(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6269 } else {
6270 gen_ins(s, ot);
6271 if (use_icount) {
6272 gen_jmp(s, s->pc - s->cs_base);
6273 }
6274 }
6275 break;
6276 case 0x6e: /* outsS */
6277 case 0x6f:
6278 if ((b & 1) == 0)
6279 ot = OT_BYTE;
6280 else
6281 ot = dflag ? OT_LONG : OT_WORD;
6282 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6283 gen_op_andl_T0_ffff();
6284 gen_check_io(s, ot, pc_start - s->cs_base,
6285 svm_is_rep(prefixes) | 4);
6286 if (prefixes & (PREFIX_REPZ | PREFIX_REPNZ)) {
6287 gen_repz_outs(s, ot, pc_start - s->cs_base, s->pc - s->cs_base);
6288 } else {
6289 gen_outs(s, ot);
6290 if (use_icount) {
6291 gen_jmp(s, s->pc - s->cs_base);
6292 }
6293 }
6294 break;
6295
6296 /************************/
6297 /* port I/O */
6298
6299 case 0xe4:
6300 case 0xe5:
6301 if ((b & 1) == 0)
6302 ot = OT_BYTE;
6303 else
6304 ot = dflag ? OT_LONG : OT_WORD;
6305 val = cpu_ldub_code(env, s->pc++);
6306 gen_op_movl_T0_im(val);
6307 gen_check_io(s, ot, pc_start - s->cs_base,
6308 SVM_IOIO_TYPE_MASK | svm_is_rep(prefixes));
6309 if (use_icount)
6310 gen_io_start();
6311 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6312 gen_helper_in_func(ot, cpu_T[1], cpu_tmp2_i32);
6313 gen_op_mov_reg_T1(ot, R_EAX);
6314 if (use_icount) {
6315 gen_io_end();
6316 gen_jmp(s, s->pc - s->cs_base);
6317 }
6318 break;
6319 case 0xe6:
6320 case 0xe7:
6321 if ((b & 1) == 0)
6322 ot = OT_BYTE;
6323 else
6324 ot = dflag ? OT_LONG : OT_WORD;
6325 val = cpu_ldub_code(env, s->pc++);
6326 gen_op_movl_T0_im(val);
6327 gen_check_io(s, ot, pc_start - s->cs_base,
6328 svm_is_rep(prefixes));
6329 gen_op_mov_TN_reg(ot, 1, R_EAX);
6330
6331 if (use_icount)
6332 gen_io_start();
6333 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6334 tcg_gen_trunc_tl_i32(cpu_tmp3_i32, cpu_T[1]);
6335 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
6336 if (use_icount) {
6337 gen_io_end();
6338 gen_jmp(s, s->pc - s->cs_base);
6339 }
6340 break;
6341 case 0xec:
6342 case 0xed:
6343 if ((b & 1) == 0)
6344 ot = OT_BYTE;
6345 else
6346 ot = dflag ? OT_LONG : OT_WORD;
6347 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6348 gen_op_andl_T0_ffff();
6349 gen_check_io(s, ot, pc_start - s->cs_base,
6350 SVM_IOIO_TYPE_MASK | svm_is_rep(prefixes));
6351 if (use_icount)
6352 gen_io_start();
6353 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6354 gen_helper_in_func(ot, cpu_T[1], cpu_tmp2_i32);
6355 gen_op_mov_reg_T1(ot, R_EAX);
6356 if (use_icount) {
6357 gen_io_end();
6358 gen_jmp(s, s->pc - s->cs_base);
6359 }
6360 break;
6361 case 0xee:
6362 case 0xef:
6363 if ((b & 1) == 0)
6364 ot = OT_BYTE;
6365 else
6366 ot = dflag ? OT_LONG : OT_WORD;
6367 gen_op_mov_TN_reg(OT_WORD, 0, R_EDX);
6368 gen_op_andl_T0_ffff();
6369 gen_check_io(s, ot, pc_start - s->cs_base,
6370 svm_is_rep(prefixes));
6371 gen_op_mov_TN_reg(ot, 1, R_EAX);
6372
6373 if (use_icount)
6374 gen_io_start();
6375 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6376 tcg_gen_trunc_tl_i32(cpu_tmp3_i32, cpu_T[1]);
6377 gen_helper_out_func(ot, cpu_tmp2_i32, cpu_tmp3_i32);
6378 if (use_icount) {
6379 gen_io_end();
6380 gen_jmp(s, s->pc - s->cs_base);
6381 }
6382 break;
6383
6384 /************************/
6385 /* control */
6386 case 0xc2: /* ret im */
6387 val = cpu_ldsw_code(env, s->pc);
6388 s->pc += 2;
6389 gen_pop_T0(s);
6390 if (CODE64(s) && s->dflag)
6391 s->dflag = 2;
6392 gen_stack_update(s, val + (2 << s->dflag));
6393 if (s->dflag == 0)
6394 gen_op_andl_T0_ffff();
6395 gen_op_jmp_T0();
6396 gen_eob(s);
6397 break;
6398 case 0xc3: /* ret */
6399 gen_pop_T0(s);
6400 gen_pop_update(s);
6401 if (s->dflag == 0)
6402 gen_op_andl_T0_ffff();
6403 gen_op_jmp_T0();
6404 gen_eob(s);
6405 break;
6406 case 0xca: /* lret im */
6407 val = cpu_ldsw_code(env, s->pc);
6408 s->pc += 2;
6409 do_lret:
6410 if (s->pe && !s->vm86) {
6411 gen_update_cc_op(s);
6412 gen_jmp_im(pc_start - s->cs_base);
6413 gen_helper_lret_protected(cpu_env, tcg_const_i32(s->dflag),
6414 tcg_const_i32(val));
6415 } else {
6416 gen_stack_A0(s);
6417 /* pop offset */
6418 gen_op_ld_T0_A0(1 + s->dflag + s->mem_index);
6419 if (s->dflag == 0)
6420 gen_op_andl_T0_ffff();
6421 /* NOTE: keeping EIP updated is not a problem in case of
6422 exception */
6423 gen_op_jmp_T0();
6424 /* pop selector */
6425 gen_op_addl_A0_im(2 << s->dflag);
6426 gen_op_ld_T0_A0(1 + s->dflag + s->mem_index);
6427 gen_op_movl_seg_T0_vm(R_CS);
6428 /* add stack offset */
6429 gen_stack_update(s, val + (4 << s->dflag));
6430 }
6431 gen_eob(s);
6432 break;
6433 case 0xcb: /* lret */
6434 val = 0;
6435 goto do_lret;
6436 case 0xcf: /* iret */
6437 gen_svm_check_intercept(s, pc_start, SVM_EXIT_IRET);
6438 if (!s->pe) {
6439 /* real mode */
6440 gen_helper_iret_real(cpu_env, tcg_const_i32(s->dflag));
6441 set_cc_op(s, CC_OP_EFLAGS);
6442 } else if (s->vm86) {
6443 if (s->iopl != 3) {
6444 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6445 } else {
6446 gen_helper_iret_real(cpu_env, tcg_const_i32(s->dflag));
6447 set_cc_op(s, CC_OP_EFLAGS);
6448 }
6449 } else {
6450 gen_update_cc_op(s);
6451 gen_jmp_im(pc_start - s->cs_base);
6452 gen_helper_iret_protected(cpu_env, tcg_const_i32(s->dflag),
6453 tcg_const_i32(s->pc - s->cs_base));
6454 set_cc_op(s, CC_OP_EFLAGS);
6455 }
6456 gen_eob(s);
6457 break;
6458 case 0xe8: /* call im */
6459 {
6460 if (dflag)
6461 tval = (int32_t)insn_get(env, s, OT_LONG);
6462 else
6463 tval = (int16_t)insn_get(env, s, OT_WORD);
6464 next_eip = s->pc - s->cs_base;
6465 tval += next_eip;
6466 if (s->dflag == 0)
6467 tval &= 0xffff;
6468 else if(!CODE64(s))
6469 tval &= 0xffffffff;
6470 gen_movtl_T0_im(next_eip);
6471 gen_push_T0(s);
6472 gen_jmp(s, tval);
6473 }
6474 break;
6475 case 0x9a: /* lcall im */
6476 {
6477 unsigned int selector, offset;
6478
6479 if (CODE64(s))
6480 goto illegal_op;
6481 ot = dflag ? OT_LONG : OT_WORD;
6482 offset = insn_get(env, s, ot);
6483 selector = insn_get(env, s, OT_WORD);
6484
6485 gen_op_movl_T0_im(selector);
6486 gen_op_movl_T1_imu(offset);
6487 }
6488 goto do_lcall;
6489 case 0xe9: /* jmp im */
6490 if (dflag)
6491 tval = (int32_t)insn_get(env, s, OT_LONG);
6492 else
6493 tval = (int16_t)insn_get(env, s, OT_WORD);
6494 tval += s->pc - s->cs_base;
6495 if (s->dflag == 0)
6496 tval &= 0xffff;
6497 else if(!CODE64(s))
6498 tval &= 0xffffffff;
6499 gen_jmp(s, tval);
6500 break;
6501 case 0xea: /* ljmp im */
6502 {
6503 unsigned int selector, offset;
6504
6505 if (CODE64(s))
6506 goto illegal_op;
6507 ot = dflag ? OT_LONG : OT_WORD;
6508 offset = insn_get(env, s, ot);
6509 selector = insn_get(env, s, OT_WORD);
6510
6511 gen_op_movl_T0_im(selector);
6512 gen_op_movl_T1_imu(offset);
6513 }
6514 goto do_ljmp;
6515 case 0xeb: /* jmp Jb */
6516 tval = (int8_t)insn_get(env, s, OT_BYTE);
6517 tval += s->pc - s->cs_base;
6518 if (s->dflag == 0)
6519 tval &= 0xffff;
6520 gen_jmp(s, tval);
6521 break;
6522 case 0x70 ... 0x7f: /* jcc Jb */
6523 tval = (int8_t)insn_get(env, s, OT_BYTE);
6524 goto do_jcc;
6525 case 0x180 ... 0x18f: /* jcc Jv */
6526 if (dflag) {
6527 tval = (int32_t)insn_get(env, s, OT_LONG);
6528 } else {
6529 tval = (int16_t)insn_get(env, s, OT_WORD);
6530 }
6531 do_jcc:
6532 next_eip = s->pc - s->cs_base;
6533 tval += next_eip;
6534 if (s->dflag == 0)
6535 tval &= 0xffff;
6536 gen_jcc(s, b, tval, next_eip);
6537 break;
6538
6539 case 0x190 ... 0x19f: /* setcc Gv */
6540 modrm = cpu_ldub_code(env, s->pc++);
6541 gen_setcc(s, b);
6542 gen_ldst_modrm(env, s, modrm, OT_BYTE, OR_TMP0, 1);
6543 break;
6544 case 0x140 ... 0x14f: /* cmov Gv, Ev */
6545 {
6546 int l1;
6547 TCGv t0;
6548
6549 ot = dflag + OT_WORD;
6550 modrm = cpu_ldub_code(env, s->pc++);
6551 reg = ((modrm >> 3) & 7) | rex_r;
6552 mod = (modrm >> 6) & 3;
6553 t0 = tcg_temp_local_new();
6554 if (mod != 3) {
6555 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
6556 gen_op_ld_v(ot + s->mem_index, t0, cpu_A0);
6557 } else {
6558 rm = (modrm & 7) | REX_B(s);
6559 gen_op_mov_v_reg(ot, t0, rm);
6560 }
6561 #ifdef TARGET_X86_64
6562 if (ot == OT_LONG) {
6563 /* XXX: specific Intel behaviour ? */
6564 l1 = gen_new_label();
6565 gen_jcc1(s, b ^ 1, l1);
6566 tcg_gen_mov_tl(cpu_regs[reg], t0);
6567 gen_set_label(l1);
6568 tcg_gen_ext32u_tl(cpu_regs[reg], cpu_regs[reg]);
6569 } else
6570 #endif
6571 {
6572 l1 = gen_new_label();
6573 gen_jcc1(s, b ^ 1, l1);
6574 gen_op_mov_reg_v(ot, reg, t0);
6575 gen_set_label(l1);
6576 }
6577 tcg_temp_free(t0);
6578 }
6579 break;
6580
6581 /************************/
6582 /* flags */
6583 case 0x9c: /* pushf */
6584 gen_svm_check_intercept(s, pc_start, SVM_EXIT_PUSHF);
6585 if (s->vm86 && s->iopl != 3) {
6586 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6587 } else {
6588 gen_update_cc_op(s);
6589 gen_helper_read_eflags(cpu_T[0], cpu_env);
6590 gen_push_T0(s);
6591 }
6592 break;
6593 case 0x9d: /* popf */
6594 gen_svm_check_intercept(s, pc_start, SVM_EXIT_POPF);
6595 if (s->vm86 && s->iopl != 3) {
6596 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6597 } else {
6598 gen_pop_T0(s);
6599 if (s->cpl == 0) {
6600 if (s->dflag) {
6601 gen_helper_write_eflags(cpu_env, cpu_T[0],
6602 tcg_const_i32((TF_MASK | AC_MASK |
6603 ID_MASK | NT_MASK |
6604 IF_MASK |
6605 IOPL_MASK)));
6606 } else {
6607 gen_helper_write_eflags(cpu_env, cpu_T[0],
6608 tcg_const_i32((TF_MASK | AC_MASK |
6609 ID_MASK | NT_MASK |
6610 IF_MASK | IOPL_MASK)
6611 & 0xffff));
6612 }
6613 } else {
6614 if (s->cpl <= s->iopl) {
6615 if (s->dflag) {
6616 gen_helper_write_eflags(cpu_env, cpu_T[0],
6617 tcg_const_i32((TF_MASK |
6618 AC_MASK |
6619 ID_MASK |
6620 NT_MASK |
6621 IF_MASK)));
6622 } else {
6623 gen_helper_write_eflags(cpu_env, cpu_T[0],
6624 tcg_const_i32((TF_MASK |
6625 AC_MASK |
6626 ID_MASK |
6627 NT_MASK |
6628 IF_MASK)
6629 & 0xffff));
6630 }
6631 } else {
6632 if (s->dflag) {
6633 gen_helper_write_eflags(cpu_env, cpu_T[0],
6634 tcg_const_i32((TF_MASK | AC_MASK |
6635 ID_MASK | NT_MASK)));
6636 } else {
6637 gen_helper_write_eflags(cpu_env, cpu_T[0],
6638 tcg_const_i32((TF_MASK | AC_MASK |
6639 ID_MASK | NT_MASK)
6640 & 0xffff));
6641 }
6642 }
6643 }
6644 gen_pop_update(s);
6645 set_cc_op(s, CC_OP_EFLAGS);
6646 /* abort translation because TF/AC flag may change */
6647 gen_jmp_im(s->pc - s->cs_base);
6648 gen_eob(s);
6649 }
6650 break;
6651 case 0x9e: /* sahf */
6652 if (CODE64(s) && !(s->cpuid_ext3_features & CPUID_EXT3_LAHF_LM))
6653 goto illegal_op;
6654 gen_op_mov_TN_reg(OT_BYTE, 0, R_AH);
6655 gen_compute_eflags(s);
6656 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, CC_O);
6657 tcg_gen_andi_tl(cpu_T[0], cpu_T[0], CC_S | CC_Z | CC_A | CC_P | CC_C);
6658 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, cpu_T[0]);
6659 break;
6660 case 0x9f: /* lahf */
6661 if (CODE64(s) && !(s->cpuid_ext3_features & CPUID_EXT3_LAHF_LM))
6662 goto illegal_op;
6663 gen_compute_eflags(s);
6664 /* Note: gen_compute_eflags() only gives the condition codes */
6665 tcg_gen_ori_tl(cpu_T[0], cpu_cc_src, 0x02);
6666 gen_op_mov_reg_T0(OT_BYTE, R_AH);
6667 break;
6668 case 0xf5: /* cmc */
6669 gen_compute_eflags(s);
6670 tcg_gen_xori_tl(cpu_cc_src, cpu_cc_src, CC_C);
6671 break;
6672 case 0xf8: /* clc */
6673 gen_compute_eflags(s);
6674 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~CC_C);
6675 break;
6676 case 0xf9: /* stc */
6677 gen_compute_eflags(s);
6678 tcg_gen_ori_tl(cpu_cc_src, cpu_cc_src, CC_C);
6679 break;
6680 case 0xfc: /* cld */
6681 tcg_gen_movi_i32(cpu_tmp2_i32, 1);
6682 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, offsetof(CPUX86State, df));
6683 break;
6684 case 0xfd: /* std */
6685 tcg_gen_movi_i32(cpu_tmp2_i32, -1);
6686 tcg_gen_st_i32(cpu_tmp2_i32, cpu_env, offsetof(CPUX86State, df));
6687 break;
6688
6689 /************************/
6690 /* bit operations */
6691 case 0x1ba: /* bt/bts/btr/btc Gv, im */
6692 ot = dflag + OT_WORD;
6693 modrm = cpu_ldub_code(env, s->pc++);
6694 op = (modrm >> 3) & 7;
6695 mod = (modrm >> 6) & 3;
6696 rm = (modrm & 7) | REX_B(s);
6697 if (mod != 3) {
6698 s->rip_offset = 1;
6699 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
6700 gen_op_ld_T0_A0(ot + s->mem_index);
6701 } else {
6702 gen_op_mov_TN_reg(ot, 0, rm);
6703 }
6704 /* load shift */
6705 val = cpu_ldub_code(env, s->pc++);
6706 gen_op_movl_T1_im(val);
6707 if (op < 4)
6708 goto illegal_op;
6709 op -= 4;
6710 goto bt_op;
6711 case 0x1a3: /* bt Gv, Ev */
6712 op = 0;
6713 goto do_btx;
6714 case 0x1ab: /* bts */
6715 op = 1;
6716 goto do_btx;
6717 case 0x1b3: /* btr */
6718 op = 2;
6719 goto do_btx;
6720 case 0x1bb: /* btc */
6721 op = 3;
6722 do_btx:
6723 ot = dflag + OT_WORD;
6724 modrm = cpu_ldub_code(env, s->pc++);
6725 reg = ((modrm >> 3) & 7) | rex_r;
6726 mod = (modrm >> 6) & 3;
6727 rm = (modrm & 7) | REX_B(s);
6728 gen_op_mov_TN_reg(OT_LONG, 1, reg);
6729 if (mod != 3) {
6730 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
6731 /* specific case: we need to add a displacement */
6732 gen_exts(ot, cpu_T[1]);
6733 tcg_gen_sari_tl(cpu_tmp0, cpu_T[1], 3 + ot);
6734 tcg_gen_shli_tl(cpu_tmp0, cpu_tmp0, ot);
6735 tcg_gen_add_tl(cpu_A0, cpu_A0, cpu_tmp0);
6736 gen_op_ld_T0_A0(ot + s->mem_index);
6737 } else {
6738 gen_op_mov_TN_reg(ot, 0, rm);
6739 }
6740 bt_op:
6741 tcg_gen_andi_tl(cpu_T[1], cpu_T[1], (1 << (3 + ot)) - 1);
6742 switch(op) {
6743 case 0:
6744 tcg_gen_shr_tl(cpu_cc_src, cpu_T[0], cpu_T[1]);
6745 tcg_gen_movi_tl(cpu_cc_dst, 0);
6746 break;
6747 case 1:
6748 tcg_gen_shr_tl(cpu_tmp4, cpu_T[0], cpu_T[1]);
6749 tcg_gen_movi_tl(cpu_tmp0, 1);
6750 tcg_gen_shl_tl(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6751 tcg_gen_or_tl(cpu_T[0], cpu_T[0], cpu_tmp0);
6752 break;
6753 case 2:
6754 tcg_gen_shr_tl(cpu_tmp4, cpu_T[0], cpu_T[1]);
6755 tcg_gen_movi_tl(cpu_tmp0, 1);
6756 tcg_gen_shl_tl(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6757 tcg_gen_not_tl(cpu_tmp0, cpu_tmp0);
6758 tcg_gen_and_tl(cpu_T[0], cpu_T[0], cpu_tmp0);
6759 break;
6760 default:
6761 case 3:
6762 tcg_gen_shr_tl(cpu_tmp4, cpu_T[0], cpu_T[1]);
6763 tcg_gen_movi_tl(cpu_tmp0, 1);
6764 tcg_gen_shl_tl(cpu_tmp0, cpu_tmp0, cpu_T[1]);
6765 tcg_gen_xor_tl(cpu_T[0], cpu_T[0], cpu_tmp0);
6766 break;
6767 }
6768 set_cc_op(s, CC_OP_SARB + ot);
6769 if (op != 0) {
6770 if (mod != 3)
6771 gen_op_st_T0_A0(ot + s->mem_index);
6772 else
6773 gen_op_mov_reg_T0(ot, rm);
6774 tcg_gen_mov_tl(cpu_cc_src, cpu_tmp4);
6775 tcg_gen_movi_tl(cpu_cc_dst, 0);
6776 }
6777 break;
6778 case 0x1bc: /* bsf */
6779 case 0x1bd: /* bsr */
6780 {
6781 int label1;
6782 TCGv t0;
6783
6784 ot = dflag + OT_WORD;
6785 modrm = cpu_ldub_code(env, s->pc++);
6786 reg = ((modrm >> 3) & 7) | rex_r;
6787 gen_ldst_modrm(env, s,modrm, ot, OR_TMP0, 0);
6788 gen_extu(ot, cpu_T[0]);
6789 t0 = tcg_temp_local_new();
6790 tcg_gen_mov_tl(t0, cpu_T[0]);
6791 if ((b & 1) && (prefixes & PREFIX_REPZ) &&
6792 (s->cpuid_ext3_features & CPUID_EXT3_ABM)) {
6793 switch(ot) {
6794 case OT_WORD: gen_helper_lzcnt(cpu_T[0], t0,
6795 tcg_const_i32(16)); break;
6796 case OT_LONG: gen_helper_lzcnt(cpu_T[0], t0,
6797 tcg_const_i32(32)); break;
6798 case OT_QUAD: gen_helper_lzcnt(cpu_T[0], t0,
6799 tcg_const_i32(64)); break;
6800 }
6801 gen_op_mov_reg_T0(ot, reg);
6802 } else {
6803 label1 = gen_new_label();
6804 tcg_gen_movi_tl(cpu_cc_dst, 0);
6805 tcg_gen_brcondi_tl(TCG_COND_EQ, t0, 0, label1);
6806 if (b & 1) {
6807 gen_helper_bsr(cpu_T[0], t0);
6808 } else {
6809 gen_helper_bsf(cpu_T[0], t0);
6810 }
6811 gen_op_mov_reg_T0(ot, reg);
6812 tcg_gen_movi_tl(cpu_cc_dst, 1);
6813 gen_set_label(label1);
6814 set_cc_op(s, CC_OP_LOGICB + ot);
6815 }
6816 tcg_temp_free(t0);
6817 }
6818 break;
6819 /************************/
6820 /* bcd */
6821 case 0x27: /* daa */
6822 if (CODE64(s))
6823 goto illegal_op;
6824 gen_update_cc_op(s);
6825 gen_helper_daa(cpu_env);
6826 set_cc_op(s, CC_OP_EFLAGS);
6827 break;
6828 case 0x2f: /* das */
6829 if (CODE64(s))
6830 goto illegal_op;
6831 gen_update_cc_op(s);
6832 gen_helper_das(cpu_env);
6833 set_cc_op(s, CC_OP_EFLAGS);
6834 break;
6835 case 0x37: /* aaa */
6836 if (CODE64(s))
6837 goto illegal_op;
6838 gen_update_cc_op(s);
6839 gen_helper_aaa(cpu_env);
6840 set_cc_op(s, CC_OP_EFLAGS);
6841 break;
6842 case 0x3f: /* aas */
6843 if (CODE64(s))
6844 goto illegal_op;
6845 gen_update_cc_op(s);
6846 gen_helper_aas(cpu_env);
6847 set_cc_op(s, CC_OP_EFLAGS);
6848 break;
6849 case 0xd4: /* aam */
6850 if (CODE64(s))
6851 goto illegal_op;
6852 val = cpu_ldub_code(env, s->pc++);
6853 if (val == 0) {
6854 gen_exception(s, EXCP00_DIVZ, pc_start - s->cs_base);
6855 } else {
6856 gen_helper_aam(cpu_env, tcg_const_i32(val));
6857 set_cc_op(s, CC_OP_LOGICB);
6858 }
6859 break;
6860 case 0xd5: /* aad */
6861 if (CODE64(s))
6862 goto illegal_op;
6863 val = cpu_ldub_code(env, s->pc++);
6864 gen_helper_aad(cpu_env, tcg_const_i32(val));
6865 set_cc_op(s, CC_OP_LOGICB);
6866 break;
6867 /************************/
6868 /* misc */
6869 case 0x90: /* nop */
6870 /* XXX: correct lock test for all insn */
6871 if (prefixes & PREFIX_LOCK) {
6872 goto illegal_op;
6873 }
6874 /* If REX_B is set, then this is xchg eax, r8d, not a nop. */
6875 if (REX_B(s)) {
6876 goto do_xchg_reg_eax;
6877 }
6878 if (prefixes & PREFIX_REPZ) {
6879 gen_svm_check_intercept(s, pc_start, SVM_EXIT_PAUSE);
6880 }
6881 break;
6882 case 0x9b: /* fwait */
6883 if ((s->flags & (HF_MP_MASK | HF_TS_MASK)) ==
6884 (HF_MP_MASK | HF_TS_MASK)) {
6885 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
6886 } else {
6887 gen_update_cc_op(s);
6888 gen_jmp_im(pc_start - s->cs_base);
6889 gen_helper_fwait(cpu_env);
6890 }
6891 break;
6892 case 0xcc: /* int3 */
6893 gen_interrupt(s, EXCP03_INT3, pc_start - s->cs_base, s->pc - s->cs_base);
6894 break;
6895 case 0xcd: /* int N */
6896 val = cpu_ldub_code(env, s->pc++);
6897 if (s->vm86 && s->iopl != 3) {
6898 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6899 } else {
6900 gen_interrupt(s, val, pc_start - s->cs_base, s->pc - s->cs_base);
6901 }
6902 break;
6903 case 0xce: /* into */
6904 if (CODE64(s))
6905 goto illegal_op;
6906 gen_update_cc_op(s);
6907 gen_jmp_im(pc_start - s->cs_base);
6908 gen_helper_into(cpu_env, tcg_const_i32(s->pc - pc_start));
6909 break;
6910 #ifdef WANT_ICEBP
6911 case 0xf1: /* icebp (undocumented, exits to external debugger) */
6912 gen_svm_check_intercept(s, pc_start, SVM_EXIT_ICEBP);
6913 #if 1
6914 gen_debug(s, pc_start - s->cs_base);
6915 #else
6916 /* start debug */
6917 tb_flush(env);
6918 qemu_set_log(CPU_LOG_INT | CPU_LOG_TB_IN_ASM);
6919 #endif
6920 break;
6921 #endif
6922 case 0xfa: /* cli */
6923 if (!s->vm86) {
6924 if (s->cpl <= s->iopl) {
6925 gen_helper_cli(cpu_env);
6926 } else {
6927 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6928 }
6929 } else {
6930 if (s->iopl == 3) {
6931 gen_helper_cli(cpu_env);
6932 } else {
6933 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6934 }
6935 }
6936 break;
6937 case 0xfb: /* sti */
6938 if (!s->vm86) {
6939 if (s->cpl <= s->iopl) {
6940 gen_sti:
6941 gen_helper_sti(cpu_env);
6942 /* interruptions are enabled only the first insn after sti */
6943 /* If several instructions disable interrupts, only the
6944 _first_ does it */
6945 if (!(s->tb->flags & HF_INHIBIT_IRQ_MASK))
6946 gen_helper_set_inhibit_irq(cpu_env);
6947 /* give a chance to handle pending irqs */
6948 gen_jmp_im(s->pc - s->cs_base);
6949 gen_eob(s);
6950 } else {
6951 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6952 }
6953 } else {
6954 if (s->iopl == 3) {
6955 goto gen_sti;
6956 } else {
6957 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
6958 }
6959 }
6960 break;
6961 case 0x62: /* bound */
6962 if (CODE64(s))
6963 goto illegal_op;
6964 ot = dflag ? OT_LONG : OT_WORD;
6965 modrm = cpu_ldub_code(env, s->pc++);
6966 reg = (modrm >> 3) & 7;
6967 mod = (modrm >> 6) & 3;
6968 if (mod == 3)
6969 goto illegal_op;
6970 gen_op_mov_TN_reg(ot, 0, reg);
6971 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
6972 gen_jmp_im(pc_start - s->cs_base);
6973 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
6974 if (ot == OT_WORD) {
6975 gen_helper_boundw(cpu_env, cpu_A0, cpu_tmp2_i32);
6976 } else {
6977 gen_helper_boundl(cpu_env, cpu_A0, cpu_tmp2_i32);
6978 }
6979 break;
6980 case 0x1c8 ... 0x1cf: /* bswap reg */
6981 reg = (b & 7) | REX_B(s);
6982 #ifdef TARGET_X86_64
6983 if (dflag == 2) {
6984 gen_op_mov_TN_reg(OT_QUAD, 0, reg);
6985 tcg_gen_bswap64_i64(cpu_T[0], cpu_T[0]);
6986 gen_op_mov_reg_T0(OT_QUAD, reg);
6987 } else
6988 #endif
6989 {
6990 gen_op_mov_TN_reg(OT_LONG, 0, reg);
6991 tcg_gen_ext32u_tl(cpu_T[0], cpu_T[0]);
6992 tcg_gen_bswap32_tl(cpu_T[0], cpu_T[0]);
6993 gen_op_mov_reg_T0(OT_LONG, reg);
6994 }
6995 break;
6996 case 0xd6: /* salc */
6997 if (CODE64(s))
6998 goto illegal_op;
6999 gen_compute_eflags_c(s, cpu_T[0], false);
7000 tcg_gen_neg_tl(cpu_T[0], cpu_T[0]);
7001 gen_op_mov_reg_T0(OT_BYTE, R_EAX);
7002 break;
7003 case 0xe0: /* loopnz */
7004 case 0xe1: /* loopz */
7005 case 0xe2: /* loop */
7006 case 0xe3: /* jecxz */
7007 {
7008 int l1, l2, l3;
7009
7010 tval = (int8_t)insn_get(env, s, OT_BYTE);
7011 next_eip = s->pc - s->cs_base;
7012 tval += next_eip;
7013 if (s->dflag == 0)
7014 tval &= 0xffff;
7015
7016 l1 = gen_new_label();
7017 l2 = gen_new_label();
7018 l3 = gen_new_label();
7019 b &= 3;
7020 switch(b) {
7021 case 0: /* loopnz */
7022 case 1: /* loopz */
7023 gen_op_add_reg_im(s->aflag, R_ECX, -1);
7024 gen_op_jz_ecx(s->aflag, l3);
7025 gen_jcc1(s, (JCC_Z << 1) | (b ^ 1), l1);
7026 break;
7027 case 2: /* loop */
7028 gen_op_add_reg_im(s->aflag, R_ECX, -1);
7029 gen_op_jnz_ecx(s->aflag, l1);
7030 break;
7031 default:
7032 case 3: /* jcxz */
7033 gen_op_jz_ecx(s->aflag, l1);
7034 break;
7035 }
7036
7037 gen_set_label(l3);
7038 gen_jmp_im(next_eip);
7039 tcg_gen_br(l2);
7040
7041 gen_set_label(l1);
7042 gen_jmp_im(tval);
7043 gen_set_label(l2);
7044 gen_eob(s);
7045 }
7046 break;
7047 case 0x130: /* wrmsr */
7048 case 0x132: /* rdmsr */
7049 if (s->cpl != 0) {
7050 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7051 } else {
7052 gen_update_cc_op(s);
7053 gen_jmp_im(pc_start - s->cs_base);
7054 if (b & 2) {
7055 gen_helper_rdmsr(cpu_env);
7056 } else {
7057 gen_helper_wrmsr(cpu_env);
7058 }
7059 }
7060 break;
7061 case 0x131: /* rdtsc */
7062 gen_update_cc_op(s);
7063 gen_jmp_im(pc_start - s->cs_base);
7064 if (use_icount)
7065 gen_io_start();
7066 gen_helper_rdtsc(cpu_env);
7067 if (use_icount) {
7068 gen_io_end();
7069 gen_jmp(s, s->pc - s->cs_base);
7070 }
7071 break;
7072 case 0x133: /* rdpmc */
7073 gen_update_cc_op(s);
7074 gen_jmp_im(pc_start - s->cs_base);
7075 gen_helper_rdpmc(cpu_env);
7076 break;
7077 case 0x134: /* sysenter */
7078 /* For Intel SYSENTER is valid on 64-bit */
7079 if (CODE64(s) && env->cpuid_vendor1 != CPUID_VENDOR_INTEL_1)
7080 goto illegal_op;
7081 if (!s->pe) {
7082 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7083 } else {
7084 gen_update_cc_op(s);
7085 gen_jmp_im(pc_start - s->cs_base);
7086 gen_helper_sysenter(cpu_env);
7087 gen_eob(s);
7088 }
7089 break;
7090 case 0x135: /* sysexit */
7091 /* For Intel SYSEXIT is valid on 64-bit */
7092 if (CODE64(s) && env->cpuid_vendor1 != CPUID_VENDOR_INTEL_1)
7093 goto illegal_op;
7094 if (!s->pe) {
7095 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7096 } else {
7097 gen_update_cc_op(s);
7098 gen_jmp_im(pc_start - s->cs_base);
7099 gen_helper_sysexit(cpu_env, tcg_const_i32(dflag));
7100 gen_eob(s);
7101 }
7102 break;
7103 #ifdef TARGET_X86_64
7104 case 0x105: /* syscall */
7105 /* XXX: is it usable in real mode ? */
7106 gen_update_cc_op(s);
7107 gen_jmp_im(pc_start - s->cs_base);
7108 gen_helper_syscall(cpu_env, tcg_const_i32(s->pc - pc_start));
7109 gen_eob(s);
7110 break;
7111 case 0x107: /* sysret */
7112 if (!s->pe) {
7113 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7114 } else {
7115 gen_update_cc_op(s);
7116 gen_jmp_im(pc_start - s->cs_base);
7117 gen_helper_sysret(cpu_env, tcg_const_i32(s->dflag));
7118 /* condition codes are modified only in long mode */
7119 if (s->lma) {
7120 set_cc_op(s, CC_OP_EFLAGS);
7121 }
7122 gen_eob(s);
7123 }
7124 break;
7125 #endif
7126 case 0x1a2: /* cpuid */
7127 gen_update_cc_op(s);
7128 gen_jmp_im(pc_start - s->cs_base);
7129 gen_helper_cpuid(cpu_env);
7130 break;
7131 case 0xf4: /* hlt */
7132 if (s->cpl != 0) {
7133 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7134 } else {
7135 gen_update_cc_op(s);
7136 gen_jmp_im(pc_start - s->cs_base);
7137 gen_helper_hlt(cpu_env, tcg_const_i32(s->pc - pc_start));
7138 s->is_jmp = DISAS_TB_JUMP;
7139 }
7140 break;
7141 case 0x100:
7142 modrm = cpu_ldub_code(env, s->pc++);
7143 mod = (modrm >> 6) & 3;
7144 op = (modrm >> 3) & 7;
7145 switch(op) {
7146 case 0: /* sldt */
7147 if (!s->pe || s->vm86)
7148 goto illegal_op;
7149 gen_svm_check_intercept(s, pc_start, SVM_EXIT_LDTR_READ);
7150 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,ldt.selector));
7151 ot = OT_WORD;
7152 if (mod == 3)
7153 ot += s->dflag;
7154 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
7155 break;
7156 case 2: /* lldt */
7157 if (!s->pe || s->vm86)
7158 goto illegal_op;
7159 if (s->cpl != 0) {
7160 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7161 } else {
7162 gen_svm_check_intercept(s, pc_start, SVM_EXIT_LDTR_WRITE);
7163 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7164 gen_jmp_im(pc_start - s->cs_base);
7165 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
7166 gen_helper_lldt(cpu_env, cpu_tmp2_i32);
7167 }
7168 break;
7169 case 1: /* str */
7170 if (!s->pe || s->vm86)
7171 goto illegal_op;
7172 gen_svm_check_intercept(s, pc_start, SVM_EXIT_TR_READ);
7173 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,tr.selector));
7174 ot = OT_WORD;
7175 if (mod == 3)
7176 ot += s->dflag;
7177 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 1);
7178 break;
7179 case 3: /* ltr */
7180 if (!s->pe || s->vm86)
7181 goto illegal_op;
7182 if (s->cpl != 0) {
7183 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7184 } else {
7185 gen_svm_check_intercept(s, pc_start, SVM_EXIT_TR_WRITE);
7186 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7187 gen_jmp_im(pc_start - s->cs_base);
7188 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
7189 gen_helper_ltr(cpu_env, cpu_tmp2_i32);
7190 }
7191 break;
7192 case 4: /* verr */
7193 case 5: /* verw */
7194 if (!s->pe || s->vm86)
7195 goto illegal_op;
7196 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7197 gen_update_cc_op(s);
7198 if (op == 4) {
7199 gen_helper_verr(cpu_env, cpu_T[0]);
7200 } else {
7201 gen_helper_verw(cpu_env, cpu_T[0]);
7202 }
7203 set_cc_op(s, CC_OP_EFLAGS);
7204 break;
7205 default:
7206 goto illegal_op;
7207 }
7208 break;
7209 case 0x101:
7210 modrm = cpu_ldub_code(env, s->pc++);
7211 mod = (modrm >> 6) & 3;
7212 op = (modrm >> 3) & 7;
7213 rm = modrm & 7;
7214 switch(op) {
7215 case 0: /* sgdt */
7216 if (mod == 3)
7217 goto illegal_op;
7218 gen_svm_check_intercept(s, pc_start, SVM_EXIT_GDTR_READ);
7219 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7220 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, gdt.limit));
7221 gen_op_st_T0_A0(OT_WORD + s->mem_index);
7222 gen_add_A0_im(s, 2);
7223 tcg_gen_ld_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, gdt.base));
7224 if (!s->dflag)
7225 gen_op_andl_T0_im(0xffffff);
7226 gen_op_st_T0_A0(CODE64(s) + OT_LONG + s->mem_index);
7227 break;
7228 case 1:
7229 if (mod == 3) {
7230 switch (rm) {
7231 case 0: /* monitor */
7232 if (!(s->cpuid_ext_features & CPUID_EXT_MONITOR) ||
7233 s->cpl != 0)
7234 goto illegal_op;
7235 gen_update_cc_op(s);
7236 gen_jmp_im(pc_start - s->cs_base);
7237 #ifdef TARGET_X86_64
7238 if (s->aflag == 2) {
7239 gen_op_movq_A0_reg(R_EAX);
7240 } else
7241 #endif
7242 {
7243 gen_op_movl_A0_reg(R_EAX);
7244 if (s->aflag == 0)
7245 gen_op_andl_A0_ffff();
7246 }
7247 gen_add_A0_ds_seg(s);
7248 gen_helper_monitor(cpu_env, cpu_A0);
7249 break;
7250 case 1: /* mwait */
7251 if (!(s->cpuid_ext_features & CPUID_EXT_MONITOR) ||
7252 s->cpl != 0)
7253 goto illegal_op;
7254 gen_update_cc_op(s);
7255 gen_jmp_im(pc_start - s->cs_base);
7256 gen_helper_mwait(cpu_env, tcg_const_i32(s->pc - pc_start));
7257 gen_eob(s);
7258 break;
7259 case 2: /* clac */
7260 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_SMAP) ||
7261 s->cpl != 0) {
7262 goto illegal_op;
7263 }
7264 gen_helper_clac(cpu_env);
7265 gen_jmp_im(s->pc - s->cs_base);
7266 gen_eob(s);
7267 break;
7268 case 3: /* stac */
7269 if (!(s->cpuid_7_0_ebx_features & CPUID_7_0_EBX_SMAP) ||
7270 s->cpl != 0) {
7271 goto illegal_op;
7272 }
7273 gen_helper_stac(cpu_env);
7274 gen_jmp_im(s->pc - s->cs_base);
7275 gen_eob(s);
7276 break;
7277 default:
7278 goto illegal_op;
7279 }
7280 } else { /* sidt */
7281 gen_svm_check_intercept(s, pc_start, SVM_EXIT_IDTR_READ);
7282 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7283 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, idt.limit));
7284 gen_op_st_T0_A0(OT_WORD + s->mem_index);
7285 gen_add_A0_im(s, 2);
7286 tcg_gen_ld_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, idt.base));
7287 if (!s->dflag)
7288 gen_op_andl_T0_im(0xffffff);
7289 gen_op_st_T0_A0(CODE64(s) + OT_LONG + s->mem_index);
7290 }
7291 break;
7292 case 2: /* lgdt */
7293 case 3: /* lidt */
7294 if (mod == 3) {
7295 gen_update_cc_op(s);
7296 gen_jmp_im(pc_start - s->cs_base);
7297 switch(rm) {
7298 case 0: /* VMRUN */
7299 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7300 goto illegal_op;
7301 if (s->cpl != 0) {
7302 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7303 break;
7304 } else {
7305 gen_helper_vmrun(cpu_env, tcg_const_i32(s->aflag),
7306 tcg_const_i32(s->pc - pc_start));
7307 tcg_gen_exit_tb(0);
7308 s->is_jmp = DISAS_TB_JUMP;
7309 }
7310 break;
7311 case 1: /* VMMCALL */
7312 if (!(s->flags & HF_SVME_MASK))
7313 goto illegal_op;
7314 gen_helper_vmmcall(cpu_env);
7315 break;
7316 case 2: /* VMLOAD */
7317 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7318 goto illegal_op;
7319 if (s->cpl != 0) {
7320 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7321 break;
7322 } else {
7323 gen_helper_vmload(cpu_env, tcg_const_i32(s->aflag));
7324 }
7325 break;
7326 case 3: /* VMSAVE */
7327 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7328 goto illegal_op;
7329 if (s->cpl != 0) {
7330 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7331 break;
7332 } else {
7333 gen_helper_vmsave(cpu_env, tcg_const_i32(s->aflag));
7334 }
7335 break;
7336 case 4: /* STGI */
7337 if ((!(s->flags & HF_SVME_MASK) &&
7338 !(s->cpuid_ext3_features & CPUID_EXT3_SKINIT)) ||
7339 !s->pe)
7340 goto illegal_op;
7341 if (s->cpl != 0) {
7342 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7343 break;
7344 } else {
7345 gen_helper_stgi(cpu_env);
7346 }
7347 break;
7348 case 5: /* CLGI */
7349 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7350 goto illegal_op;
7351 if (s->cpl != 0) {
7352 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7353 break;
7354 } else {
7355 gen_helper_clgi(cpu_env);
7356 }
7357 break;
7358 case 6: /* SKINIT */
7359 if ((!(s->flags & HF_SVME_MASK) &&
7360 !(s->cpuid_ext3_features & CPUID_EXT3_SKINIT)) ||
7361 !s->pe)
7362 goto illegal_op;
7363 gen_helper_skinit(cpu_env);
7364 break;
7365 case 7: /* INVLPGA */
7366 if (!(s->flags & HF_SVME_MASK) || !s->pe)
7367 goto illegal_op;
7368 if (s->cpl != 0) {
7369 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7370 break;
7371 } else {
7372 gen_helper_invlpga(cpu_env, tcg_const_i32(s->aflag));
7373 }
7374 break;
7375 default:
7376 goto illegal_op;
7377 }
7378 } else if (s->cpl != 0) {
7379 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7380 } else {
7381 gen_svm_check_intercept(s, pc_start,
7382 op==2 ? SVM_EXIT_GDTR_WRITE : SVM_EXIT_IDTR_WRITE);
7383 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7384 gen_op_ld_T1_A0(OT_WORD + s->mem_index);
7385 gen_add_A0_im(s, 2);
7386 gen_op_ld_T0_A0(CODE64(s) + OT_LONG + s->mem_index);
7387 if (!s->dflag)
7388 gen_op_andl_T0_im(0xffffff);
7389 if (op == 2) {
7390 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,gdt.base));
7391 tcg_gen_st32_tl(cpu_T[1], cpu_env, offsetof(CPUX86State,gdt.limit));
7392 } else {
7393 tcg_gen_st_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,idt.base));
7394 tcg_gen_st32_tl(cpu_T[1], cpu_env, offsetof(CPUX86State,idt.limit));
7395 }
7396 }
7397 break;
7398 case 4: /* smsw */
7399 gen_svm_check_intercept(s, pc_start, SVM_EXIT_READ_CR0);
7400 #if defined TARGET_X86_64 && defined HOST_WORDS_BIGENDIAN
7401 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,cr[0]) + 4);
7402 #else
7403 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,cr[0]));
7404 #endif
7405 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 1);
7406 break;
7407 case 6: /* lmsw */
7408 if (s->cpl != 0) {
7409 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7410 } else {
7411 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_CR0);
7412 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7413 gen_helper_lmsw(cpu_env, cpu_T[0]);
7414 gen_jmp_im(s->pc - s->cs_base);
7415 gen_eob(s);
7416 }
7417 break;
7418 case 7:
7419 if (mod != 3) { /* invlpg */
7420 if (s->cpl != 0) {
7421 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7422 } else {
7423 gen_update_cc_op(s);
7424 gen_jmp_im(pc_start - s->cs_base);
7425 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7426 gen_helper_invlpg(cpu_env, cpu_A0);
7427 gen_jmp_im(s->pc - s->cs_base);
7428 gen_eob(s);
7429 }
7430 } else {
7431 switch (rm) {
7432 case 0: /* swapgs */
7433 #ifdef TARGET_X86_64
7434 if (CODE64(s)) {
7435 if (s->cpl != 0) {
7436 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7437 } else {
7438 tcg_gen_ld_tl(cpu_T[0], cpu_env,
7439 offsetof(CPUX86State,segs[R_GS].base));
7440 tcg_gen_ld_tl(cpu_T[1], cpu_env,
7441 offsetof(CPUX86State,kernelgsbase));
7442 tcg_gen_st_tl(cpu_T[1], cpu_env,
7443 offsetof(CPUX86State,segs[R_GS].base));
7444 tcg_gen_st_tl(cpu_T[0], cpu_env,
7445 offsetof(CPUX86State,kernelgsbase));
7446 }
7447 } else
7448 #endif
7449 {
7450 goto illegal_op;
7451 }
7452 break;
7453 case 1: /* rdtscp */
7454 if (!(s->cpuid_ext2_features & CPUID_EXT2_RDTSCP))
7455 goto illegal_op;
7456 gen_update_cc_op(s);
7457 gen_jmp_im(pc_start - s->cs_base);
7458 if (use_icount)
7459 gen_io_start();
7460 gen_helper_rdtscp(cpu_env);
7461 if (use_icount) {
7462 gen_io_end();
7463 gen_jmp(s, s->pc - s->cs_base);
7464 }
7465 break;
7466 default:
7467 goto illegal_op;
7468 }
7469 }
7470 break;
7471 default:
7472 goto illegal_op;
7473 }
7474 break;
7475 case 0x108: /* invd */
7476 case 0x109: /* wbinvd */
7477 if (s->cpl != 0) {
7478 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7479 } else {
7480 gen_svm_check_intercept(s, pc_start, (b & 2) ? SVM_EXIT_INVD : SVM_EXIT_WBINVD);
7481 /* nothing to do */
7482 }
7483 break;
7484 case 0x63: /* arpl or movslS (x86_64) */
7485 #ifdef TARGET_X86_64
7486 if (CODE64(s)) {
7487 int d_ot;
7488 /* d_ot is the size of destination */
7489 d_ot = dflag + OT_WORD;
7490
7491 modrm = cpu_ldub_code(env, s->pc++);
7492 reg = ((modrm >> 3) & 7) | rex_r;
7493 mod = (modrm >> 6) & 3;
7494 rm = (modrm & 7) | REX_B(s);
7495
7496 if (mod == 3) {
7497 gen_op_mov_TN_reg(OT_LONG, 0, rm);
7498 /* sign extend */
7499 if (d_ot == OT_QUAD)
7500 tcg_gen_ext32s_tl(cpu_T[0], cpu_T[0]);
7501 gen_op_mov_reg_T0(d_ot, reg);
7502 } else {
7503 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7504 if (d_ot == OT_QUAD) {
7505 gen_op_lds_T0_A0(OT_LONG + s->mem_index);
7506 } else {
7507 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
7508 }
7509 gen_op_mov_reg_T0(d_ot, reg);
7510 }
7511 } else
7512 #endif
7513 {
7514 int label1;
7515 TCGv t0, t1, t2, a0;
7516
7517 if (!s->pe || s->vm86)
7518 goto illegal_op;
7519 t0 = tcg_temp_local_new();
7520 t1 = tcg_temp_local_new();
7521 t2 = tcg_temp_local_new();
7522 ot = OT_WORD;
7523 modrm = cpu_ldub_code(env, s->pc++);
7524 reg = (modrm >> 3) & 7;
7525 mod = (modrm >> 6) & 3;
7526 rm = modrm & 7;
7527 if (mod != 3) {
7528 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7529 gen_op_ld_v(ot + s->mem_index, t0, cpu_A0);
7530 a0 = tcg_temp_local_new();
7531 tcg_gen_mov_tl(a0, cpu_A0);
7532 } else {
7533 gen_op_mov_v_reg(ot, t0, rm);
7534 TCGV_UNUSED(a0);
7535 }
7536 gen_op_mov_v_reg(ot, t1, reg);
7537 tcg_gen_andi_tl(cpu_tmp0, t0, 3);
7538 tcg_gen_andi_tl(t1, t1, 3);
7539 tcg_gen_movi_tl(t2, 0);
7540 label1 = gen_new_label();
7541 tcg_gen_brcond_tl(TCG_COND_GE, cpu_tmp0, t1, label1);
7542 tcg_gen_andi_tl(t0, t0, ~3);
7543 tcg_gen_or_tl(t0, t0, t1);
7544 tcg_gen_movi_tl(t2, CC_Z);
7545 gen_set_label(label1);
7546 if (mod != 3) {
7547 gen_op_st_v(ot + s->mem_index, t0, a0);
7548 tcg_temp_free(a0);
7549 } else {
7550 gen_op_mov_reg_v(ot, rm, t0);
7551 }
7552 gen_compute_eflags(s);
7553 tcg_gen_andi_tl(cpu_cc_src, cpu_cc_src, ~CC_Z);
7554 tcg_gen_or_tl(cpu_cc_src, cpu_cc_src, t2);
7555 tcg_temp_free(t0);
7556 tcg_temp_free(t1);
7557 tcg_temp_free(t2);
7558 }
7559 break;
7560 case 0x102: /* lar */
7561 case 0x103: /* lsl */
7562 {
7563 int label1;
7564 TCGv t0;
7565 if (!s->pe || s->vm86)
7566 goto illegal_op;
7567 ot = dflag ? OT_LONG : OT_WORD;
7568 modrm = cpu_ldub_code(env, s->pc++);
7569 reg = ((modrm >> 3) & 7) | rex_r;
7570 gen_ldst_modrm(env, s, modrm, OT_WORD, OR_TMP0, 0);
7571 t0 = tcg_temp_local_new();
7572 gen_update_cc_op(s);
7573 if (b == 0x102) {
7574 gen_helper_lar(t0, cpu_env, cpu_T[0]);
7575 } else {
7576 gen_helper_lsl(t0, cpu_env, cpu_T[0]);
7577 }
7578 tcg_gen_andi_tl(cpu_tmp0, cpu_cc_src, CC_Z);
7579 label1 = gen_new_label();
7580 tcg_gen_brcondi_tl(TCG_COND_EQ, cpu_tmp0, 0, label1);
7581 gen_op_mov_reg_v(ot, reg, t0);
7582 gen_set_label(label1);
7583 set_cc_op(s, CC_OP_EFLAGS);
7584 tcg_temp_free(t0);
7585 }
7586 break;
7587 case 0x118:
7588 modrm = cpu_ldub_code(env, s->pc++);
7589 mod = (modrm >> 6) & 3;
7590 op = (modrm >> 3) & 7;
7591 switch(op) {
7592 case 0: /* prefetchnta */
7593 case 1: /* prefetchnt0 */
7594 case 2: /* prefetchnt0 */
7595 case 3: /* prefetchnt0 */
7596 if (mod == 3)
7597 goto illegal_op;
7598 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7599 /* nothing more to do */
7600 break;
7601 default: /* nop (multi byte) */
7602 gen_nop_modrm(env, s, modrm);
7603 break;
7604 }
7605 break;
7606 case 0x119 ... 0x11f: /* nop (multi byte) */
7607 modrm = cpu_ldub_code(env, s->pc++);
7608 gen_nop_modrm(env, s, modrm);
7609 break;
7610 case 0x120: /* mov reg, crN */
7611 case 0x122: /* mov crN, reg */
7612 if (s->cpl != 0) {
7613 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7614 } else {
7615 modrm = cpu_ldub_code(env, s->pc++);
7616 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7617 * AMD documentation (24594.pdf) and testing of
7618 * intel 386 and 486 processors all show that the mod bits
7619 * are assumed to be 1's, regardless of actual values.
7620 */
7621 rm = (modrm & 7) | REX_B(s);
7622 reg = ((modrm >> 3) & 7) | rex_r;
7623 if (CODE64(s))
7624 ot = OT_QUAD;
7625 else
7626 ot = OT_LONG;
7627 if ((prefixes & PREFIX_LOCK) && (reg == 0) &&
7628 (s->cpuid_ext3_features & CPUID_EXT3_CR8LEG)) {
7629 reg = 8;
7630 }
7631 switch(reg) {
7632 case 0:
7633 case 2:
7634 case 3:
7635 case 4:
7636 case 8:
7637 gen_update_cc_op(s);
7638 gen_jmp_im(pc_start - s->cs_base);
7639 if (b & 2) {
7640 gen_op_mov_TN_reg(ot, 0, rm);
7641 gen_helper_write_crN(cpu_env, tcg_const_i32(reg),
7642 cpu_T[0]);
7643 gen_jmp_im(s->pc - s->cs_base);
7644 gen_eob(s);
7645 } else {
7646 gen_helper_read_crN(cpu_T[0], cpu_env, tcg_const_i32(reg));
7647 gen_op_mov_reg_T0(ot, rm);
7648 }
7649 break;
7650 default:
7651 goto illegal_op;
7652 }
7653 }
7654 break;
7655 case 0x121: /* mov reg, drN */
7656 case 0x123: /* mov drN, reg */
7657 if (s->cpl != 0) {
7658 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7659 } else {
7660 modrm = cpu_ldub_code(env, s->pc++);
7661 /* Ignore the mod bits (assume (modrm&0xc0)==0xc0).
7662 * AMD documentation (24594.pdf) and testing of
7663 * intel 386 and 486 processors all show that the mod bits
7664 * are assumed to be 1's, regardless of actual values.
7665 */
7666 rm = (modrm & 7) | REX_B(s);
7667 reg = ((modrm >> 3) & 7) | rex_r;
7668 if (CODE64(s))
7669 ot = OT_QUAD;
7670 else
7671 ot = OT_LONG;
7672 /* XXX: do it dynamically with CR4.DE bit */
7673 if (reg == 4 || reg == 5 || reg >= 8)
7674 goto illegal_op;
7675 if (b & 2) {
7676 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_DR0 + reg);
7677 gen_op_mov_TN_reg(ot, 0, rm);
7678 gen_helper_movl_drN_T0(cpu_env, tcg_const_i32(reg), cpu_T[0]);
7679 gen_jmp_im(s->pc - s->cs_base);
7680 gen_eob(s);
7681 } else {
7682 gen_svm_check_intercept(s, pc_start, SVM_EXIT_READ_DR0 + reg);
7683 tcg_gen_ld_tl(cpu_T[0], cpu_env, offsetof(CPUX86State,dr[reg]));
7684 gen_op_mov_reg_T0(ot, rm);
7685 }
7686 }
7687 break;
7688 case 0x106: /* clts */
7689 if (s->cpl != 0) {
7690 gen_exception(s, EXCP0D_GPF, pc_start - s->cs_base);
7691 } else {
7692 gen_svm_check_intercept(s, pc_start, SVM_EXIT_WRITE_CR0);
7693 gen_helper_clts(cpu_env);
7694 /* abort block because static cpu state changed */
7695 gen_jmp_im(s->pc - s->cs_base);
7696 gen_eob(s);
7697 }
7698 break;
7699 /* MMX/3DNow!/SSE/SSE2/SSE3/SSSE3/SSE4 support */
7700 case 0x1c3: /* MOVNTI reg, mem */
7701 if (!(s->cpuid_features & CPUID_SSE2))
7702 goto illegal_op;
7703 ot = s->dflag == 2 ? OT_QUAD : OT_LONG;
7704 modrm = cpu_ldub_code(env, s->pc++);
7705 mod = (modrm >> 6) & 3;
7706 if (mod == 3)
7707 goto illegal_op;
7708 reg = ((modrm >> 3) & 7) | rex_r;
7709 /* generate a generic store */
7710 gen_ldst_modrm(env, s, modrm, ot, reg, 1);
7711 break;
7712 case 0x1ae:
7713 modrm = cpu_ldub_code(env, s->pc++);
7714 mod = (modrm >> 6) & 3;
7715 op = (modrm >> 3) & 7;
7716 switch(op) {
7717 case 0: /* fxsave */
7718 if (mod == 3 || !(s->cpuid_features & CPUID_FXSR) ||
7719 (s->prefix & PREFIX_LOCK))
7720 goto illegal_op;
7721 if ((s->flags & HF_EM_MASK) || (s->flags & HF_TS_MASK)) {
7722 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
7723 break;
7724 }
7725 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7726 gen_update_cc_op(s);
7727 gen_jmp_im(pc_start - s->cs_base);
7728 gen_helper_fxsave(cpu_env, cpu_A0, tcg_const_i32((s->dflag == 2)));
7729 break;
7730 case 1: /* fxrstor */
7731 if (mod == 3 || !(s->cpuid_features & CPUID_FXSR) ||
7732 (s->prefix & PREFIX_LOCK))
7733 goto illegal_op;
7734 if ((s->flags & HF_EM_MASK) || (s->flags & HF_TS_MASK)) {
7735 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
7736 break;
7737 }
7738 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7739 gen_update_cc_op(s);
7740 gen_jmp_im(pc_start - s->cs_base);
7741 gen_helper_fxrstor(cpu_env, cpu_A0,
7742 tcg_const_i32((s->dflag == 2)));
7743 break;
7744 case 2: /* ldmxcsr */
7745 case 3: /* stmxcsr */
7746 if (s->flags & HF_TS_MASK) {
7747 gen_exception(s, EXCP07_PREX, pc_start - s->cs_base);
7748 break;
7749 }
7750 if ((s->flags & HF_EM_MASK) || !(s->flags & HF_OSFXSR_MASK) ||
7751 mod == 3)
7752 goto illegal_op;
7753 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7754 if (op == 2) {
7755 gen_op_ld_T0_A0(OT_LONG + s->mem_index);
7756 tcg_gen_trunc_tl_i32(cpu_tmp2_i32, cpu_T[0]);
7757 gen_helper_ldmxcsr(cpu_env, cpu_tmp2_i32);
7758 } else {
7759 tcg_gen_ld32u_tl(cpu_T[0], cpu_env, offsetof(CPUX86State, mxcsr));
7760 gen_op_st_T0_A0(OT_LONG + s->mem_index);
7761 }
7762 break;
7763 case 5: /* lfence */
7764 case 6: /* mfence */
7765 if ((modrm & 0xc7) != 0xc0 || !(s->cpuid_features & CPUID_SSE2))
7766 goto illegal_op;
7767 break;
7768 case 7: /* sfence / clflush */
7769 if ((modrm & 0xc7) == 0xc0) {
7770 /* sfence */
7771 /* XXX: also check for cpuid_ext2_features & CPUID_EXT2_EMMX */
7772 if (!(s->cpuid_features & CPUID_SSE))
7773 goto illegal_op;
7774 } else {
7775 /* clflush */
7776 if (!(s->cpuid_features & CPUID_CLFLUSH))
7777 goto illegal_op;
7778 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7779 }
7780 break;
7781 default:
7782 goto illegal_op;
7783 }
7784 break;
7785 case 0x10d: /* 3DNow! prefetch(w) */
7786 modrm = cpu_ldub_code(env, s->pc++);
7787 mod = (modrm >> 6) & 3;
7788 if (mod == 3)
7789 goto illegal_op;
7790 gen_lea_modrm(env, s, modrm, &reg_addr, &offset_addr);
7791 /* ignore for now */
7792 break;
7793 case 0x1aa: /* rsm */
7794 gen_svm_check_intercept(s, pc_start, SVM_EXIT_RSM);
7795 if (!(s->flags & HF_SMM_MASK))
7796 goto illegal_op;
7797 gen_update_cc_op(s);
7798 gen_jmp_im(s->pc - s->cs_base);
7799 gen_helper_rsm(cpu_env);
7800 gen_eob(s);
7801 break;
7802 case 0x1b8: /* SSE4.2 popcnt */
7803 if ((prefixes & (PREFIX_REPZ | PREFIX_LOCK | PREFIX_REPNZ)) !=
7804 PREFIX_REPZ)
7805 goto illegal_op;
7806 if (!(s->cpuid_ext_features & CPUID_EXT_POPCNT))
7807 goto illegal_op;
7808
7809 modrm = cpu_ldub_code(env, s->pc++);
7810 reg = ((modrm >> 3) & 7) | rex_r;
7811
7812 if (s->prefix & PREFIX_DATA)
7813 ot = OT_WORD;
7814 else if (s->dflag != 2)
7815 ot = OT_LONG;
7816 else
7817 ot = OT_QUAD;
7818
7819 gen_ldst_modrm(env, s, modrm, ot, OR_TMP0, 0);
7820 gen_helper_popcnt(cpu_T[0], cpu_env, cpu_T[0], tcg_const_i32(ot));
7821 gen_op_mov_reg_T0(ot, reg);
7822
7823 set_cc_op(s, CC_OP_EFLAGS);
7824 break;
7825 case 0x10e ... 0x10f:
7826 /* 3DNow! instructions, ignore prefixes */
7827 s->prefix &= ~(PREFIX_REPZ | PREFIX_REPNZ | PREFIX_DATA);
7828 case 0x110 ... 0x117:
7829 case 0x128 ... 0x12f:
7830 case 0x138 ... 0x13a:
7831 case 0x150 ... 0x179:
7832 case 0x17c ... 0x17f:
7833 case 0x1c2:
7834 case 0x1c4 ... 0x1c6:
7835 case 0x1d0 ... 0x1fe:
7836 gen_sse(env, s, b, pc_start, rex_r);
7837 break;
7838 default:
7839 goto illegal_op;
7840 }
7841 /* lock generation */
7842 if (s->prefix & PREFIX_LOCK)
7843 gen_helper_unlock();
7844 return s->pc;
7845 illegal_op:
7846 if (s->prefix & PREFIX_LOCK)
7847 gen_helper_unlock();
7848 /* XXX: ensure that no lock was generated */
7849 gen_exception(s, EXCP06_ILLOP, pc_start - s->cs_base);
7850 return s->pc;
7851 }
7852
7853 void optimize_flags_init(void)
7854 {
7855 cpu_env = tcg_global_reg_new_ptr(TCG_AREG0, "env");
7856 cpu_cc_op = tcg_global_mem_new_i32(TCG_AREG0,
7857 offsetof(CPUX86State, cc_op), "cc_op");
7858 cpu_cc_src = tcg_global_mem_new(TCG_AREG0, offsetof(CPUX86State, cc_src),
7859 "cc_src");
7860 cpu_cc_dst = tcg_global_mem_new(TCG_AREG0, offsetof(CPUX86State, cc_dst),
7861 "cc_dst");
7862
7863 #ifdef TARGET_X86_64
7864 cpu_regs[R_EAX] = tcg_global_mem_new_i64(TCG_AREG0,
7865 offsetof(CPUX86State, regs[R_EAX]), "rax");
7866 cpu_regs[R_ECX] = tcg_global_mem_new_i64(TCG_AREG0,
7867 offsetof(CPUX86State, regs[R_ECX]), "rcx");
7868 cpu_regs[R_EDX] = tcg_global_mem_new_i64(TCG_AREG0,
7869 offsetof(CPUX86State, regs[R_EDX]), "rdx");
7870 cpu_regs[R_EBX] = tcg_global_mem_new_i64(TCG_AREG0,
7871 offsetof(CPUX86State, regs[R_EBX]), "rbx");
7872 cpu_regs[R_ESP] = tcg_global_mem_new_i64(TCG_AREG0,
7873 offsetof(CPUX86State, regs[R_ESP]), "rsp");
7874 cpu_regs[R_EBP] = tcg_global_mem_new_i64(TCG_AREG0,
7875 offsetof(CPUX86State, regs[R_EBP]), "rbp");
7876 cpu_regs[R_ESI] = tcg_global_mem_new_i64(TCG_AREG0,
7877 offsetof(CPUX86State, regs[R_ESI]), "rsi");
7878 cpu_regs[R_EDI] = tcg_global_mem_new_i64(TCG_AREG0,
7879 offsetof(CPUX86State, regs[R_EDI]), "rdi");
7880 cpu_regs[8] = tcg_global_mem_new_i64(TCG_AREG0,
7881 offsetof(CPUX86State, regs[8]), "r8");
7882 cpu_regs[9] = tcg_global_mem_new_i64(TCG_AREG0,
7883 offsetof(CPUX86State, regs[9]), "r9");
7884 cpu_regs[10] = tcg_global_mem_new_i64(TCG_AREG0,
7885 offsetof(CPUX86State, regs[10]), "r10");
7886 cpu_regs[11] = tcg_global_mem_new_i64(TCG_AREG0,
7887 offsetof(CPUX86State, regs[11]), "r11");
7888 cpu_regs[12] = tcg_global_mem_new_i64(TCG_AREG0,
7889 offsetof(CPUX86State, regs[12]), "r12");
7890 cpu_regs[13] = tcg_global_mem_new_i64(TCG_AREG0,
7891 offsetof(CPUX86State, regs[13]), "r13");
7892 cpu_regs[14] = tcg_global_mem_new_i64(TCG_AREG0,
7893 offsetof(CPUX86State, regs[14]), "r14");
7894 cpu_regs[15] = tcg_global_mem_new_i64(TCG_AREG0,
7895 offsetof(CPUX86State, regs[15]), "r15");
7896 #else
7897 cpu_regs[R_EAX] = tcg_global_mem_new_i32(TCG_AREG0,
7898 offsetof(CPUX86State, regs[R_EAX]), "eax");
7899 cpu_regs[R_ECX] = tcg_global_mem_new_i32(TCG_AREG0,
7900 offsetof(CPUX86State, regs[R_ECX]), "ecx");
7901 cpu_regs[R_EDX] = tcg_global_mem_new_i32(TCG_AREG0,
7902 offsetof(CPUX86State, regs[R_EDX]), "edx");
7903 cpu_regs[R_EBX] = tcg_global_mem_new_i32(TCG_AREG0,
7904 offsetof(CPUX86State, regs[R_EBX]), "ebx");
7905 cpu_regs[R_ESP] = tcg_global_mem_new_i32(TCG_AREG0,
7906 offsetof(CPUX86State, regs[R_ESP]), "esp");
7907 cpu_regs[R_EBP] = tcg_global_mem_new_i32(TCG_AREG0,
7908 offsetof(CPUX86State, regs[R_EBP]), "ebp");
7909 cpu_regs[R_ESI] = tcg_global_mem_new_i32(TCG_AREG0,
7910 offsetof(CPUX86State, regs[R_ESI]), "esi");
7911 cpu_regs[R_EDI] = tcg_global_mem_new_i32(TCG_AREG0,
7912 offsetof(CPUX86State, regs[R_EDI]), "edi");
7913 #endif
7914
7915 /* register helpers */
7916 #define GEN_HELPER 2
7917 #include "helper.h"
7918 }
7919
7920 /* generate intermediate code in gen_opc_buf and gen_opparam_buf for
7921 basic block 'tb'. If search_pc is TRUE, also generate PC
7922 information for each intermediate instruction. */
7923 static inline void gen_intermediate_code_internal(CPUX86State *env,
7924 TranslationBlock *tb,
7925 int search_pc)
7926 {
7927 DisasContext dc1, *dc = &dc1;
7928 target_ulong pc_ptr;
7929 uint16_t *gen_opc_end;
7930 CPUBreakpoint *bp;
7931 int j, lj;
7932 uint64_t flags;
7933 target_ulong pc_start;
7934 target_ulong cs_base;
7935 int num_insns;
7936 int max_insns;
7937
7938 /* generate intermediate code */
7939 pc_start = tb->pc;
7940 cs_base = tb->cs_base;
7941 flags = tb->flags;
7942
7943 dc->pe = (flags >> HF_PE_SHIFT) & 1;
7944 dc->code32 = (flags >> HF_CS32_SHIFT) & 1;
7945 dc->ss32 = (flags >> HF_SS32_SHIFT) & 1;
7946 dc->addseg = (flags >> HF_ADDSEG_SHIFT) & 1;
7947 dc->f_st = 0;
7948 dc->vm86 = (flags >> VM_SHIFT) & 1;
7949 dc->cpl = (flags >> HF_CPL_SHIFT) & 3;
7950 dc->iopl = (flags >> IOPL_SHIFT) & 3;
7951 dc->tf = (flags >> TF_SHIFT) & 1;
7952 dc->singlestep_enabled = env->singlestep_enabled;
7953 dc->cc_op = CC_OP_DYNAMIC;
7954 dc->cc_op_dirty = false;
7955 dc->cs_base = cs_base;
7956 dc->tb = tb;
7957 dc->popl_esp_hack = 0;
7958 /* select memory access functions */
7959 dc->mem_index = 0;
7960 if (flags & HF_SOFTMMU_MASK) {
7961 dc->mem_index = (cpu_mmu_index(env) + 1) << 2;
7962 }
7963 dc->cpuid_features = env->cpuid_features;
7964 dc->cpuid_ext_features = env->cpuid_ext_features;
7965 dc->cpuid_ext2_features = env->cpuid_ext2_features;
7966 dc->cpuid_ext3_features = env->cpuid_ext3_features;
7967 dc->cpuid_7_0_ebx_features = env->cpuid_7_0_ebx_features;
7968 #ifdef TARGET_X86_64
7969 dc->lma = (flags >> HF_LMA_SHIFT) & 1;
7970 dc->code64 = (flags >> HF_CS64_SHIFT) & 1;
7971 #endif
7972 dc->flags = flags;
7973 dc->jmp_opt = !(dc->tf || env->singlestep_enabled ||
7974 (flags & HF_INHIBIT_IRQ_MASK)
7975 #ifndef CONFIG_SOFTMMU
7976 || (flags & HF_SOFTMMU_MASK)
7977 #endif
7978 );
7979 #if 0
7980 /* check addseg logic */
7981 if (!dc->addseg && (dc->vm86 || !dc->pe || !dc->code32))
7982 printf("ERROR addseg\n");
7983 #endif
7984
7985 cpu_T[0] = tcg_temp_new();
7986 cpu_T[1] = tcg_temp_new();
7987 cpu_A0 = tcg_temp_new();
7988 cpu_T3 = tcg_temp_new();
7989
7990 cpu_tmp0 = tcg_temp_new();
7991 cpu_tmp1_i64 = tcg_temp_new_i64();
7992 cpu_tmp2_i32 = tcg_temp_new_i32();
7993 cpu_tmp3_i32 = tcg_temp_new_i32();
7994 cpu_tmp4 = tcg_temp_new();
7995 cpu_tmp5 = tcg_temp_new();
7996 cpu_ptr0 = tcg_temp_new_ptr();
7997 cpu_ptr1 = tcg_temp_new_ptr();
7998
7999 gen_opc_end = tcg_ctx.gen_opc_buf + OPC_MAX_SIZE;
8000
8001 dc->is_jmp = DISAS_NEXT;
8002 pc_ptr = pc_start;
8003 lj = -1;
8004 num_insns = 0;
8005 max_insns = tb->cflags & CF_COUNT_MASK;
8006 if (max_insns == 0)
8007 max_insns = CF_COUNT_MASK;
8008
8009 gen_icount_start();
8010 for(;;) {
8011 if (unlikely(!QTAILQ_EMPTY(&env->breakpoints))) {
8012 QTAILQ_FOREACH(bp, &env->breakpoints, entry) {
8013 if (bp->pc == pc_ptr &&
8014 !((bp->flags & BP_CPU) && (tb->flags & HF_RF_MASK))) {
8015 gen_debug(dc, pc_ptr - dc->cs_base);
8016 break;
8017 }
8018 }
8019 }
8020 if (search_pc) {
8021 j = tcg_ctx.gen_opc_ptr - tcg_ctx.gen_opc_buf;
8022 if (lj < j) {
8023 lj++;
8024 while (lj < j)
8025 tcg_ctx.gen_opc_instr_start[lj++] = 0;
8026 }
8027 tcg_ctx.gen_opc_pc[lj] = pc_ptr;
8028 gen_opc_cc_op[lj] = dc->cc_op;
8029 tcg_ctx.gen_opc_instr_start[lj] = 1;
8030 tcg_ctx.gen_opc_icount[lj] = num_insns;
8031 }
8032 if (num_insns + 1 == max_insns && (tb->cflags & CF_LAST_IO))
8033 gen_io_start();
8034
8035 pc_ptr = disas_insn(env, dc, pc_ptr);
8036 num_insns++;
8037 /* stop translation if indicated */
8038 if (dc->is_jmp)
8039 break;
8040 /* if single step mode, we generate only one instruction and
8041 generate an exception */
8042 /* if irq were inhibited with HF_INHIBIT_IRQ_MASK, we clear
8043 the flag and abort the translation to give the irqs a
8044 change to be happen */
8045 if (dc->tf || dc->singlestep_enabled ||
8046 (flags & HF_INHIBIT_IRQ_MASK)) {
8047 gen_jmp_im(pc_ptr - dc->cs_base);
8048 gen_eob(dc);
8049 break;
8050 }
8051 /* if too long translation, stop generation too */
8052 if (tcg_ctx.gen_opc_ptr >= gen_opc_end ||
8053 (pc_ptr - pc_start) >= (TARGET_PAGE_SIZE - 32) ||
8054 num_insns >= max_insns) {
8055 gen_jmp_im(pc_ptr - dc->cs_base);
8056 gen_eob(dc);
8057 break;
8058 }
8059 if (singlestep) {
8060 gen_jmp_im(pc_ptr - dc->cs_base);
8061 gen_eob(dc);
8062 break;
8063 }
8064 }
8065 if (tb->cflags & CF_LAST_IO)
8066 gen_io_end();
8067 gen_icount_end(tb, num_insns);
8068 *tcg_ctx.gen_opc_ptr = INDEX_op_end;
8069 /* we don't forget to fill the last values */
8070 if (search_pc) {
8071 j = tcg_ctx.gen_opc_ptr - tcg_ctx.gen_opc_buf;
8072 lj++;
8073 while (lj <= j)
8074 tcg_ctx.gen_opc_instr_start[lj++] = 0;
8075 }
8076
8077 #ifdef DEBUG_DISAS
8078 if (qemu_loglevel_mask(CPU_LOG_TB_IN_ASM)) {
8079 int disas_flags;
8080 qemu_log("----------------\n");
8081 qemu_log("IN: %s\n", lookup_symbol(pc_start));
8082 #ifdef TARGET_X86_64
8083 if (dc->code64)
8084 disas_flags = 2;
8085 else
8086 #endif
8087 disas_flags = !dc->code32;
8088 log_target_disas(env, pc_start, pc_ptr - pc_start, disas_flags);
8089 qemu_log("\n");
8090 }
8091 #endif
8092
8093 if (!search_pc) {
8094 tb->size = pc_ptr - pc_start;
8095 tb->icount = num_insns;
8096 }
8097 }
8098
8099 void gen_intermediate_code(CPUX86State *env, TranslationBlock *tb)
8100 {
8101 gen_intermediate_code_internal(env, tb, 0);
8102 }
8103
8104 void gen_intermediate_code_pc(CPUX86State *env, TranslationBlock *tb)
8105 {
8106 gen_intermediate_code_internal(env, tb, 1);
8107 }
8108
8109 void restore_state_to_opc(CPUX86State *env, TranslationBlock *tb, int pc_pos)
8110 {
8111 int cc_op;
8112 #ifdef DEBUG_DISAS
8113 if (qemu_loglevel_mask(CPU_LOG_TB_OP)) {
8114 int i;
8115 qemu_log("RESTORE:\n");
8116 for(i = 0;i <= pc_pos; i++) {
8117 if (tcg_ctx.gen_opc_instr_start[i]) {
8118 qemu_log("0x%04x: " TARGET_FMT_lx "\n", i,
8119 tcg_ctx.gen_opc_pc[i]);
8120 }
8121 }
8122 qemu_log("pc_pos=0x%x eip=" TARGET_FMT_lx " cs_base=%x\n",
8123 pc_pos, tcg_ctx.gen_opc_pc[pc_pos] - tb->cs_base,
8124 (uint32_t)tb->cs_base);
8125 }
8126 #endif
8127 env->eip = tcg_ctx.gen_opc_pc[pc_pos] - tb->cs_base;
8128 cc_op = gen_opc_cc_op[pc_pos];
8129 if (cc_op != CC_OP_DYNAMIC)
8130 env->cc_op = cc_op;
8131 }