1 /******************************************************************************
4 * Generic x86 (32-bit and 64-bit) instruction decoder and emulator.
6 * Copyright (c) 2005 Keir Fraser
8 * Linux coding style, mod r/m decoder, segment base fixes, real-mode
9 * privileged instructions:
11 * Copyright (C) 2006 Qumranet
12 * Copyright 2010 Red Hat, Inc. and/or its affiliates.
14 * Avi Kivity <avi@qumranet.com>
15 * Yaniv Kamay <yaniv@qumranet.com>
17 * This work is licensed under the terms of the GNU GPL, version 2. See
18 * the COPYING file in the top-level directory.
20 * From: xen-unstable 10676:af9809f51f81a3c43f276f00c81a52ef558afda4
23 #include <linux/kvm_host.h>
24 #include "kvm_cache_regs.h"
25 #include <linux/module.h>
26 #include <asm/kvm_emulate.h>
35 #define OpImplicit 1ull /* No generic decode */
36 #define OpReg 2ull /* Register */
37 #define OpMem 3ull /* Memory */
38 #define OpAcc 4ull /* Accumulator: AL/AX/EAX/RAX */
39 #define OpDI 5ull /* ES:DI/EDI/RDI */
40 #define OpMem64 6ull /* Memory, 64-bit */
41 #define OpImmUByte 7ull /* Zero-extended 8-bit immediate */
42 #define OpDX 8ull /* DX register */
43 #define OpCL 9ull /* CL register (for shifts) */
44 #define OpImmByte 10ull /* 8-bit sign extended immediate */
45 #define OpOne 11ull /* Implied 1 */
46 #define OpImm 12ull /* Sign extended immediate */
47 #define OpMem16 13ull /* Memory operand (16-bit). */
48 #define OpMem32 14ull /* Memory operand (32-bit). */
49 #define OpImmU 15ull /* Immediate operand, zero extended */
50 #define OpSI 16ull /* SI/ESI/RSI */
51 #define OpImmFAddr 17ull /* Immediate far address */
52 #define OpMemFAddr 18ull /* Far address in memory */
53 #define OpImmU16 19ull /* Immediate operand, 16 bits, zero extended */
54 #define OpES 20ull /* ES */
55 #define OpCS 21ull /* CS */
56 #define OpSS 22ull /* SS */
57 #define OpDS 23ull /* DS */
58 #define OpFS 24ull /* FS */
59 #define OpGS 25ull /* GS */
60 #define OpMem8 26ull /* 8-bit zero extended memory operand */
62 #define OpBits 5 /* Width of operand field */
63 #define OpMask ((1ull << OpBits) - 1)
66 * Opcode effective-address decode tables.
67 * Note that we only emulate instructions that have at least one memory
68 * operand (excluding implicit stack references). We assume that stack
69 * references and instruction fetches will never occur in special memory
70 * areas that require emulation. So, for example, 'mov <imm>,<reg>' need
74 /* Operand sizes: 8-bit operands or specified/overridden size. */
75 #define ByteOp (1<<0) /* 8-bit operands. */
76 /* Destination operand type. */
78 #define ImplicitOps (OpImplicit << DstShift)
79 #define DstReg (OpReg << DstShift)
80 #define DstMem (OpMem << DstShift)
81 #define DstAcc (OpAcc << DstShift)
82 #define DstDI (OpDI << DstShift)
83 #define DstMem64 (OpMem64 << DstShift)
84 #define DstImmUByte (OpImmUByte << DstShift)
85 #define DstDX (OpDX << DstShift)
86 #define DstMask (OpMask << DstShift)
87 /* Source operand type. */
89 #define SrcNone (OpNone << SrcShift)
90 #define SrcReg (OpReg << SrcShift)
91 #define SrcMem (OpMem << SrcShift)
92 #define SrcMem16 (OpMem16 << SrcShift)
93 #define SrcMem32 (OpMem32 << SrcShift)
94 #define SrcImm (OpImm << SrcShift)
95 #define SrcImmByte (OpImmByte << SrcShift)
96 #define SrcOne (OpOne << SrcShift)
97 #define SrcImmUByte (OpImmUByte << SrcShift)
98 #define SrcImmU (OpImmU << SrcShift)
99 #define SrcSI (OpSI << SrcShift)
100 #define SrcImmFAddr (OpImmFAddr << SrcShift)
101 #define SrcMemFAddr (OpMemFAddr << SrcShift)
102 #define SrcAcc (OpAcc << SrcShift)
103 #define SrcImmU16 (OpImmU16 << SrcShift)
104 #define SrcDX (OpDX << SrcShift)
105 #define SrcMem8 (OpMem8 << SrcShift)
106 #define SrcMask (OpMask << SrcShift)
107 #define BitOp (1<<11)
108 #define MemAbs (1<<12) /* Memory operand is absolute displacement */
109 #define String (1<<13) /* String instruction (rep capable) */
110 #define Stack (1<<14) /* Stack instruction (push/pop) */
111 #define GroupMask (7<<15) /* Opcode uses one of the group mechanisms */
112 #define Group (1<<15) /* Bits 3:5 of modrm byte extend opcode */
113 #define GroupDual (2<<15) /* Alternate decoding of mod == 3 */
114 #define Prefix (3<<15) /* Instruction varies with 66/f2/f3 prefix */
115 #define RMExt (4<<15) /* Opcode extension in ModRM r/m if mod == 3 */
116 #define Sse (1<<18) /* SSE Vector instruction */
117 /* Generic ModRM decode. */
118 #define ModRM (1<<19)
119 /* Destination is only written; never read. */
122 #define Prot (1<<21) /* instruction generates #UD if not in prot-mode */
123 #define VendorSpecific (1<<22) /* Vendor specific instruction */
124 #define NoAccess (1<<23) /* Don't access memory (lea/invlpg/verr etc) */
125 #define Op3264 (1<<24) /* Operand is 64b in long mode, 32b otherwise */
126 #define Undefined (1<<25) /* No Such Instruction */
127 #define Lock (1<<26) /* lock prefix is allowed for the instruction */
128 #define Priv (1<<27) /* instruction generates #GP if current CPL != 0 */
130 #define PageTable (1 << 29) /* instruction used to write page table */
131 /* Source 2 operand type */
132 #define Src2Shift (30)
133 #define Src2None (OpNone << Src2Shift)
134 #define Src2CL (OpCL << Src2Shift)
135 #define Src2ImmByte (OpImmByte << Src2Shift)
136 #define Src2One (OpOne << Src2Shift)
137 #define Src2Imm (OpImm << Src2Shift)
138 #define Src2ES (OpES << Src2Shift)
139 #define Src2CS (OpCS << Src2Shift)
140 #define Src2SS (OpSS << Src2Shift)
141 #define Src2DS (OpDS << Src2Shift)
142 #define Src2FS (OpFS << Src2Shift)
143 #define Src2GS (OpGS << Src2Shift)
144 #define Src2Mask (OpMask << Src2Shift)
145 #define Mmx ((u64)1 << 40) /* MMX Vector instruction */
146 #define Aligned ((u64)1 << 41) /* Explicitly aligned (e.g. MOVDQA) */
147 #define Unaligned ((u64)1 << 42) /* Explicitly unaligned (e.g. MOVDQU) */
148 #define Avx ((u64)1 << 43) /* Advanced Vector Extensions */
150 #define X2(x...) x, x
151 #define X3(x...) X2(x), x
152 #define X4(x...) X2(x), X2(x)
153 #define X5(x...) X4(x), x
154 #define X6(x...) X4(x), X2(x)
155 #define X7(x...) X4(x), X3(x)
156 #define X8(x...) X4(x), X4(x)
157 #define X16(x...) X8(x), X8(x)
163 int (*execute
)(struct x86_emulate_ctxt
*ctxt
);
164 struct opcode
*group
;
165 struct group_dual
*gdual
;
166 struct gprefix
*gprefix
;
168 int (*check_perm
)(struct x86_emulate_ctxt
*ctxt
);
172 struct opcode mod012
[8];
173 struct opcode mod3
[8];
177 struct opcode pfx_no
;
178 struct opcode pfx_66
;
179 struct opcode pfx_f2
;
180 struct opcode pfx_f3
;
183 /* EFLAGS bit definitions. */
184 #define EFLG_ID (1<<21)
185 #define EFLG_VIP (1<<20)
186 #define EFLG_VIF (1<<19)
187 #define EFLG_AC (1<<18)
188 #define EFLG_VM (1<<17)
189 #define EFLG_RF (1<<16)
190 #define EFLG_IOPL (3<<12)
191 #define EFLG_NT (1<<14)
192 #define EFLG_OF (1<<11)
193 #define EFLG_DF (1<<10)
194 #define EFLG_IF (1<<9)
195 #define EFLG_TF (1<<8)
196 #define EFLG_SF (1<<7)
197 #define EFLG_ZF (1<<6)
198 #define EFLG_AF (1<<4)
199 #define EFLG_PF (1<<2)
200 #define EFLG_CF (1<<0)
202 #define EFLG_RESERVED_ZEROS_MASK 0xffc0802a
203 #define EFLG_RESERVED_ONE_MASK 2
206 * Instruction emulation:
207 * Most instructions are emulated directly via a fragment of inline assembly
208 * code. This allows us to save/restore EFLAGS and thus very easily pick up
209 * any modified flags.
212 #if defined(CONFIG_X86_64)
213 #define _LO32 "k" /* force 32-bit operand */
214 #define _STK "%%rsp" /* stack pointer */
215 #elif defined(__i386__)
216 #define _LO32 "" /* force 32-bit operand */
217 #define _STK "%%esp" /* stack pointer */
221 * These EFLAGS bits are restored from saved value during emulation, and
222 * any changes are written back to the saved value after emulation.
224 #define EFLAGS_MASK (EFLG_OF|EFLG_SF|EFLG_ZF|EFLG_AF|EFLG_PF|EFLG_CF)
226 /* Before executing instruction: restore necessary bits in EFLAGS. */
227 #define _PRE_EFLAGS(_sav, _msk, _tmp) \
228 /* EFLAGS = (_sav & _msk) | (EFLAGS & ~_msk); _sav &= ~_msk; */ \
229 "movl %"_sav",%"_LO32 _tmp"; " \
232 "movl %"_msk",%"_LO32 _tmp"; " \
233 "andl %"_LO32 _tmp",("_STK"); " \
235 "notl %"_LO32 _tmp"; " \
236 "andl %"_LO32 _tmp",("_STK"); " \
237 "andl %"_LO32 _tmp","__stringify(BITS_PER_LONG/4)"("_STK"); " \
239 "orl %"_LO32 _tmp",("_STK"); " \
243 /* After executing instruction: write-back necessary bits in EFLAGS. */
244 #define _POST_EFLAGS(_sav, _msk, _tmp) \
245 /* _sav |= EFLAGS & _msk; */ \
248 "andl %"_msk",%"_LO32 _tmp"; " \
249 "orl %"_LO32 _tmp",%"_sav"; "
257 #define ____emulate_2op(ctxt, _op, _x, _y, _suffix, _dsttype) \
259 __asm__ __volatile__ ( \
260 _PRE_EFLAGS("0", "4", "2") \
261 _op _suffix " %"_x"3,%1; " \
262 _POST_EFLAGS("0", "4", "2") \
263 : "=m" ((ctxt)->eflags), \
264 "+q" (*(_dsttype*)&(ctxt)->dst.val), \
266 : _y ((ctxt)->src.val), "i" (EFLAGS_MASK)); \
270 /* Raw emulation: instruction has two explicit operands. */
271 #define __emulate_2op_nobyte(ctxt,_op,_wx,_wy,_lx,_ly,_qx,_qy) \
273 unsigned long _tmp; \
275 switch ((ctxt)->dst.bytes) { \
277 ____emulate_2op(ctxt,_op,_wx,_wy,"w",u16); \
280 ____emulate_2op(ctxt,_op,_lx,_ly,"l",u32); \
283 ON64(____emulate_2op(ctxt,_op,_qx,_qy,"q",u64)); \
288 #define __emulate_2op(ctxt,_op,_bx,_by,_wx,_wy,_lx,_ly,_qx,_qy) \
290 unsigned long _tmp; \
291 switch ((ctxt)->dst.bytes) { \
293 ____emulate_2op(ctxt,_op,_bx,_by,"b",u8); \
296 __emulate_2op_nobyte(ctxt, _op, \
297 _wx, _wy, _lx, _ly, _qx, _qy); \
302 /* Source operand is byte-sized and may be restricted to just %cl. */
303 #define emulate_2op_SrcB(ctxt, _op) \
304 __emulate_2op(ctxt, _op, "b", "c", "b", "c", "b", "c", "b", "c")
306 /* Source operand is byte, word, long or quad sized. */
307 #define emulate_2op_SrcV(ctxt, _op) \
308 __emulate_2op(ctxt, _op, "b", "q", "w", "r", _LO32, "r", "", "r")
310 /* Source operand is word, long or quad sized. */
311 #define emulate_2op_SrcV_nobyte(ctxt, _op) \
312 __emulate_2op_nobyte(ctxt, _op, "w", "r", _LO32, "r", "", "r")
314 /* Instruction has three operands and one operand is stored in ECX register */
315 #define __emulate_2op_cl(ctxt, _op, _suffix, _type) \
317 unsigned long _tmp; \
318 _type _clv = (ctxt)->src2.val; \
319 _type _srcv = (ctxt)->src.val; \
320 _type _dstv = (ctxt)->dst.val; \
322 __asm__ __volatile__ ( \
323 _PRE_EFLAGS("0", "5", "2") \
324 _op _suffix " %4,%1 \n" \
325 _POST_EFLAGS("0", "5", "2") \
326 : "=m" ((ctxt)->eflags), "+r" (_dstv), "=&r" (_tmp) \
327 : "c" (_clv) , "r" (_srcv), "i" (EFLAGS_MASK) \
330 (ctxt)->src2.val = (unsigned long) _clv; \
331 (ctxt)->src2.val = (unsigned long) _srcv; \
332 (ctxt)->dst.val = (unsigned long) _dstv; \
335 #define emulate_2op_cl(ctxt, _op) \
337 switch ((ctxt)->dst.bytes) { \
339 __emulate_2op_cl(ctxt, _op, "w", u16); \
342 __emulate_2op_cl(ctxt, _op, "l", u32); \
345 ON64(__emulate_2op_cl(ctxt, _op, "q", ulong)); \
350 #define __emulate_1op(ctxt, _op, _suffix) \
352 unsigned long _tmp; \
354 __asm__ __volatile__ ( \
355 _PRE_EFLAGS("0", "3", "2") \
356 _op _suffix " %1; " \
357 _POST_EFLAGS("0", "3", "2") \
358 : "=m" ((ctxt)->eflags), "+m" ((ctxt)->dst.val), \
360 : "i" (EFLAGS_MASK)); \
363 /* Instruction has only one explicit operand (no source operand). */
364 #define emulate_1op(ctxt, _op) \
366 switch ((ctxt)->dst.bytes) { \
367 case 1: __emulate_1op(ctxt, _op, "b"); break; \
368 case 2: __emulate_1op(ctxt, _op, "w"); break; \
369 case 4: __emulate_1op(ctxt, _op, "l"); break; \
370 case 8: ON64(__emulate_1op(ctxt, _op, "q")); break; \
374 #define __emulate_1op_rax_rdx(ctxt, _op, _suffix, _ex) \
376 unsigned long _tmp; \
377 ulong *rax = &(ctxt)->regs[VCPU_REGS_RAX]; \
378 ulong *rdx = &(ctxt)->regs[VCPU_REGS_RDX]; \
380 __asm__ __volatile__ ( \
381 _PRE_EFLAGS("0", "5", "1") \
383 _op _suffix " %6; " \
385 _POST_EFLAGS("0", "5", "1") \
386 ".pushsection .fixup,\"ax\" \n\t" \
387 "3: movb $1, %4 \n\t" \
390 _ASM_EXTABLE(1b, 3b) \
391 : "=m" ((ctxt)->eflags), "=&r" (_tmp), \
392 "+a" (*rax), "+d" (*rdx), "+qm"(_ex) \
393 : "i" (EFLAGS_MASK), "m" ((ctxt)->src.val), \
394 "a" (*rax), "d" (*rdx)); \
397 /* instruction has only one source operand, destination is implicit (e.g. mul, div, imul, idiv) */
398 #define emulate_1op_rax_rdx(ctxt, _op, _ex) \
400 switch((ctxt)->src.bytes) { \
402 __emulate_1op_rax_rdx(ctxt, _op, "b", _ex); \
405 __emulate_1op_rax_rdx(ctxt, _op, "w", _ex); \
408 __emulate_1op_rax_rdx(ctxt, _op, "l", _ex); \
411 __emulate_1op_rax_rdx(ctxt, _op, "q", _ex)); \
416 static int emulator_check_intercept(struct x86_emulate_ctxt
*ctxt
,
417 enum x86_intercept intercept
,
418 enum x86_intercept_stage stage
)
420 struct x86_instruction_info info
= {
421 .intercept
= intercept
,
422 .rep_prefix
= ctxt
->rep_prefix
,
423 .modrm_mod
= ctxt
->modrm_mod
,
424 .modrm_reg
= ctxt
->modrm_reg
,
425 .modrm_rm
= ctxt
->modrm_rm
,
426 .src_val
= ctxt
->src
.val64
,
427 .src_bytes
= ctxt
->src
.bytes
,
428 .dst_bytes
= ctxt
->dst
.bytes
,
429 .ad_bytes
= ctxt
->ad_bytes
,
430 .next_rip
= ctxt
->eip
,
433 return ctxt
->ops
->intercept(ctxt
, &info
, stage
);
436 static void assign_masked(ulong
*dest
, ulong src
, ulong mask
)
438 *dest
= (*dest
& ~mask
) | (src
& mask
);
441 static inline unsigned long ad_mask(struct x86_emulate_ctxt
*ctxt
)
443 return (1UL << (ctxt
->ad_bytes
<< 3)) - 1;
446 static ulong
stack_mask(struct x86_emulate_ctxt
*ctxt
)
449 struct desc_struct ss
;
451 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
453 ctxt
->ops
->get_segment(ctxt
, &sel
, &ss
, NULL
, VCPU_SREG_SS
);
454 return ~0U >> ((ss
.d
^ 1) * 16); /* d=0: 0xffff; d=1: 0xffffffff */
457 /* Access/update address held in a register, based on addressing mode. */
458 static inline unsigned long
459 address_mask(struct x86_emulate_ctxt
*ctxt
, unsigned long reg
)
461 if (ctxt
->ad_bytes
== sizeof(unsigned long))
464 return reg
& ad_mask(ctxt
);
467 static inline unsigned long
468 register_address(struct x86_emulate_ctxt
*ctxt
, unsigned long reg
)
470 return address_mask(ctxt
, reg
);
474 register_address_increment(struct x86_emulate_ctxt
*ctxt
, unsigned long *reg
, int inc
)
476 if (ctxt
->ad_bytes
== sizeof(unsigned long))
479 *reg
= (*reg
& ~ad_mask(ctxt
)) | ((*reg
+ inc
) & ad_mask(ctxt
));
482 static inline void jmp_rel(struct x86_emulate_ctxt
*ctxt
, int rel
)
484 register_address_increment(ctxt
, &ctxt
->_eip
, rel
);
487 static u32
desc_limit_scaled(struct desc_struct
*desc
)
489 u32 limit
= get_desc_limit(desc
);
491 return desc
->g
? (limit
<< 12) | 0xfff : limit
;
494 static void set_seg_override(struct x86_emulate_ctxt
*ctxt
, int seg
)
496 ctxt
->has_seg_override
= true;
497 ctxt
->seg_override
= seg
;
500 static unsigned long seg_base(struct x86_emulate_ctxt
*ctxt
, int seg
)
502 if (ctxt
->mode
== X86EMUL_MODE_PROT64
&& seg
< VCPU_SREG_FS
)
505 return ctxt
->ops
->get_cached_segment_base(ctxt
, seg
);
508 static unsigned seg_override(struct x86_emulate_ctxt
*ctxt
)
510 if (!ctxt
->has_seg_override
)
513 return ctxt
->seg_override
;
516 static int emulate_exception(struct x86_emulate_ctxt
*ctxt
, int vec
,
517 u32 error
, bool valid
)
519 ctxt
->exception
.vector
= vec
;
520 ctxt
->exception
.error_code
= error
;
521 ctxt
->exception
.error_code_valid
= valid
;
522 return X86EMUL_PROPAGATE_FAULT
;
525 static int emulate_db(struct x86_emulate_ctxt
*ctxt
)
527 return emulate_exception(ctxt
, DB_VECTOR
, 0, false);
530 static int emulate_gp(struct x86_emulate_ctxt
*ctxt
, int err
)
532 return emulate_exception(ctxt
, GP_VECTOR
, err
, true);
535 static int emulate_ss(struct x86_emulate_ctxt
*ctxt
, int err
)
537 return emulate_exception(ctxt
, SS_VECTOR
, err
, true);
540 static int emulate_ud(struct x86_emulate_ctxt
*ctxt
)
542 return emulate_exception(ctxt
, UD_VECTOR
, 0, false);
545 static int emulate_ts(struct x86_emulate_ctxt
*ctxt
, int err
)
547 return emulate_exception(ctxt
, TS_VECTOR
, err
, true);
550 static int emulate_de(struct x86_emulate_ctxt
*ctxt
)
552 return emulate_exception(ctxt
, DE_VECTOR
, 0, false);
555 static int emulate_nm(struct x86_emulate_ctxt
*ctxt
)
557 return emulate_exception(ctxt
, NM_VECTOR
, 0, false);
560 static u16
get_segment_selector(struct x86_emulate_ctxt
*ctxt
, unsigned seg
)
563 struct desc_struct desc
;
565 ctxt
->ops
->get_segment(ctxt
, &selector
, &desc
, NULL
, seg
);
569 static void set_segment_selector(struct x86_emulate_ctxt
*ctxt
, u16 selector
,
574 struct desc_struct desc
;
576 ctxt
->ops
->get_segment(ctxt
, &dummy
, &desc
, &base3
, seg
);
577 ctxt
->ops
->set_segment(ctxt
, selector
, &desc
, base3
, seg
);
581 * x86 defines three classes of vector instructions: explicitly
582 * aligned, explicitly unaligned, and the rest, which change behaviour
583 * depending on whether they're AVX encoded or not.
585 * Also included is CMPXCHG16B which is not a vector instruction, yet it is
586 * subject to the same check.
588 static bool insn_aligned(struct x86_emulate_ctxt
*ctxt
, unsigned size
)
590 if (likely(size
< 16))
593 if (ctxt
->d
& Aligned
)
595 else if (ctxt
->d
& Unaligned
)
597 else if (ctxt
->d
& Avx
)
603 static int __linearize(struct x86_emulate_ctxt
*ctxt
,
604 struct segmented_address addr
,
605 unsigned size
, bool write
, bool fetch
,
608 struct desc_struct desc
;
615 la
= seg_base(ctxt
, addr
.seg
) + addr
.ea
;
616 switch (ctxt
->mode
) {
617 case X86EMUL_MODE_REAL
:
619 case X86EMUL_MODE_PROT64
:
620 if (((signed long)la
<< 16) >> 16 != la
)
621 return emulate_gp(ctxt
, 0);
624 usable
= ctxt
->ops
->get_segment(ctxt
, &sel
, &desc
, NULL
,
628 /* code segment or read-only data segment */
629 if (((desc
.type
& 8) || !(desc
.type
& 2)) && write
)
631 /* unreadable code segment */
632 if (!fetch
&& (desc
.type
& 8) && !(desc
.type
& 2))
634 lim
= desc_limit_scaled(&desc
);
635 if ((desc
.type
& 8) || !(desc
.type
& 4)) {
636 /* expand-up segment */
637 if (addr
.ea
> lim
|| (u32
)(addr
.ea
+ size
- 1) > lim
)
640 /* exapand-down segment */
641 if (addr
.ea
<= lim
|| (u32
)(addr
.ea
+ size
- 1) <= lim
)
643 lim
= desc
.d
? 0xffffffff : 0xffff;
644 if (addr
.ea
> lim
|| (u32
)(addr
.ea
+ size
- 1) > lim
)
647 cpl
= ctxt
->ops
->cpl(ctxt
);
650 if (!(desc
.type
& 8)) {
654 } else if ((desc
.type
& 8) && !(desc
.type
& 4)) {
655 /* nonconforming code segment */
658 } else if ((desc
.type
& 8) && (desc
.type
& 4)) {
659 /* conforming code segment */
665 if (fetch
? ctxt
->mode
!= X86EMUL_MODE_PROT64
: ctxt
->ad_bytes
!= 8)
667 if (insn_aligned(ctxt
, size
) && ((la
& (size
- 1)) != 0))
668 return emulate_gp(ctxt
, 0);
670 return X86EMUL_CONTINUE
;
672 if (addr
.seg
== VCPU_SREG_SS
)
673 return emulate_ss(ctxt
, addr
.seg
);
675 return emulate_gp(ctxt
, addr
.seg
);
678 static int linearize(struct x86_emulate_ctxt
*ctxt
,
679 struct segmented_address addr
,
680 unsigned size
, bool write
,
683 return __linearize(ctxt
, addr
, size
, write
, false, linear
);
687 static int segmented_read_std(struct x86_emulate_ctxt
*ctxt
,
688 struct segmented_address addr
,
695 rc
= linearize(ctxt
, addr
, size
, false, &linear
);
696 if (rc
!= X86EMUL_CONTINUE
)
698 return ctxt
->ops
->read_std(ctxt
, linear
, data
, size
, &ctxt
->exception
);
702 * Fetch the next byte of the instruction being emulated which is pointed to
703 * by ctxt->_eip, then increment ctxt->_eip.
705 * Also prefetch the remaining bytes of the instruction without crossing page
706 * boundary if they are not in fetch_cache yet.
708 static int do_insn_fetch_byte(struct x86_emulate_ctxt
*ctxt
, u8
*dest
)
710 struct fetch_cache
*fc
= &ctxt
->fetch
;
714 if (ctxt
->_eip
== fc
->end
) {
715 unsigned long linear
;
716 struct segmented_address addr
= { .seg
= VCPU_SREG_CS
,
718 cur_size
= fc
->end
- fc
->start
;
719 size
= min(15UL - cur_size
,
720 PAGE_SIZE
- offset_in_page(ctxt
->_eip
));
721 rc
= __linearize(ctxt
, addr
, size
, false, true, &linear
);
722 if (unlikely(rc
!= X86EMUL_CONTINUE
))
724 rc
= ctxt
->ops
->fetch(ctxt
, linear
, fc
->data
+ cur_size
,
725 size
, &ctxt
->exception
);
726 if (unlikely(rc
!= X86EMUL_CONTINUE
))
730 *dest
= fc
->data
[ctxt
->_eip
- fc
->start
];
732 return X86EMUL_CONTINUE
;
735 static int do_insn_fetch(struct x86_emulate_ctxt
*ctxt
,
736 void *dest
, unsigned size
)
740 /* x86 instructions are limited to 15 bytes. */
741 if (unlikely(ctxt
->_eip
+ size
- ctxt
->eip
> 15))
742 return X86EMUL_UNHANDLEABLE
;
744 rc
= do_insn_fetch_byte(ctxt
, dest
++);
745 if (rc
!= X86EMUL_CONTINUE
)
748 return X86EMUL_CONTINUE
;
751 /* Fetch next part of the instruction being emulated. */
752 #define insn_fetch(_type, _ctxt) \
753 ({ unsigned long _x; \
754 rc = do_insn_fetch(_ctxt, &_x, sizeof(_type)); \
755 if (rc != X86EMUL_CONTINUE) \
760 #define insn_fetch_arr(_arr, _size, _ctxt) \
761 ({ rc = do_insn_fetch(_ctxt, _arr, (_size)); \
762 if (rc != X86EMUL_CONTINUE) \
767 * Given the 'reg' portion of a ModRM byte, and a register block, return a
768 * pointer into the block that addresses the relevant register.
769 * @highbyte_regs specifies whether to decode AH,CH,DH,BH.
771 static void *decode_register(u8 modrm_reg
, unsigned long *regs
,
776 p
= ®s
[modrm_reg
];
777 if (highbyte_regs
&& modrm_reg
>= 4 && modrm_reg
< 8)
778 p
= (unsigned char *)®s
[modrm_reg
& 3] + 1;
782 static int read_descriptor(struct x86_emulate_ctxt
*ctxt
,
783 struct segmented_address addr
,
784 u16
*size
, unsigned long *address
, int op_bytes
)
791 rc
= segmented_read_std(ctxt
, addr
, size
, 2);
792 if (rc
!= X86EMUL_CONTINUE
)
795 rc
= segmented_read_std(ctxt
, addr
, address
, op_bytes
);
799 static int test_cc(unsigned int condition
, unsigned int flags
)
803 switch ((condition
& 15) >> 1) {
805 rc
|= (flags
& EFLG_OF
);
807 case 1: /* b/c/nae */
808 rc
|= (flags
& EFLG_CF
);
811 rc
|= (flags
& EFLG_ZF
);
814 rc
|= (flags
& (EFLG_CF
|EFLG_ZF
));
817 rc
|= (flags
& EFLG_SF
);
820 rc
|= (flags
& EFLG_PF
);
823 rc
|= (flags
& EFLG_ZF
);
826 rc
|= (!(flags
& EFLG_SF
) != !(flags
& EFLG_OF
));
830 /* Odd condition identifiers (lsb == 1) have inverted sense. */
831 return (!!rc
^ (condition
& 1));
834 static void fetch_register_operand(struct operand
*op
)
838 op
->val
= *(u8
*)op
->addr
.reg
;
841 op
->val
= *(u16
*)op
->addr
.reg
;
844 op
->val
= *(u32
*)op
->addr
.reg
;
847 op
->val
= *(u64
*)op
->addr
.reg
;
852 static void read_sse_reg(struct x86_emulate_ctxt
*ctxt
, sse128_t
*data
, int reg
)
854 ctxt
->ops
->get_fpu(ctxt
);
856 case 0: asm("movdqu %%xmm0, %0" : "=m"(*data
)); break;
857 case 1: asm("movdqu %%xmm1, %0" : "=m"(*data
)); break;
858 case 2: asm("movdqu %%xmm2, %0" : "=m"(*data
)); break;
859 case 3: asm("movdqu %%xmm3, %0" : "=m"(*data
)); break;
860 case 4: asm("movdqu %%xmm4, %0" : "=m"(*data
)); break;
861 case 5: asm("movdqu %%xmm5, %0" : "=m"(*data
)); break;
862 case 6: asm("movdqu %%xmm6, %0" : "=m"(*data
)); break;
863 case 7: asm("movdqu %%xmm7, %0" : "=m"(*data
)); break;
865 case 8: asm("movdqu %%xmm8, %0" : "=m"(*data
)); break;
866 case 9: asm("movdqu %%xmm9, %0" : "=m"(*data
)); break;
867 case 10: asm("movdqu %%xmm10, %0" : "=m"(*data
)); break;
868 case 11: asm("movdqu %%xmm11, %0" : "=m"(*data
)); break;
869 case 12: asm("movdqu %%xmm12, %0" : "=m"(*data
)); break;
870 case 13: asm("movdqu %%xmm13, %0" : "=m"(*data
)); break;
871 case 14: asm("movdqu %%xmm14, %0" : "=m"(*data
)); break;
872 case 15: asm("movdqu %%xmm15, %0" : "=m"(*data
)); break;
876 ctxt
->ops
->put_fpu(ctxt
);
879 static void write_sse_reg(struct x86_emulate_ctxt
*ctxt
, sse128_t
*data
,
882 ctxt
->ops
->get_fpu(ctxt
);
884 case 0: asm("movdqu %0, %%xmm0" : : "m"(*data
)); break;
885 case 1: asm("movdqu %0, %%xmm1" : : "m"(*data
)); break;
886 case 2: asm("movdqu %0, %%xmm2" : : "m"(*data
)); break;
887 case 3: asm("movdqu %0, %%xmm3" : : "m"(*data
)); break;
888 case 4: asm("movdqu %0, %%xmm4" : : "m"(*data
)); break;
889 case 5: asm("movdqu %0, %%xmm5" : : "m"(*data
)); break;
890 case 6: asm("movdqu %0, %%xmm6" : : "m"(*data
)); break;
891 case 7: asm("movdqu %0, %%xmm7" : : "m"(*data
)); break;
893 case 8: asm("movdqu %0, %%xmm8" : : "m"(*data
)); break;
894 case 9: asm("movdqu %0, %%xmm9" : : "m"(*data
)); break;
895 case 10: asm("movdqu %0, %%xmm10" : : "m"(*data
)); break;
896 case 11: asm("movdqu %0, %%xmm11" : : "m"(*data
)); break;
897 case 12: asm("movdqu %0, %%xmm12" : : "m"(*data
)); break;
898 case 13: asm("movdqu %0, %%xmm13" : : "m"(*data
)); break;
899 case 14: asm("movdqu %0, %%xmm14" : : "m"(*data
)); break;
900 case 15: asm("movdqu %0, %%xmm15" : : "m"(*data
)); break;
904 ctxt
->ops
->put_fpu(ctxt
);
907 static void read_mmx_reg(struct x86_emulate_ctxt
*ctxt
, u64
*data
, int reg
)
909 ctxt
->ops
->get_fpu(ctxt
);
911 case 0: asm("movq %%mm0, %0" : "=m"(*data
)); break;
912 case 1: asm("movq %%mm1, %0" : "=m"(*data
)); break;
913 case 2: asm("movq %%mm2, %0" : "=m"(*data
)); break;
914 case 3: asm("movq %%mm3, %0" : "=m"(*data
)); break;
915 case 4: asm("movq %%mm4, %0" : "=m"(*data
)); break;
916 case 5: asm("movq %%mm5, %0" : "=m"(*data
)); break;
917 case 6: asm("movq %%mm6, %0" : "=m"(*data
)); break;
918 case 7: asm("movq %%mm7, %0" : "=m"(*data
)); break;
921 ctxt
->ops
->put_fpu(ctxt
);
924 static void write_mmx_reg(struct x86_emulate_ctxt
*ctxt
, u64
*data
, int reg
)
926 ctxt
->ops
->get_fpu(ctxt
);
928 case 0: asm("movq %0, %%mm0" : : "m"(*data
)); break;
929 case 1: asm("movq %0, %%mm1" : : "m"(*data
)); break;
930 case 2: asm("movq %0, %%mm2" : : "m"(*data
)); break;
931 case 3: asm("movq %0, %%mm3" : : "m"(*data
)); break;
932 case 4: asm("movq %0, %%mm4" : : "m"(*data
)); break;
933 case 5: asm("movq %0, %%mm5" : : "m"(*data
)); break;
934 case 6: asm("movq %0, %%mm6" : : "m"(*data
)); break;
935 case 7: asm("movq %0, %%mm7" : : "m"(*data
)); break;
938 ctxt
->ops
->put_fpu(ctxt
);
941 static void decode_register_operand(struct x86_emulate_ctxt
*ctxt
,
944 unsigned reg
= ctxt
->modrm_reg
;
945 int highbyte_regs
= ctxt
->rex_prefix
== 0;
947 if (!(ctxt
->d
& ModRM
))
948 reg
= (ctxt
->b
& 7) | ((ctxt
->rex_prefix
& 1) << 3);
954 read_sse_reg(ctxt
, &op
->vec_val
, reg
);
966 if (ctxt
->d
& ByteOp
) {
967 op
->addr
.reg
= decode_register(reg
, ctxt
->regs
, highbyte_regs
);
970 op
->addr
.reg
= decode_register(reg
, ctxt
->regs
, 0);
971 op
->bytes
= ctxt
->op_bytes
;
973 fetch_register_operand(op
);
974 op
->orig_val
= op
->val
;
977 static void adjust_modrm_seg(struct x86_emulate_ctxt
*ctxt
, int base_reg
)
979 if (base_reg
== VCPU_REGS_RSP
|| base_reg
== VCPU_REGS_RBP
)
980 ctxt
->modrm_seg
= VCPU_SREG_SS
;
983 static int decode_modrm(struct x86_emulate_ctxt
*ctxt
,
987 int index_reg
= 0, base_reg
= 0, scale
;
988 int rc
= X86EMUL_CONTINUE
;
991 if (ctxt
->rex_prefix
) {
992 ctxt
->modrm_reg
= (ctxt
->rex_prefix
& 4) << 1; /* REX.R */
993 index_reg
= (ctxt
->rex_prefix
& 2) << 2; /* REX.X */
994 ctxt
->modrm_rm
= base_reg
= (ctxt
->rex_prefix
& 1) << 3; /* REG.B */
997 ctxt
->modrm_mod
|= (ctxt
->modrm
& 0xc0) >> 6;
998 ctxt
->modrm_reg
|= (ctxt
->modrm
& 0x38) >> 3;
999 ctxt
->modrm_rm
|= (ctxt
->modrm
& 0x07);
1000 ctxt
->modrm_seg
= VCPU_SREG_DS
;
1002 if (ctxt
->modrm_mod
== 3) {
1004 op
->bytes
= (ctxt
->d
& ByteOp
) ? 1 : ctxt
->op_bytes
;
1005 op
->addr
.reg
= decode_register(ctxt
->modrm_rm
,
1006 ctxt
->regs
, ctxt
->d
& ByteOp
);
1007 if (ctxt
->d
& Sse
) {
1010 op
->addr
.xmm
= ctxt
->modrm_rm
;
1011 read_sse_reg(ctxt
, &op
->vec_val
, ctxt
->modrm_rm
);
1014 if (ctxt
->d
& Mmx
) {
1017 op
->addr
.xmm
= ctxt
->modrm_rm
& 7;
1020 fetch_register_operand(op
);
1026 if (ctxt
->ad_bytes
== 2) {
1027 unsigned bx
= ctxt
->regs
[VCPU_REGS_RBX
];
1028 unsigned bp
= ctxt
->regs
[VCPU_REGS_RBP
];
1029 unsigned si
= ctxt
->regs
[VCPU_REGS_RSI
];
1030 unsigned di
= ctxt
->regs
[VCPU_REGS_RDI
];
1032 /* 16-bit ModR/M decode. */
1033 switch (ctxt
->modrm_mod
) {
1035 if (ctxt
->modrm_rm
== 6)
1036 modrm_ea
+= insn_fetch(u16
, ctxt
);
1039 modrm_ea
+= insn_fetch(s8
, ctxt
);
1042 modrm_ea
+= insn_fetch(u16
, ctxt
);
1045 switch (ctxt
->modrm_rm
) {
1047 modrm_ea
+= bx
+ si
;
1050 modrm_ea
+= bx
+ di
;
1053 modrm_ea
+= bp
+ si
;
1056 modrm_ea
+= bp
+ di
;
1065 if (ctxt
->modrm_mod
!= 0)
1072 if (ctxt
->modrm_rm
== 2 || ctxt
->modrm_rm
== 3 ||
1073 (ctxt
->modrm_rm
== 6 && ctxt
->modrm_mod
!= 0))
1074 ctxt
->modrm_seg
= VCPU_SREG_SS
;
1075 modrm_ea
= (u16
)modrm_ea
;
1077 /* 32/64-bit ModR/M decode. */
1078 if ((ctxt
->modrm_rm
& 7) == 4) {
1079 sib
= insn_fetch(u8
, ctxt
);
1080 index_reg
|= (sib
>> 3) & 7;
1081 base_reg
|= sib
& 7;
1084 if ((base_reg
& 7) == 5 && ctxt
->modrm_mod
== 0)
1085 modrm_ea
+= insn_fetch(s32
, ctxt
);
1087 modrm_ea
+= ctxt
->regs
[base_reg
];
1088 adjust_modrm_seg(ctxt
, base_reg
);
1091 modrm_ea
+= ctxt
->regs
[index_reg
] << scale
;
1092 } else if ((ctxt
->modrm_rm
& 7) == 5 && ctxt
->modrm_mod
== 0) {
1093 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
1094 ctxt
->rip_relative
= 1;
1096 base_reg
= ctxt
->modrm_rm
;
1097 modrm_ea
+= ctxt
->regs
[base_reg
];
1098 adjust_modrm_seg(ctxt
, base_reg
);
1100 switch (ctxt
->modrm_mod
) {
1102 if (ctxt
->modrm_rm
== 5)
1103 modrm_ea
+= insn_fetch(s32
, ctxt
);
1106 modrm_ea
+= insn_fetch(s8
, ctxt
);
1109 modrm_ea
+= insn_fetch(s32
, ctxt
);
1113 op
->addr
.mem
.ea
= modrm_ea
;
1118 static int decode_abs(struct x86_emulate_ctxt
*ctxt
,
1121 int rc
= X86EMUL_CONTINUE
;
1124 switch (ctxt
->ad_bytes
) {
1126 op
->addr
.mem
.ea
= insn_fetch(u16
, ctxt
);
1129 op
->addr
.mem
.ea
= insn_fetch(u32
, ctxt
);
1132 op
->addr
.mem
.ea
= insn_fetch(u64
, ctxt
);
1139 static void fetch_bit_operand(struct x86_emulate_ctxt
*ctxt
)
1143 if (ctxt
->dst
.type
== OP_MEM
&& ctxt
->src
.type
== OP_REG
) {
1144 mask
= ~(ctxt
->dst
.bytes
* 8 - 1);
1146 if (ctxt
->src
.bytes
== 2)
1147 sv
= (s16
)ctxt
->src
.val
& (s16
)mask
;
1148 else if (ctxt
->src
.bytes
== 4)
1149 sv
= (s32
)ctxt
->src
.val
& (s32
)mask
;
1151 ctxt
->dst
.addr
.mem
.ea
+= (sv
>> 3);
1154 /* only subword offset */
1155 ctxt
->src
.val
&= (ctxt
->dst
.bytes
<< 3) - 1;
1158 static int read_emulated(struct x86_emulate_ctxt
*ctxt
,
1159 unsigned long addr
, void *dest
, unsigned size
)
1162 struct read_cache
*mc
= &ctxt
->mem_read
;
1165 int n
= min(size
, 8u);
1167 if (mc
->pos
< mc
->end
)
1170 rc
= ctxt
->ops
->read_emulated(ctxt
, addr
, mc
->data
+ mc
->end
, n
,
1172 if (rc
!= X86EMUL_CONTINUE
)
1177 memcpy(dest
, mc
->data
+ mc
->pos
, n
);
1182 return X86EMUL_CONTINUE
;
1185 static int segmented_read(struct x86_emulate_ctxt
*ctxt
,
1186 struct segmented_address addr
,
1193 rc
= linearize(ctxt
, addr
, size
, false, &linear
);
1194 if (rc
!= X86EMUL_CONTINUE
)
1196 return read_emulated(ctxt
, linear
, data
, size
);
1199 static int segmented_write(struct x86_emulate_ctxt
*ctxt
,
1200 struct segmented_address addr
,
1207 rc
= linearize(ctxt
, addr
, size
, true, &linear
);
1208 if (rc
!= X86EMUL_CONTINUE
)
1210 return ctxt
->ops
->write_emulated(ctxt
, linear
, data
, size
,
1214 static int segmented_cmpxchg(struct x86_emulate_ctxt
*ctxt
,
1215 struct segmented_address addr
,
1216 const void *orig_data
, const void *data
,
1222 rc
= linearize(ctxt
, addr
, size
, true, &linear
);
1223 if (rc
!= X86EMUL_CONTINUE
)
1225 return ctxt
->ops
->cmpxchg_emulated(ctxt
, linear
, orig_data
, data
,
1226 size
, &ctxt
->exception
);
1229 static int pio_in_emulated(struct x86_emulate_ctxt
*ctxt
,
1230 unsigned int size
, unsigned short port
,
1233 struct read_cache
*rc
= &ctxt
->io_read
;
1235 if (rc
->pos
== rc
->end
) { /* refill pio read ahead */
1236 unsigned int in_page
, n
;
1237 unsigned int count
= ctxt
->rep_prefix
?
1238 address_mask(ctxt
, ctxt
->regs
[VCPU_REGS_RCX
]) : 1;
1239 in_page
= (ctxt
->eflags
& EFLG_DF
) ?
1240 offset_in_page(ctxt
->regs
[VCPU_REGS_RDI
]) :
1241 PAGE_SIZE
- offset_in_page(ctxt
->regs
[VCPU_REGS_RDI
]);
1242 n
= min(min(in_page
, (unsigned int)sizeof(rc
->data
)) / size
,
1246 rc
->pos
= rc
->end
= 0;
1247 if (!ctxt
->ops
->pio_in_emulated(ctxt
, size
, port
, rc
->data
, n
))
1252 memcpy(dest
, rc
->data
+ rc
->pos
, size
);
1257 static int read_interrupt_descriptor(struct x86_emulate_ctxt
*ctxt
,
1258 u16 index
, struct desc_struct
*desc
)
1263 ctxt
->ops
->get_idt(ctxt
, &dt
);
1265 if (dt
.size
< index
* 8 + 7)
1266 return emulate_gp(ctxt
, index
<< 3 | 0x2);
1268 addr
= dt
.address
+ index
* 8;
1269 return ctxt
->ops
->read_std(ctxt
, addr
, desc
, sizeof *desc
,
1273 static void get_descriptor_table_ptr(struct x86_emulate_ctxt
*ctxt
,
1274 u16 selector
, struct desc_ptr
*dt
)
1276 struct x86_emulate_ops
*ops
= ctxt
->ops
;
1278 if (selector
& 1 << 2) {
1279 struct desc_struct desc
;
1282 memset (dt
, 0, sizeof *dt
);
1283 if (!ops
->get_segment(ctxt
, &sel
, &desc
, NULL
, VCPU_SREG_LDTR
))
1286 dt
->size
= desc_limit_scaled(&desc
); /* what if limit > 65535? */
1287 dt
->address
= get_desc_base(&desc
);
1289 ops
->get_gdt(ctxt
, dt
);
1292 /* allowed just for 8 bytes segments */
1293 static int read_segment_descriptor(struct x86_emulate_ctxt
*ctxt
,
1294 u16 selector
, struct desc_struct
*desc
)
1297 u16 index
= selector
>> 3;
1300 get_descriptor_table_ptr(ctxt
, selector
, &dt
);
1302 if (dt
.size
< index
* 8 + 7)
1303 return emulate_gp(ctxt
, selector
& 0xfffc);
1305 addr
= dt
.address
+ index
* 8;
1306 return ctxt
->ops
->read_std(ctxt
, addr
, desc
, sizeof *desc
,
1310 /* allowed just for 8 bytes segments */
1311 static int write_segment_descriptor(struct x86_emulate_ctxt
*ctxt
,
1312 u16 selector
, struct desc_struct
*desc
)
1315 u16 index
= selector
>> 3;
1318 get_descriptor_table_ptr(ctxt
, selector
, &dt
);
1320 if (dt
.size
< index
* 8 + 7)
1321 return emulate_gp(ctxt
, selector
& 0xfffc);
1323 addr
= dt
.address
+ index
* 8;
1324 return ctxt
->ops
->write_std(ctxt
, addr
, desc
, sizeof *desc
,
1328 /* Does not support long mode */
1329 static int load_segment_descriptor(struct x86_emulate_ctxt
*ctxt
,
1330 u16 selector
, int seg
)
1332 struct desc_struct seg_desc
;
1334 unsigned err_vec
= GP_VECTOR
;
1336 bool null_selector
= !(selector
& ~0x3); /* 0000-0003 are null */
1339 memset(&seg_desc
, 0, sizeof seg_desc
);
1341 if ((seg
<= VCPU_SREG_GS
&& ctxt
->mode
== X86EMUL_MODE_VM86
)
1342 || ctxt
->mode
== X86EMUL_MODE_REAL
) {
1343 /* set real mode segment descriptor */
1344 set_desc_base(&seg_desc
, selector
<< 4);
1345 set_desc_limit(&seg_desc
, 0xffff);
1349 if (ctxt
->mode
== X86EMUL_MODE_VM86
)
1355 cpl
= ctxt
->ops
->cpl(ctxt
);
1357 /* NULL selector is not valid for TR, CS and SS (except for long mode) */
1358 if ((seg
== VCPU_SREG_CS
1359 || (seg
== VCPU_SREG_SS
1360 && (ctxt
->mode
!= X86EMUL_MODE_PROT64
|| rpl
!= cpl
))
1361 || seg
== VCPU_SREG_TR
)
1365 /* TR should be in GDT only */
1366 if (seg
== VCPU_SREG_TR
&& (selector
& (1 << 2)))
1369 if (null_selector
) /* for NULL selector skip all following checks */
1372 ret
= read_segment_descriptor(ctxt
, selector
, &seg_desc
);
1373 if (ret
!= X86EMUL_CONTINUE
)
1376 err_code
= selector
& 0xfffc;
1377 err_vec
= GP_VECTOR
;
1379 /* can't load system descriptor into segment selecor */
1380 if (seg
<= VCPU_SREG_GS
&& !seg_desc
.s
)
1384 err_vec
= (seg
== VCPU_SREG_SS
) ? SS_VECTOR
: NP_VECTOR
;
1393 * segment is not a writable data segment or segment
1394 * selector's RPL != CPL or segment selector's RPL != CPL
1396 if (rpl
!= cpl
|| (seg_desc
.type
& 0xa) != 0x2 || dpl
!= cpl
)
1400 if (!(seg_desc
.type
& 8))
1403 if (seg_desc
.type
& 4) {
1409 if (rpl
> cpl
|| dpl
!= cpl
)
1412 /* CS(RPL) <- CPL */
1413 selector
= (selector
& 0xfffc) | cpl
;
1416 if (seg_desc
.s
|| (seg_desc
.type
!= 1 && seg_desc
.type
!= 9))
1419 case VCPU_SREG_LDTR
:
1420 if (seg_desc
.s
|| seg_desc
.type
!= 2)
1423 default: /* DS, ES, FS, or GS */
1425 * segment is not a data or readable code segment or
1426 * ((segment is a data or nonconforming code segment)
1427 * and (both RPL and CPL > DPL))
1429 if ((seg_desc
.type
& 0xa) == 0x8 ||
1430 (((seg_desc
.type
& 0xc) != 0xc) &&
1431 (rpl
> dpl
&& cpl
> dpl
)))
1437 /* mark segment as accessed */
1439 ret
= write_segment_descriptor(ctxt
, selector
, &seg_desc
);
1440 if (ret
!= X86EMUL_CONTINUE
)
1444 ctxt
->ops
->set_segment(ctxt
, selector
, &seg_desc
, 0, seg
);
1445 return X86EMUL_CONTINUE
;
1447 emulate_exception(ctxt
, err_vec
, err_code
, true);
1448 return X86EMUL_PROPAGATE_FAULT
;
1451 static void write_register_operand(struct operand
*op
)
1453 /* The 4-byte case *is* correct: in 64-bit mode we zero-extend. */
1454 switch (op
->bytes
) {
1456 *(u8
*)op
->addr
.reg
= (u8
)op
->val
;
1459 *(u16
*)op
->addr
.reg
= (u16
)op
->val
;
1462 *op
->addr
.reg
= (u32
)op
->val
;
1463 break; /* 64b: zero-extend */
1465 *op
->addr
.reg
= op
->val
;
1470 static int writeback(struct x86_emulate_ctxt
*ctxt
)
1474 switch (ctxt
->dst
.type
) {
1476 write_register_operand(&ctxt
->dst
);
1479 if (ctxt
->lock_prefix
)
1480 rc
= segmented_cmpxchg(ctxt
,
1482 &ctxt
->dst
.orig_val
,
1486 rc
= segmented_write(ctxt
,
1490 if (rc
!= X86EMUL_CONTINUE
)
1494 write_sse_reg(ctxt
, &ctxt
->dst
.vec_val
, ctxt
->dst
.addr
.xmm
);
1497 write_mmx_reg(ctxt
, &ctxt
->dst
.mm_val
, ctxt
->dst
.addr
.mm
);
1505 return X86EMUL_CONTINUE
;
1508 static int em_push(struct x86_emulate_ctxt
*ctxt
)
1510 struct segmented_address addr
;
1512 register_address_increment(ctxt
, &ctxt
->regs
[VCPU_REGS_RSP
], -ctxt
->op_bytes
);
1513 addr
.ea
= register_address(ctxt
, ctxt
->regs
[VCPU_REGS_RSP
]);
1514 addr
.seg
= VCPU_SREG_SS
;
1516 /* Disable writeback. */
1517 ctxt
->dst
.type
= OP_NONE
;
1518 return segmented_write(ctxt
, addr
, &ctxt
->src
.val
, ctxt
->op_bytes
);
1521 static int emulate_pop(struct x86_emulate_ctxt
*ctxt
,
1522 void *dest
, int len
)
1525 struct segmented_address addr
;
1527 addr
.ea
= register_address(ctxt
, ctxt
->regs
[VCPU_REGS_RSP
]);
1528 addr
.seg
= VCPU_SREG_SS
;
1529 rc
= segmented_read(ctxt
, addr
, dest
, len
);
1530 if (rc
!= X86EMUL_CONTINUE
)
1533 register_address_increment(ctxt
, &ctxt
->regs
[VCPU_REGS_RSP
], len
);
1537 static int em_pop(struct x86_emulate_ctxt
*ctxt
)
1539 return emulate_pop(ctxt
, &ctxt
->dst
.val
, ctxt
->op_bytes
);
1542 static int emulate_popf(struct x86_emulate_ctxt
*ctxt
,
1543 void *dest
, int len
)
1546 unsigned long val
, change_mask
;
1547 int iopl
= (ctxt
->eflags
& X86_EFLAGS_IOPL
) >> IOPL_SHIFT
;
1548 int cpl
= ctxt
->ops
->cpl(ctxt
);
1550 rc
= emulate_pop(ctxt
, &val
, len
);
1551 if (rc
!= X86EMUL_CONTINUE
)
1554 change_mask
= EFLG_CF
| EFLG_PF
| EFLG_AF
| EFLG_ZF
| EFLG_SF
| EFLG_OF
1555 | EFLG_TF
| EFLG_DF
| EFLG_NT
| EFLG_RF
| EFLG_AC
| EFLG_ID
;
1557 switch(ctxt
->mode
) {
1558 case X86EMUL_MODE_PROT64
:
1559 case X86EMUL_MODE_PROT32
:
1560 case X86EMUL_MODE_PROT16
:
1562 change_mask
|= EFLG_IOPL
;
1564 change_mask
|= EFLG_IF
;
1566 case X86EMUL_MODE_VM86
:
1568 return emulate_gp(ctxt
, 0);
1569 change_mask
|= EFLG_IF
;
1571 default: /* real mode */
1572 change_mask
|= (EFLG_IOPL
| EFLG_IF
);
1576 *(unsigned long *)dest
=
1577 (ctxt
->eflags
& ~change_mask
) | (val
& change_mask
);
1582 static int em_popf(struct x86_emulate_ctxt
*ctxt
)
1584 ctxt
->dst
.type
= OP_REG
;
1585 ctxt
->dst
.addr
.reg
= &ctxt
->eflags
;
1586 ctxt
->dst
.bytes
= ctxt
->op_bytes
;
1587 return emulate_popf(ctxt
, &ctxt
->dst
.val
, ctxt
->op_bytes
);
1590 static int em_leave(struct x86_emulate_ctxt
*ctxt
)
1592 assign_masked(&ctxt
->regs
[VCPU_REGS_RSP
], ctxt
->regs
[VCPU_REGS_RBP
],
1594 return emulate_pop(ctxt
, &ctxt
->regs
[VCPU_REGS_RBP
], ctxt
->op_bytes
);
1597 static int em_push_sreg(struct x86_emulate_ctxt
*ctxt
)
1599 int seg
= ctxt
->src2
.val
;
1601 ctxt
->src
.val
= get_segment_selector(ctxt
, seg
);
1603 return em_push(ctxt
);
1606 static int em_pop_sreg(struct x86_emulate_ctxt
*ctxt
)
1608 int seg
= ctxt
->src2
.val
;
1609 unsigned long selector
;
1612 rc
= emulate_pop(ctxt
, &selector
, ctxt
->op_bytes
);
1613 if (rc
!= X86EMUL_CONTINUE
)
1616 rc
= load_segment_descriptor(ctxt
, (u16
)selector
, seg
);
1620 static int em_pusha(struct x86_emulate_ctxt
*ctxt
)
1622 unsigned long old_esp
= ctxt
->regs
[VCPU_REGS_RSP
];
1623 int rc
= X86EMUL_CONTINUE
;
1624 int reg
= VCPU_REGS_RAX
;
1626 while (reg
<= VCPU_REGS_RDI
) {
1627 (reg
== VCPU_REGS_RSP
) ?
1628 (ctxt
->src
.val
= old_esp
) : (ctxt
->src
.val
= ctxt
->regs
[reg
]);
1631 if (rc
!= X86EMUL_CONTINUE
)
1640 static int em_pushf(struct x86_emulate_ctxt
*ctxt
)
1642 ctxt
->src
.val
= (unsigned long)ctxt
->eflags
;
1643 return em_push(ctxt
);
1646 static int em_popa(struct x86_emulate_ctxt
*ctxt
)
1648 int rc
= X86EMUL_CONTINUE
;
1649 int reg
= VCPU_REGS_RDI
;
1651 while (reg
>= VCPU_REGS_RAX
) {
1652 if (reg
== VCPU_REGS_RSP
) {
1653 register_address_increment(ctxt
, &ctxt
->regs
[VCPU_REGS_RSP
],
1658 rc
= emulate_pop(ctxt
, &ctxt
->regs
[reg
], ctxt
->op_bytes
);
1659 if (rc
!= X86EMUL_CONTINUE
)
1666 int emulate_int_real(struct x86_emulate_ctxt
*ctxt
, int irq
)
1668 struct x86_emulate_ops
*ops
= ctxt
->ops
;
1675 /* TODO: Add limit checks */
1676 ctxt
->src
.val
= ctxt
->eflags
;
1678 if (rc
!= X86EMUL_CONTINUE
)
1681 ctxt
->eflags
&= ~(EFLG_IF
| EFLG_TF
| EFLG_AC
);
1683 ctxt
->src
.val
= get_segment_selector(ctxt
, VCPU_SREG_CS
);
1685 if (rc
!= X86EMUL_CONTINUE
)
1688 ctxt
->src
.val
= ctxt
->_eip
;
1690 if (rc
!= X86EMUL_CONTINUE
)
1693 ops
->get_idt(ctxt
, &dt
);
1695 eip_addr
= dt
.address
+ (irq
<< 2);
1696 cs_addr
= dt
.address
+ (irq
<< 2) + 2;
1698 rc
= ops
->read_std(ctxt
, cs_addr
, &cs
, 2, &ctxt
->exception
);
1699 if (rc
!= X86EMUL_CONTINUE
)
1702 rc
= ops
->read_std(ctxt
, eip_addr
, &eip
, 2, &ctxt
->exception
);
1703 if (rc
!= X86EMUL_CONTINUE
)
1706 rc
= load_segment_descriptor(ctxt
, cs
, VCPU_SREG_CS
);
1707 if (rc
!= X86EMUL_CONTINUE
)
1715 static int emulate_int(struct x86_emulate_ctxt
*ctxt
, int irq
)
1717 switch(ctxt
->mode
) {
1718 case X86EMUL_MODE_REAL
:
1719 return emulate_int_real(ctxt
, irq
);
1720 case X86EMUL_MODE_VM86
:
1721 case X86EMUL_MODE_PROT16
:
1722 case X86EMUL_MODE_PROT32
:
1723 case X86EMUL_MODE_PROT64
:
1725 /* Protected mode interrupts unimplemented yet */
1726 return X86EMUL_UNHANDLEABLE
;
1730 static int emulate_iret_real(struct x86_emulate_ctxt
*ctxt
)
1732 int rc
= X86EMUL_CONTINUE
;
1733 unsigned long temp_eip
= 0;
1734 unsigned long temp_eflags
= 0;
1735 unsigned long cs
= 0;
1736 unsigned long mask
= EFLG_CF
| EFLG_PF
| EFLG_AF
| EFLG_ZF
| EFLG_SF
| EFLG_TF
|
1737 EFLG_IF
| EFLG_DF
| EFLG_OF
| EFLG_IOPL
| EFLG_NT
| EFLG_RF
|
1738 EFLG_AC
| EFLG_ID
| (1 << 1); /* Last one is the reserved bit */
1739 unsigned long vm86_mask
= EFLG_VM
| EFLG_VIF
| EFLG_VIP
;
1741 /* TODO: Add stack limit check */
1743 rc
= emulate_pop(ctxt
, &temp_eip
, ctxt
->op_bytes
);
1745 if (rc
!= X86EMUL_CONTINUE
)
1748 if (temp_eip
& ~0xffff)
1749 return emulate_gp(ctxt
, 0);
1751 rc
= emulate_pop(ctxt
, &cs
, ctxt
->op_bytes
);
1753 if (rc
!= X86EMUL_CONTINUE
)
1756 rc
= emulate_pop(ctxt
, &temp_eflags
, ctxt
->op_bytes
);
1758 if (rc
!= X86EMUL_CONTINUE
)
1761 rc
= load_segment_descriptor(ctxt
, (u16
)cs
, VCPU_SREG_CS
);
1763 if (rc
!= X86EMUL_CONTINUE
)
1766 ctxt
->_eip
= temp_eip
;
1769 if (ctxt
->op_bytes
== 4)
1770 ctxt
->eflags
= ((temp_eflags
& mask
) | (ctxt
->eflags
& vm86_mask
));
1771 else if (ctxt
->op_bytes
== 2) {
1772 ctxt
->eflags
&= ~0xffff;
1773 ctxt
->eflags
|= temp_eflags
;
1776 ctxt
->eflags
&= ~EFLG_RESERVED_ZEROS_MASK
; /* Clear reserved zeros */
1777 ctxt
->eflags
|= EFLG_RESERVED_ONE_MASK
;
1782 static int em_iret(struct x86_emulate_ctxt
*ctxt
)
1784 switch(ctxt
->mode
) {
1785 case X86EMUL_MODE_REAL
:
1786 return emulate_iret_real(ctxt
);
1787 case X86EMUL_MODE_VM86
:
1788 case X86EMUL_MODE_PROT16
:
1789 case X86EMUL_MODE_PROT32
:
1790 case X86EMUL_MODE_PROT64
:
1792 /* iret from protected mode unimplemented yet */
1793 return X86EMUL_UNHANDLEABLE
;
1797 static int em_jmp_far(struct x86_emulate_ctxt
*ctxt
)
1802 memcpy(&sel
, ctxt
->src
.valptr
+ ctxt
->op_bytes
, 2);
1804 rc
= load_segment_descriptor(ctxt
, sel
, VCPU_SREG_CS
);
1805 if (rc
!= X86EMUL_CONTINUE
)
1809 memcpy(&ctxt
->_eip
, ctxt
->src
.valptr
, ctxt
->op_bytes
);
1810 return X86EMUL_CONTINUE
;
1813 static int em_grp2(struct x86_emulate_ctxt
*ctxt
)
1815 switch (ctxt
->modrm_reg
) {
1817 emulate_2op_SrcB(ctxt
, "rol");
1820 emulate_2op_SrcB(ctxt
, "ror");
1823 emulate_2op_SrcB(ctxt
, "rcl");
1826 emulate_2op_SrcB(ctxt
, "rcr");
1828 case 4: /* sal/shl */
1829 case 6: /* sal/shl */
1830 emulate_2op_SrcB(ctxt
, "sal");
1833 emulate_2op_SrcB(ctxt
, "shr");
1836 emulate_2op_SrcB(ctxt
, "sar");
1839 return X86EMUL_CONTINUE
;
1842 static int em_not(struct x86_emulate_ctxt
*ctxt
)
1844 ctxt
->dst
.val
= ~ctxt
->dst
.val
;
1845 return X86EMUL_CONTINUE
;
1848 static int em_neg(struct x86_emulate_ctxt
*ctxt
)
1850 emulate_1op(ctxt
, "neg");
1851 return X86EMUL_CONTINUE
;
1854 static int em_mul_ex(struct x86_emulate_ctxt
*ctxt
)
1858 emulate_1op_rax_rdx(ctxt
, "mul", ex
);
1859 return X86EMUL_CONTINUE
;
1862 static int em_imul_ex(struct x86_emulate_ctxt
*ctxt
)
1866 emulate_1op_rax_rdx(ctxt
, "imul", ex
);
1867 return X86EMUL_CONTINUE
;
1870 static int em_div_ex(struct x86_emulate_ctxt
*ctxt
)
1874 emulate_1op_rax_rdx(ctxt
, "div", de
);
1876 return emulate_de(ctxt
);
1877 return X86EMUL_CONTINUE
;
1880 static int em_idiv_ex(struct x86_emulate_ctxt
*ctxt
)
1884 emulate_1op_rax_rdx(ctxt
, "idiv", de
);
1886 return emulate_de(ctxt
);
1887 return X86EMUL_CONTINUE
;
1890 static int em_grp45(struct x86_emulate_ctxt
*ctxt
)
1892 int rc
= X86EMUL_CONTINUE
;
1894 switch (ctxt
->modrm_reg
) {
1896 emulate_1op(ctxt
, "inc");
1899 emulate_1op(ctxt
, "dec");
1901 case 2: /* call near abs */ {
1903 old_eip
= ctxt
->_eip
;
1904 ctxt
->_eip
= ctxt
->src
.val
;
1905 ctxt
->src
.val
= old_eip
;
1909 case 4: /* jmp abs */
1910 ctxt
->_eip
= ctxt
->src
.val
;
1912 case 5: /* jmp far */
1913 rc
= em_jmp_far(ctxt
);
1922 static int em_cmpxchg8b(struct x86_emulate_ctxt
*ctxt
)
1924 u64 old
= ctxt
->dst
.orig_val64
;
1926 if (((u32
) (old
>> 0) != (u32
) ctxt
->regs
[VCPU_REGS_RAX
]) ||
1927 ((u32
) (old
>> 32) != (u32
) ctxt
->regs
[VCPU_REGS_RDX
])) {
1928 ctxt
->regs
[VCPU_REGS_RAX
] = (u32
) (old
>> 0);
1929 ctxt
->regs
[VCPU_REGS_RDX
] = (u32
) (old
>> 32);
1930 ctxt
->eflags
&= ~EFLG_ZF
;
1932 ctxt
->dst
.val64
= ((u64
)ctxt
->regs
[VCPU_REGS_RCX
] << 32) |
1933 (u32
) ctxt
->regs
[VCPU_REGS_RBX
];
1935 ctxt
->eflags
|= EFLG_ZF
;
1937 return X86EMUL_CONTINUE
;
1940 static int em_ret(struct x86_emulate_ctxt
*ctxt
)
1942 ctxt
->dst
.type
= OP_REG
;
1943 ctxt
->dst
.addr
.reg
= &ctxt
->_eip
;
1944 ctxt
->dst
.bytes
= ctxt
->op_bytes
;
1945 return em_pop(ctxt
);
1948 static int em_ret_far(struct x86_emulate_ctxt
*ctxt
)
1953 rc
= emulate_pop(ctxt
, &ctxt
->_eip
, ctxt
->op_bytes
);
1954 if (rc
!= X86EMUL_CONTINUE
)
1956 if (ctxt
->op_bytes
== 4)
1957 ctxt
->_eip
= (u32
)ctxt
->_eip
;
1958 rc
= emulate_pop(ctxt
, &cs
, ctxt
->op_bytes
);
1959 if (rc
!= X86EMUL_CONTINUE
)
1961 rc
= load_segment_descriptor(ctxt
, (u16
)cs
, VCPU_SREG_CS
);
1965 static int em_cmpxchg(struct x86_emulate_ctxt
*ctxt
)
1967 /* Save real source value, then compare EAX against destination. */
1968 ctxt
->src
.orig_val
= ctxt
->src
.val
;
1969 ctxt
->src
.val
= ctxt
->regs
[VCPU_REGS_RAX
];
1970 emulate_2op_SrcV(ctxt
, "cmp");
1972 if (ctxt
->eflags
& EFLG_ZF
) {
1973 /* Success: write back to memory. */
1974 ctxt
->dst
.val
= ctxt
->src
.orig_val
;
1976 /* Failure: write the value we saw to EAX. */
1977 ctxt
->dst
.type
= OP_REG
;
1978 ctxt
->dst
.addr
.reg
= (unsigned long *)&ctxt
->regs
[VCPU_REGS_RAX
];
1980 return X86EMUL_CONTINUE
;
1983 static int em_lseg(struct x86_emulate_ctxt
*ctxt
)
1985 int seg
= ctxt
->src2
.val
;
1989 memcpy(&sel
, ctxt
->src
.valptr
+ ctxt
->op_bytes
, 2);
1991 rc
= load_segment_descriptor(ctxt
, sel
, seg
);
1992 if (rc
!= X86EMUL_CONTINUE
)
1995 ctxt
->dst
.val
= ctxt
->src
.val
;
2000 setup_syscalls_segments(struct x86_emulate_ctxt
*ctxt
,
2001 struct desc_struct
*cs
, struct desc_struct
*ss
)
2005 memset(cs
, 0, sizeof(struct desc_struct
));
2006 ctxt
->ops
->get_segment(ctxt
, &selector
, cs
, NULL
, VCPU_SREG_CS
);
2007 memset(ss
, 0, sizeof(struct desc_struct
));
2009 cs
->l
= 0; /* will be adjusted later */
2010 set_desc_base(cs
, 0); /* flat segment */
2011 cs
->g
= 1; /* 4kb granularity */
2012 set_desc_limit(cs
, 0xfffff); /* 4GB limit */
2013 cs
->type
= 0x0b; /* Read, Execute, Accessed */
2015 cs
->dpl
= 0; /* will be adjusted later */
2019 set_desc_base(ss
, 0); /* flat segment */
2020 set_desc_limit(ss
, 0xfffff); /* 4GB limit */
2021 ss
->g
= 1; /* 4kb granularity */
2023 ss
->type
= 0x03; /* Read/Write, Accessed */
2024 ss
->d
= 1; /* 32bit stack segment */
2029 static bool vendor_intel(struct x86_emulate_ctxt
*ctxt
)
2031 u32 eax
, ebx
, ecx
, edx
;
2034 ctxt
->ops
->get_cpuid(ctxt
, &eax
, &ebx
, &ecx
, &edx
);
2035 return ebx
== X86EMUL_CPUID_VENDOR_GenuineIntel_ebx
2036 && ecx
== X86EMUL_CPUID_VENDOR_GenuineIntel_ecx
2037 && edx
== X86EMUL_CPUID_VENDOR_GenuineIntel_edx
;
2040 static bool em_syscall_is_enabled(struct x86_emulate_ctxt
*ctxt
)
2042 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2043 u32 eax
, ebx
, ecx
, edx
;
2046 * syscall should always be enabled in longmode - so only become
2047 * vendor specific (cpuid) if other modes are active...
2049 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
2054 ops
->get_cpuid(ctxt
, &eax
, &ebx
, &ecx
, &edx
);
2056 * Intel ("GenuineIntel")
2057 * remark: Intel CPUs only support "syscall" in 64bit
2058 * longmode. Also an 64bit guest with a
2059 * 32bit compat-app running will #UD !! While this
2060 * behaviour can be fixed (by emulating) into AMD
2061 * response - CPUs of AMD can't behave like Intel.
2063 if (ebx
== X86EMUL_CPUID_VENDOR_GenuineIntel_ebx
&&
2064 ecx
== X86EMUL_CPUID_VENDOR_GenuineIntel_ecx
&&
2065 edx
== X86EMUL_CPUID_VENDOR_GenuineIntel_edx
)
2068 /* AMD ("AuthenticAMD") */
2069 if (ebx
== X86EMUL_CPUID_VENDOR_AuthenticAMD_ebx
&&
2070 ecx
== X86EMUL_CPUID_VENDOR_AuthenticAMD_ecx
&&
2071 edx
== X86EMUL_CPUID_VENDOR_AuthenticAMD_edx
)
2074 /* AMD ("AMDisbetter!") */
2075 if (ebx
== X86EMUL_CPUID_VENDOR_AMDisbetterI_ebx
&&
2076 ecx
== X86EMUL_CPUID_VENDOR_AMDisbetterI_ecx
&&
2077 edx
== X86EMUL_CPUID_VENDOR_AMDisbetterI_edx
)
2080 /* default: (not Intel, not AMD), apply Intel's stricter rules... */
2084 static int em_syscall(struct x86_emulate_ctxt
*ctxt
)
2086 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2087 struct desc_struct cs
, ss
;
2092 /* syscall is not available in real mode */
2093 if (ctxt
->mode
== X86EMUL_MODE_REAL
||
2094 ctxt
->mode
== X86EMUL_MODE_VM86
)
2095 return emulate_ud(ctxt
);
2097 if (!(em_syscall_is_enabled(ctxt
)))
2098 return emulate_ud(ctxt
);
2100 ops
->get_msr(ctxt
, MSR_EFER
, &efer
);
2101 setup_syscalls_segments(ctxt
, &cs
, &ss
);
2103 if (!(efer
& EFER_SCE
))
2104 return emulate_ud(ctxt
);
2106 ops
->get_msr(ctxt
, MSR_STAR
, &msr_data
);
2108 cs_sel
= (u16
)(msr_data
& 0xfffc);
2109 ss_sel
= (u16
)(msr_data
+ 8);
2111 if (efer
& EFER_LMA
) {
2115 ops
->set_segment(ctxt
, cs_sel
, &cs
, 0, VCPU_SREG_CS
);
2116 ops
->set_segment(ctxt
, ss_sel
, &ss
, 0, VCPU_SREG_SS
);
2118 ctxt
->regs
[VCPU_REGS_RCX
] = ctxt
->_eip
;
2119 if (efer
& EFER_LMA
) {
2120 #ifdef CONFIG_X86_64
2121 ctxt
->regs
[VCPU_REGS_R11
] = ctxt
->eflags
& ~EFLG_RF
;
2124 ctxt
->mode
== X86EMUL_MODE_PROT64
?
2125 MSR_LSTAR
: MSR_CSTAR
, &msr_data
);
2126 ctxt
->_eip
= msr_data
;
2128 ops
->get_msr(ctxt
, MSR_SYSCALL_MASK
, &msr_data
);
2129 ctxt
->eflags
&= ~(msr_data
| EFLG_RF
);
2133 ops
->get_msr(ctxt
, MSR_STAR
, &msr_data
);
2134 ctxt
->_eip
= (u32
)msr_data
;
2136 ctxt
->eflags
&= ~(EFLG_VM
| EFLG_IF
| EFLG_RF
);
2139 return X86EMUL_CONTINUE
;
2142 static int em_sysenter(struct x86_emulate_ctxt
*ctxt
)
2144 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2145 struct desc_struct cs
, ss
;
2150 ops
->get_msr(ctxt
, MSR_EFER
, &efer
);
2151 /* inject #GP if in real mode */
2152 if (ctxt
->mode
== X86EMUL_MODE_REAL
)
2153 return emulate_gp(ctxt
, 0);
2156 * Not recognized on AMD in compat mode (but is recognized in legacy
2159 if ((ctxt
->mode
== X86EMUL_MODE_PROT32
) && (efer
& EFER_LMA
)
2160 && !vendor_intel(ctxt
))
2161 return emulate_ud(ctxt
);
2163 /* XXX sysenter/sysexit have not been tested in 64bit mode.
2164 * Therefore, we inject an #UD.
2166 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
2167 return emulate_ud(ctxt
);
2169 setup_syscalls_segments(ctxt
, &cs
, &ss
);
2171 ops
->get_msr(ctxt
, MSR_IA32_SYSENTER_CS
, &msr_data
);
2172 switch (ctxt
->mode
) {
2173 case X86EMUL_MODE_PROT32
:
2174 if ((msr_data
& 0xfffc) == 0x0)
2175 return emulate_gp(ctxt
, 0);
2177 case X86EMUL_MODE_PROT64
:
2178 if (msr_data
== 0x0)
2179 return emulate_gp(ctxt
, 0);
2183 ctxt
->eflags
&= ~(EFLG_VM
| EFLG_IF
| EFLG_RF
);
2184 cs_sel
= (u16
)msr_data
;
2185 cs_sel
&= ~SELECTOR_RPL_MASK
;
2186 ss_sel
= cs_sel
+ 8;
2187 ss_sel
&= ~SELECTOR_RPL_MASK
;
2188 if (ctxt
->mode
== X86EMUL_MODE_PROT64
|| (efer
& EFER_LMA
)) {
2193 ops
->set_segment(ctxt
, cs_sel
, &cs
, 0, VCPU_SREG_CS
);
2194 ops
->set_segment(ctxt
, ss_sel
, &ss
, 0, VCPU_SREG_SS
);
2196 ops
->get_msr(ctxt
, MSR_IA32_SYSENTER_EIP
, &msr_data
);
2197 ctxt
->_eip
= msr_data
;
2199 ops
->get_msr(ctxt
, MSR_IA32_SYSENTER_ESP
, &msr_data
);
2200 ctxt
->regs
[VCPU_REGS_RSP
] = msr_data
;
2202 return X86EMUL_CONTINUE
;
2205 static int em_sysexit(struct x86_emulate_ctxt
*ctxt
)
2207 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2208 struct desc_struct cs
, ss
;
2211 u16 cs_sel
= 0, ss_sel
= 0;
2213 /* inject #GP if in real mode or Virtual 8086 mode */
2214 if (ctxt
->mode
== X86EMUL_MODE_REAL
||
2215 ctxt
->mode
== X86EMUL_MODE_VM86
)
2216 return emulate_gp(ctxt
, 0);
2218 setup_syscalls_segments(ctxt
, &cs
, &ss
);
2220 if ((ctxt
->rex_prefix
& 0x8) != 0x0)
2221 usermode
= X86EMUL_MODE_PROT64
;
2223 usermode
= X86EMUL_MODE_PROT32
;
2227 ops
->get_msr(ctxt
, MSR_IA32_SYSENTER_CS
, &msr_data
);
2229 case X86EMUL_MODE_PROT32
:
2230 cs_sel
= (u16
)(msr_data
+ 16);
2231 if ((msr_data
& 0xfffc) == 0x0)
2232 return emulate_gp(ctxt
, 0);
2233 ss_sel
= (u16
)(msr_data
+ 24);
2235 case X86EMUL_MODE_PROT64
:
2236 cs_sel
= (u16
)(msr_data
+ 32);
2237 if (msr_data
== 0x0)
2238 return emulate_gp(ctxt
, 0);
2239 ss_sel
= cs_sel
+ 8;
2244 cs_sel
|= SELECTOR_RPL_MASK
;
2245 ss_sel
|= SELECTOR_RPL_MASK
;
2247 ops
->set_segment(ctxt
, cs_sel
, &cs
, 0, VCPU_SREG_CS
);
2248 ops
->set_segment(ctxt
, ss_sel
, &ss
, 0, VCPU_SREG_SS
);
2250 ctxt
->_eip
= ctxt
->regs
[VCPU_REGS_RDX
];
2251 ctxt
->regs
[VCPU_REGS_RSP
] = ctxt
->regs
[VCPU_REGS_RCX
];
2253 return X86EMUL_CONTINUE
;
2256 static bool emulator_bad_iopl(struct x86_emulate_ctxt
*ctxt
)
2259 if (ctxt
->mode
== X86EMUL_MODE_REAL
)
2261 if (ctxt
->mode
== X86EMUL_MODE_VM86
)
2263 iopl
= (ctxt
->eflags
& X86_EFLAGS_IOPL
) >> IOPL_SHIFT
;
2264 return ctxt
->ops
->cpl(ctxt
) > iopl
;
2267 static bool emulator_io_port_access_allowed(struct x86_emulate_ctxt
*ctxt
,
2270 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2271 struct desc_struct tr_seg
;
2274 u16 tr
, io_bitmap_ptr
, perm
, bit_idx
= port
& 0x7;
2275 unsigned mask
= (1 << len
) - 1;
2278 ops
->get_segment(ctxt
, &tr
, &tr_seg
, &base3
, VCPU_SREG_TR
);
2281 if (desc_limit_scaled(&tr_seg
) < 103)
2283 base
= get_desc_base(&tr_seg
);
2284 #ifdef CONFIG_X86_64
2285 base
|= ((u64
)base3
) << 32;
2287 r
= ops
->read_std(ctxt
, base
+ 102, &io_bitmap_ptr
, 2, NULL
);
2288 if (r
!= X86EMUL_CONTINUE
)
2290 if (io_bitmap_ptr
+ port
/8 > desc_limit_scaled(&tr_seg
))
2292 r
= ops
->read_std(ctxt
, base
+ io_bitmap_ptr
+ port
/8, &perm
, 2, NULL
);
2293 if (r
!= X86EMUL_CONTINUE
)
2295 if ((perm
>> bit_idx
) & mask
)
2300 static bool emulator_io_permited(struct x86_emulate_ctxt
*ctxt
,
2306 if (emulator_bad_iopl(ctxt
))
2307 if (!emulator_io_port_access_allowed(ctxt
, port
, len
))
2310 ctxt
->perm_ok
= true;
2315 static void save_state_to_tss16(struct x86_emulate_ctxt
*ctxt
,
2316 struct tss_segment_16
*tss
)
2318 tss
->ip
= ctxt
->_eip
;
2319 tss
->flag
= ctxt
->eflags
;
2320 tss
->ax
= ctxt
->regs
[VCPU_REGS_RAX
];
2321 tss
->cx
= ctxt
->regs
[VCPU_REGS_RCX
];
2322 tss
->dx
= ctxt
->regs
[VCPU_REGS_RDX
];
2323 tss
->bx
= ctxt
->regs
[VCPU_REGS_RBX
];
2324 tss
->sp
= ctxt
->regs
[VCPU_REGS_RSP
];
2325 tss
->bp
= ctxt
->regs
[VCPU_REGS_RBP
];
2326 tss
->si
= ctxt
->regs
[VCPU_REGS_RSI
];
2327 tss
->di
= ctxt
->regs
[VCPU_REGS_RDI
];
2329 tss
->es
= get_segment_selector(ctxt
, VCPU_SREG_ES
);
2330 tss
->cs
= get_segment_selector(ctxt
, VCPU_SREG_CS
);
2331 tss
->ss
= get_segment_selector(ctxt
, VCPU_SREG_SS
);
2332 tss
->ds
= get_segment_selector(ctxt
, VCPU_SREG_DS
);
2333 tss
->ldt
= get_segment_selector(ctxt
, VCPU_SREG_LDTR
);
2336 static int load_state_from_tss16(struct x86_emulate_ctxt
*ctxt
,
2337 struct tss_segment_16
*tss
)
2341 ctxt
->_eip
= tss
->ip
;
2342 ctxt
->eflags
= tss
->flag
| 2;
2343 ctxt
->regs
[VCPU_REGS_RAX
] = tss
->ax
;
2344 ctxt
->regs
[VCPU_REGS_RCX
] = tss
->cx
;
2345 ctxt
->regs
[VCPU_REGS_RDX
] = tss
->dx
;
2346 ctxt
->regs
[VCPU_REGS_RBX
] = tss
->bx
;
2347 ctxt
->regs
[VCPU_REGS_RSP
] = tss
->sp
;
2348 ctxt
->regs
[VCPU_REGS_RBP
] = tss
->bp
;
2349 ctxt
->regs
[VCPU_REGS_RSI
] = tss
->si
;
2350 ctxt
->regs
[VCPU_REGS_RDI
] = tss
->di
;
2353 * SDM says that segment selectors are loaded before segment
2356 set_segment_selector(ctxt
, tss
->ldt
, VCPU_SREG_LDTR
);
2357 set_segment_selector(ctxt
, tss
->es
, VCPU_SREG_ES
);
2358 set_segment_selector(ctxt
, tss
->cs
, VCPU_SREG_CS
);
2359 set_segment_selector(ctxt
, tss
->ss
, VCPU_SREG_SS
);
2360 set_segment_selector(ctxt
, tss
->ds
, VCPU_SREG_DS
);
2363 * Now load segment descriptors. If fault happenes at this stage
2364 * it is handled in a context of new task
2366 ret
= load_segment_descriptor(ctxt
, tss
->ldt
, VCPU_SREG_LDTR
);
2367 if (ret
!= X86EMUL_CONTINUE
)
2369 ret
= load_segment_descriptor(ctxt
, tss
->es
, VCPU_SREG_ES
);
2370 if (ret
!= X86EMUL_CONTINUE
)
2372 ret
= load_segment_descriptor(ctxt
, tss
->cs
, VCPU_SREG_CS
);
2373 if (ret
!= X86EMUL_CONTINUE
)
2375 ret
= load_segment_descriptor(ctxt
, tss
->ss
, VCPU_SREG_SS
);
2376 if (ret
!= X86EMUL_CONTINUE
)
2378 ret
= load_segment_descriptor(ctxt
, tss
->ds
, VCPU_SREG_DS
);
2379 if (ret
!= X86EMUL_CONTINUE
)
2382 return X86EMUL_CONTINUE
;
2385 static int task_switch_16(struct x86_emulate_ctxt
*ctxt
,
2386 u16 tss_selector
, u16 old_tss_sel
,
2387 ulong old_tss_base
, struct desc_struct
*new_desc
)
2389 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2390 struct tss_segment_16 tss_seg
;
2392 u32 new_tss_base
= get_desc_base(new_desc
);
2394 ret
= ops
->read_std(ctxt
, old_tss_base
, &tss_seg
, sizeof tss_seg
,
2396 if (ret
!= X86EMUL_CONTINUE
)
2397 /* FIXME: need to provide precise fault address */
2400 save_state_to_tss16(ctxt
, &tss_seg
);
2402 ret
= ops
->write_std(ctxt
, old_tss_base
, &tss_seg
, sizeof tss_seg
,
2404 if (ret
!= X86EMUL_CONTINUE
)
2405 /* FIXME: need to provide precise fault address */
2408 ret
= ops
->read_std(ctxt
, new_tss_base
, &tss_seg
, sizeof tss_seg
,
2410 if (ret
!= X86EMUL_CONTINUE
)
2411 /* FIXME: need to provide precise fault address */
2414 if (old_tss_sel
!= 0xffff) {
2415 tss_seg
.prev_task_link
= old_tss_sel
;
2417 ret
= ops
->write_std(ctxt
, new_tss_base
,
2418 &tss_seg
.prev_task_link
,
2419 sizeof tss_seg
.prev_task_link
,
2421 if (ret
!= X86EMUL_CONTINUE
)
2422 /* FIXME: need to provide precise fault address */
2426 return load_state_from_tss16(ctxt
, &tss_seg
);
2429 static void save_state_to_tss32(struct x86_emulate_ctxt
*ctxt
,
2430 struct tss_segment_32
*tss
)
2432 tss
->cr3
= ctxt
->ops
->get_cr(ctxt
, 3);
2433 tss
->eip
= ctxt
->_eip
;
2434 tss
->eflags
= ctxt
->eflags
;
2435 tss
->eax
= ctxt
->regs
[VCPU_REGS_RAX
];
2436 tss
->ecx
= ctxt
->regs
[VCPU_REGS_RCX
];
2437 tss
->edx
= ctxt
->regs
[VCPU_REGS_RDX
];
2438 tss
->ebx
= ctxt
->regs
[VCPU_REGS_RBX
];
2439 tss
->esp
= ctxt
->regs
[VCPU_REGS_RSP
];
2440 tss
->ebp
= ctxt
->regs
[VCPU_REGS_RBP
];
2441 tss
->esi
= ctxt
->regs
[VCPU_REGS_RSI
];
2442 tss
->edi
= ctxt
->regs
[VCPU_REGS_RDI
];
2444 tss
->es
= get_segment_selector(ctxt
, VCPU_SREG_ES
);
2445 tss
->cs
= get_segment_selector(ctxt
, VCPU_SREG_CS
);
2446 tss
->ss
= get_segment_selector(ctxt
, VCPU_SREG_SS
);
2447 tss
->ds
= get_segment_selector(ctxt
, VCPU_SREG_DS
);
2448 tss
->fs
= get_segment_selector(ctxt
, VCPU_SREG_FS
);
2449 tss
->gs
= get_segment_selector(ctxt
, VCPU_SREG_GS
);
2450 tss
->ldt_selector
= get_segment_selector(ctxt
, VCPU_SREG_LDTR
);
2453 static int load_state_from_tss32(struct x86_emulate_ctxt
*ctxt
,
2454 struct tss_segment_32
*tss
)
2458 if (ctxt
->ops
->set_cr(ctxt
, 3, tss
->cr3
))
2459 return emulate_gp(ctxt
, 0);
2460 ctxt
->_eip
= tss
->eip
;
2461 ctxt
->eflags
= tss
->eflags
| 2;
2463 /* General purpose registers */
2464 ctxt
->regs
[VCPU_REGS_RAX
] = tss
->eax
;
2465 ctxt
->regs
[VCPU_REGS_RCX
] = tss
->ecx
;
2466 ctxt
->regs
[VCPU_REGS_RDX
] = tss
->edx
;
2467 ctxt
->regs
[VCPU_REGS_RBX
] = tss
->ebx
;
2468 ctxt
->regs
[VCPU_REGS_RSP
] = tss
->esp
;
2469 ctxt
->regs
[VCPU_REGS_RBP
] = tss
->ebp
;
2470 ctxt
->regs
[VCPU_REGS_RSI
] = tss
->esi
;
2471 ctxt
->regs
[VCPU_REGS_RDI
] = tss
->edi
;
2474 * SDM says that segment selectors are loaded before segment
2477 set_segment_selector(ctxt
, tss
->ldt_selector
, VCPU_SREG_LDTR
);
2478 set_segment_selector(ctxt
, tss
->es
, VCPU_SREG_ES
);
2479 set_segment_selector(ctxt
, tss
->cs
, VCPU_SREG_CS
);
2480 set_segment_selector(ctxt
, tss
->ss
, VCPU_SREG_SS
);
2481 set_segment_selector(ctxt
, tss
->ds
, VCPU_SREG_DS
);
2482 set_segment_selector(ctxt
, tss
->fs
, VCPU_SREG_FS
);
2483 set_segment_selector(ctxt
, tss
->gs
, VCPU_SREG_GS
);
2486 * If we're switching between Protected Mode and VM86, we need to make
2487 * sure to update the mode before loading the segment descriptors so
2488 * that the selectors are interpreted correctly.
2490 * Need to get rflags to the vcpu struct immediately because it
2491 * influences the CPL which is checked at least when loading the segment
2492 * descriptors and when pushing an error code to the new kernel stack.
2494 * TODO Introduce a separate ctxt->ops->set_cpl callback
2496 if (ctxt
->eflags
& X86_EFLAGS_VM
)
2497 ctxt
->mode
= X86EMUL_MODE_VM86
;
2499 ctxt
->mode
= X86EMUL_MODE_PROT32
;
2501 ctxt
->ops
->set_rflags(ctxt
, ctxt
->eflags
);
2504 * Now load segment descriptors. If fault happenes at this stage
2505 * it is handled in a context of new task
2507 ret
= load_segment_descriptor(ctxt
, tss
->ldt_selector
, VCPU_SREG_LDTR
);
2508 if (ret
!= X86EMUL_CONTINUE
)
2510 ret
= load_segment_descriptor(ctxt
, tss
->es
, VCPU_SREG_ES
);
2511 if (ret
!= X86EMUL_CONTINUE
)
2513 ret
= load_segment_descriptor(ctxt
, tss
->cs
, VCPU_SREG_CS
);
2514 if (ret
!= X86EMUL_CONTINUE
)
2516 ret
= load_segment_descriptor(ctxt
, tss
->ss
, VCPU_SREG_SS
);
2517 if (ret
!= X86EMUL_CONTINUE
)
2519 ret
= load_segment_descriptor(ctxt
, tss
->ds
, VCPU_SREG_DS
);
2520 if (ret
!= X86EMUL_CONTINUE
)
2522 ret
= load_segment_descriptor(ctxt
, tss
->fs
, VCPU_SREG_FS
);
2523 if (ret
!= X86EMUL_CONTINUE
)
2525 ret
= load_segment_descriptor(ctxt
, tss
->gs
, VCPU_SREG_GS
);
2526 if (ret
!= X86EMUL_CONTINUE
)
2529 return X86EMUL_CONTINUE
;
2532 static int task_switch_32(struct x86_emulate_ctxt
*ctxt
,
2533 u16 tss_selector
, u16 old_tss_sel
,
2534 ulong old_tss_base
, struct desc_struct
*new_desc
)
2536 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2537 struct tss_segment_32 tss_seg
;
2539 u32 new_tss_base
= get_desc_base(new_desc
);
2541 ret
= ops
->read_std(ctxt
, old_tss_base
, &tss_seg
, sizeof tss_seg
,
2543 if (ret
!= X86EMUL_CONTINUE
)
2544 /* FIXME: need to provide precise fault address */
2547 save_state_to_tss32(ctxt
, &tss_seg
);
2549 ret
= ops
->write_std(ctxt
, old_tss_base
, &tss_seg
, sizeof tss_seg
,
2551 if (ret
!= X86EMUL_CONTINUE
)
2552 /* FIXME: need to provide precise fault address */
2555 ret
= ops
->read_std(ctxt
, new_tss_base
, &tss_seg
, sizeof tss_seg
,
2557 if (ret
!= X86EMUL_CONTINUE
)
2558 /* FIXME: need to provide precise fault address */
2561 if (old_tss_sel
!= 0xffff) {
2562 tss_seg
.prev_task_link
= old_tss_sel
;
2564 ret
= ops
->write_std(ctxt
, new_tss_base
,
2565 &tss_seg
.prev_task_link
,
2566 sizeof tss_seg
.prev_task_link
,
2568 if (ret
!= X86EMUL_CONTINUE
)
2569 /* FIXME: need to provide precise fault address */
2573 return load_state_from_tss32(ctxt
, &tss_seg
);
2576 static int emulator_do_task_switch(struct x86_emulate_ctxt
*ctxt
,
2577 u16 tss_selector
, int idt_index
, int reason
,
2578 bool has_error_code
, u32 error_code
)
2580 struct x86_emulate_ops
*ops
= ctxt
->ops
;
2581 struct desc_struct curr_tss_desc
, next_tss_desc
;
2583 u16 old_tss_sel
= get_segment_selector(ctxt
, VCPU_SREG_TR
);
2584 ulong old_tss_base
=
2585 ops
->get_cached_segment_base(ctxt
, VCPU_SREG_TR
);
2588 /* FIXME: old_tss_base == ~0 ? */
2590 ret
= read_segment_descriptor(ctxt
, tss_selector
, &next_tss_desc
);
2591 if (ret
!= X86EMUL_CONTINUE
)
2593 ret
= read_segment_descriptor(ctxt
, old_tss_sel
, &curr_tss_desc
);
2594 if (ret
!= X86EMUL_CONTINUE
)
2597 /* FIXME: check that next_tss_desc is tss */
2600 * Check privileges. The three cases are task switch caused by...
2602 * 1. jmp/call/int to task gate: Check against DPL of the task gate
2603 * 2. Exception/IRQ/iret: No check is performed
2604 * 3. jmp/call to TSS: Check agains DPL of the TSS
2606 if (reason
== TASK_SWITCH_GATE
) {
2607 if (idt_index
!= -1) {
2608 /* Software interrupts */
2609 struct desc_struct task_gate_desc
;
2612 ret
= read_interrupt_descriptor(ctxt
, idt_index
,
2614 if (ret
!= X86EMUL_CONTINUE
)
2617 dpl
= task_gate_desc
.dpl
;
2618 if ((tss_selector
& 3) > dpl
|| ops
->cpl(ctxt
) > dpl
)
2619 return emulate_gp(ctxt
, (idt_index
<< 3) | 0x2);
2621 } else if (reason
!= TASK_SWITCH_IRET
) {
2622 int dpl
= next_tss_desc
.dpl
;
2623 if ((tss_selector
& 3) > dpl
|| ops
->cpl(ctxt
) > dpl
)
2624 return emulate_gp(ctxt
, tss_selector
);
2628 desc_limit
= desc_limit_scaled(&next_tss_desc
);
2629 if (!next_tss_desc
.p
||
2630 ((desc_limit
< 0x67 && (next_tss_desc
.type
& 8)) ||
2631 desc_limit
< 0x2b)) {
2632 emulate_ts(ctxt
, tss_selector
& 0xfffc);
2633 return X86EMUL_PROPAGATE_FAULT
;
2636 if (reason
== TASK_SWITCH_IRET
|| reason
== TASK_SWITCH_JMP
) {
2637 curr_tss_desc
.type
&= ~(1 << 1); /* clear busy flag */
2638 write_segment_descriptor(ctxt
, old_tss_sel
, &curr_tss_desc
);
2641 if (reason
== TASK_SWITCH_IRET
)
2642 ctxt
->eflags
= ctxt
->eflags
& ~X86_EFLAGS_NT
;
2644 /* set back link to prev task only if NT bit is set in eflags
2645 note that old_tss_sel is not used afetr this point */
2646 if (reason
!= TASK_SWITCH_CALL
&& reason
!= TASK_SWITCH_GATE
)
2647 old_tss_sel
= 0xffff;
2649 if (next_tss_desc
.type
& 8)
2650 ret
= task_switch_32(ctxt
, tss_selector
, old_tss_sel
,
2651 old_tss_base
, &next_tss_desc
);
2653 ret
= task_switch_16(ctxt
, tss_selector
, old_tss_sel
,
2654 old_tss_base
, &next_tss_desc
);
2655 if (ret
!= X86EMUL_CONTINUE
)
2658 if (reason
== TASK_SWITCH_CALL
|| reason
== TASK_SWITCH_GATE
)
2659 ctxt
->eflags
= ctxt
->eflags
| X86_EFLAGS_NT
;
2661 if (reason
!= TASK_SWITCH_IRET
) {
2662 next_tss_desc
.type
|= (1 << 1); /* set busy flag */
2663 write_segment_descriptor(ctxt
, tss_selector
, &next_tss_desc
);
2666 ops
->set_cr(ctxt
, 0, ops
->get_cr(ctxt
, 0) | X86_CR0_TS
);
2667 ops
->set_segment(ctxt
, tss_selector
, &next_tss_desc
, 0, VCPU_SREG_TR
);
2669 if (has_error_code
) {
2670 ctxt
->op_bytes
= ctxt
->ad_bytes
= (next_tss_desc
.type
& 8) ? 4 : 2;
2671 ctxt
->lock_prefix
= 0;
2672 ctxt
->src
.val
= (unsigned long) error_code
;
2673 ret
= em_push(ctxt
);
2679 int emulator_task_switch(struct x86_emulate_ctxt
*ctxt
,
2680 u16 tss_selector
, int idt_index
, int reason
,
2681 bool has_error_code
, u32 error_code
)
2685 ctxt
->_eip
= ctxt
->eip
;
2686 ctxt
->dst
.type
= OP_NONE
;
2688 rc
= emulator_do_task_switch(ctxt
, tss_selector
, idt_index
, reason
,
2689 has_error_code
, error_code
);
2691 if (rc
== X86EMUL_CONTINUE
)
2692 ctxt
->eip
= ctxt
->_eip
;
2694 return (rc
== X86EMUL_UNHANDLEABLE
) ? EMULATION_FAILED
: EMULATION_OK
;
2697 static void string_addr_inc(struct x86_emulate_ctxt
*ctxt
, unsigned seg
,
2698 int reg
, struct operand
*op
)
2700 int df
= (ctxt
->eflags
& EFLG_DF
) ? -1 : 1;
2702 register_address_increment(ctxt
, &ctxt
->regs
[reg
], df
* op
->bytes
);
2703 op
->addr
.mem
.ea
= register_address(ctxt
, ctxt
->regs
[reg
]);
2704 op
->addr
.mem
.seg
= seg
;
2707 static int em_das(struct x86_emulate_ctxt
*ctxt
)
2710 bool af
, cf
, old_cf
;
2712 cf
= ctxt
->eflags
& X86_EFLAGS_CF
;
2718 af
= ctxt
->eflags
& X86_EFLAGS_AF
;
2719 if ((al
& 0x0f) > 9 || af
) {
2721 cf
= old_cf
| (al
>= 250);
2726 if (old_al
> 0x99 || old_cf
) {
2732 /* Set PF, ZF, SF */
2733 ctxt
->src
.type
= OP_IMM
;
2735 ctxt
->src
.bytes
= 1;
2736 emulate_2op_SrcV(ctxt
, "or");
2737 ctxt
->eflags
&= ~(X86_EFLAGS_AF
| X86_EFLAGS_CF
);
2739 ctxt
->eflags
|= X86_EFLAGS_CF
;
2741 ctxt
->eflags
|= X86_EFLAGS_AF
;
2742 return X86EMUL_CONTINUE
;
2745 static int em_call(struct x86_emulate_ctxt
*ctxt
)
2747 long rel
= ctxt
->src
.val
;
2749 ctxt
->src
.val
= (unsigned long)ctxt
->_eip
;
2751 return em_push(ctxt
);
2754 static int em_call_far(struct x86_emulate_ctxt
*ctxt
)
2760 old_cs
= get_segment_selector(ctxt
, VCPU_SREG_CS
);
2761 old_eip
= ctxt
->_eip
;
2763 memcpy(&sel
, ctxt
->src
.valptr
+ ctxt
->op_bytes
, 2);
2764 if (load_segment_descriptor(ctxt
, sel
, VCPU_SREG_CS
))
2765 return X86EMUL_CONTINUE
;
2768 memcpy(&ctxt
->_eip
, ctxt
->src
.valptr
, ctxt
->op_bytes
);
2770 ctxt
->src
.val
= old_cs
;
2772 if (rc
!= X86EMUL_CONTINUE
)
2775 ctxt
->src
.val
= old_eip
;
2776 return em_push(ctxt
);
2779 static int em_ret_near_imm(struct x86_emulate_ctxt
*ctxt
)
2783 ctxt
->dst
.type
= OP_REG
;
2784 ctxt
->dst
.addr
.reg
= &ctxt
->_eip
;
2785 ctxt
->dst
.bytes
= ctxt
->op_bytes
;
2786 rc
= emulate_pop(ctxt
, &ctxt
->dst
.val
, ctxt
->op_bytes
);
2787 if (rc
!= X86EMUL_CONTINUE
)
2789 register_address_increment(ctxt
, &ctxt
->regs
[VCPU_REGS_RSP
], ctxt
->src
.val
);
2790 return X86EMUL_CONTINUE
;
2793 static int em_add(struct x86_emulate_ctxt
*ctxt
)
2795 emulate_2op_SrcV(ctxt
, "add");
2796 return X86EMUL_CONTINUE
;
2799 static int em_or(struct x86_emulate_ctxt
*ctxt
)
2801 emulate_2op_SrcV(ctxt
, "or");
2802 return X86EMUL_CONTINUE
;
2805 static int em_adc(struct x86_emulate_ctxt
*ctxt
)
2807 emulate_2op_SrcV(ctxt
, "adc");
2808 return X86EMUL_CONTINUE
;
2811 static int em_sbb(struct x86_emulate_ctxt
*ctxt
)
2813 emulate_2op_SrcV(ctxt
, "sbb");
2814 return X86EMUL_CONTINUE
;
2817 static int em_and(struct x86_emulate_ctxt
*ctxt
)
2819 emulate_2op_SrcV(ctxt
, "and");
2820 return X86EMUL_CONTINUE
;
2823 static int em_sub(struct x86_emulate_ctxt
*ctxt
)
2825 emulate_2op_SrcV(ctxt
, "sub");
2826 return X86EMUL_CONTINUE
;
2829 static int em_xor(struct x86_emulate_ctxt
*ctxt
)
2831 emulate_2op_SrcV(ctxt
, "xor");
2832 return X86EMUL_CONTINUE
;
2835 static int em_cmp(struct x86_emulate_ctxt
*ctxt
)
2837 emulate_2op_SrcV(ctxt
, "cmp");
2838 /* Disable writeback. */
2839 ctxt
->dst
.type
= OP_NONE
;
2840 return X86EMUL_CONTINUE
;
2843 static int em_test(struct x86_emulate_ctxt
*ctxt
)
2845 emulate_2op_SrcV(ctxt
, "test");
2846 /* Disable writeback. */
2847 ctxt
->dst
.type
= OP_NONE
;
2848 return X86EMUL_CONTINUE
;
2851 static int em_xchg(struct x86_emulate_ctxt
*ctxt
)
2853 /* Write back the register source. */
2854 ctxt
->src
.val
= ctxt
->dst
.val
;
2855 write_register_operand(&ctxt
->src
);
2857 /* Write back the memory destination with implicit LOCK prefix. */
2858 ctxt
->dst
.val
= ctxt
->src
.orig_val
;
2859 ctxt
->lock_prefix
= 1;
2860 return X86EMUL_CONTINUE
;
2863 static int em_imul(struct x86_emulate_ctxt
*ctxt
)
2865 emulate_2op_SrcV_nobyte(ctxt
, "imul");
2866 return X86EMUL_CONTINUE
;
2869 static int em_imul_3op(struct x86_emulate_ctxt
*ctxt
)
2871 ctxt
->dst
.val
= ctxt
->src2
.val
;
2872 return em_imul(ctxt
);
2875 static int em_cwd(struct x86_emulate_ctxt
*ctxt
)
2877 ctxt
->dst
.type
= OP_REG
;
2878 ctxt
->dst
.bytes
= ctxt
->src
.bytes
;
2879 ctxt
->dst
.addr
.reg
= &ctxt
->regs
[VCPU_REGS_RDX
];
2880 ctxt
->dst
.val
= ~((ctxt
->src
.val
>> (ctxt
->src
.bytes
* 8 - 1)) - 1);
2882 return X86EMUL_CONTINUE
;
2885 static int em_rdtsc(struct x86_emulate_ctxt
*ctxt
)
2889 ctxt
->ops
->get_msr(ctxt
, MSR_IA32_TSC
, &tsc
);
2890 ctxt
->regs
[VCPU_REGS_RAX
] = (u32
)tsc
;
2891 ctxt
->regs
[VCPU_REGS_RDX
] = tsc
>> 32;
2892 return X86EMUL_CONTINUE
;
2895 static int em_rdpmc(struct x86_emulate_ctxt
*ctxt
)
2899 if (ctxt
->ops
->read_pmc(ctxt
, ctxt
->regs
[VCPU_REGS_RCX
], &pmc
))
2900 return emulate_gp(ctxt
, 0);
2901 ctxt
->regs
[VCPU_REGS_RAX
] = (u32
)pmc
;
2902 ctxt
->regs
[VCPU_REGS_RDX
] = pmc
>> 32;
2903 return X86EMUL_CONTINUE
;
2906 static int em_mov(struct x86_emulate_ctxt
*ctxt
)
2908 memcpy(ctxt
->dst
.valptr
, ctxt
->src
.valptr
, ctxt
->op_bytes
);
2909 return X86EMUL_CONTINUE
;
2912 static int em_cr_write(struct x86_emulate_ctxt
*ctxt
)
2914 if (ctxt
->ops
->set_cr(ctxt
, ctxt
->modrm_reg
, ctxt
->src
.val
))
2915 return emulate_gp(ctxt
, 0);
2917 /* Disable writeback. */
2918 ctxt
->dst
.type
= OP_NONE
;
2919 return X86EMUL_CONTINUE
;
2922 static int em_dr_write(struct x86_emulate_ctxt
*ctxt
)
2926 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
2927 val
= ctxt
->src
.val
& ~0ULL;
2929 val
= ctxt
->src
.val
& ~0U;
2931 /* #UD condition is already handled. */
2932 if (ctxt
->ops
->set_dr(ctxt
, ctxt
->modrm_reg
, val
) < 0)
2933 return emulate_gp(ctxt
, 0);
2935 /* Disable writeback. */
2936 ctxt
->dst
.type
= OP_NONE
;
2937 return X86EMUL_CONTINUE
;
2940 static int em_wrmsr(struct x86_emulate_ctxt
*ctxt
)
2944 msr_data
= (u32
)ctxt
->regs
[VCPU_REGS_RAX
]
2945 | ((u64
)ctxt
->regs
[VCPU_REGS_RDX
] << 32);
2946 if (ctxt
->ops
->set_msr(ctxt
, ctxt
->regs
[VCPU_REGS_RCX
], msr_data
))
2947 return emulate_gp(ctxt
, 0);
2949 return X86EMUL_CONTINUE
;
2952 static int em_rdmsr(struct x86_emulate_ctxt
*ctxt
)
2956 if (ctxt
->ops
->get_msr(ctxt
, ctxt
->regs
[VCPU_REGS_RCX
], &msr_data
))
2957 return emulate_gp(ctxt
, 0);
2959 ctxt
->regs
[VCPU_REGS_RAX
] = (u32
)msr_data
;
2960 ctxt
->regs
[VCPU_REGS_RDX
] = msr_data
>> 32;
2961 return X86EMUL_CONTINUE
;
2964 static int em_mov_rm_sreg(struct x86_emulate_ctxt
*ctxt
)
2966 if (ctxt
->modrm_reg
> VCPU_SREG_GS
)
2967 return emulate_ud(ctxt
);
2969 ctxt
->dst
.val
= get_segment_selector(ctxt
, ctxt
->modrm_reg
);
2970 return X86EMUL_CONTINUE
;
2973 static int em_mov_sreg_rm(struct x86_emulate_ctxt
*ctxt
)
2975 u16 sel
= ctxt
->src
.val
;
2977 if (ctxt
->modrm_reg
== VCPU_SREG_CS
|| ctxt
->modrm_reg
> VCPU_SREG_GS
)
2978 return emulate_ud(ctxt
);
2980 if (ctxt
->modrm_reg
== VCPU_SREG_SS
)
2981 ctxt
->interruptibility
= KVM_X86_SHADOW_INT_MOV_SS
;
2983 /* Disable writeback. */
2984 ctxt
->dst
.type
= OP_NONE
;
2985 return load_segment_descriptor(ctxt
, sel
, ctxt
->modrm_reg
);
2988 static int em_invlpg(struct x86_emulate_ctxt
*ctxt
)
2993 rc
= linearize(ctxt
, ctxt
->src
.addr
.mem
, 1, false, &linear
);
2994 if (rc
== X86EMUL_CONTINUE
)
2995 ctxt
->ops
->invlpg(ctxt
, linear
);
2996 /* Disable writeback. */
2997 ctxt
->dst
.type
= OP_NONE
;
2998 return X86EMUL_CONTINUE
;
3001 static int em_clts(struct x86_emulate_ctxt
*ctxt
)
3005 cr0
= ctxt
->ops
->get_cr(ctxt
, 0);
3007 ctxt
->ops
->set_cr(ctxt
, 0, cr0
);
3008 return X86EMUL_CONTINUE
;
3011 static int em_vmcall(struct x86_emulate_ctxt
*ctxt
)
3015 if (ctxt
->modrm_mod
!= 3 || ctxt
->modrm_rm
!= 1)
3016 return X86EMUL_UNHANDLEABLE
;
3018 rc
= ctxt
->ops
->fix_hypercall(ctxt
);
3019 if (rc
!= X86EMUL_CONTINUE
)
3022 /* Let the processor re-execute the fixed hypercall */
3023 ctxt
->_eip
= ctxt
->eip
;
3024 /* Disable writeback. */
3025 ctxt
->dst
.type
= OP_NONE
;
3026 return X86EMUL_CONTINUE
;
3029 static int emulate_store_desc_ptr(struct x86_emulate_ctxt
*ctxt
,
3030 void (*get
)(struct x86_emulate_ctxt
*ctxt
,
3031 struct desc_ptr
*ptr
))
3033 struct desc_ptr desc_ptr
;
3035 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
3037 get(ctxt
, &desc_ptr
);
3038 if (ctxt
->op_bytes
== 2) {
3040 desc_ptr
.address
&= 0x00ffffff;
3042 /* Disable writeback. */
3043 ctxt
->dst
.type
= OP_NONE
;
3044 return segmented_write(ctxt
, ctxt
->dst
.addr
.mem
,
3045 &desc_ptr
, 2 + ctxt
->op_bytes
);
3048 static int em_sgdt(struct x86_emulate_ctxt
*ctxt
)
3050 return emulate_store_desc_ptr(ctxt
, ctxt
->ops
->get_gdt
);
3053 static int em_sidt(struct x86_emulate_ctxt
*ctxt
)
3055 return emulate_store_desc_ptr(ctxt
, ctxt
->ops
->get_idt
);
3058 static int em_lgdt(struct x86_emulate_ctxt
*ctxt
)
3060 struct desc_ptr desc_ptr
;
3063 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
3065 rc
= read_descriptor(ctxt
, ctxt
->src
.addr
.mem
,
3066 &desc_ptr
.size
, &desc_ptr
.address
,
3068 if (rc
!= X86EMUL_CONTINUE
)
3070 ctxt
->ops
->set_gdt(ctxt
, &desc_ptr
);
3071 /* Disable writeback. */
3072 ctxt
->dst
.type
= OP_NONE
;
3073 return X86EMUL_CONTINUE
;
3076 static int em_vmmcall(struct x86_emulate_ctxt
*ctxt
)
3080 rc
= ctxt
->ops
->fix_hypercall(ctxt
);
3082 /* Disable writeback. */
3083 ctxt
->dst
.type
= OP_NONE
;
3087 static int em_lidt(struct x86_emulate_ctxt
*ctxt
)
3089 struct desc_ptr desc_ptr
;
3092 if (ctxt
->mode
== X86EMUL_MODE_PROT64
)
3094 rc
= read_descriptor(ctxt
, ctxt
->src
.addr
.mem
,
3095 &desc_ptr
.size
, &desc_ptr
.address
,
3097 if (rc
!= X86EMUL_CONTINUE
)
3099 ctxt
->ops
->set_idt(ctxt
, &desc_ptr
);
3100 /* Disable writeback. */
3101 ctxt
->dst
.type
= OP_NONE
;
3102 return X86EMUL_CONTINUE
;
3105 static int em_smsw(struct x86_emulate_ctxt
*ctxt
)
3107 ctxt
->dst
.bytes
= 2;
3108 ctxt
->dst
.val
= ctxt
->ops
->get_cr(ctxt
, 0);
3109 return X86EMUL_CONTINUE
;
3112 static int em_lmsw(struct x86_emulate_ctxt
*ctxt
)
3114 ctxt
->ops
->set_cr(ctxt
, 0, (ctxt
->ops
->get_cr(ctxt
, 0) & ~0x0eul
)
3115 | (ctxt
->src
.val
& 0x0f));
3116 ctxt
->dst
.type
= OP_NONE
;
3117 return X86EMUL_CONTINUE
;
3120 static int em_loop(struct x86_emulate_ctxt
*ctxt
)
3122 register_address_increment(ctxt
, &ctxt
->regs
[VCPU_REGS_RCX
], -1);
3123 if ((address_mask(ctxt
, ctxt
->regs
[VCPU_REGS_RCX
]) != 0) &&
3124 (ctxt
->b
== 0xe2 || test_cc(ctxt
->b
^ 0x5, ctxt
->eflags
)))
3125 jmp_rel(ctxt
, ctxt
->src
.val
);
3127 return X86EMUL_CONTINUE
;
3130 static int em_jcxz(struct x86_emulate_ctxt
*ctxt
)
3132 if (address_mask(ctxt
, ctxt
->regs
[VCPU_REGS_RCX
]) == 0)
3133 jmp_rel(ctxt
, ctxt
->src
.val
);
3135 return X86EMUL_CONTINUE
;
3138 static int em_in(struct x86_emulate_ctxt
*ctxt
)
3140 if (!pio_in_emulated(ctxt
, ctxt
->dst
.bytes
, ctxt
->src
.val
,
3142 return X86EMUL_IO_NEEDED
;
3144 return X86EMUL_CONTINUE
;
3147 static int em_out(struct x86_emulate_ctxt
*ctxt
)
3149 ctxt
->ops
->pio_out_emulated(ctxt
, ctxt
->src
.bytes
, ctxt
->dst
.val
,
3151 /* Disable writeback. */
3152 ctxt
->dst
.type
= OP_NONE
;
3153 return X86EMUL_CONTINUE
;
3156 static int em_cli(struct x86_emulate_ctxt
*ctxt
)
3158 if (emulator_bad_iopl(ctxt
))
3159 return emulate_gp(ctxt
, 0);
3161 ctxt
->eflags
&= ~X86_EFLAGS_IF
;
3162 return X86EMUL_CONTINUE
;
3165 static int em_sti(struct x86_emulate_ctxt
*ctxt
)
3167 if (emulator_bad_iopl(ctxt
))
3168 return emulate_gp(ctxt
, 0);
3170 ctxt
->interruptibility
= KVM_X86_SHADOW_INT_STI
;
3171 ctxt
->eflags
|= X86_EFLAGS_IF
;
3172 return X86EMUL_CONTINUE
;
3175 static int em_bt(struct x86_emulate_ctxt
*ctxt
)
3177 /* Disable writeback. */
3178 ctxt
->dst
.type
= OP_NONE
;
3179 /* only subword offset */
3180 ctxt
->src
.val
&= (ctxt
->dst
.bytes
<< 3) - 1;
3182 emulate_2op_SrcV_nobyte(ctxt
, "bt");
3183 return X86EMUL_CONTINUE
;
3186 static int em_bts(struct x86_emulate_ctxt
*ctxt
)
3188 emulate_2op_SrcV_nobyte(ctxt
, "bts");
3189 return X86EMUL_CONTINUE
;
3192 static int em_btr(struct x86_emulate_ctxt
*ctxt
)
3194 emulate_2op_SrcV_nobyte(ctxt
, "btr");
3195 return X86EMUL_CONTINUE
;
3198 static int em_btc(struct x86_emulate_ctxt
*ctxt
)
3200 emulate_2op_SrcV_nobyte(ctxt
, "btc");
3201 return X86EMUL_CONTINUE
;
3204 static int em_bsf(struct x86_emulate_ctxt
*ctxt
)
3206 emulate_2op_SrcV_nobyte(ctxt
, "bsf");
3207 return X86EMUL_CONTINUE
;
3210 static int em_bsr(struct x86_emulate_ctxt
*ctxt
)
3212 emulate_2op_SrcV_nobyte(ctxt
, "bsr");
3213 return X86EMUL_CONTINUE
;
3216 static int em_cpuid(struct x86_emulate_ctxt
*ctxt
)
3218 u32 eax
, ebx
, ecx
, edx
;
3220 eax
= ctxt
->regs
[VCPU_REGS_RAX
];
3221 ecx
= ctxt
->regs
[VCPU_REGS_RCX
];
3222 ctxt
->ops
->get_cpuid(ctxt
, &eax
, &ebx
, &ecx
, &edx
);
3223 ctxt
->regs
[VCPU_REGS_RAX
] = eax
;
3224 ctxt
->regs
[VCPU_REGS_RBX
] = ebx
;
3225 ctxt
->regs
[VCPU_REGS_RCX
] = ecx
;
3226 ctxt
->regs
[VCPU_REGS_RDX
] = edx
;
3227 return X86EMUL_CONTINUE
;
3230 static int em_lahf(struct x86_emulate_ctxt
*ctxt
)
3232 ctxt
->regs
[VCPU_REGS_RAX
] &= ~0xff00UL
;
3233 ctxt
->regs
[VCPU_REGS_RAX
] |= (ctxt
->eflags
& 0xff) << 8;
3234 return X86EMUL_CONTINUE
;
3237 static bool valid_cr(int nr
)
3249 static int check_cr_read(struct x86_emulate_ctxt
*ctxt
)
3251 if (!valid_cr(ctxt
->modrm_reg
))
3252 return emulate_ud(ctxt
);
3254 return X86EMUL_CONTINUE
;
3257 static int check_cr_write(struct x86_emulate_ctxt
*ctxt
)
3259 u64 new_val
= ctxt
->src
.val64
;
3260 int cr
= ctxt
->modrm_reg
;
3263 static u64 cr_reserved_bits
[] = {
3264 0xffffffff00000000ULL
,
3265 0, 0, 0, /* CR3 checked later */
3272 return emulate_ud(ctxt
);
3274 if (new_val
& cr_reserved_bits
[cr
])
3275 return emulate_gp(ctxt
, 0);
3280 if (((new_val
& X86_CR0_PG
) && !(new_val
& X86_CR0_PE
)) ||
3281 ((new_val
& X86_CR0_NW
) && !(new_val
& X86_CR0_CD
)))
3282 return emulate_gp(ctxt
, 0);
3284 cr4
= ctxt
->ops
->get_cr(ctxt
, 4);
3285 ctxt
->ops
->get_msr(ctxt
, MSR_EFER
, &efer
);
3287 if ((new_val
& X86_CR0_PG
) && (efer
& EFER_LME
) &&
3288 !(cr4
& X86_CR4_PAE
))
3289 return emulate_gp(ctxt
, 0);
3296 ctxt
->ops
->get_msr(ctxt
, MSR_EFER
, &efer
);
3297 if (efer
& EFER_LMA
)
3298 rsvd
= CR3_L_MODE_RESERVED_BITS
;
3299 else if (ctxt
->ops
->get_cr(ctxt
, 4) & X86_CR4_PAE
)
3300 rsvd
= CR3_PAE_RESERVED_BITS
;
3301 else if (ctxt
->ops
->get_cr(ctxt
, 0) & X86_CR0_PG
)
3302 rsvd
= CR3_NONPAE_RESERVED_BITS
;
3305 return emulate_gp(ctxt
, 0);
3310 ctxt
->ops
->get_msr(ctxt
, MSR_EFER
, &efer
);
3312 if ((efer
& EFER_LMA
) && !(new_val
& X86_CR4_PAE
))
3313 return emulate_gp(ctxt
, 0);
3319 return X86EMUL_CONTINUE
;
3322 static int check_dr7_gd(struct x86_emulate_ctxt
*ctxt
)
3326 ctxt
->ops
->get_dr(ctxt
, 7, &dr7
);
3328 /* Check if DR7.Global_Enable is set */
3329 return dr7
& (1 << 13);
3332 static int check_dr_read(struct x86_emulate_ctxt
*ctxt
)
3334 int dr
= ctxt
->modrm_reg
;
3338 return emulate_ud(ctxt
);
3340 cr4
= ctxt
->ops
->get_cr(ctxt
, 4);
3341 if ((cr4
& X86_CR4_DE
) && (dr
== 4 || dr
== 5))
3342 return emulate_ud(ctxt
);
3344 if (check_dr7_gd(ctxt
))
3345 return emulate_db(ctxt
);
3347 return X86EMUL_CONTINUE
;
3350 static int check_dr_write(struct x86_emulate_ctxt
*ctxt
)
3352 u64 new_val
= ctxt
->src
.val64
;
3353 int dr
= ctxt
->modrm_reg
;
3355 if ((dr
== 6 || dr
== 7) && (new_val
& 0xffffffff00000000ULL
))
3356 return emulate_gp(ctxt
, 0);
3358 return check_dr_read(ctxt
);
3361 static int check_svme(struct x86_emulate_ctxt
*ctxt
)
3365 ctxt
->ops
->get_msr(ctxt
, MSR_EFER
, &efer
);
3367 if (!(efer
& EFER_SVME
))
3368 return emulate_ud(ctxt
);
3370 return X86EMUL_CONTINUE
;
3373 static int check_svme_pa(struct x86_emulate_ctxt
*ctxt
)
3375 u64 rax
= ctxt
->regs
[VCPU_REGS_RAX
];
3377 /* Valid physical address? */
3378 if (rax
& 0xffff000000000000ULL
)
3379 return emulate_gp(ctxt
, 0);
3381 return check_svme(ctxt
);
3384 static int check_rdtsc(struct x86_emulate_ctxt
*ctxt
)
3386 u64 cr4
= ctxt
->ops
->get_cr(ctxt
, 4);
3388 if (cr4
& X86_CR4_TSD
&& ctxt
->ops
->cpl(ctxt
))
3389 return emulate_ud(ctxt
);
3391 return X86EMUL_CONTINUE
;
3394 static int check_rdpmc(struct x86_emulate_ctxt
*ctxt
)
3396 u64 cr4
= ctxt
->ops
->get_cr(ctxt
, 4);
3397 u64 rcx
= ctxt
->regs
[VCPU_REGS_RCX
];
3399 if ((!(cr4
& X86_CR4_PCE
) && ctxt
->ops
->cpl(ctxt
)) ||
3401 return emulate_gp(ctxt
, 0);
3403 return X86EMUL_CONTINUE
;
3406 static int check_perm_in(struct x86_emulate_ctxt
*ctxt
)
3408 ctxt
->dst
.bytes
= min(ctxt
->dst
.bytes
, 4u);
3409 if (!emulator_io_permited(ctxt
, ctxt
->src
.val
, ctxt
->dst
.bytes
))
3410 return emulate_gp(ctxt
, 0);
3412 return X86EMUL_CONTINUE
;
3415 static int check_perm_out(struct x86_emulate_ctxt
*ctxt
)
3417 ctxt
->src
.bytes
= min(ctxt
->src
.bytes
, 4u);
3418 if (!emulator_io_permited(ctxt
, ctxt
->dst
.val
, ctxt
->src
.bytes
))
3419 return emulate_gp(ctxt
, 0);
3421 return X86EMUL_CONTINUE
;
3424 #define D(_y) { .flags = (_y) }
3425 #define DI(_y, _i) { .flags = (_y), .intercept = x86_intercept_##_i }
3426 #define DIP(_y, _i, _p) { .flags = (_y), .intercept = x86_intercept_##_i, \
3427 .check_perm = (_p) }
3429 #define EXT(_f, _e) { .flags = ((_f) | RMExt), .u.group = (_e) }
3430 #define G(_f, _g) { .flags = ((_f) | Group | ModRM), .u.group = (_g) }
3431 #define GD(_f, _g) { .flags = ((_f) | GroupDual | ModRM), .u.gdual = (_g) }
3432 #define I(_f, _e) { .flags = (_f), .u.execute = (_e) }
3433 #define II(_f, _e, _i) \
3434 { .flags = (_f), .u.execute = (_e), .intercept = x86_intercept_##_i }
3435 #define IIP(_f, _e, _i, _p) \
3436 { .flags = (_f), .u.execute = (_e), .intercept = x86_intercept_##_i, \
3437 .check_perm = (_p) }
3438 #define GP(_f, _g) { .flags = ((_f) | Prefix), .u.gprefix = (_g) }
3440 #define D2bv(_f) D((_f) | ByteOp), D(_f)
3441 #define D2bvIP(_f, _i, _p) DIP((_f) | ByteOp, _i, _p), DIP(_f, _i, _p)
3442 #define I2bv(_f, _e) I((_f) | ByteOp, _e), I(_f, _e)
3443 #define I2bvIP(_f, _e, _i, _p) \
3444 IIP((_f) | ByteOp, _e, _i, _p), IIP(_f, _e, _i, _p)
3446 #define I6ALU(_f, _e) I2bv((_f) | DstMem | SrcReg | ModRM, _e), \
3447 I2bv(((_f) | DstReg | SrcMem | ModRM) & ~Lock, _e), \
3448 I2bv(((_f) & ~Lock) | DstAcc | SrcImm, _e)
3450 static struct opcode group7_rm1
[] = {
3451 DI(SrcNone
| Priv
, monitor
),
3452 DI(SrcNone
| Priv
, mwait
),
3456 static struct opcode group7_rm3
[] = {
3457 DIP(SrcNone
| Prot
| Priv
, vmrun
, check_svme_pa
),
3458 II(SrcNone
| Prot
| VendorSpecific
, em_vmmcall
, vmmcall
),
3459 DIP(SrcNone
| Prot
| Priv
, vmload
, check_svme_pa
),
3460 DIP(SrcNone
| Prot
| Priv
, vmsave
, check_svme_pa
),
3461 DIP(SrcNone
| Prot
| Priv
, stgi
, check_svme
),
3462 DIP(SrcNone
| Prot
| Priv
, clgi
, check_svme
),
3463 DIP(SrcNone
| Prot
| Priv
, skinit
, check_svme
),
3464 DIP(SrcNone
| Prot
| Priv
, invlpga
, check_svme
),
3467 static struct opcode group7_rm7
[] = {
3469 DIP(SrcNone
, rdtscp
, check_rdtsc
),
3473 static struct opcode group1
[] = {
3475 I(Lock
| PageTable
, em_or
),
3478 I(Lock
| PageTable
, em_and
),
3484 static struct opcode group1A
[] = {
3485 I(DstMem
| SrcNone
| Mov
| Stack
, em_pop
), N
, N
, N
, N
, N
, N
, N
,
3488 static struct opcode group3
[] = {
3489 I(DstMem
| SrcImm
, em_test
),
3490 I(DstMem
| SrcImm
, em_test
),
3491 I(DstMem
| SrcNone
| Lock
, em_not
),
3492 I(DstMem
| SrcNone
| Lock
, em_neg
),
3493 I(SrcMem
, em_mul_ex
),
3494 I(SrcMem
, em_imul_ex
),
3495 I(SrcMem
, em_div_ex
),
3496 I(SrcMem
, em_idiv_ex
),
3499 static struct opcode group4
[] = {
3500 I(ByteOp
| DstMem
| SrcNone
| Lock
, em_grp45
),
3501 I(ByteOp
| DstMem
| SrcNone
| Lock
, em_grp45
),
3505 static struct opcode group5
[] = {
3506 I(DstMem
| SrcNone
| Lock
, em_grp45
),
3507 I(DstMem
| SrcNone
| Lock
, em_grp45
),
3508 I(SrcMem
| Stack
, em_grp45
),
3509 I(SrcMemFAddr
| ImplicitOps
| Stack
, em_call_far
),
3510 I(SrcMem
| Stack
, em_grp45
),
3511 I(SrcMemFAddr
| ImplicitOps
, em_grp45
),
3512 I(SrcMem
| Stack
, em_grp45
), N
,
3515 static struct opcode group6
[] = {
3518 DI(Prot
| Priv
, lldt
),
3519 DI(Prot
| Priv
, ltr
),
3523 static struct group_dual group7
= { {
3524 II(Mov
| DstMem
| Priv
, em_sgdt
, sgdt
),
3525 II(Mov
| DstMem
| Priv
, em_sidt
, sidt
),
3526 II(SrcMem
| Priv
, em_lgdt
, lgdt
),
3527 II(SrcMem
| Priv
, em_lidt
, lidt
),
3528 II(SrcNone
| DstMem
| Mov
, em_smsw
, smsw
), N
,
3529 II(SrcMem16
| Mov
| Priv
, em_lmsw
, lmsw
),
3530 II(SrcMem
| ByteOp
| Priv
| NoAccess
, em_invlpg
, invlpg
),
3532 I(SrcNone
| Priv
| VendorSpecific
, em_vmcall
),
3534 N
, EXT(0, group7_rm3
),
3535 II(SrcNone
| DstMem
| Mov
, em_smsw
, smsw
), N
,
3536 II(SrcMem16
| Mov
| Priv
, em_lmsw
, lmsw
),
3540 static struct opcode group8
[] = {
3542 I(DstMem
| SrcImmByte
, em_bt
),
3543 I(DstMem
| SrcImmByte
| Lock
| PageTable
, em_bts
),
3544 I(DstMem
| SrcImmByte
| Lock
, em_btr
),
3545 I(DstMem
| SrcImmByte
| Lock
| PageTable
, em_btc
),
3548 static struct group_dual group9
= { {
3549 N
, I(DstMem64
| Lock
| PageTable
, em_cmpxchg8b
), N
, N
, N
, N
, N
, N
,
3551 N
, N
, N
, N
, N
, N
, N
, N
,
3554 static struct opcode group11
[] = {
3555 I(DstMem
| SrcImm
| Mov
| PageTable
, em_mov
),
3559 static struct gprefix pfx_0f_6f_0f_7f
= {
3560 I(Mmx
, em_mov
), I(Sse
| Aligned
, em_mov
), N
, I(Sse
| Unaligned
, em_mov
),
3563 static struct gprefix pfx_vmovntpx
= {
3564 I(0, em_mov
), N
, N
, N
,
3567 static struct opcode opcode_table
[256] = {
3569 I6ALU(Lock
, em_add
),
3570 I(ImplicitOps
| Stack
| No64
| Src2ES
, em_push_sreg
),
3571 I(ImplicitOps
| Stack
| No64
| Src2ES
, em_pop_sreg
),
3573 I6ALU(Lock
| PageTable
, em_or
),
3574 I(ImplicitOps
| Stack
| No64
| Src2CS
, em_push_sreg
),
3577 I6ALU(Lock
, em_adc
),
3578 I(ImplicitOps
| Stack
| No64
| Src2SS
, em_push_sreg
),
3579 I(ImplicitOps
| Stack
| No64
| Src2SS
, em_pop_sreg
),
3581 I6ALU(Lock
, em_sbb
),
3582 I(ImplicitOps
| Stack
| No64
| Src2DS
, em_push_sreg
),
3583 I(ImplicitOps
| Stack
| No64
| Src2DS
, em_pop_sreg
),
3585 I6ALU(Lock
| PageTable
, em_and
), N
, N
,
3587 I6ALU(Lock
, em_sub
), N
, I(ByteOp
| DstAcc
| No64
, em_das
),
3589 I6ALU(Lock
, em_xor
), N
, N
,
3591 I6ALU(0, em_cmp
), N
, N
,
3595 X8(I(SrcReg
| Stack
, em_push
)),
3597 X8(I(DstReg
| Stack
, em_pop
)),
3599 I(ImplicitOps
| Stack
| No64
, em_pusha
),
3600 I(ImplicitOps
| Stack
| No64
, em_popa
),
3601 N
, D(DstReg
| SrcMem32
| ModRM
| Mov
) /* movsxd (x86/64) */ ,
3604 I(SrcImm
| Mov
| Stack
, em_push
),
3605 I(DstReg
| SrcMem
| ModRM
| Src2Imm
, em_imul_3op
),
3606 I(SrcImmByte
| Mov
| Stack
, em_push
),
3607 I(DstReg
| SrcMem
| ModRM
| Src2ImmByte
, em_imul_3op
),
3608 I2bvIP(DstDI
| SrcDX
| Mov
| String
, em_in
, ins
, check_perm_in
), /* insb, insw/insd */
3609 I2bvIP(SrcSI
| DstDX
| String
, em_out
, outs
, check_perm_out
), /* outsb, outsw/outsd */
3613 G(ByteOp
| DstMem
| SrcImm
, group1
),
3614 G(DstMem
| SrcImm
, group1
),
3615 G(ByteOp
| DstMem
| SrcImm
| No64
, group1
),
3616 G(DstMem
| SrcImmByte
, group1
),
3617 I2bv(DstMem
| SrcReg
| ModRM
, em_test
),
3618 I2bv(DstMem
| SrcReg
| ModRM
| Lock
| PageTable
, em_xchg
),
3620 I2bv(DstMem
| SrcReg
| ModRM
| Mov
| PageTable
, em_mov
),
3621 I2bv(DstReg
| SrcMem
| ModRM
| Mov
, em_mov
),
3622 I(DstMem
| SrcNone
| ModRM
| Mov
| PageTable
, em_mov_rm_sreg
),
3623 D(ModRM
| SrcMem
| NoAccess
| DstReg
),
3624 I(ImplicitOps
| SrcMem16
| ModRM
, em_mov_sreg_rm
),
3627 DI(SrcAcc
| DstReg
, pause
), X7(D(SrcAcc
| DstReg
)),
3629 D(DstAcc
| SrcNone
), I(ImplicitOps
| SrcAcc
, em_cwd
),
3630 I(SrcImmFAddr
| No64
, em_call_far
), N
,
3631 II(ImplicitOps
| Stack
, em_pushf
, pushf
),
3632 II(ImplicitOps
| Stack
, em_popf
, popf
), N
, I(ImplicitOps
, em_lahf
),
3634 I2bv(DstAcc
| SrcMem
| Mov
| MemAbs
, em_mov
),
3635 I2bv(DstMem
| SrcAcc
| Mov
| MemAbs
| PageTable
, em_mov
),
3636 I2bv(SrcSI
| DstDI
| Mov
| String
, em_mov
),
3637 I2bv(SrcSI
| DstDI
| String
, em_cmp
),
3639 I2bv(DstAcc
| SrcImm
, em_test
),
3640 I2bv(SrcAcc
| DstDI
| Mov
| String
, em_mov
),
3641 I2bv(SrcSI
| DstAcc
| Mov
| String
, em_mov
),
3642 I2bv(SrcAcc
| DstDI
| String
, em_cmp
),
3644 X8(I(ByteOp
| DstReg
| SrcImm
| Mov
, em_mov
)),
3646 X8(I(DstReg
| SrcImm
| Mov
, em_mov
)),
3648 D2bv(DstMem
| SrcImmByte
| ModRM
),
3649 I(ImplicitOps
| Stack
| SrcImmU16
, em_ret_near_imm
),
3650 I(ImplicitOps
| Stack
, em_ret
),
3651 I(DstReg
| SrcMemFAddr
| ModRM
| No64
| Src2ES
, em_lseg
),
3652 I(DstReg
| SrcMemFAddr
| ModRM
| No64
| Src2DS
, em_lseg
),
3653 G(ByteOp
, group11
), G(0, group11
),
3655 N
, I(Stack
, em_leave
), N
, I(ImplicitOps
| Stack
, em_ret_far
),
3656 D(ImplicitOps
), DI(SrcImmByte
, intn
),
3657 D(ImplicitOps
| No64
), II(ImplicitOps
, em_iret
, iret
),
3659 D2bv(DstMem
| SrcOne
| ModRM
), D2bv(DstMem
| ModRM
),
3662 N
, N
, N
, N
, N
, N
, N
, N
,
3664 X3(I(SrcImmByte
, em_loop
)),
3665 I(SrcImmByte
, em_jcxz
),
3666 I2bvIP(SrcImmUByte
| DstAcc
, em_in
, in
, check_perm_in
),
3667 I2bvIP(SrcAcc
| DstImmUByte
, em_out
, out
, check_perm_out
),
3669 I(SrcImm
| Stack
, em_call
), D(SrcImm
| ImplicitOps
),
3670 I(SrcImmFAddr
| No64
, em_jmp_far
), D(SrcImmByte
| ImplicitOps
),
3671 I2bvIP(SrcDX
| DstAcc
, em_in
, in
, check_perm_in
),
3672 I2bvIP(SrcAcc
| DstDX
, em_out
, out
, check_perm_out
),
3674 N
, DI(ImplicitOps
, icebp
), N
, N
,
3675 DI(ImplicitOps
| Priv
, hlt
), D(ImplicitOps
),
3676 G(ByteOp
, group3
), G(0, group3
),
3678 D(ImplicitOps
), D(ImplicitOps
),
3679 I(ImplicitOps
, em_cli
), I(ImplicitOps
, em_sti
),
3680 D(ImplicitOps
), D(ImplicitOps
), G(0, group4
), G(0, group5
),
3683 static struct opcode twobyte_table
[256] = {
3685 G(0, group6
), GD(0, &group7
), N
, N
,
3686 N
, I(ImplicitOps
| VendorSpecific
, em_syscall
),
3687 II(ImplicitOps
| Priv
, em_clts
, clts
), N
,
3688 DI(ImplicitOps
| Priv
, invd
), DI(ImplicitOps
| Priv
, wbinvd
), N
, N
,
3689 N
, D(ImplicitOps
| ModRM
), N
, N
,
3691 N
, N
, N
, N
, N
, N
, N
, N
, D(ImplicitOps
| ModRM
), N
, N
, N
, N
, N
, N
, N
,
3693 DIP(ModRM
| DstMem
| Priv
| Op3264
, cr_read
, check_cr_read
),
3694 DIP(ModRM
| DstMem
| Priv
| Op3264
, dr_read
, check_dr_read
),
3695 IIP(ModRM
| SrcMem
| Priv
| Op3264
, em_cr_write
, cr_write
, check_cr_write
),
3696 IIP(ModRM
| SrcMem
| Priv
| Op3264
, em_dr_write
, dr_write
, check_dr_write
),
3698 N
, N
, N
, GP(ModRM
| DstMem
| SrcReg
| Sse
| Mov
| Aligned
, &pfx_vmovntpx
),
3701 II(ImplicitOps
| Priv
, em_wrmsr
, wrmsr
),
3702 IIP(ImplicitOps
, em_rdtsc
, rdtsc
, check_rdtsc
),
3703 II(ImplicitOps
| Priv
, em_rdmsr
, rdmsr
),
3704 IIP(ImplicitOps
, em_rdpmc
, rdpmc
, check_rdpmc
),
3705 I(ImplicitOps
| VendorSpecific
, em_sysenter
),
3706 I(ImplicitOps
| Priv
| VendorSpecific
, em_sysexit
),
3708 N
, N
, N
, N
, N
, N
, N
, N
,
3710 X16(D(DstReg
| SrcMem
| ModRM
| Mov
)),
3712 N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
,
3717 N
, N
, N
, GP(SrcMem
| DstReg
| ModRM
| Mov
, &pfx_0f_6f_0f_7f
),
3722 N
, N
, N
, GP(SrcReg
| DstMem
| ModRM
| Mov
, &pfx_0f_6f_0f_7f
),
3726 X16(D(ByteOp
| DstMem
| SrcNone
| ModRM
| Mov
)),
3728 I(Stack
| Src2FS
, em_push_sreg
), I(Stack
| Src2FS
, em_pop_sreg
),
3729 II(ImplicitOps
, em_cpuid
, cpuid
), I(DstMem
| SrcReg
| ModRM
| BitOp
, em_bt
),
3730 D(DstMem
| SrcReg
| Src2ImmByte
| ModRM
),
3731 D(DstMem
| SrcReg
| Src2CL
| ModRM
), N
, N
,
3733 I(Stack
| Src2GS
, em_push_sreg
), I(Stack
| Src2GS
, em_pop_sreg
),
3734 DI(ImplicitOps
, rsm
),
3735 I(DstMem
| SrcReg
| ModRM
| BitOp
| Lock
| PageTable
, em_bts
),
3736 D(DstMem
| SrcReg
| Src2ImmByte
| ModRM
),
3737 D(DstMem
| SrcReg
| Src2CL
| ModRM
),
3738 D(ModRM
), I(DstReg
| SrcMem
| ModRM
, em_imul
),
3740 I2bv(DstMem
| SrcReg
| ModRM
| Lock
| PageTable
, em_cmpxchg
),
3741 I(DstReg
| SrcMemFAddr
| ModRM
| Src2SS
, em_lseg
),
3742 I(DstMem
| SrcReg
| ModRM
| BitOp
| Lock
, em_btr
),
3743 I(DstReg
| SrcMemFAddr
| ModRM
| Src2FS
, em_lseg
),
3744 I(DstReg
| SrcMemFAddr
| ModRM
| Src2GS
, em_lseg
),
3745 D(DstReg
| SrcMem8
| ModRM
| Mov
), D(DstReg
| SrcMem16
| ModRM
| Mov
),
3749 I(DstMem
| SrcReg
| ModRM
| BitOp
| Lock
| PageTable
, em_btc
),
3750 I(DstReg
| SrcMem
| ModRM
, em_bsf
), I(DstReg
| SrcMem
| ModRM
, em_bsr
),
3751 D(DstReg
| SrcMem8
| ModRM
| Mov
), D(DstReg
| SrcMem16
| ModRM
| Mov
),
3753 D2bv(DstMem
| SrcReg
| ModRM
| Lock
),
3754 N
, D(DstMem
| SrcReg
| ModRM
| Mov
),
3755 N
, N
, N
, GD(0, &group9
),
3756 N
, N
, N
, N
, N
, N
, N
, N
,
3758 N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
,
3760 N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
,
3762 N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
, N
3779 static unsigned imm_size(struct x86_emulate_ctxt
*ctxt
)
3783 size
= (ctxt
->d
& ByteOp
) ? 1 : ctxt
->op_bytes
;
3789 static int decode_imm(struct x86_emulate_ctxt
*ctxt
, struct operand
*op
,
3790 unsigned size
, bool sign_extension
)
3792 int rc
= X86EMUL_CONTINUE
;
3796 op
->addr
.mem
.ea
= ctxt
->_eip
;
3797 /* NB. Immediates are sign-extended as necessary. */
3798 switch (op
->bytes
) {
3800 op
->val
= insn_fetch(s8
, ctxt
);
3803 op
->val
= insn_fetch(s16
, ctxt
);
3806 op
->val
= insn_fetch(s32
, ctxt
);
3809 if (!sign_extension
) {
3810 switch (op
->bytes
) {
3818 op
->val
&= 0xffffffff;
3826 static int decode_operand(struct x86_emulate_ctxt
*ctxt
, struct operand
*op
,
3829 int rc
= X86EMUL_CONTINUE
;
3833 decode_register_operand(ctxt
, op
);
3836 rc
= decode_imm(ctxt
, op
, 1, false);
3839 ctxt
->memop
.bytes
= (ctxt
->d
& ByteOp
) ? 1 : ctxt
->op_bytes
;
3843 if ((ctxt
->d
& BitOp
) && op
== &ctxt
->dst
)
3844 fetch_bit_operand(ctxt
);
3845 op
->orig_val
= op
->val
;
3848 ctxt
->memop
.bytes
= 8;
3852 op
->bytes
= (ctxt
->d
& ByteOp
) ? 1 : ctxt
->op_bytes
;
3853 op
->addr
.reg
= &ctxt
->regs
[VCPU_REGS_RAX
];
3854 fetch_register_operand(op
);
3855 op
->orig_val
= op
->val
;
3859 op
->bytes
= (ctxt
->d
& ByteOp
) ? 1 : ctxt
->op_bytes
;
3861 register_address(ctxt
, ctxt
->regs
[VCPU_REGS_RDI
]);
3862 op
->addr
.mem
.seg
= VCPU_SREG_ES
;
3868 op
->addr
.reg
= &ctxt
->regs
[VCPU_REGS_RDX
];
3869 fetch_register_operand(op
);
3873 op
->val
= ctxt
->regs
[VCPU_REGS_RCX
] & 0xff;
3876 rc
= decode_imm(ctxt
, op
, 1, true);
3883 rc
= decode_imm(ctxt
, op
, imm_size(ctxt
), true);
3886 ctxt
->memop
.bytes
= 1;
3889 ctxt
->memop
.bytes
= 2;
3892 ctxt
->memop
.bytes
= 4;
3895 rc
= decode_imm(ctxt
, op
, 2, false);
3898 rc
= decode_imm(ctxt
, op
, imm_size(ctxt
), false);
3902 op
->bytes
= (ctxt
->d
& ByteOp
) ? 1 : ctxt
->op_bytes
;
3904 register_address(ctxt
, ctxt
->regs
[VCPU_REGS_RSI
]);
3905 op
->addr
.mem
.seg
= seg_override(ctxt
);
3910 op
->addr
.mem
.ea
= ctxt
->_eip
;
3911 op
->bytes
= ctxt
->op_bytes
+ 2;
3912 insn_fetch_arr(op
->valptr
, op
->bytes
, ctxt
);
3915 ctxt
->memop
.bytes
= ctxt
->op_bytes
+ 2;
3918 op
->val
= VCPU_SREG_ES
;
3921 op
->val
= VCPU_SREG_CS
;
3924 op
->val
= VCPU_SREG_SS
;
3927 op
->val
= VCPU_SREG_DS
;
3930 op
->val
= VCPU_SREG_FS
;
3933 op
->val
= VCPU_SREG_GS
;
3936 /* Special instructions do their own operand decoding. */
3938 op
->type
= OP_NONE
; /* Disable writeback. */
3946 int x86_decode_insn(struct x86_emulate_ctxt
*ctxt
, void *insn
, int insn_len
)
3948 int rc
= X86EMUL_CONTINUE
;
3949 int mode
= ctxt
->mode
;
3950 int def_op_bytes
, def_ad_bytes
, goffset
, simd_prefix
;
3951 bool op_prefix
= false;
3952 struct opcode opcode
;
3954 ctxt
->memop
.type
= OP_NONE
;
3955 ctxt
->memopp
= NULL
;
3956 ctxt
->_eip
= ctxt
->eip
;
3957 ctxt
->fetch
.start
= ctxt
->_eip
;
3958 ctxt
->fetch
.end
= ctxt
->fetch
.start
+ insn_len
;
3960 memcpy(ctxt
->fetch
.data
, insn
, insn_len
);
3963 case X86EMUL_MODE_REAL
:
3964 case X86EMUL_MODE_VM86
:
3965 case X86EMUL_MODE_PROT16
:
3966 def_op_bytes
= def_ad_bytes
= 2;
3968 case X86EMUL_MODE_PROT32
:
3969 def_op_bytes
= def_ad_bytes
= 4;
3971 #ifdef CONFIG_X86_64
3972 case X86EMUL_MODE_PROT64
:
3978 return EMULATION_FAILED
;
3981 ctxt
->op_bytes
= def_op_bytes
;
3982 ctxt
->ad_bytes
= def_ad_bytes
;
3984 /* Legacy prefixes. */
3986 switch (ctxt
->b
= insn_fetch(u8
, ctxt
)) {
3987 case 0x66: /* operand-size override */
3989 /* switch between 2/4 bytes */
3990 ctxt
->op_bytes
= def_op_bytes
^ 6;
3992 case 0x67: /* address-size override */
3993 if (mode
== X86EMUL_MODE_PROT64
)
3994 /* switch between 4/8 bytes */
3995 ctxt
->ad_bytes
= def_ad_bytes
^ 12;
3997 /* switch between 2/4 bytes */
3998 ctxt
->ad_bytes
= def_ad_bytes
^ 6;
4000 case 0x26: /* ES override */
4001 case 0x2e: /* CS override */
4002 case 0x36: /* SS override */
4003 case 0x3e: /* DS override */
4004 set_seg_override(ctxt
, (ctxt
->b
>> 3) & 3);
4006 case 0x64: /* FS override */
4007 case 0x65: /* GS override */
4008 set_seg_override(ctxt
, ctxt
->b
& 7);
4010 case 0x40 ... 0x4f: /* REX */
4011 if (mode
!= X86EMUL_MODE_PROT64
)
4013 ctxt
->rex_prefix
= ctxt
->b
;
4015 case 0xf0: /* LOCK */
4016 ctxt
->lock_prefix
= 1;
4018 case 0xf2: /* REPNE/REPNZ */
4019 case 0xf3: /* REP/REPE/REPZ */
4020 ctxt
->rep_prefix
= ctxt
->b
;
4026 /* Any legacy prefix after a REX prefix nullifies its effect. */
4028 ctxt
->rex_prefix
= 0;
4034 if (ctxt
->rex_prefix
& 8)
4035 ctxt
->op_bytes
= 8; /* REX.W */
4037 /* Opcode byte(s). */
4038 opcode
= opcode_table
[ctxt
->b
];
4039 /* Two-byte opcode? */
4040 if (ctxt
->b
== 0x0f) {
4042 ctxt
->b
= insn_fetch(u8
, ctxt
);
4043 opcode
= twobyte_table
[ctxt
->b
];
4045 ctxt
->d
= opcode
.flags
;
4047 if (ctxt
->d
& ModRM
)
4048 ctxt
->modrm
= insn_fetch(u8
, ctxt
);
4050 while (ctxt
->d
& GroupMask
) {
4051 switch (ctxt
->d
& GroupMask
) {
4053 goffset
= (ctxt
->modrm
>> 3) & 7;
4054 opcode
= opcode
.u
.group
[goffset
];
4057 goffset
= (ctxt
->modrm
>> 3) & 7;
4058 if ((ctxt
->modrm
>> 6) == 3)
4059 opcode
= opcode
.u
.gdual
->mod3
[goffset
];
4061 opcode
= opcode
.u
.gdual
->mod012
[goffset
];
4064 goffset
= ctxt
->modrm
& 7;
4065 opcode
= opcode
.u
.group
[goffset
];
4068 if (ctxt
->rep_prefix
&& op_prefix
)
4069 return EMULATION_FAILED
;
4070 simd_prefix
= op_prefix
? 0x66 : ctxt
->rep_prefix
;
4071 switch (simd_prefix
) {
4072 case 0x00: opcode
= opcode
.u
.gprefix
->pfx_no
; break;
4073 case 0x66: opcode
= opcode
.u
.gprefix
->pfx_66
; break;
4074 case 0xf2: opcode
= opcode
.u
.gprefix
->pfx_f2
; break;
4075 case 0xf3: opcode
= opcode
.u
.gprefix
->pfx_f3
; break;
4079 return EMULATION_FAILED
;
4082 ctxt
->d
&= ~(u64
)GroupMask
;
4083 ctxt
->d
|= opcode
.flags
;
4086 ctxt
->execute
= opcode
.u
.execute
;
4087 ctxt
->check_perm
= opcode
.check_perm
;
4088 ctxt
->intercept
= opcode
.intercept
;
4091 if (ctxt
->d
== 0 || (ctxt
->d
& Undefined
))
4092 return EMULATION_FAILED
;
4094 if (!(ctxt
->d
& VendorSpecific
) && ctxt
->only_vendor_specific_insn
)
4095 return EMULATION_FAILED
;
4097 if (mode
== X86EMUL_MODE_PROT64
&& (ctxt
->d
& Stack
))
4100 if (ctxt
->d
& Op3264
) {
4101 if (mode
== X86EMUL_MODE_PROT64
)
4108 ctxt
->op_bytes
= 16;
4109 else if (ctxt
->d
& Mmx
)
4112 /* ModRM and SIB bytes. */
4113 if (ctxt
->d
& ModRM
) {
4114 rc
= decode_modrm(ctxt
, &ctxt
->memop
);
4115 if (!ctxt
->has_seg_override
)
4116 set_seg_override(ctxt
, ctxt
->modrm_seg
);
4117 } else if (ctxt
->d
& MemAbs
)
4118 rc
= decode_abs(ctxt
, &ctxt
->memop
);
4119 if (rc
!= X86EMUL_CONTINUE
)
4122 if (!ctxt
->has_seg_override
)
4123 set_seg_override(ctxt
, VCPU_SREG_DS
);
4125 ctxt
->memop
.addr
.mem
.seg
= seg_override(ctxt
);
4127 if (ctxt
->memop
.type
== OP_MEM
&& ctxt
->ad_bytes
!= 8)
4128 ctxt
->memop
.addr
.mem
.ea
= (u32
)ctxt
->memop
.addr
.mem
.ea
;
4131 * Decode and fetch the source operand: register, memory
4134 rc
= decode_operand(ctxt
, &ctxt
->src
, (ctxt
->d
>> SrcShift
) & OpMask
);
4135 if (rc
!= X86EMUL_CONTINUE
)
4139 * Decode and fetch the second source operand: register, memory
4142 rc
= decode_operand(ctxt
, &ctxt
->src2
, (ctxt
->d
>> Src2Shift
) & OpMask
);
4143 if (rc
!= X86EMUL_CONTINUE
)
4146 /* Decode and fetch the destination operand: register or memory. */
4147 rc
= decode_operand(ctxt
, &ctxt
->dst
, (ctxt
->d
>> DstShift
) & OpMask
);
4150 if (ctxt
->memopp
&& ctxt
->memopp
->type
== OP_MEM
&& ctxt
->rip_relative
)
4151 ctxt
->memopp
->addr
.mem
.ea
+= ctxt
->_eip
;
4153 return (rc
!= X86EMUL_CONTINUE
) ? EMULATION_FAILED
: EMULATION_OK
;
4156 bool x86_page_table_writing_insn(struct x86_emulate_ctxt
*ctxt
)
4158 return ctxt
->d
& PageTable
;
4161 static bool string_insn_completed(struct x86_emulate_ctxt
*ctxt
)
4163 /* The second termination condition only applies for REPE
4164 * and REPNE. Test if the repeat string operation prefix is
4165 * REPE/REPZ or REPNE/REPNZ and if it's the case it tests the
4166 * corresponding termination condition according to:
4167 * - if REPE/REPZ and ZF = 0 then done
4168 * - if REPNE/REPNZ and ZF = 1 then done
4170 if (((ctxt
->b
== 0xa6) || (ctxt
->b
== 0xa7) ||
4171 (ctxt
->b
== 0xae) || (ctxt
->b
== 0xaf))
4172 && (((ctxt
->rep_prefix
== REPE_PREFIX
) &&
4173 ((ctxt
->eflags
& EFLG_ZF
) == 0))
4174 || ((ctxt
->rep_prefix
== REPNE_PREFIX
) &&
4175 ((ctxt
->eflags
& EFLG_ZF
) == EFLG_ZF
))))
4181 static int flush_pending_x87_faults(struct x86_emulate_ctxt
*ctxt
)
4185 ctxt
->ops
->get_fpu(ctxt
);
4186 asm volatile("1: fwait \n\t"
4188 ".pushsection .fixup,\"ax\" \n\t"
4190 "movb $1, %[fault] \n\t"
4193 _ASM_EXTABLE(1b
, 3b
)
4194 : [fault
]"+qm"(fault
));
4195 ctxt
->ops
->put_fpu(ctxt
);
4197 if (unlikely(fault
))
4198 return emulate_exception(ctxt
, MF_VECTOR
, 0, false);
4200 return X86EMUL_CONTINUE
;
4203 static void fetch_possible_mmx_operand(struct x86_emulate_ctxt
*ctxt
,
4206 if (op
->type
== OP_MM
)
4207 read_mmx_reg(ctxt
, &op
->mm_val
, op
->addr
.mm
);
4210 int x86_emulate_insn(struct x86_emulate_ctxt
*ctxt
)
4212 struct x86_emulate_ops
*ops
= ctxt
->ops
;
4213 int rc
= X86EMUL_CONTINUE
;
4214 int saved_dst_type
= ctxt
->dst
.type
;
4216 ctxt
->mem_read
.pos
= 0;
4218 if (ctxt
->mode
== X86EMUL_MODE_PROT64
&& (ctxt
->d
& No64
)) {
4219 rc
= emulate_ud(ctxt
);
4223 /* LOCK prefix is allowed only with some instructions */
4224 if (ctxt
->lock_prefix
&& (!(ctxt
->d
& Lock
) || ctxt
->dst
.type
!= OP_MEM
)) {
4225 rc
= emulate_ud(ctxt
);
4229 if ((ctxt
->d
& SrcMask
) == SrcMemFAddr
&& ctxt
->src
.type
!= OP_MEM
) {
4230 rc
= emulate_ud(ctxt
);
4234 if (((ctxt
->d
& (Sse
|Mmx
)) && ((ops
->get_cr(ctxt
, 0) & X86_CR0_EM
)))
4235 || ((ctxt
->d
& Sse
) && !(ops
->get_cr(ctxt
, 4) & X86_CR4_OSFXSR
))) {
4236 rc
= emulate_ud(ctxt
);
4240 if ((ctxt
->d
& (Sse
|Mmx
)) && (ops
->get_cr(ctxt
, 0) & X86_CR0_TS
)) {
4241 rc
= emulate_nm(ctxt
);
4245 if (ctxt
->d
& Mmx
) {
4246 rc
= flush_pending_x87_faults(ctxt
);
4247 if (rc
!= X86EMUL_CONTINUE
)
4250 * Now that we know the fpu is exception safe, we can fetch
4253 fetch_possible_mmx_operand(ctxt
, &ctxt
->src
);
4254 fetch_possible_mmx_operand(ctxt
, &ctxt
->src2
);
4255 if (!(ctxt
->d
& Mov
))
4256 fetch_possible_mmx_operand(ctxt
, &ctxt
->dst
);
4259 if (unlikely(ctxt
->guest_mode
) && ctxt
->intercept
) {
4260 rc
= emulator_check_intercept(ctxt
, ctxt
->intercept
,
4261 X86_ICPT_PRE_EXCEPT
);
4262 if (rc
!= X86EMUL_CONTINUE
)
4266 /* Privileged instruction can be executed only in CPL=0 */
4267 if ((ctxt
->d
& Priv
) && ops
->cpl(ctxt
)) {
4268 rc
= emulate_gp(ctxt
, 0);
4272 /* Instruction can only be executed in protected mode */
4273 if ((ctxt
->d
& Prot
) && !(ctxt
->mode
& X86EMUL_MODE_PROT
)) {
4274 rc
= emulate_ud(ctxt
);
4278 /* Do instruction specific permission checks */
4279 if (ctxt
->check_perm
) {
4280 rc
= ctxt
->check_perm(ctxt
);
4281 if (rc
!= X86EMUL_CONTINUE
)
4285 if (unlikely(ctxt
->guest_mode
) && ctxt
->intercept
) {
4286 rc
= emulator_check_intercept(ctxt
, ctxt
->intercept
,
4287 X86_ICPT_POST_EXCEPT
);
4288 if (rc
!= X86EMUL_CONTINUE
)
4292 if (ctxt
->rep_prefix
&& (ctxt
->d
& String
)) {
4293 /* All REP prefixes have the same first termination condition */
4294 if (address_mask(ctxt
, ctxt
->regs
[VCPU_REGS_RCX
]) == 0) {
4295 ctxt
->eip
= ctxt
->_eip
;
4300 if ((ctxt
->src
.type
== OP_MEM
) && !(ctxt
->d
& NoAccess
)) {
4301 rc
= segmented_read(ctxt
, ctxt
->src
.addr
.mem
,
4302 ctxt
->src
.valptr
, ctxt
->src
.bytes
);
4303 if (rc
!= X86EMUL_CONTINUE
)
4305 ctxt
->src
.orig_val64
= ctxt
->src
.val64
;
4308 if (ctxt
->src2
.type
== OP_MEM
) {
4309 rc
= segmented_read(ctxt
, ctxt
->src2
.addr
.mem
,
4310 &ctxt
->src2
.val
, ctxt
->src2
.bytes
);
4311 if (rc
!= X86EMUL_CONTINUE
)
4315 if ((ctxt
->d
& DstMask
) == ImplicitOps
)
4319 if ((ctxt
->dst
.type
== OP_MEM
) && !(ctxt
->d
& Mov
)) {
4320 /* optimisation - avoid slow emulated read if Mov */
4321 rc
= segmented_read(ctxt
, ctxt
->dst
.addr
.mem
,
4322 &ctxt
->dst
.val
, ctxt
->dst
.bytes
);
4323 if (rc
!= X86EMUL_CONTINUE
)
4326 ctxt
->dst
.orig_val
= ctxt
->dst
.val
;
4330 if (unlikely(ctxt
->guest_mode
) && ctxt
->intercept
) {
4331 rc
= emulator_check_intercept(ctxt
, ctxt
->intercept
,
4332 X86_ICPT_POST_MEMACCESS
);
4333 if (rc
!= X86EMUL_CONTINUE
)
4337 if (ctxt
->execute
) {
4338 rc
= ctxt
->execute(ctxt
);
4339 if (rc
!= X86EMUL_CONTINUE
)
4348 case 0x40 ... 0x47: /* inc r16/r32 */
4349 emulate_1op(ctxt
, "inc");
4351 case 0x48 ... 0x4f: /* dec r16/r32 */
4352 emulate_1op(ctxt
, "dec");
4354 case 0x63: /* movsxd */
4355 if (ctxt
->mode
!= X86EMUL_MODE_PROT64
)
4356 goto cannot_emulate
;
4357 ctxt
->dst
.val
= (s32
) ctxt
->src
.val
;
4359 case 0x70 ... 0x7f: /* jcc (short) */
4360 if (test_cc(ctxt
->b
, ctxt
->eflags
))
4361 jmp_rel(ctxt
, ctxt
->src
.val
);
4363 case 0x8d: /* lea r16/r32, m */
4364 ctxt
->dst
.val
= ctxt
->src
.addr
.mem
.ea
;
4366 case 0x90 ... 0x97: /* nop / xchg reg, rax */
4367 if (ctxt
->dst
.addr
.reg
== &ctxt
->regs
[VCPU_REGS_RAX
])
4371 case 0x98: /* cbw/cwde/cdqe */
4372 switch (ctxt
->op_bytes
) {
4373 case 2: ctxt
->dst
.val
= (s8
)ctxt
->dst
.val
; break;
4374 case 4: ctxt
->dst
.val
= (s16
)ctxt
->dst
.val
; break;
4375 case 8: ctxt
->dst
.val
= (s32
)ctxt
->dst
.val
; break;
4381 case 0xcc: /* int3 */
4382 rc
= emulate_int(ctxt
, 3);
4384 case 0xcd: /* int n */
4385 rc
= emulate_int(ctxt
, ctxt
->src
.val
);
4387 case 0xce: /* into */
4388 if (ctxt
->eflags
& EFLG_OF
)
4389 rc
= emulate_int(ctxt
, 4);
4391 case 0xd0 ... 0xd1: /* Grp2 */
4394 case 0xd2 ... 0xd3: /* Grp2 */
4395 ctxt
->src
.val
= ctxt
->regs
[VCPU_REGS_RCX
];
4398 case 0xe9: /* jmp rel */
4399 case 0xeb: /* jmp rel short */
4400 jmp_rel(ctxt
, ctxt
->src
.val
);
4401 ctxt
->dst
.type
= OP_NONE
; /* Disable writeback. */
4403 case 0xf4: /* hlt */
4404 ctxt
->ops
->halt(ctxt
);
4406 case 0xf5: /* cmc */
4407 /* complement carry flag from eflags reg */
4408 ctxt
->eflags
^= EFLG_CF
;
4410 case 0xf8: /* clc */
4411 ctxt
->eflags
&= ~EFLG_CF
;
4413 case 0xf9: /* stc */
4414 ctxt
->eflags
|= EFLG_CF
;
4416 case 0xfc: /* cld */
4417 ctxt
->eflags
&= ~EFLG_DF
;
4419 case 0xfd: /* std */
4420 ctxt
->eflags
|= EFLG_DF
;
4423 goto cannot_emulate
;
4426 if (rc
!= X86EMUL_CONTINUE
)
4430 rc
= writeback(ctxt
);
4431 if (rc
!= X86EMUL_CONTINUE
)
4435 * restore dst type in case the decoding will be reused
4436 * (happens for string instruction )
4438 ctxt
->dst
.type
= saved_dst_type
;
4440 if ((ctxt
->d
& SrcMask
) == SrcSI
)
4441 string_addr_inc(ctxt
, seg_override(ctxt
),
4442 VCPU_REGS_RSI
, &ctxt
->src
);
4444 if ((ctxt
->d
& DstMask
) == DstDI
)
4445 string_addr_inc(ctxt
, VCPU_SREG_ES
, VCPU_REGS_RDI
,
4448 if (ctxt
->rep_prefix
&& (ctxt
->d
& String
)) {
4449 struct read_cache
*r
= &ctxt
->io_read
;
4450 register_address_increment(ctxt
, &ctxt
->regs
[VCPU_REGS_RCX
], -1);
4452 if (!string_insn_completed(ctxt
)) {
4454 * Re-enter guest when pio read ahead buffer is empty
4455 * or, if it is not used, after each 1024 iteration.
4457 if ((r
->end
!= 0 || ctxt
->regs
[VCPU_REGS_RCX
] & 0x3ff) &&
4458 (r
->end
== 0 || r
->end
!= r
->pos
)) {
4460 * Reset read cache. Usually happens before
4461 * decode, but since instruction is restarted
4462 * we have to do it here.
4464 ctxt
->mem_read
.end
= 0;
4465 return EMULATION_RESTART
;
4467 goto done
; /* skip rip writeback */
4471 ctxt
->eip
= ctxt
->_eip
;
4474 if (rc
== X86EMUL_PROPAGATE_FAULT
)
4475 ctxt
->have_exception
= true;
4476 if (rc
== X86EMUL_INTERCEPTED
)
4477 return EMULATION_INTERCEPTED
;
4479 return (rc
== X86EMUL_UNHANDLEABLE
) ? EMULATION_FAILED
: EMULATION_OK
;
4483 case 0x09: /* wbinvd */
4484 (ctxt
->ops
->wbinvd
)(ctxt
);
4486 case 0x08: /* invd */
4487 case 0x0d: /* GrpP (prefetch) */
4488 case 0x18: /* Grp16 (prefetch/nop) */
4490 case 0x20: /* mov cr, reg */
4491 ctxt
->dst
.val
= ops
->get_cr(ctxt
, ctxt
->modrm_reg
);
4493 case 0x21: /* mov from dr to reg */
4494 ops
->get_dr(ctxt
, ctxt
->modrm_reg
, &ctxt
->dst
.val
);
4496 case 0x40 ... 0x4f: /* cmov */
4497 ctxt
->dst
.val
= ctxt
->dst
.orig_val
= ctxt
->src
.val
;
4498 if (!test_cc(ctxt
->b
, ctxt
->eflags
))
4499 ctxt
->dst
.type
= OP_NONE
; /* no writeback */
4501 case 0x80 ... 0x8f: /* jnz rel, etc*/
4502 if (test_cc(ctxt
->b
, ctxt
->eflags
))
4503 jmp_rel(ctxt
, ctxt
->src
.val
);
4505 case 0x90 ... 0x9f: /* setcc r/m8 */
4506 ctxt
->dst
.val
= test_cc(ctxt
->b
, ctxt
->eflags
);
4508 case 0xa4: /* shld imm8, r, r/m */
4509 case 0xa5: /* shld cl, r, r/m */
4510 emulate_2op_cl(ctxt
, "shld");
4512 case 0xac: /* shrd imm8, r, r/m */
4513 case 0xad: /* shrd cl, r, r/m */
4514 emulate_2op_cl(ctxt
, "shrd");
4516 case 0xae: /* clflush */
4518 case 0xb6 ... 0xb7: /* movzx */
4519 ctxt
->dst
.bytes
= ctxt
->op_bytes
;
4520 ctxt
->dst
.val
= (ctxt
->d
& ByteOp
) ? (u8
) ctxt
->src
.val
4521 : (u16
) ctxt
->src
.val
;
4523 case 0xbe ... 0xbf: /* movsx */
4524 ctxt
->dst
.bytes
= ctxt
->op_bytes
;
4525 ctxt
->dst
.val
= (ctxt
->d
& ByteOp
) ? (s8
) ctxt
->src
.val
:
4526 (s16
) ctxt
->src
.val
;
4528 case 0xc0 ... 0xc1: /* xadd */
4529 emulate_2op_SrcV(ctxt
, "add");
4530 /* Write back the register source. */
4531 ctxt
->src
.val
= ctxt
->dst
.orig_val
;
4532 write_register_operand(&ctxt
->src
);
4534 case 0xc3: /* movnti */
4535 ctxt
->dst
.bytes
= ctxt
->op_bytes
;
4536 ctxt
->dst
.val
= (ctxt
->op_bytes
== 4) ? (u32
) ctxt
->src
.val
:
4537 (u64
) ctxt
->src
.val
;
4540 goto cannot_emulate
;
4543 if (rc
!= X86EMUL_CONTINUE
)
4549 return EMULATION_FAILED
;