iothread: replace fair_mutex with a condition variable

[qemu.git] / target-i386 / op_helper.c
diff --git a/target-i386/op_helper.c b/target-i386/op_helper.c

index 33d44b0037db80cdee78b097555dbeb9c0947981..315e18b9a4c3f1e2e6962f433e754810574b9867 100644 (file)
--- a/target-i386/op_helper.c
+++ b/target-i386/op_helper.c
@@ -16,10 +16,11 @@
   * You should have received a copy of the GNU Lesser General Public
   * License along with this library; if not, see <http://www.gnu.org/licenses/>.
   */
-#define CPU_NO_GLOBAL_REGS
+
+#include <math.h>
  #include "exec.h"
-#include "exec-all.h"
  #include "host-utils.h"
+#include "ioport.h"
  
  //#define DEBUG_PCALL
  
@@ -93,16 +94,9 @@ static const uint8_t rclb_table[32] = {
      6, 7, 8, 0, 1, 2, 3, 4,
  };
  
-static const CPU86_LDouble f15rk[7] =
-{
-    0.00000000000000000000L,
-    1.00000000000000000000L,
-    3.14159265358979323851L,  /*pi*/
-    0.30102999566398119523L,  /*lg2*/
-    0.69314718055994530943L,  /*ln2*/
-    1.44269504088896340739L,  /*l2e*/
-    3.32192809488736234781L,  /*l2t*/
-};
+#define floatx80_lg2 make_floatx80( 0x3ffd, 0x9a209a84fbcff799LL )
+#define floatx80_l2e make_floatx80( 0x3fff, 0xb8aa3b295c17f0bcLL )
+#define floatx80_l2t make_floatx80( 0x4000, 0xd49a784bcd1b8afeLL )
  
  /* broken thread support */
  
@@ -348,6 +342,10 @@ static void switch_tss(int tss_selector,
          new_segs[R_GS] = 0;
          new_trap = 0;
      }
+    /* XXX: avoid a compiler warning, see
+     http://support.amd.com/us/Processor_TechDocs/24593.pdf
+     chapters 12.2.5 and 13.2.4 on how to implement TSS Trap bit */
+    (void)new_trap;
  
      /* NOTE: we must avoid memory exceptions during the task switch,
         so we make dummy accesses before */
@@ -1001,7 +999,7 @@ void helper_syscall(int next_eip_addend)
  {
      env->exception_index = EXCP_SYSCALL;
      env->exception_next_eip = env->eip + next_eip_addend;
-    cpu_loop_exit();
+    cpu_loop_exit(env);
  }
  #else
  void helper_syscall(int next_eip_addend)
@@ -1151,9 +1149,10 @@ static void do_interrupt_real(int intno, int is_int, int error_code,
      env->eflags &= ~(IF_MASK | TF_MASK | AC_MASK | RF_MASK);
  }
  
+#if defined(CONFIG_USER_ONLY)
  /* fake user mode interrupt */
-void do_interrupt_user(int intno, int is_int, int error_code,
-                       target_ulong next_eip)
+static void do_interrupt_user(int intno, int is_int, int error_code,
+                              target_ulong next_eip)
  {
      SegmentCache *dt;
      target_ulong ptr;
@@ -1182,7 +1181,8 @@ void do_interrupt_user(int intno, int is_int, int error_code,
          EIP = next_eip;
  }
  
-#if !defined(CONFIG_USER_ONLY)
+#else
+
  static void handle_even_inj(int intno, int is_int, int error_code,
                 int is_hw, int rm)
  {
@@ -1208,8 +1208,8 @@ static void handle_even_inj(int intno, int is_int, int error_code,
   * the int instruction. next_eip is the EIP value AFTER the interrupt
   * instruction. It is only relevant if is_int is TRUE.
   */
-void do_interrupt(int intno, int is_int, int error_code,
-                  target_ulong next_eip, int is_hw)
+static void do_interrupt_all(int intno, int is_int, int error_code,
+                             target_ulong next_eip, int is_hw)
  {
      if (qemu_loglevel_mask(CPU_LOG_INT)) {
          if ((env->cr[0] & CR0_PE_MASK)) {
@@ -1230,7 +1230,7 @@ void do_interrupt(int intno, int is_int, int error_code,
  #if 0
              {
                  int i;
-                uint8_t *ptr;
+                target_ulong ptr;
                  qemu_log("       code=");
                  ptr = env->segs[R_CS].base + env->eip;
                  for(i = 0; i < 16; i++) {
@@ -1271,6 +1271,46 @@ void do_interrupt(int intno, int is_int, int error_code,
  #endif
  }
  
+void do_interrupt(CPUState *env1)
+{
+    CPUState *saved_env;
+
+    saved_env = env;
+    env = env1;
+#if defined(CONFIG_USER_ONLY)
+    /* if user mode only, we simulate a fake exception
+       which will be handled outside the cpu execution
+       loop */
+    do_interrupt_user(env->exception_index,
+                      env->exception_is_int,
+                      env->error_code,
+                      env->exception_next_eip);
+    /* successfully delivered */
+    env->old_exception = -1;
+#else
+    /* simulate a real cpu exception. On i386, it can
+       trigger new exceptions, but we do not handle
+       double or triple faults yet. */
+    do_interrupt_all(env->exception_index,
+                     env->exception_is_int,
+                     env->error_code,
+                     env->exception_next_eip, 0);
+    /* successfully delivered */
+    env->old_exception = -1;
+#endif
+    env = saved_env;
+}
+
+void do_interrupt_x86_hardirq(CPUState *env1, int intno, int is_hw)
+{
+    CPUState *saved_env;
+
+    saved_env = env;
+    env = env1;
+    do_interrupt_all(intno, 0, 0, 0, is_hw);
+    env = saved_env;
+}
+
  /* This should come from sysemu.h - if we could include it here... */
  void qemu_system_reset_request(void);
  
@@ -1336,7 +1376,7 @@ static void QEMU_NORETURN raise_interrupt(int intno, int is_int, int error_code,
      env->error_code = error_code;
      env->exception_is_int = is_int;
      env->exception_next_eip = env->eip + next_eip_addend;
-    cpu_loop_exit();
+    cpu_loop_exit(env);
  }
  
  /* shortcuts to generate exceptions */
@@ -1351,11 +1391,16 @@ void raise_exception(int exception_index)
      raise_interrupt(exception_index, 0, 0, 0);
  }
  
+void raise_exception_env(int exception_index, CPUState *nenv)
+{
+    env = nenv;
+    raise_exception(exception_index);
+}
  /* SMM support */
  
  #if defined(CONFIG_USER_ONLY)
  
-void do_smm_enter(void)
+void do_smm_enter(CPUState *env1)
  {
  }
  
@@ -1371,11 +1416,15 @@ void helper_rsm(void)
  #define SMM_REVISION_ID 0x00020000
  #endif
  
-void do_smm_enter(void)
+void do_smm_enter(CPUState *env1)
  {
      target_ulong sm_state;
      SegmentCache *dt;
      int i, offset;
+    CPUState *saved_env;
+
+    saved_env = env;
+    env = env1;
  
      qemu_log_mask(CPU_LOG_INT, "SMM: enter\n");
      log_cpu_state_mask(CPU_LOG_INT, env, X86_DUMP_CCOP);
@@ -1502,6 +1551,7 @@ void do_smm_enter(void)
      cpu_x86_update_cr4(env, 0);
      env->dr[7] = 0x00000400;
      CC_OP = CC_OP_EFLAGS;
+    env = saved_env;
  }
  
  void helper_rsm(void)
@@ -2882,7 +2932,7 @@ target_ulong helper_read_crN(int reg)
          break;
      case 8:
          if (!(env->hflags2 & HF2_VINTR_MASK)) {
-            val = cpu_get_apic_tpr(env);
+            val = cpu_get_apic_tpr(env->apic_state);
          } else {
              val = env->v_tpr;
          }
@@ -2906,7 +2956,7 @@ void helper_write_crN(int reg, target_ulong t0)
          break;
      case 8:
          if (!(env->hflags2 & HF2_VINTR_MASK)) {
-            cpu_set_apic_tpr(env, t0);
+            cpu_set_apic_tpr(env->apic_state, t0);
          }
          env->v_tpr = t0 & 0x0f;
          break;
@@ -2969,6 +3019,12 @@ void helper_rdtsc(void)
      EDX = (uint32_t)(val >> 32);
  }
  
+void helper_rdtscp(void)
+{
+    helper_rdtsc();
+    ECX = (uint32_t)(env->tsc_aux);
+}
+
  void helper_rdpmc(void)
  {
      if ((env->cr[4] & CR4_PCE_MASK) && ((env->hflags & HF_CPL_MASK) != 0)) {
@@ -3008,7 +3064,7 @@ void helper_wrmsr(void)
          env->sysenter_eip = val;
          break;
      case MSR_IA32_APICBASE:
-        cpu_set_apic_base(env, val);
+        cpu_set_apic_base(env->apic_state, val);
          break;
      case MSR_EFER:
          {
@@ -3107,6 +3163,9 @@ void helper_wrmsr(void)
              && (val == 0 || val == ~(uint64_t)0))
              env->mcg_ctl = val;
          break;
+    case MSR_TSC_AUX:
+        env->tsc_aux = val;
+        break;
      default:
          if ((uint32_t)ECX >= MSR_MC0_CTL
              && (uint32_t)ECX < MSR_MC0_CTL + (4 * env->mcg_cap & 0xff)) {
@@ -3138,7 +3197,7 @@ void helper_rdmsr(void)
          val = env->sysenter_eip;
          break;
      case MSR_IA32_APICBASE:
-        val = cpu_get_apic_base(env);
+        val = cpu_get_apic_base(env->apic_state);
          break;
      case MSR_EFER:
          val = env->efer;
@@ -3177,6 +3236,9 @@ void helper_rdmsr(void)
      case MSR_KERNELGSBASE:
          val = env->kernelgsbase;
          break;
+    case MSR_TSC_AUX:
+        val = env->tsc_aux;
+        break;
  #endif
      case MSR_MTRRphysBase(0):
      case MSR_MTRRphysBase(1):
@@ -3409,6 +3471,28 @@ void helper_verw(target_ulong selector1)
  
  /* x87 FPU helpers */
  
+static inline double floatx80_to_double(floatx80 a)
+{
+    union {
+        float64 f64;
+        double d;
+    } u;
+
+    u.f64 = floatx80_to_float64(a, &env->fp_status);
+    return u.d;
+}
+
+static inline floatx80 double_to_floatx80(double a)
+{
+    union {
+        float64 f64;
+        double d;
+    } u;
+
+    u.d = a;
+    return float64_to_floatx80(u.f64, &env->fp_status);
+}
+
  static void fpu_set_exception(int mask)
  {
      env->fpus |= mask;
@@ -3416,11 +3500,12 @@ static void fpu_set_exception(int mask)
          env->fpus |= FPUS_SE | FPUS_B;
  }
  
-static inline CPU86_LDouble helper_fdiv(CPU86_LDouble a, CPU86_LDouble b)
+static inline floatx80 helper_fdiv(floatx80 a, floatx80 b)
  {
-    if (b == 0.0)
+    if (floatx80_is_zero(b)) {
          fpu_set_exception(FPUS_ZE);
-    return a / b;
+    }
+    return floatx80_div(a, b, &env->fp_status);
  }
  
  static void fpu_raise_exception(void)
@@ -3442,7 +3527,7 @@ void helper_flds_FT0(uint32_t val)
          uint32_t i;
      } u;
      u.i = val;
-    FT0 = float32_to_floatx(u.f, &env->fp_status);
+    FT0 = float32_to_floatx80(u.f, &env->fp_status);
  }
  
  void helper_fldl_FT0(uint64_t val)
@@ -3452,12 +3537,12 @@ void helper_fldl_FT0(uint64_t val)
          uint64_t i;
      } u;
      u.i = val;
-    FT0 = float64_to_floatx(u.f, &env->fp_status);
+    FT0 = float64_to_floatx80(u.f, &env->fp_status);
  }
  
  void helper_fildl_FT0(int32_t val)
  {
-    FT0 = int32_to_floatx(val, &env->fp_status);
+    FT0 = int32_to_floatx80(val, &env->fp_status);
  }
  
  void helper_flds_ST0(uint32_t val)
@@ -3469,7 +3554,7 @@ void helper_flds_ST0(uint32_t val)
      } u;
      new_fpstt = (env->fpstt - 1) & 7;
      u.i = val;
-    env->fpregs[new_fpstt].d = float32_to_floatx(u.f, &env->fp_status);
+    env->fpregs[new_fpstt].d = float32_to_floatx80(u.f, &env->fp_status);
      env->fpstt = new_fpstt;
      env->fptags[new_fpstt] = 0; /* validate stack entry */
  }
@@ -3483,7 +3568,7 @@ void helper_fldl_ST0(uint64_t val)
      } u;
      new_fpstt = (env->fpstt - 1) & 7;
      u.i = val;
-    env->fpregs[new_fpstt].d = float64_to_floatx(u.f, &env->fp_status);
+    env->fpregs[new_fpstt].d = float64_to_floatx80(u.f, &env->fp_status);
      env->fpstt = new_fpstt;
      env->fptags[new_fpstt] = 0; /* validate stack entry */
  }
@@ -3492,7 +3577,7 @@ void helper_fildl_ST0(int32_t val)
  {
      int new_fpstt;
      new_fpstt = (env->fpstt - 1) & 7;
-    env->fpregs[new_fpstt].d = int32_to_floatx(val, &env->fp_status);
+    env->fpregs[new_fpstt].d = int32_to_floatx80(val, &env->fp_status);
      env->fpstt = new_fpstt;
      env->fptags[new_fpstt] = 0; /* validate stack entry */
  }
@@ -3501,7 +3586,7 @@ void helper_fildll_ST0(int64_t val)
  {
      int new_fpstt;
      new_fpstt = (env->fpstt - 1) & 7;
-    env->fpregs[new_fpstt].d = int64_to_floatx(val, &env->fp_status);
+    env->fpregs[new_fpstt].d = int64_to_floatx80(val, &env->fp_status);
      env->fpstt = new_fpstt;
      env->fptags[new_fpstt] = 0; /* validate stack entry */
  }
@@ -3512,7 +3597,7 @@ uint32_t helper_fsts_ST0(void)
          float32 f;
          uint32_t i;
      } u;
-    u.f = floatx_to_float32(ST0, &env->fp_status);
+    u.f = floatx80_to_float32(ST0, &env->fp_status);
      return u.i;
  }
  
@@ -3522,14 +3607,14 @@ uint64_t helper_fstl_ST0(void)
          float64 f;
          uint64_t i;
      } u;
-    u.f = floatx_to_float64(ST0, &env->fp_status);
+    u.f = floatx80_to_float64(ST0, &env->fp_status);
      return u.i;
  }
  
  int32_t helper_fist_ST0(void)
  {
      int32_t val;
-    val = floatx_to_int32(ST0, &env->fp_status);
+    val = floatx80_to_int32(ST0, &env->fp_status);
      if (val != (int16_t)val)
          val = -32768;
      return val;
@@ -3538,21 +3623,21 @@ int32_t helper_fist_ST0(void)
  int32_t helper_fistl_ST0(void)
  {
      int32_t val;
-    val = floatx_to_int32(ST0, &env->fp_status);
+    val = floatx80_to_int32(ST0, &env->fp_status);
      return val;
  }
  
  int64_t helper_fistll_ST0(void)
  {
      int64_t val;
-    val = floatx_to_int64(ST0, &env->fp_status);
+    val = floatx80_to_int64(ST0, &env->fp_status);
      return val;
  }
  
  int32_t helper_fistt_ST0(void)
  {
      int32_t val;
-    val = floatx_to_int32_round_to_zero(ST0, &env->fp_status);
+    val = floatx80_to_int32_round_to_zero(ST0, &env->fp_status);
      if (val != (int16_t)val)
          val = -32768;
      return val;
@@ -3561,14 +3646,14 @@ int32_t helper_fistt_ST0(void)
  int32_t helper_fisttl_ST0(void)
  {
      int32_t val;
-    val = floatx_to_int32_round_to_zero(ST0, &env->fp_status);
+    val = floatx80_to_int32_round_to_zero(ST0, &env->fp_status);
      return val;
  }
  
  int64_t helper_fisttll_ST0(void)
  {
      int64_t val;
-    val = floatx_to_int64_round_to_zero(ST0, &env->fp_status);
+    val = floatx80_to_int64_round_to_zero(ST0, &env->fp_status);
      return val;
  }
  
@@ -3637,7 +3722,7 @@ void helper_fmov_STN_ST0(int st_index)
  
  void helper_fxchg_ST0_STN(int st_index)
  {
-    CPU86_LDouble tmp;
+    floatx80 tmp;
      tmp = ST(st_index);
      ST(st_index) = ST0;
      ST0 = tmp;
@@ -3651,7 +3736,7 @@ void helper_fcom_ST0_FT0(void)
  {
      int ret;
  
-    ret = floatx_compare(ST0, FT0, &env->fp_status);
+    ret = floatx80_compare(ST0, FT0, &env->fp_status);
      env->fpus = (env->fpus & ~0x4500) | fcom_ccval[ret + 1];
  }
  
@@ -3659,7 +3744,7 @@ void helper_fucom_ST0_FT0(void)
  {
      int ret;
  
-    ret = floatx_compare_quiet(ST0, FT0, &env->fp_status);
+    ret = floatx80_compare_quiet(ST0, FT0, &env->fp_status);
      env->fpus = (env->fpus & ~0x4500) | fcom_ccval[ret+ 1];
  }
  
@@ -3670,7 +3755,7 @@ void helper_fcomi_ST0_FT0(void)
      int eflags;
      int ret;
  
-    ret = floatx_compare(ST0, FT0, &env->fp_status);
+    ret = floatx80_compare(ST0, FT0, &env->fp_status);
      eflags = helper_cc_compute_all(CC_OP);
      eflags = (eflags & ~(CC_Z | CC_P | CC_C)) | fcomi_ccval[ret + 1];
      CC_SRC = eflags;
@@ -3681,7 +3766,7 @@ void helper_fucomi_ST0_FT0(void)
      int eflags;
      int ret;
  
-    ret = floatx_compare_quiet(ST0, FT0, &env->fp_status);
+    ret = floatx80_compare_quiet(ST0, FT0, &env->fp_status);
      eflags = helper_cc_compute_all(CC_OP);
      eflags = (eflags & ~(CC_Z | CC_P | CC_C)) | fcomi_ccval[ret + 1];
      CC_SRC = eflags;
@@ -3689,22 +3774,22 @@ void helper_fucomi_ST0_FT0(void)
  
  void helper_fadd_ST0_FT0(void)
  {
-    ST0 += FT0;
+    ST0 = floatx80_add(ST0, FT0, &env->fp_status);
  }
  
  void helper_fmul_ST0_FT0(void)
  {
-    ST0 *= FT0;
+    ST0 = floatx80_mul(ST0, FT0, &env->fp_status);
  }
  
  void helper_fsub_ST0_FT0(void)
  {
-    ST0 -= FT0;
+    ST0 = floatx80_sub(ST0, FT0, &env->fp_status);
  }
  
  void helper_fsubr_ST0_FT0(void)
  {
-    ST0 = FT0 - ST0;
+    ST0 = floatx80_sub(FT0, ST0, &env->fp_status);
  }
  
  void helper_fdiv_ST0_FT0(void)
@@ -3721,36 +3806,34 @@ void helper_fdivr_ST0_FT0(void)
  
  void helper_fadd_STN_ST0(int st_index)
  {
-    ST(st_index) += ST0;
+    ST(st_index) = floatx80_add(ST(st_index), ST0, &env->fp_status);
  }
  
  void helper_fmul_STN_ST0(int st_index)
  {
-    ST(st_index) *= ST0;
+    ST(st_index) = floatx80_mul(ST(st_index), ST0, &env->fp_status);
  }
  
  void helper_fsub_STN_ST0(int st_index)
  {
-    ST(st_index) -= ST0;
+    ST(st_index) = floatx80_sub(ST(st_index), ST0, &env->fp_status);
  }
  
  void helper_fsubr_STN_ST0(int st_index)
  {
-    CPU86_LDouble *p;
-    p = &ST(st_index);
-    *p = ST0 - *p;
+    ST(st_index) = floatx80_sub(ST0, ST(st_index), &env->fp_status);
  }
  
  void helper_fdiv_STN_ST0(int st_index)
  {
-    CPU86_LDouble *p;
+    floatx80 *p;
      p = &ST(st_index);
      *p = helper_fdiv(*p, ST0);
  }
  
  void helper_fdivr_STN_ST0(int st_index)
  {
-    CPU86_LDouble *p;
+    floatx80 *p;
      p = &ST(st_index);
      *p = helper_fdiv(ST0, *p);
  }
@@ -3758,52 +3841,52 @@ void helper_fdivr_STN_ST0(int st_index)
  /* misc FPU operations */
  void helper_fchs_ST0(void)
  {
-    ST0 = floatx_chs(ST0);
+    ST0 = floatx80_chs(ST0);
  }
  
  void helper_fabs_ST0(void)
  {
-    ST0 = floatx_abs(ST0);
+    ST0 = floatx80_abs(ST0);
  }
  
  void helper_fld1_ST0(void)
  {
-    ST0 = f15rk[1];
+    ST0 = floatx80_one;
  }
  
  void helper_fldl2t_ST0(void)
  {
-    ST0 = f15rk[6];
+    ST0 = floatx80_l2t;
  }
  
  void helper_fldl2e_ST0(void)
  {
-    ST0 = f15rk[5];
+    ST0 = floatx80_l2e;
  }
  
  void helper_fldpi_ST0(void)
  {
-    ST0 = f15rk[2];
+    ST0 = floatx80_pi;
  }
  
  void helper_fldlg2_ST0(void)
  {
-    ST0 = f15rk[3];
+    ST0 = floatx80_lg2;
  }
  
  void helper_fldln2_ST0(void)
  {
-    ST0 = f15rk[4];
+    ST0 = floatx80_ln2;
  }
  
  void helper_fldz_ST0(void)
  {
-    ST0 = f15rk[0];
+    ST0 = floatx80_zero;
  }
  
  void helper_fldz_FT0(void)
  {
-    FT0 = f15rk[0];
+    FT0 = floatx80_zero;
  }
  
  uint32_t helper_fnstsw(void)
@@ -3837,7 +3920,6 @@ static void update_fp_status(void)
          break;
      }
      set_float_rounding_mode(rnd_type, &env->fp_status);
-#ifdef FLOATX80
      switch((env->fpuc >> 8) & 3) {
      case 0:
          rnd_type = 32;
@@ -3851,7 +3933,6 @@ static void update_fp_status(void)
          break;
      }
      set_floatx80_rounding_precision(rnd_type, &env->fp_status);
-#endif
  }
  
  void helper_fldcw(uint32_t val)
@@ -3890,7 +3971,7 @@ void helper_fninit(void)
  
  void helper_fbld_ST0(target_ulong ptr)
  {
-    CPU86_LDouble tmp;
+    floatx80 tmp;
      uint64_t val;
      unsigned int v;
      int i;
@@ -3900,9 +3981,10 @@ void helper_fbld_ST0(target_ulong ptr)
          v = ldub(ptr + i);
          val = (val * 100) + ((v >> 4) * 10) + (v & 0xf);
      }
-    tmp = val;
-    if (ldub(ptr + 9) & 0x80)
-        tmp = -tmp;
+    tmp = int64_to_floatx80(val, &env->fp_status);
+    if (ldub(ptr + 9) & 0x80) {
+        floatx80_chs(tmp);
+    }
      fpush();
      ST0 = tmp;
  }
@@ -3913,7 +3995,7 @@ void helper_fbst_ST0(target_ulong ptr)
      target_ulong mem_ref, mem_end;
      int64_t val;
  
-    val = floatx_to_int64(ST0, &env->fp_status);
+    val = floatx80_to_int64(ST0, &env->fp_status);
      mem_ref = ptr;
      mem_end = mem_ref + 9;
      if (val < 0) {
@@ -3937,17 +4019,19 @@ void helper_fbst_ST0(target_ulong ptr)
  
  void helper_f2xm1(void)
  {
-    ST0 = pow(2.0,ST0) - 1.0;
+    double val = floatx80_to_double(ST0);
+    val = pow(2.0, val) - 1.0;
+    ST0 = double_to_floatx80(val);
  }
  
  void helper_fyl2x(void)
  {
-    CPU86_LDouble fptemp;
+    double fptemp = floatx80_to_double(ST0);
  
-    fptemp = ST0;
      if (fptemp>0.0){
-        fptemp = log(fptemp)/log(2.0);  /* log2(ST) */
-        ST1 *= fptemp;
+        fptemp = log(fptemp)/log(2.0);    /* log2(ST) */
+        fptemp *= floatx80_to_double(ST1);
+        ST1 = double_to_floatx80(fptemp);
          fpop();
      } else {
          env->fpus &= (~0x4700);
@@ -3957,15 +4041,15 @@ void helper_fyl2x(void)
  
  void helper_fptan(void)
  {
-    CPU86_LDouble fptemp;
+    double fptemp = floatx80_to_double(ST0);
  
-    fptemp = ST0;
      if((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
          env->fpus |= 0x400;
      } else {
-        ST0 = tan(fptemp);
+        fptemp = tan(fptemp);
+        ST0 = double_to_floatx80(fptemp);
          fpush();
-        ST0 = 1.0;
+        ST0 = floatx80_one;
          env->fpus &= (~0x400);  /* C2 <-- 0 */
          /* the above code is for  |arg| < 2**52 only */
      }
@@ -3973,45 +4057,57 @@ void helper_fptan(void)
  
  void helper_fpatan(void)
  {
-    CPU86_LDouble fptemp, fpsrcop;
+    double fptemp, fpsrcop;
  
-    fpsrcop = ST1;
-    fptemp = ST0;
-    ST1 = atan2(fpsrcop,fptemp);
+    fpsrcop = floatx80_to_double(ST1);
+    fptemp = floatx80_to_double(ST0);
+    ST1 = double_to_floatx80(atan2(fpsrcop, fptemp));
      fpop();
  }
  
  void helper_fxtract(void)
  {
-    CPU86_LDoubleU temp;
-    unsigned int expdif;
+    CPU_LDoubleU temp;
  
      temp.d = ST0;
-    expdif = EXPD(temp) - EXPBIAS;
-    /*DP exponent bias*/
-    ST0 = expdif;
-    fpush();
-    BIASEXPONENT(temp);
-    ST0 = temp.d;
+
+    if (floatx80_is_zero(ST0)) {
+        /* Easy way to generate -inf and raising division by 0 exception */
+        ST0 = floatx80_div(floatx80_chs(floatx80_one), floatx80_zero, &env->fp_status);
+        fpush();
+        ST0 = temp.d;
+    } else {
+        int expdif;
+
+        expdif = EXPD(temp) - EXPBIAS;
+        /*DP exponent bias*/
+        ST0 = int32_to_floatx80(expdif, &env->fp_status);
+        fpush();
+        BIASEXPONENT(temp);
+        ST0 = temp.d;
+    }
  }
  
  void helper_fprem1(void)
  {
-    CPU86_LDouble dblq, fpsrcop, fptemp;
-    CPU86_LDoubleU fpsrcop1, fptemp1;
+    double st0, st1, dblq, fpsrcop, fptemp;
+    CPU_LDoubleU fpsrcop1, fptemp1;
      int expdif;
      signed long long int q;
  
-    if (isinf(ST0) || isnan(ST0) || isnan(ST1) || (ST1 == 0.0)) {
-        ST0 = 0.0 / 0.0; /* NaN */
+    st0 = floatx80_to_double(ST0);
+    st1 = floatx80_to_double(ST1);
+
+    if (isinf(st0) || isnan(st0) || isnan(st1) || (st1 == 0.0)) {
+        ST0 = double_to_floatx80(0.0 / 0.0); /* NaN */
          env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
          return;
      }
  
-    fpsrcop = ST0;
-    fptemp = ST1;
-    fpsrcop1.d = fpsrcop;
-    fptemp1.d = fptemp;
+    fpsrcop = st0;
+    fptemp = st1;
+    fpsrcop1.d = ST0;
+    fptemp1.d = ST1;
      expdif = EXPD(fpsrcop1) - EXPD(fptemp1);
  
      if (expdif < 0) {
@@ -4025,7 +4121,7 @@ void helper_fprem1(void)
          dblq = fpsrcop / fptemp;
          /* round dblq towards nearest integer */
          dblq = rint(dblq);
-        ST0 = fpsrcop - fptemp * dblq;
+        st0 = fpsrcop - fptemp * dblq;
  
          /* convert dblq to q by truncating towards zero */
          if (dblq < 0.0)
@@ -4041,31 +4137,35 @@ void helper_fprem1(void)
      } else {
          env->fpus |= 0x400;  /* C2 <-- 1 */
          fptemp = pow(2.0, expdif - 50);
-        fpsrcop = (ST0 / ST1) / fptemp;
+        fpsrcop = (st0 / st1) / fptemp;
          /* fpsrcop = integer obtained by chopping */
          fpsrcop = (fpsrcop < 0.0) ?
                    -(floor(fabs(fpsrcop))) : floor(fpsrcop);
-        ST0 -= (ST1 * fpsrcop * fptemp);
+        st0 -= (st1 * fpsrcop * fptemp);
      }
+    ST0 = double_to_floatx80(st0);
  }
  
  void helper_fprem(void)
  {
-    CPU86_LDouble dblq, fpsrcop, fptemp;
-    CPU86_LDoubleU fpsrcop1, fptemp1;
+    double st0, st1, dblq, fpsrcop, fptemp;
+    CPU_LDoubleU fpsrcop1, fptemp1;
      int expdif;
      signed long long int q;
  
-    if (isinf(ST0) || isnan(ST0) || isnan(ST1) || (ST1 == 0.0)) {
-       ST0 = 0.0 / 0.0; /* NaN */
+    st0 = floatx80_to_double(ST0);
+    st1 = floatx80_to_double(ST1);
+
+    if (isinf(st0) || isnan(st0) || isnan(st1) || (st1 == 0.0)) {
+       ST0 = double_to_floatx80(0.0 / 0.0); /* NaN */
         env->fpus &= (~0x4700); /* (C3,C2,C1,C0) <-- 0000 */
         return;
      }
  
-    fpsrcop = (CPU86_LDouble)ST0;
-    fptemp = (CPU86_LDouble)ST1;
-    fpsrcop1.d = fpsrcop;
-    fptemp1.d = fptemp;
+    fpsrcop = st0;
+    fptemp = st1;
+    fpsrcop1.d = ST0;
+    fptemp1.d = ST1;
      expdif = EXPD(fpsrcop1) - EXPD(fptemp1);
  
      if (expdif < 0) {
@@ -4079,7 +4179,7 @@ void helper_fprem(void)
          dblq = fpsrcop/*ST0*/ / fptemp/*ST1*/;
          /* round dblq towards zero */
          dblq = (dblq < 0.0) ? ceil(dblq) : floor(dblq);
-        ST0 = fpsrcop/*ST0*/ - fptemp * dblq;
+        st0 = fpsrcop/*ST0*/ - fptemp * dblq;
  
          /* convert dblq to q by truncating towards zero */
          if (dblq < 0.0)
@@ -4096,22 +4196,23 @@ void helper_fprem(void)
          int N = 32 + (expdif % 32); /* as per AMD docs */
          env->fpus |= 0x400;  /* C2 <-- 1 */
          fptemp = pow(2.0, (double)(expdif - N));
-        fpsrcop = (ST0 / ST1) / fptemp;
+        fpsrcop = (st0 / st1) / fptemp;
          /* fpsrcop = integer obtained by chopping */
          fpsrcop = (fpsrcop < 0.0) ?
                    -(floor(fabs(fpsrcop))) : floor(fpsrcop);
-        ST0 -= (ST1 * fpsrcop * fptemp);
+        st0 -= (st1 * fpsrcop * fptemp);
      }
+    ST0 = double_to_floatx80(st0);
  }
  
  void helper_fyl2xp1(void)
  {
-    CPU86_LDouble fptemp;
+    double fptemp = floatx80_to_double(ST0);
  
-    fptemp = ST0;
      if ((fptemp+1.0)>0.0) {
          fptemp = log(fptemp+1.0) / log(2.0); /* log2(ST+1.0) */
-        ST1 *= fptemp;
+        fptemp *= floatx80_to_double(ST1);
+        ST1 = double_to_floatx80(fptemp);
          fpop();
      } else {
          env->fpus &= (~0x4700);
@@ -4121,27 +4222,23 @@ void helper_fyl2xp1(void)
  
  void helper_fsqrt(void)
  {
-    CPU86_LDouble fptemp;
-
-    fptemp = ST0;
-    if (fptemp<0.0) {
+    if (floatx80_is_neg(ST0)) {
          env->fpus &= (~0x4700);  /* (C3,C2,C1,C0) <-- 0000 */
          env->fpus |= 0x400;
      }
-    ST0 = sqrt(fptemp);
+    ST0 = floatx80_sqrt(ST0, &env->fp_status);
  }
  
  void helper_fsincos(void)
  {
-    CPU86_LDouble fptemp;
+    double fptemp = floatx80_to_double(ST0);
  
-    fptemp = ST0;
      if ((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
          env->fpus |= 0x400;
      } else {
-        ST0 = sin(fptemp);
+        ST0 = double_to_floatx80(sin(fptemp));
          fpush();
-        ST0 = cos(fptemp);
+        ST0 = double_to_floatx80(cos(fptemp));
          env->fpus &= (~0x400);  /* C2 <-- 0 */
          /* the above code is for  |arg| < 2**63 only */
      }
@@ -4149,23 +4246,27 @@ void helper_fsincos(void)
  
  void helper_frndint(void)
  {
-    ST0 = floatx_round_to_int(ST0, &env->fp_status);
+    ST0 = floatx80_round_to_int(ST0, &env->fp_status);
  }
  
  void helper_fscale(void)
  {
-    ST0 = ldexp (ST0, (int)(ST1));
+    if (floatx80_is_any_nan(ST1)) {
+        ST0 = ST1;
+    } else {
+        int n = floatx80_to_int32_round_to_zero(ST1, &env->fp_status);
+        ST0 = floatx80_scalbn(ST0, n, &env->fp_status);
+    }
  }
  
  void helper_fsin(void)
  {
-    CPU86_LDouble fptemp;
+    double fptemp = floatx80_to_double(ST0);
  
-    fptemp = ST0;
      if ((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
          env->fpus |= 0x400;
      } else {
-        ST0 = sin(fptemp);
+        ST0 = double_to_floatx80(sin(fptemp));
          env->fpus &= (~0x400);  /* C2 <-- 0 */
          /* the above code is for  |arg| < 2**53 only */
      }
@@ -4173,13 +4274,12 @@ void helper_fsin(void)
  
  void helper_fcos(void)
  {
-    CPU86_LDouble fptemp;
+    double fptemp = floatx80_to_double(ST0);
  
-    fptemp = ST0;
      if((fptemp > MAXTAN)||(fptemp < -MAXTAN)) {
          env->fpus |= 0x400;
      } else {
-        ST0 = cos(fptemp);
+        ST0 = double_to_floatx80(cos(fptemp));
          env->fpus &= (~0x400);  /* C2 <-- 0 */
          /* the above code is for  |arg5 < 2**63 only */
      }
@@ -4187,7 +4287,7 @@ void helper_fcos(void)
  
  void helper_fxam_ST0(void)
  {
-    CPU86_LDoubleU temp;
+    CPU_LDoubleU temp;
      int expdif;
  
      temp.d = ST0;
@@ -4199,11 +4299,7 @@ void helper_fxam_ST0(void)
      /* XXX: test fptags too */
      expdif = EXPD(temp);
      if (expdif == MAXEXPD) {
-#ifdef USE_X86LDOUBLE
          if (MANTD(temp) == 0x8000000000000000ULL)
-#else
-        if (MANTD(temp) == 0)
-#endif
              env->fpus |=  0x500 /*Infinity*/;
          else
              env->fpus |=  0x100 /*NaN*/;
@@ -4221,7 +4317,7 @@ void helper_fstenv(target_ulong ptr, int data32)
  {
      int fpus, fptag, exp, i;
      uint64_t mant;
-    CPU86_LDoubleU tmp;
+    CPU_LDoubleU tmp;
  
      fpus = (env->fpus & ~0x3800) | (env->fpstt & 0x7) << 11;
      fptag = 0;
@@ -4237,9 +4333,7 @@ void helper_fstenv(target_ulong ptr, int data32)
                  /* zero */
                 fptag |= 1;
             } else if (exp == 0 || exp == MAXEXPD
-#ifdef USE_X86LDOUBLE
                         || (mant & (1LL << 63)) == 0
-#endif
                         ) {
                  /* NaNs, infinity, denormal */
                  fptag |= 2;
@@ -4291,7 +4385,7 @@ void helper_fldenv(target_ulong ptr, int data32)
  
  void helper_fsave(target_ulong ptr, int data32)
  {
-    CPU86_LDouble tmp;
+    floatx80 tmp;
      int i;
  
      helper_fstenv(ptr, data32);
@@ -4319,7 +4413,7 @@ void helper_fsave(target_ulong ptr, int data32)
  
  void helper_frstor(target_ulong ptr, int data32)
  {
-    CPU86_LDouble tmp;
+    floatx80 tmp;
      int i;
  
      helper_fldenv(ptr, data32);
@@ -4335,9 +4429,14 @@ void helper_frstor(target_ulong ptr, int data32)
  void helper_fxsave(target_ulong ptr, int data64)
  {
      int fpus, fptag, i, nb_xmm_regs;
-    CPU86_LDouble tmp;
+    floatx80 tmp;
      target_ulong addr;
  
+    /* The operand must be 16 byte aligned */
+    if (ptr & 0xf) {
+        raise_exception(EXCP0D_GPF);
+    }
+
      fpus = (env->fpus & ~0x3800) | (env->fpstt & 0x7) << 11;
      fptag = 0;
      for(i = 0; i < 8; i++) {
@@ -4391,9 +4490,14 @@ void helper_fxsave(target_ulong ptr, int data64)
  void helper_fxrstor(target_ulong ptr, int data64)
  {
      int i, fpus, fptag, nb_xmm_regs;
-    CPU86_LDouble tmp;
+    floatx80 tmp;
      target_ulong addr;
  
+    /* The operand must be 16 byte aligned */
+    if (ptr & 0xf) {
+        raise_exception(EXCP0D_GPF);
+    }
+
      env->fpuc = lduw(ptr);
      fpus = lduw(ptr + 2);
      fptag = lduw(ptr + 4);
@@ -4433,61 +4537,23 @@ void helper_fxrstor(target_ulong ptr, int data64)
      }
  }
  
-#ifndef USE_X86LDOUBLE
-
-void cpu_get_fp80(uint64_t *pmant, uint16_t *pexp, CPU86_LDouble f)
-{
-    CPU86_LDoubleU temp;
-    int e;
-
-    temp.d = f;
-    /* mantissa */
-    *pmant = (MANTD(temp) << 11) | (1LL << 63);
-    /* exponent + sign */
-    e = EXPD(temp) - EXPBIAS + 16383;
-    e |= SIGND(temp) >> 16;
-    *pexp = e;
-}
-
-CPU86_LDouble cpu_set_fp80(uint64_t mant, uint16_t upper)
-{
-    CPU86_LDoubleU temp;
-    int e;
-    uint64_t ll;
-
-    /* XXX: handle overflow ? */
-    e = (upper & 0x7fff) - 16383 + EXPBIAS; /* exponent */
-    e |= (upper >> 4) & 0x800; /* sign */
-    ll = (mant >> 11) & ((1LL << 52) - 1);
-#ifdef __arm__
-    temp.l.upper = (e << 20) | (ll >> 32);
-    temp.l.lower = ll;
-#else
-    temp.ll = ll | ((uint64_t)e << 52);
-#endif
-    return temp.d;
-}
-
-#else
-
-void cpu_get_fp80(uint64_t *pmant, uint16_t *pexp, CPU86_LDouble f)
+void cpu_get_fp80(uint64_t *pmant, uint16_t *pexp, floatx80 f)
  {
-    CPU86_LDoubleU temp;
+    CPU_LDoubleU temp;
  
      temp.d = f;
      *pmant = temp.l.lower;
      *pexp = temp.l.upper;
  }
  
-CPU86_LDouble cpu_set_fp80(uint64_t mant, uint16_t upper)
+floatx80 cpu_set_fp80(uint64_t mant, uint16_t upper)
  {
-    CPU86_LDoubleU temp;
+    CPU_LDoubleU temp;
  
      temp.l.upper = upper;
      temp.l.lower = mant;
      return temp.d;
  }
-#endif
  
  #ifdef TARGET_X86_64
  
@@ -4638,7 +4704,7 @@ static void do_hlt(void)
      env->hflags &= ~HF_INHIBIT_IRQ_MASK; /* needed if sti is just before */
      env->halted = 1;
      env->exception_index = EXCP_HLT;
-    cpu_loop_exit();
+    cpu_loop_exit(env);
  }
  
  void helper_hlt(int next_eip_addend)
@@ -4676,7 +4742,7 @@ void helper_mwait(int next_eip_addend)
  void helper_debug(void)
  {
      env->exception_index = EXCP_DEBUG;
-    cpu_loop_exit();
+    cpu_loop_exit(env);
  }
  
  void helper_reset_rf(void)
@@ -4751,16 +4817,6 @@ void helper_boundl(target_ulong a0, int v)
      }
  }
  
-static float approx_rsqrt(float a)
-{
-    return 1.0 / sqrt(a);
-}
-
-static float approx_rcp(float a)
-{
-    return 1.0 / a;
-}
-
  #if !defined(CONFIG_USER_ONLY)
  
  #define MMUSUFFIX _mmu
@@ -4805,7 +4861,7 @@ void tlb_fill(target_ulong addr, int is_write, int mmu_idx, void *retaddr)
              if (tb) {
                  /* the PC is inside the translated code. It means that we have
                     a virtual CPU fault */
-                cpu_restore_state(tb, env, pc, NULL);
+                cpu_restore_state(tb, env, pc);
              }
          }
          raise_exception_err(env->exception_index, env->error_code);
@@ -4849,6 +4905,10 @@ void helper_svm_check_intercept_param(uint32_t type, uint64_t param)
  {
  }
  
+void svm_check_intercept(CPUState *env1, uint32_t type)
+{
+}
+
  void helper_svm_check_io(uint32_t port, uint32_t param, 
                           uint32_t next_eip_addend)
  {
@@ -5030,7 +5090,7 @@ void helper_vmrun(int aflag, int next_eip_addend)
                  env->exception_next_eip = -1;
                  qemu_log_mask(CPU_LOG_TB_IN_ASM, "INTR");
                  /* XXX: is it always correct ? */
-                do_interrupt(vector, 0, 0, 0, 1);
+                do_interrupt_all(vector, 0, 0, 0, 1);
                  break;
          case SVM_EVTINJ_TYPE_NMI:
                  env->exception_index = EXCP02_NMI;
@@ -5038,7 +5098,7 @@ void helper_vmrun(int aflag, int next_eip_addend)
                  env->exception_is_int = 0;
                  env->exception_next_eip = EIP;
                  qemu_log_mask(CPU_LOG_TB_IN_ASM, "NMI");
-                cpu_loop_exit();
+                cpu_loop_exit(env);
                  break;
          case SVM_EVTINJ_TYPE_EXEPT:
                  env->exception_index = vector;
@@ -5046,7 +5106,7 @@ void helper_vmrun(int aflag, int next_eip_addend)
                  env->exception_is_int = 0;
                  env->exception_next_eip = -1;
                  qemu_log_mask(CPU_LOG_TB_IN_ASM, "EXEPT");
-                cpu_loop_exit();
+                cpu_loop_exit(env);
                  break;
          case SVM_EVTINJ_TYPE_SOFT:
                  env->exception_index = vector;
@@ -5054,7 +5114,7 @@ void helper_vmrun(int aflag, int next_eip_addend)
                  env->exception_is_int = 1;
                  env->exception_next_eip = EIP;
                  qemu_log_mask(CPU_LOG_TB_IN_ASM, "SOFT");
-                cpu_loop_exit();
+                cpu_loop_exit(env);
                  break;
          }
          qemu_log_mask(CPU_LOG_TB_IN_ASM, " %#x %#x\n", env->exception_index, env->error_code);
@@ -5209,7 +5269,7 @@ void helper_svm_check_intercept_param(uint32_t type, uint64_t param)
              switch((uint32_t)ECX) {
              case 0 ... 0x1fff:
                  t0 = (ECX * 2) % 8;
-                t1 = ECX / 8;
+                t1 = (ECX * 2) / 8;
                  break;
              case 0xc0000000 ... 0xc0001fff:
                  t0 = (8192 + ECX - 0xc0000000) * 2;
@@ -5239,6 +5299,16 @@ void helper_svm_check_intercept_param(uint32_t type, uint64_t param)
      }
  }
  
+void svm_check_intercept(CPUState *env1, uint32_t type)
+{
+    CPUState *saved_env;
+
+    saved_env = env;
+    env = env1;
+    helper_svm_check_intercept_param(type, 0);
+    env = saved_env;
+}
+
  void helper_svm_check_io(uint32_t port, uint32_t param, 
                           uint32_t next_eip_addend)
  {
@@ -5360,6 +5430,7 @@ void helper_vmexit(uint32_t exit_code, uint64_t exit_info_1)
               ldl_phys(env->vm_vmcb + offsetof(struct vmcb, control.event_inj)));
      stl_phys(env->vm_vmcb + offsetof(struct vmcb, control.exit_int_info_err),
               ldl_phys(env->vm_vmcb + offsetof(struct vmcb, control.event_inj_err)));
+    stl_phys(env->vm_vmcb + offsetof(struct vmcb, control.event_inj), 0);
  
      env->hflags2 &= ~HF2_GIF_MASK;
      /* FIXME: Resets the current ASID register to zero (host ASID). */
@@ -5389,7 +5460,7 @@ void helper_vmexit(uint32_t exit_code, uint64_t exit_info_1)
      env->error_code = 0;
      env->old_exception = -1;
  
-    cpu_loop_exit();
+    cpu_loop_exit(env);
  }
  
  #endif
@@ -5457,11 +5528,14 @@ target_ulong helper_bsf(target_ulong t0)
      return count;
  }
  
-target_ulong helper_bsr(target_ulong t0)
+target_ulong helper_lzcnt(target_ulong t0, int wordsize)
  {
      int count;
      target_ulong res, mask;
-    
+
+    if (wordsize > 0 && t0 == 0) {
+        return wordsize;
+    }
      res = t0;
      count = TARGET_LONG_BITS - 1;
      mask = (target_ulong)1 << (TARGET_LONG_BITS - 1);
@@ -5469,9 +5543,16 @@ target_ulong helper_bsr(target_ulong t0)
          count--;
          res <<= 1;
      }
+    if (wordsize > 0) {
+        return wordsize - 1 - count;
+    }
      return count;
  }
  
+target_ulong helper_bsr(target_ulong t0)
+{
+       return helper_lzcnt(t0, 0);
+}
  
  static int compute_all_eflags(void)
  {
@@ -5554,6 +5635,18 @@ uint32_t helper_cc_compute_all(int op)
      }
  }
  
+uint32_t cpu_cc_compute_all(CPUState *env1, int op)
+{
+    CPUState *saved_env;
+    uint32_t ret;
+
+    saved_env = env;
+    env = env1;
+    ret = helper_cc_compute_all(op);
+    env = saved_env;
+    return ret;
+}
+
  uint32_t helper_cc_compute_c(int op)
  {
      switch (op) {