target-ppc: add vabsdu[b,h,w] instructions

[mirror_qemu.git] / target-ppc / int_helper.c
diff --git a/target-ppc/int_helper.c b/target-ppc/int_helper.c

index e83a25d05a133371ed4a598c4ea9c0f1238b694c..ef487d0b9c122c02d273595cd998f92c6663985f 100644 (file)
--- a/target-ppc/int_helper.c
+++ b/target-ppc/int_helper.c
@@ -16,41 +16,16 @@
   * You should have received a copy of the GNU Lesser General Public
   * License along with this library; if not, see <http://www.gnu.org/licenses/>.
   */
+#include "qemu/osdep.h"
  #include "cpu.h"
+#include "exec/exec-all.h"
  #include "qemu/host-utils.h"
  #include "exec/helper-proto.h"
-#include "qemu/aes.h"
+#include "crypto/aes.h"
  
  #include "helper_regs.h"
  /*****************************************************************************/
  /* Fixed point operations helpers */
-#if defined(TARGET_PPC64)
-
-uint64_t helper_mulldo(CPUPPCState *env, uint64_t arg1, uint64_t arg2)
-{
-    int64_t th;
-    uint64_t tl;
-
-    muls64(&tl, (uint64_t *)&th, arg1, arg2);
-
-    /* th should either contain all 1 bits or all 0 bits and should
-     * match the sign bit of tl; otherwise we have overflowed. */
-
-    if ((int64_t)tl < 0) {
-        if (likely(th == -1LL)) {
-            env->ov = 0;
-        } else {
-            env->so = env->ov = 1;
-        }
-    } else if (likely(th == 0LL)) {
-        env->ov = 0;
-    } else {
-        env->so = env->ov = 1;
-    }
-
-    return (int64_t)tl;
-}
-#endif
  
  target_ulong helper_divweu(CPUPPCState *env, target_ulong ra, target_ulong rb,
                             uint32_t oe)
@@ -170,11 +145,43 @@ target_ulong helper_cntlzw(target_ulong t)
      return clz32(t);
  }
  
+target_ulong helper_cnttzw(target_ulong t)
+{
+    return ctz32(t);
+}
+
  #if defined(TARGET_PPC64)
+/* if x = 0xab, returns 0xababababababababa */
+#define pattern(x) (((x) & 0xff) * (~(target_ulong)0 / 0xff))
+
+/* substract 1 from each byte, and with inverse, check if MSB is set at each
+ * byte.
+ * i.e. ((0x00 - 0x01) & ~(0x00)) & 0x80
+ *      (0xFF & 0xFF) & 0x80 = 0x80 (zero found)
+ */
+#define haszero(v) (((v) - pattern(0x01)) & ~(v) & pattern(0x80))
+
+/* When you XOR the pattern and there is a match, that byte will be zero */
+#define hasvalue(x, n)  (haszero((x) ^ pattern(n)))
+
+uint32_t helper_cmpeqb(target_ulong ra, target_ulong rb)
+{
+    return hasvalue(rb, ra) ? 1 << CRF_GT : 0;
+}
+
+#undef pattern
+#undef haszero
+#undef hasvalue
+
  target_ulong helper_cntlzd(target_ulong t)
  {
      return clz64(t);
  }
+
+target_ulong helper_cnttzd(target_ulong t)
+{
+    return ctz64(t);
+}
  #endif
  
  #if defined(TARGET_PPC64)
@@ -248,7 +255,7 @@ target_ulong helper_srad(CPUPPCState *env, target_ulong value,
          if (likely((uint64_t)shift != 0)) {
              shift &= 0x3f;
              ret = (int64_t)value >> shift;
-            if (likely(ret >= 0 || (value & ((1 << shift) - 1)) == 0)) {
+            if (likely(ret >= 0 || (value & ((1ULL << shift) - 1)) == 0)) {
                  env->ca = 0;
              } else {
                  env->ca = 1;
@@ -622,6 +629,30 @@ VAVG(w, s32, int64_t, u32, uint64_t)
  #undef VAVG_DO
  #undef VAVG
  
+#define VABSDU_DO(name, element)                                        \
+void helper_v##name(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)           \
+{                                                                       \
+    int i;                                                              \
+                                                                        \
+    for (i = 0; i < ARRAY_SIZE(r->element); i++) {                      \
+        r->element[i] = (a->element[i] > b->element[i]) ?               \
+            (a->element[i] - b->element[i]) :                           \
+            (b->element[i] - a->element[i]);                            \
+    }                                                                   \
+}
+
+/* VABSDU - Vector absolute difference unsigned
+ *   name    - instruction mnemonic suffix (b: byte, h: halfword, w: word)
+ *   element - element type to access from vector
+ */
+#define VABSDU(type, element)                   \
+    VABSDU_DO(absdu##type, element)
+VABSDU(b, u8)
+VABSDU(h, u16)
+VABSDU(w, u32)
+#undef VABSDU_DO
+#undef VABSDU
+
  #define VCF(suffix, cvt, element)                                       \
      void helper_vcf##suffix(CPUPPCState *env, ppc_avr_t *r,             \
                              ppc_avr_t *b, uint32_t uim)                 \
@@ -735,7 +766,7 @@ static inline void vcmpbfp_internal(CPUPPCState *env, ppc_avr_t *r,
          int le_rel = float32_compare_quiet(a->f[i], b->f[i], &env->vec_status);
          if (le_rel == float_relation_unordered) {
              r->u32[i] = 0xc0000000;
-            /* ALL_IN does not need to be updated here.  */
+            all_in = 1;
          } else {
              float32 bneg = float32_chs(b->f[i]);
              int ge_rel = float32_compare_quiet(a->f[i], bneg, &env->vec_status);
@@ -1579,13 +1610,6 @@ void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
      }
  }
  
-#if defined(HOST_WORDS_BIGENDIAN)
-#define LEFT 0
-#define RIGHT 1
-#else
-#define LEFT 1
-#define RIGHT 0
-#endif
  /* The specification says that the results are undefined if all of the
   * shift counts are not identical.  We check to make sure that they are
   * to conform to what real hardware appears to do.  */
@@ -1615,11 +1639,9 @@ void helper_vlogefp(CPUPPCState *env, ppc_avr_t *r, ppc_avr_t *b)
              }                                                           \
          }                                                               \
      }
-VSHIFT(l, LEFT)
-VSHIFT(r, RIGHT)
+VSHIFT(l, 1)
+VSHIFT(r, 0)
  #undef VSHIFT
-#undef LEFT
-#undef RIGHT
  
  #define VSL(suffix, element, mask)                                      \
      void helper_vsl##suffix(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)   \
@@ -2313,25 +2335,25 @@ uint32_t helper_bcdadd(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, uint32_t ps)
          if (sgna == sgnb) {
              result.u8[BCD_DIG_BYTE(0)] = bcd_preferred_sgn(sgna, ps);
              zero = bcd_add_mag(&result, a, b, &invalid, &overflow);
-            cr = (sgna > 0) ? 4 : 8;
+            cr = (sgna > 0) ? 1 << CRF_GT : 1 << CRF_LT;
          } else if (bcd_cmp_mag(a, b) > 0) {
              result.u8[BCD_DIG_BYTE(0)] = bcd_preferred_sgn(sgna, ps);
              zero = bcd_sub_mag(&result, a, b, &invalid, &overflow);
-            cr = (sgna > 0) ? 4 : 8;
+            cr = (sgna > 0) ? 1 << CRF_GT : 1 << CRF_LT;
          } else {
              result.u8[BCD_DIG_BYTE(0)] = bcd_preferred_sgn(sgnb, ps);
              zero = bcd_sub_mag(&result, b, a, &invalid, &overflow);
-            cr = (sgnb > 0) ? 4 : 8;
+            cr = (sgnb > 0) ? 1 << CRF_GT : 1 << CRF_LT;
          }
      }
  
      if (unlikely(invalid)) {
          result.u64[HI_IDX] = result.u64[LO_IDX] = -1;
-        cr = 1;
+        cr = 1 << CRF_SO;
      } else if (overflow) {
-        cr |= 1;
+        cr |= 1 << CRF_SO;
      } else if (zero) {
-        cr = 2;
+        cr = 1 << CRF_EQ;
      }
  
      *r = result;
@@ -2363,24 +2385,28 @@ void helper_vsbox(ppc_avr_t *r, ppc_avr_t *a)
  
  void helper_vcipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
  {
+    ppc_avr_t result;
      int i;
  
      VECTOR_FOR_INORDER_I(i, u32) {
-        r->AVRW(i) = b->AVRW(i) ^
+        result.AVRW(i) = b->AVRW(i) ^
              (AES_Te0[a->AVRB(AES_shifts[4*i + 0])] ^
               AES_Te1[a->AVRB(AES_shifts[4*i + 1])] ^
               AES_Te2[a->AVRB(AES_shifts[4*i + 2])] ^
               AES_Te3[a->AVRB(AES_shifts[4*i + 3])]);
      }
+    *r = result;
  }
  
  void helper_vcipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
  {
+    ppc_avr_t result;
      int i;
  
      VECTOR_FOR_INORDER_I(i, u8) {
-        r->AVRB(i) = b->AVRB(i) ^ (AES_Te4[a->AVRB(AES_shifts[i])] & 0xFF);
+        result.AVRB(i) = b->AVRB(i) ^ (AES_sbox[a->AVRB(AES_shifts[i])]);
      }
+    *r = result;
  }
  
  void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
@@ -2405,11 +2431,13 @@ void helper_vncipher(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
  
  void helper_vncipherlast(ppc_avr_t *r, ppc_avr_t *a, ppc_avr_t *b)
  {
+    ppc_avr_t result;
      int i;
  
      VECTOR_FOR_INORDER_I(i, u8) {
-        r->AVRB(i) = b->AVRB(i) ^ (AES_Td4[a->AVRB(AES_ishifts[i])] & 0xFF);
+        result.AVRB(i) = b->AVRB(i) ^ (AES_isbox[a->AVRB(AES_ishifts[i])]);
      }
+    *r = result;
  }
  
  #define ROTRu32(v, n) (((v) >> (n)) | ((v) << (32-n)))
@@ -2496,16 +2524,19 @@ void helper_vshasigmad(ppc_avr_t *r,  ppc_avr_t *a, uint32_t st_six)
  
  void helper_vpermxor(ppc_avr_t *r,  ppc_avr_t *a, ppc_avr_t *b, ppc_avr_t *c)
  {
+    ppc_avr_t result;
      int i;
+
      VECTOR_FOR_INORDER_I(i, u8) {
          int indexA = c->u8[i] >> 4;
          int indexB = c->u8[i] & 0xF;
  #if defined(HOST_WORDS_BIGENDIAN)
-        r->u8[i] = a->u8[indexA] ^ b->u8[indexB];
+        result.u8[i] = a->u8[indexA] ^ b->u8[indexB];
  #else
-        r->u8[i] = a->u8[15-indexA] ^ b->u8[15-indexB];
+        result.u8[i] = a->u8[15-indexA] ^ b->u8[15-indexB];
  #endif
      }
+    *r = result;
  }
  
  #undef VECTOR_FOR_INORDER_I
@@ -2583,6 +2614,7 @@ target_ulong helper_dlmzb(CPUPPCState *env, target_ulong high,
          }
          i++;
      }
+    i = 8;
      if (update_Rc) {
          env->crf[0] = 0x2;
      }