QIOChannelSocket: Implement io_writev zero copy flag & io_flush for CONFIG_LINUX

[mirror_qemu.git] / tcg / README
diff --git a/tcg/README b/tcg/README

index c30e5418a6856442933e775ec5593774e838649b..bc15cc3b32fd39037edafce4cc1cd90a82411824 100644 (file)
--- a/tcg/README
+++ b/tcg/README
@@ -101,7 +101,7 @@ This can be overridden using the following function modifiers:
    canonical locations before calling the helper.
  - TCG_CALL_NO_WRITE_GLOBALS means that the helper does not modify any globals.
    They will only be saved to their canonical location before calling helpers,
-  but they won't be reloaded afterwise.
+  but they won't be reloaded afterwards.
  - TCG_CALL_NO_SIDE_EFFECTS means that the call to the function is removed if
    the return value is not used.
  
@@ -254,6 +254,12 @@ t0 = t1 ? clz(t1) : t2
  
  t0 = t1 ? ctz(t1) : t2
  
+* ctpop_i32/i64 t0, t1
+
+t0 = number of bits set in t1
+With "ctpop" short for "count population", matching
+the function name used in include/qemu/host-utils.h.
+
  ********* Shifts/Rotates
  
  * shl_i32/i64 t0, t1, t2
@@ -295,19 +301,25 @@ ext32u_i64 t0, t1
  
  8, 16 or 32 bit sign/zero extension (both operands must have the same type)
  
-* bswap16_i32/i64 t0, t1
+* bswap16_i32/i64 t0, t1, flags
  
-16 bit byte swap on a 32/64 bit value. It assumes that the two/six high order
-bytes are set to zero.
+16 bit byte swap on the low bits of a 32/64 bit input.
+If flags & TCG_BSWAP_IZ, then t1 is known to be zero-extended from bit 15.
+If flags & TCG_BSWAP_OZ, then t0 will be zero-extended from bit 15.
+If flags & TCG_BSWAP_OS, then t0 will be sign-extended from bit 15.
+If neither TCG_BSWAP_OZ nor TCG_BSWAP_OS are set, then the bits of
+t0 above bit 15 may contain any value.
  
-* bswap32_i32/i64 t0, t1
+* bswap32_i64 t0, t1, flags
  
-32 bit byte swap on a 32/64 bit value. With a 64 bit value, it assumes that
-the four high order bytes are set to zero.
+32 bit byte swap on a 64-bit value.  The flags are the same as for bswap16,
+except they apply from bit 31 instead of bit 15.
  
-* bswap64_i64 t0, t1
+* bswap32_i32 t0, t1, flags
+* bswap64_i64 t0, t1, flags
  
-64 bit byte swap
+32/64 bit byte swap.  The flags are ignored, but still present
+for consistency with the other bswap opcodes.
  
  * discard_i32/i64 t0
  
@@ -461,7 +473,7 @@ when MTTCG is enabled.
  The guest translators should generate this opcode for all guest instructions
  which have ordering side effects.
  
-Please see docs/devel/atomics.txt for more information on memory barriers.
+Please see docs/devel/atomics.rst for more information on memory barriers.
  
  ********* 64-bit guest on 32-bit host support
  
@@ -502,6 +514,7 @@ goto_ptr opcode, emitting this op is equivalent to emitting exit_tb(0).
  
  * qemu_ld_i32/i64 t0, t1, flags, memidx
  * qemu_st_i32/i64 t0, t1, flags, memidx
+* qemu_st8_i32 t0, t1, flags, memidx
  
  Load data at the guest address t1 into t0, or store data in t0 at guest
  address t1.  The _i32/_i64 size applies to the size of the input/output
@@ -512,12 +525,16 @@ Both t0 and t1 may be split into little-endian ordered pairs of registers
  if dealing with 64-bit quantities on a 32-bit host.
  
  The memidx selects the qemu tlb index to use (e.g. user or kernel access).
-The flags are the TCGMemOp bits, selecting the sign, width, and endianness
+The flags are the MemOp bits, selecting the sign, width, and endianness
  of the memory access.
  
  For a 32-bit host, qemu_ld/st_i64 is guaranteed to only be used with a
  64-bit memory access specified in flags.
  
+For i386, qemu_st8_i32 is exactly like qemu_st_i32, except the size of
+the memory operation is known to be 8-bit.  This allows the backend to
+provide a different set of register constraints.
+
  ********* Host vector operations
  
  All of the vector ops have two parameters, TCGOP_VECL & TCGOP_VECE.
@@ -561,6 +578,10 @@ E.g. VECL=1 -> 64 << 1 -> v128, and VECE=2 -> 1 << 2 -> i32.
  
    Similarly, v0 = -v1.
  
+* abs_vec   v0, v1
+
+  Similarly, v0 = v1 < 0 ? -v1 : v1, in elements across the vector.
+
  * smin_vec:
  * umin_vec:
  
@@ -601,10 +622,11 @@ E.g. VECL=1 -> 64 << 1 -> v128, and VECE=2 -> 1 << 2 -> i32.
  
  * shri_vec   v0, v1, i2
  * sari_vec   v0, v1, i2
+* rotli_vec  v0, v1, i2
  * shrs_vec   v0, v1, s2
  * sars_vec   v0, v1, s2
  
-  Similarly for logical and arithmetic right shift.
+  Similarly for logical and arithmetic right shift, and left rotate.
  
  * shlv_vec   v0, v1, v2
  
@@ -616,13 +638,26 @@ E.g. VECL=1 -> 64 << 1 -> v128, and VECE=2 -> 1 << 2 -> i32.
  
  * shrv_vec   v0, v1, v2
  * sarv_vec   v0, v1, v2
+* rotlv_vec  v0, v1, v2
+* rotrv_vec  v0, v1, v2
  
-  Similarly for logical and arithmetic right shift.
+  Similarly for logical and arithmetic right shift, and rotates.
  
  * cmp_vec  v0, v1, v2, cond
  
    Compare vectors by element, storing -1 for true and 0 for false.
  
+* bitsel_vec v0, v1, v2, v3
+
+  Bitwise select, v0 = (v2 & v1) | (v3 & ~v1), across the entire vector.
+
+* cmpsel_vec v0, c1, c2, v3, v4, cond
+
+  Select elements based on comparison results:
+  for (i = 0; i < n; ++i) {
+    v0[i] = (c1[i] cond c2[i]) ? v3[i] : v4[i].
+  }
+
  *********
  
  Note 1: Some shortcuts are defined when the last operand is known to be
@@ -634,7 +669,7 @@ function tcg_gen_xxx(args).
  
  4) Backend
  
-tcg-target.h contains the target specific definitions. tcg-target.inc.c
+tcg-target.h contains the target specific definitions. tcg-target.c.inc
  contains the target specific code; it is #included by tcg/tcg.c, rather
  than being a standalone C file.