]> git.proxmox.com Git - mirror_qemu.git/blob - target/hexagon/genptr.c
Hexagon (target/hexagon) Improve code gen for predicated HVX instructions
[mirror_qemu.git] / target / hexagon / genptr.c
1 /*
2 * Copyright(c) 2019-2023 Qualcomm Innovation Center, Inc. All Rights Reserved.
3 *
4 * This program is free software; you can redistribute it and/or modify
5 * it under the terms of the GNU General Public License as published by
6 * the Free Software Foundation; either version 2 of the License, or
7 * (at your option) any later version.
8 *
9 * This program is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 * GNU General Public License for more details.
13 *
14 * You should have received a copy of the GNU General Public License
15 * along with this program; if not, see <http://www.gnu.org/licenses/>.
16 */
17
18 #include "qemu/osdep.h"
19 #include "cpu.h"
20 #include "internal.h"
21 #include "tcg/tcg-op.h"
22 #include "tcg/tcg-op-gvec.h"
23 #include "insn.h"
24 #include "opcodes.h"
25 #include "translate.h"
26 #define QEMU_GENERATE /* Used internally by macros.h */
27 #include "macros.h"
28 #include "mmvec/macros.h"
29 #undef QEMU_GENERATE
30 #include "gen_tcg.h"
31 #include "gen_tcg_hvx.h"
32 #include "genptr.h"
33
34 TCGv gen_read_reg(TCGv result, int num)
35 {
36 tcg_gen_mov_tl(result, hex_gpr[num]);
37 return result;
38 }
39
40 TCGv gen_read_preg(TCGv pred, uint8_t num)
41 {
42 tcg_gen_mov_tl(pred, hex_pred[num]);
43 return pred;
44 }
45
46 #define IMMUTABLE (~0)
47
48 static const target_ulong reg_immut_masks[TOTAL_PER_THREAD_REGS] = {
49 [HEX_REG_USR] = 0xc13000c0,
50 [HEX_REG_PC] = IMMUTABLE,
51 [HEX_REG_GP] = 0x3f,
52 [HEX_REG_UPCYCLELO] = IMMUTABLE,
53 [HEX_REG_UPCYCLEHI] = IMMUTABLE,
54 [HEX_REG_UTIMERLO] = IMMUTABLE,
55 [HEX_REG_UTIMERHI] = IMMUTABLE,
56 };
57
58 static inline void gen_masked_reg_write(TCGv new_val, TCGv cur_val,
59 target_ulong reg_mask)
60 {
61 if (reg_mask) {
62 TCGv tmp = tcg_temp_new();
63
64 /* new_val = (new_val & ~reg_mask) | (cur_val & reg_mask) */
65 tcg_gen_andi_tl(new_val, new_val, ~reg_mask);
66 tcg_gen_andi_tl(tmp, cur_val, reg_mask);
67 tcg_gen_or_tl(new_val, new_val, tmp);
68 }
69 }
70
71 static TCGv get_result_gpr(DisasContext *ctx, int rnum)
72 {
73 return hex_new_value[rnum];
74 }
75
76 static TCGv_i64 get_result_gpr_pair(DisasContext *ctx, int rnum)
77 {
78 TCGv_i64 result = tcg_temp_new_i64();
79 tcg_gen_concat_i32_i64(result, hex_new_value[rnum],
80 hex_new_value[rnum + 1]);
81 return result;
82 }
83
84 void gen_log_reg_write(int rnum, TCGv val)
85 {
86 const target_ulong reg_mask = reg_immut_masks[rnum];
87
88 gen_masked_reg_write(val, hex_gpr[rnum], reg_mask);
89 tcg_gen_mov_tl(hex_new_value[rnum], val);
90 if (HEX_DEBUG) {
91 /* Do this so HELPER(debug_commit_end) will know */
92 tcg_gen_movi_tl(hex_reg_written[rnum], 1);
93 }
94 }
95
96 static void gen_log_reg_write_pair(int rnum, TCGv_i64 val)
97 {
98 const target_ulong reg_mask_low = reg_immut_masks[rnum];
99 const target_ulong reg_mask_high = reg_immut_masks[rnum + 1];
100 TCGv val32 = tcg_temp_new();
101
102 /* Low word */
103 tcg_gen_extrl_i64_i32(val32, val);
104 gen_masked_reg_write(val32, hex_gpr[rnum], reg_mask_low);
105 tcg_gen_mov_tl(hex_new_value[rnum], val32);
106 if (HEX_DEBUG) {
107 /* Do this so HELPER(debug_commit_end) will know */
108 tcg_gen_movi_tl(hex_reg_written[rnum], 1);
109 }
110
111 /* High word */
112 tcg_gen_extrh_i64_i32(val32, val);
113 gen_masked_reg_write(val32, hex_gpr[rnum + 1], reg_mask_high);
114 tcg_gen_mov_tl(hex_new_value[rnum + 1], val32);
115 if (HEX_DEBUG) {
116 /* Do this so HELPER(debug_commit_end) will know */
117 tcg_gen_movi_tl(hex_reg_written[rnum + 1], 1);
118 }
119 }
120
121 void gen_log_pred_write(DisasContext *ctx, int pnum, TCGv val)
122 {
123 TCGv base_val = tcg_temp_new();
124
125 tcg_gen_andi_tl(base_val, val, 0xff);
126
127 /*
128 * Section 6.1.3 of the Hexagon V67 Programmer's Reference Manual
129 *
130 * Multiple writes to the same preg are and'ed together
131 * If this is the first predicate write in the packet, do a
132 * straight assignment. Otherwise, do an and.
133 */
134 if (!test_bit(pnum, ctx->pregs_written)) {
135 tcg_gen_mov_tl(hex_new_pred_value[pnum], base_val);
136 } else {
137 tcg_gen_and_tl(hex_new_pred_value[pnum],
138 hex_new_pred_value[pnum], base_val);
139 }
140 tcg_gen_ori_tl(hex_pred_written, hex_pred_written, 1 << pnum);
141 set_bit(pnum, ctx->pregs_written);
142 }
143
144 static inline void gen_read_p3_0(TCGv control_reg)
145 {
146 tcg_gen_movi_tl(control_reg, 0);
147 for (int i = 0; i < NUM_PREGS; i++) {
148 tcg_gen_deposit_tl(control_reg, control_reg, hex_pred[i], i * 8, 8);
149 }
150 }
151
152 /*
153 * Certain control registers require special handling on read
154 * HEX_REG_P3_0_ALIASED aliased to the predicate registers
155 * -> concat the 4 predicate registers together
156 * HEX_REG_PC actual value stored in DisasContext
157 * -> assign from ctx->base.pc_next
158 * HEX_REG_QEMU_*_CNT changes in current TB in DisasContext
159 * -> add current TB changes to existing reg value
160 */
161 static inline void gen_read_ctrl_reg(DisasContext *ctx, const int reg_num,
162 TCGv dest)
163 {
164 if (reg_num == HEX_REG_P3_0_ALIASED) {
165 gen_read_p3_0(dest);
166 } else if (reg_num == HEX_REG_PC) {
167 tcg_gen_movi_tl(dest, ctx->base.pc_next);
168 } else if (reg_num == HEX_REG_QEMU_PKT_CNT) {
169 tcg_gen_addi_tl(dest, hex_gpr[HEX_REG_QEMU_PKT_CNT],
170 ctx->num_packets);
171 } else if (reg_num == HEX_REG_QEMU_INSN_CNT) {
172 tcg_gen_addi_tl(dest, hex_gpr[HEX_REG_QEMU_INSN_CNT],
173 ctx->num_insns);
174 } else if (reg_num == HEX_REG_QEMU_HVX_CNT) {
175 tcg_gen_addi_tl(dest, hex_gpr[HEX_REG_QEMU_HVX_CNT],
176 ctx->num_hvx_insns);
177 } else {
178 tcg_gen_mov_tl(dest, hex_gpr[reg_num]);
179 }
180 }
181
182 static inline void gen_read_ctrl_reg_pair(DisasContext *ctx, const int reg_num,
183 TCGv_i64 dest)
184 {
185 if (reg_num == HEX_REG_P3_0_ALIASED) {
186 TCGv p3_0 = tcg_temp_new();
187 gen_read_p3_0(p3_0);
188 tcg_gen_concat_i32_i64(dest, p3_0, hex_gpr[reg_num + 1]);
189 } else if (reg_num == HEX_REG_PC - 1) {
190 TCGv pc = tcg_constant_tl(ctx->base.pc_next);
191 tcg_gen_concat_i32_i64(dest, hex_gpr[reg_num], pc);
192 } else if (reg_num == HEX_REG_QEMU_PKT_CNT) {
193 TCGv pkt_cnt = tcg_temp_new();
194 TCGv insn_cnt = tcg_temp_new();
195 tcg_gen_addi_tl(pkt_cnt, hex_gpr[HEX_REG_QEMU_PKT_CNT],
196 ctx->num_packets);
197 tcg_gen_addi_tl(insn_cnt, hex_gpr[HEX_REG_QEMU_INSN_CNT],
198 ctx->num_insns);
199 tcg_gen_concat_i32_i64(dest, pkt_cnt, insn_cnt);
200 } else if (reg_num == HEX_REG_QEMU_HVX_CNT) {
201 TCGv hvx_cnt = tcg_temp_new();
202 tcg_gen_addi_tl(hvx_cnt, hex_gpr[HEX_REG_QEMU_HVX_CNT],
203 ctx->num_hvx_insns);
204 tcg_gen_concat_i32_i64(dest, hvx_cnt, hex_gpr[reg_num + 1]);
205 } else {
206 tcg_gen_concat_i32_i64(dest,
207 hex_gpr[reg_num],
208 hex_gpr[reg_num + 1]);
209 }
210 }
211
212 static void gen_write_p3_0(DisasContext *ctx, TCGv control_reg)
213 {
214 TCGv hex_p8 = tcg_temp_new();
215 for (int i = 0; i < NUM_PREGS; i++) {
216 tcg_gen_extract_tl(hex_p8, control_reg, i * 8, 8);
217 gen_log_pred_write(ctx, i, hex_p8);
218 }
219 }
220
221 /*
222 * Certain control registers require special handling on write
223 * HEX_REG_P3_0_ALIASED aliased to the predicate registers
224 * -> break the value across 4 predicate registers
225 * HEX_REG_QEMU_*_CNT changes in current TB in DisasContext
226 * -> clear the changes
227 */
228 static inline void gen_write_ctrl_reg(DisasContext *ctx, int reg_num,
229 TCGv val)
230 {
231 if (reg_num == HEX_REG_P3_0_ALIASED) {
232 gen_write_p3_0(ctx, val);
233 } else {
234 gen_log_reg_write(reg_num, val);
235 if (reg_num == HEX_REG_QEMU_PKT_CNT) {
236 ctx->num_packets = 0;
237 }
238 if (reg_num == HEX_REG_QEMU_INSN_CNT) {
239 ctx->num_insns = 0;
240 }
241 if (reg_num == HEX_REG_QEMU_HVX_CNT) {
242 ctx->num_hvx_insns = 0;
243 }
244 }
245 }
246
247 static inline void gen_write_ctrl_reg_pair(DisasContext *ctx, int reg_num,
248 TCGv_i64 val)
249 {
250 if (reg_num == HEX_REG_P3_0_ALIASED) {
251 TCGv result = get_result_gpr(ctx, reg_num + 1);
252 TCGv val32 = tcg_temp_new();
253 tcg_gen_extrl_i64_i32(val32, val);
254 gen_write_p3_0(ctx, val32);
255 tcg_gen_extrh_i64_i32(val32, val);
256 tcg_gen_mov_tl(result, val32);
257 } else {
258 gen_log_reg_write_pair(reg_num, val);
259 if (reg_num == HEX_REG_QEMU_PKT_CNT) {
260 ctx->num_packets = 0;
261 ctx->num_insns = 0;
262 }
263 if (reg_num == HEX_REG_QEMU_HVX_CNT) {
264 ctx->num_hvx_insns = 0;
265 }
266 }
267 }
268
269 TCGv gen_get_byte(TCGv result, int N, TCGv src, bool sign)
270 {
271 if (sign) {
272 tcg_gen_sextract_tl(result, src, N * 8, 8);
273 } else {
274 tcg_gen_extract_tl(result, src, N * 8, 8);
275 }
276 return result;
277 }
278
279 TCGv gen_get_byte_i64(TCGv result, int N, TCGv_i64 src, bool sign)
280 {
281 TCGv_i64 res64 = tcg_temp_new_i64();
282 if (sign) {
283 tcg_gen_sextract_i64(res64, src, N * 8, 8);
284 } else {
285 tcg_gen_extract_i64(res64, src, N * 8, 8);
286 }
287 tcg_gen_extrl_i64_i32(result, res64);
288
289 return result;
290 }
291
292 TCGv gen_get_half(TCGv result, int N, TCGv src, bool sign)
293 {
294 if (sign) {
295 tcg_gen_sextract_tl(result, src, N * 16, 16);
296 } else {
297 tcg_gen_extract_tl(result, src, N * 16, 16);
298 }
299 return result;
300 }
301
302 void gen_set_half(int N, TCGv result, TCGv src)
303 {
304 tcg_gen_deposit_tl(result, result, src, N * 16, 16);
305 }
306
307 void gen_set_half_i64(int N, TCGv_i64 result, TCGv src)
308 {
309 TCGv_i64 src64 = tcg_temp_new_i64();
310 tcg_gen_extu_i32_i64(src64, src);
311 tcg_gen_deposit_i64(result, result, src64, N * 16, 16);
312 }
313
314 void gen_set_byte_i64(int N, TCGv_i64 result, TCGv src)
315 {
316 TCGv_i64 src64 = tcg_temp_new_i64();
317 tcg_gen_extu_i32_i64(src64, src);
318 tcg_gen_deposit_i64(result, result, src64, N * 8, 8);
319 }
320
321 static inline void gen_load_locked4u(TCGv dest, TCGv vaddr, int mem_index)
322 {
323 tcg_gen_qemu_ld32u(dest, vaddr, mem_index);
324 tcg_gen_mov_tl(hex_llsc_addr, vaddr);
325 tcg_gen_mov_tl(hex_llsc_val, dest);
326 }
327
328 static inline void gen_load_locked8u(TCGv_i64 dest, TCGv vaddr, int mem_index)
329 {
330 tcg_gen_qemu_ld64(dest, vaddr, mem_index);
331 tcg_gen_mov_tl(hex_llsc_addr, vaddr);
332 tcg_gen_mov_i64(hex_llsc_val_i64, dest);
333 }
334
335 static inline void gen_store_conditional4(DisasContext *ctx,
336 TCGv pred, TCGv vaddr, TCGv src)
337 {
338 TCGLabel *fail = gen_new_label();
339 TCGLabel *done = gen_new_label();
340 TCGv one, zero, tmp;
341
342 tcg_gen_brcond_tl(TCG_COND_NE, vaddr, hex_llsc_addr, fail);
343
344 one = tcg_constant_tl(0xff);
345 zero = tcg_constant_tl(0);
346 tmp = tcg_temp_new();
347 tcg_gen_atomic_cmpxchg_tl(tmp, hex_llsc_addr, hex_llsc_val, src,
348 ctx->mem_idx, MO_32);
349 tcg_gen_movcond_tl(TCG_COND_EQ, pred, tmp, hex_llsc_val,
350 one, zero);
351 tcg_gen_br(done);
352
353 gen_set_label(fail);
354 tcg_gen_movi_tl(pred, 0);
355
356 gen_set_label(done);
357 tcg_gen_movi_tl(hex_llsc_addr, ~0);
358 }
359
360 static inline void gen_store_conditional8(DisasContext *ctx,
361 TCGv pred, TCGv vaddr, TCGv_i64 src)
362 {
363 TCGLabel *fail = gen_new_label();
364 TCGLabel *done = gen_new_label();
365 TCGv_i64 one, zero, tmp;
366
367 tcg_gen_brcond_tl(TCG_COND_NE, vaddr, hex_llsc_addr, fail);
368
369 one = tcg_constant_i64(0xff);
370 zero = tcg_constant_i64(0);
371 tmp = tcg_temp_new_i64();
372 tcg_gen_atomic_cmpxchg_i64(tmp, hex_llsc_addr, hex_llsc_val_i64, src,
373 ctx->mem_idx, MO_64);
374 tcg_gen_movcond_i64(TCG_COND_EQ, tmp, tmp, hex_llsc_val_i64,
375 one, zero);
376 tcg_gen_extrl_i64_i32(pred, tmp);
377 tcg_gen_br(done);
378
379 gen_set_label(fail);
380 tcg_gen_movi_tl(pred, 0);
381
382 gen_set_label(done);
383 tcg_gen_movi_tl(hex_llsc_addr, ~0);
384 }
385
386 void gen_store32(TCGv vaddr, TCGv src, int width, uint32_t slot)
387 {
388 tcg_gen_mov_tl(hex_store_addr[slot], vaddr);
389 tcg_gen_movi_tl(hex_store_width[slot], width);
390 tcg_gen_mov_tl(hex_store_val32[slot], src);
391 }
392
393 void gen_store1(TCGv_env cpu_env, TCGv vaddr, TCGv src, uint32_t slot)
394 {
395 gen_store32(vaddr, src, 1, slot);
396 }
397
398 void gen_store1i(TCGv_env cpu_env, TCGv vaddr, int32_t src, uint32_t slot)
399 {
400 TCGv tmp = tcg_constant_tl(src);
401 gen_store1(cpu_env, vaddr, tmp, slot);
402 }
403
404 void gen_store2(TCGv_env cpu_env, TCGv vaddr, TCGv src, uint32_t slot)
405 {
406 gen_store32(vaddr, src, 2, slot);
407 }
408
409 void gen_store2i(TCGv_env cpu_env, TCGv vaddr, int32_t src, uint32_t slot)
410 {
411 TCGv tmp = tcg_constant_tl(src);
412 gen_store2(cpu_env, vaddr, tmp, slot);
413 }
414
415 void gen_store4(TCGv_env cpu_env, TCGv vaddr, TCGv src, uint32_t slot)
416 {
417 gen_store32(vaddr, src, 4, slot);
418 }
419
420 void gen_store4i(TCGv_env cpu_env, TCGv vaddr, int32_t src, uint32_t slot)
421 {
422 TCGv tmp = tcg_constant_tl(src);
423 gen_store4(cpu_env, vaddr, tmp, slot);
424 }
425
426 void gen_store8(TCGv_env cpu_env, TCGv vaddr, TCGv_i64 src, uint32_t slot)
427 {
428 tcg_gen_mov_tl(hex_store_addr[slot], vaddr);
429 tcg_gen_movi_tl(hex_store_width[slot], 8);
430 tcg_gen_mov_i64(hex_store_val64[slot], src);
431 }
432
433 void gen_store8i(TCGv_env cpu_env, TCGv vaddr, int64_t src, uint32_t slot)
434 {
435 TCGv_i64 tmp = tcg_constant_i64(src);
436 gen_store8(cpu_env, vaddr, tmp, slot);
437 }
438
439 TCGv gen_8bitsof(TCGv result, TCGv value)
440 {
441 TCGv zero = tcg_constant_tl(0);
442 TCGv ones = tcg_constant_tl(0xff);
443 tcg_gen_movcond_tl(TCG_COND_NE, result, value, zero, ones, zero);
444
445 return result;
446 }
447
448 static void gen_write_new_pc_addr(DisasContext *ctx, TCGv addr,
449 TCGCond cond, TCGv pred)
450 {
451 TCGLabel *pred_false = NULL;
452 if (cond != TCG_COND_ALWAYS) {
453 pred_false = gen_new_label();
454 tcg_gen_brcondi_tl(cond, pred, 0, pred_false);
455 }
456
457 if (ctx->pkt->pkt_has_multi_cof) {
458 /* If there are multiple branches in a packet, ignore the second one */
459 tcg_gen_movcond_tl(TCG_COND_NE, hex_gpr[HEX_REG_PC],
460 hex_branch_taken, tcg_constant_tl(0),
461 hex_gpr[HEX_REG_PC], addr);
462 tcg_gen_movi_tl(hex_branch_taken, 1);
463 } else {
464 tcg_gen_mov_tl(hex_gpr[HEX_REG_PC], addr);
465 }
466
467 if (cond != TCG_COND_ALWAYS) {
468 gen_set_label(pred_false);
469 }
470 }
471
472 static void gen_write_new_pc_pcrel(DisasContext *ctx, int pc_off,
473 TCGCond cond, TCGv pred)
474 {
475 target_ulong dest = ctx->pkt->pc + pc_off;
476 if (ctx->pkt->pkt_has_multi_cof) {
477 gen_write_new_pc_addr(ctx, tcg_constant_tl(dest), cond, pred);
478 } else {
479 /* Defer this jump to the end of the TB */
480 ctx->branch_cond = TCG_COND_ALWAYS;
481 if (pred != NULL) {
482 ctx->branch_cond = cond;
483 tcg_gen_mov_tl(hex_branch_taken, pred);
484 }
485 ctx->branch_dest = dest;
486 }
487 }
488
489 void gen_set_usr_field(int field, TCGv val)
490 {
491 tcg_gen_deposit_tl(hex_new_value[HEX_REG_USR], hex_new_value[HEX_REG_USR],
492 val,
493 reg_field_info[field].offset,
494 reg_field_info[field].width);
495 }
496
497 void gen_set_usr_fieldi(int field, int x)
498 {
499 if (reg_field_info[field].width == 1) {
500 target_ulong bit = 1 << reg_field_info[field].offset;
501 if ((x & 1) == 1) {
502 tcg_gen_ori_tl(hex_new_value[HEX_REG_USR],
503 hex_new_value[HEX_REG_USR],
504 bit);
505 } else {
506 tcg_gen_andi_tl(hex_new_value[HEX_REG_USR],
507 hex_new_value[HEX_REG_USR],
508 ~bit);
509 }
510 } else {
511 TCGv val = tcg_constant_tl(x);
512 gen_set_usr_field(field, val);
513 }
514 }
515
516 static void gen_compare(TCGCond cond, TCGv res, TCGv arg1, TCGv arg2)
517 {
518 TCGv one = tcg_constant_tl(0xff);
519 TCGv zero = tcg_constant_tl(0);
520
521 tcg_gen_movcond_tl(cond, res, arg1, arg2, one, zero);
522 }
523
524 static void gen_cond_jumpr(DisasContext *ctx, TCGv dst_pc,
525 TCGCond cond, TCGv pred)
526 {
527 gen_write_new_pc_addr(ctx, dst_pc, cond, pred);
528 }
529
530 static void gen_cond_jumpr31(DisasContext *ctx, TCGCond cond, TCGv pred)
531 {
532 TCGv LSB = tcg_temp_new();
533 tcg_gen_andi_tl(LSB, pred, 1);
534 gen_cond_jumpr(ctx, hex_gpr[HEX_REG_LR], cond, LSB);
535 }
536
537 static void gen_cond_jump(DisasContext *ctx, TCGCond cond, TCGv pred,
538 int pc_off)
539 {
540 gen_write_new_pc_pcrel(ctx, pc_off, cond, pred);
541 }
542
543 static void gen_cmpnd_cmp_jmp(DisasContext *ctx,
544 int pnum, TCGCond cond1, TCGv arg1, TCGv arg2,
545 TCGCond cond2, int pc_off)
546 {
547 if (ctx->insn->part1) {
548 TCGv pred = tcg_temp_new();
549 gen_compare(cond1, pred, arg1, arg2);
550 gen_log_pred_write(ctx, pnum, pred);
551 } else {
552 TCGv pred = tcg_temp_new();
553 tcg_gen_mov_tl(pred, hex_new_pred_value[pnum]);
554 gen_cond_jump(ctx, cond2, pred, pc_off);
555 }
556 }
557
558 static void gen_cmpnd_cmp_jmp_t(DisasContext *ctx,
559 int pnum, TCGCond cond, TCGv arg1, TCGv arg2,
560 int pc_off)
561 {
562 gen_cmpnd_cmp_jmp(ctx, pnum, cond, arg1, arg2, TCG_COND_EQ, pc_off);
563 }
564
565 static void gen_cmpnd_cmp_jmp_f(DisasContext *ctx,
566 int pnum, TCGCond cond, TCGv arg1, TCGv arg2,
567 int pc_off)
568 {
569 gen_cmpnd_cmp_jmp(ctx, pnum, cond, arg1, arg2, TCG_COND_NE, pc_off);
570 }
571
572 static void gen_cmpnd_cmpi_jmp_t(DisasContext *ctx,
573 int pnum, TCGCond cond, TCGv arg1, int arg2,
574 int pc_off)
575 {
576 TCGv tmp = tcg_constant_tl(arg2);
577 gen_cmpnd_cmp_jmp(ctx, pnum, cond, arg1, tmp, TCG_COND_EQ, pc_off);
578 }
579
580 static void gen_cmpnd_cmpi_jmp_f(DisasContext *ctx,
581 int pnum, TCGCond cond, TCGv arg1, int arg2,
582 int pc_off)
583 {
584 TCGv tmp = tcg_constant_tl(arg2);
585 gen_cmpnd_cmp_jmp(ctx, pnum, cond, arg1, tmp, TCG_COND_NE, pc_off);
586 }
587
588 static void gen_cmpnd_cmp_n1_jmp_t(DisasContext *ctx, int pnum, TCGCond cond,
589 TCGv arg, int pc_off)
590 {
591 gen_cmpnd_cmpi_jmp_t(ctx, pnum, cond, arg, -1, pc_off);
592 }
593
594 static void gen_cmpnd_cmp_n1_jmp_f(DisasContext *ctx, int pnum, TCGCond cond,
595 TCGv arg, int pc_off)
596 {
597 gen_cmpnd_cmpi_jmp_f(ctx, pnum, cond, arg, -1, pc_off);
598 }
599
600 static void gen_cmpnd_tstbit0_jmp(DisasContext *ctx,
601 int pnum, TCGv arg, TCGCond cond, int pc_off)
602 {
603 if (ctx->insn->part1) {
604 TCGv pred = tcg_temp_new();
605 tcg_gen_andi_tl(pred, arg, 1);
606 gen_8bitsof(pred, pred);
607 gen_log_pred_write(ctx, pnum, pred);
608 } else {
609 TCGv pred = tcg_temp_new();
610 tcg_gen_mov_tl(pred, hex_new_pred_value[pnum]);
611 gen_cond_jump(ctx, cond, pred, pc_off);
612 }
613 }
614
615 static void gen_testbit0_jumpnv(DisasContext *ctx,
616 TCGv arg, TCGCond cond, int pc_off)
617 {
618 TCGv pred = tcg_temp_new();
619 tcg_gen_andi_tl(pred, arg, 1);
620 gen_cond_jump(ctx, cond, pred, pc_off);
621 }
622
623 static void gen_jump(DisasContext *ctx, int pc_off)
624 {
625 gen_write_new_pc_pcrel(ctx, pc_off, TCG_COND_ALWAYS, NULL);
626 }
627
628 static void gen_jumpr(DisasContext *ctx, TCGv new_pc)
629 {
630 gen_write_new_pc_addr(ctx, new_pc, TCG_COND_ALWAYS, NULL);
631 }
632
633 static void gen_call(DisasContext *ctx, int pc_off)
634 {
635 TCGv lr = get_result_gpr(ctx, HEX_REG_LR);
636 tcg_gen_movi_tl(lr, ctx->next_PC);
637 gen_write_new_pc_pcrel(ctx, pc_off, TCG_COND_ALWAYS, NULL);
638 }
639
640 static void gen_callr(DisasContext *ctx, TCGv new_pc)
641 {
642 TCGv lr = get_result_gpr(ctx, HEX_REG_LR);
643 tcg_gen_movi_tl(lr, ctx->next_PC);
644 gen_write_new_pc_addr(ctx, new_pc, TCG_COND_ALWAYS, NULL);
645 }
646
647 static void gen_cond_call(DisasContext *ctx, TCGv pred,
648 TCGCond cond, int pc_off)
649 {
650 TCGv lr = get_result_gpr(ctx, HEX_REG_LR);
651 TCGv lsb = tcg_temp_new();
652 TCGLabel *skip = gen_new_label();
653 tcg_gen_andi_tl(lsb, pred, 1);
654 gen_write_new_pc_pcrel(ctx, pc_off, cond, lsb);
655 tcg_gen_brcondi_tl(cond, lsb, 0, skip);
656 tcg_gen_movi_tl(lr, ctx->next_PC);
657 gen_set_label(skip);
658 }
659
660 static void gen_cond_callr(DisasContext *ctx,
661 TCGCond cond, TCGv pred, TCGv new_pc)
662 {
663 TCGv lsb = tcg_temp_new();
664 TCGLabel *skip = gen_new_label();
665 tcg_gen_andi_tl(lsb, pred, 1);
666 tcg_gen_brcondi_tl(cond, lsb, 0, skip);
667 gen_callr(ctx, new_pc);
668 gen_set_label(skip);
669 }
670
671 /* frame ^= (int64_t)FRAMEKEY << 32 */
672 static void gen_frame_unscramble(TCGv_i64 frame)
673 {
674 TCGv_i64 framekey = tcg_temp_new_i64();
675 tcg_gen_extu_i32_i64(framekey, hex_gpr[HEX_REG_FRAMEKEY]);
676 tcg_gen_shli_i64(framekey, framekey, 32);
677 tcg_gen_xor_i64(frame, frame, framekey);
678 }
679
680 static void gen_load_frame(DisasContext *ctx, TCGv_i64 frame, TCGv EA)
681 {
682 Insn *insn = ctx->insn; /* Needed for CHECK_NOSHUF */
683 CHECK_NOSHUF(EA, 8);
684 tcg_gen_qemu_ld64(frame, EA, ctx->mem_idx);
685 }
686
687 static void gen_return(DisasContext *ctx, TCGv_i64 dst, TCGv src)
688 {
689 /*
690 * frame = *src
691 * dst = frame_unscramble(frame)
692 * SP = src + 8
693 * PC = dst.w[1]
694 */
695 TCGv_i64 frame = tcg_temp_new_i64();
696 TCGv r31 = tcg_temp_new();
697 TCGv r29 = get_result_gpr(ctx, HEX_REG_SP);
698
699 gen_load_frame(ctx, frame, src);
700 gen_frame_unscramble(frame);
701 tcg_gen_mov_i64(dst, frame);
702 tcg_gen_addi_tl(r29, src, 8);
703 tcg_gen_extrh_i64_i32(r31, dst);
704 gen_jumpr(ctx, r31);
705 }
706
707 /* if (pred) dst = dealloc_return(src):raw */
708 static void gen_cond_return(DisasContext *ctx, TCGv_i64 dst, TCGv src,
709 TCGv pred, TCGCond cond)
710 {
711 TCGv LSB = tcg_temp_new();
712 TCGLabel *skip = gen_new_label();
713 tcg_gen_andi_tl(LSB, pred, 1);
714
715 tcg_gen_brcondi_tl(cond, LSB, 0, skip);
716 gen_return(ctx, dst, src);
717 gen_set_label(skip);
718 }
719
720 /* sub-instruction version (no RddV, so handle it manually) */
721 static void gen_cond_return_subinsn(DisasContext *ctx, TCGCond cond, TCGv pred)
722 {
723 TCGv_i64 RddV = get_result_gpr_pair(ctx, HEX_REG_FP);
724 gen_cond_return(ctx, RddV, hex_gpr[HEX_REG_FP], pred, cond);
725 gen_log_reg_write_pair(HEX_REG_FP, RddV);
726 }
727
728 static void gen_endloop0(DisasContext *ctx)
729 {
730 TCGv lpcfg = tcg_temp_new();
731
732 GET_USR_FIELD(USR_LPCFG, lpcfg);
733
734 /*
735 * if (lpcfg == 1) {
736 * hex_new_pred_value[3] = 0xff;
737 * hex_pred_written |= 1 << 3;
738 * }
739 */
740 TCGLabel *label1 = gen_new_label();
741 tcg_gen_brcondi_tl(TCG_COND_NE, lpcfg, 1, label1);
742 {
743 tcg_gen_movi_tl(hex_new_pred_value[3], 0xff);
744 tcg_gen_ori_tl(hex_pred_written, hex_pred_written, 1 << 3);
745 }
746 gen_set_label(label1);
747
748 /*
749 * if (lpcfg) {
750 * SET_USR_FIELD(USR_LPCFG, lpcfg - 1);
751 * }
752 */
753 TCGLabel *label2 = gen_new_label();
754 tcg_gen_brcondi_tl(TCG_COND_EQ, lpcfg, 0, label2);
755 {
756 tcg_gen_subi_tl(lpcfg, lpcfg, 1);
757 SET_USR_FIELD(USR_LPCFG, lpcfg);
758 }
759 gen_set_label(label2);
760
761 /*
762 * If we're in a tight loop, we'll do this at the end of the TB to take
763 * advantage of direct block chaining.
764 */
765 if (!ctx->is_tight_loop) {
766 /*
767 * if (hex_gpr[HEX_REG_LC0] > 1) {
768 * PC = hex_gpr[HEX_REG_SA0];
769 * hex_new_value[HEX_REG_LC0] = hex_gpr[HEX_REG_LC0] - 1;
770 * }
771 */
772 TCGLabel *label3 = gen_new_label();
773 tcg_gen_brcondi_tl(TCG_COND_LEU, hex_gpr[HEX_REG_LC0], 1, label3);
774 {
775 TCGv lc0 = get_result_gpr(ctx, HEX_REG_LC0);
776 gen_jumpr(ctx, hex_gpr[HEX_REG_SA0]);
777 tcg_gen_subi_tl(lc0, hex_gpr[HEX_REG_LC0], 1);
778 }
779 gen_set_label(label3);
780 }
781 }
782
783 static void gen_endloop1(DisasContext *ctx)
784 {
785 /*
786 * if (hex_gpr[HEX_REG_LC1] > 1) {
787 * PC = hex_gpr[HEX_REG_SA1];
788 * hex_new_value[HEX_REG_LC1] = hex_gpr[HEX_REG_LC1] - 1;
789 * }
790 */
791 TCGLabel *label = gen_new_label();
792 tcg_gen_brcondi_tl(TCG_COND_LEU, hex_gpr[HEX_REG_LC1], 1, label);
793 {
794 TCGv lc1 = get_result_gpr(ctx, HEX_REG_LC1);
795 gen_jumpr(ctx, hex_gpr[HEX_REG_SA1]);
796 tcg_gen_subi_tl(lc1, hex_gpr[HEX_REG_LC1], 1);
797 }
798 gen_set_label(label);
799 }
800
801 static void gen_endloop01(DisasContext *ctx)
802 {
803 TCGv lpcfg = tcg_temp_new();
804 TCGLabel *label1 = gen_new_label();
805 TCGLabel *label2 = gen_new_label();
806 TCGLabel *label3 = gen_new_label();
807 TCGLabel *done = gen_new_label();
808
809 GET_USR_FIELD(USR_LPCFG, lpcfg);
810
811 /*
812 * if (lpcfg == 1) {
813 * hex_new_pred_value[3] = 0xff;
814 * hex_pred_written |= 1 << 3;
815 * }
816 */
817 tcg_gen_brcondi_tl(TCG_COND_NE, lpcfg, 1, label1);
818 {
819 tcg_gen_movi_tl(hex_new_pred_value[3], 0xff);
820 tcg_gen_ori_tl(hex_pred_written, hex_pred_written, 1 << 3);
821 }
822 gen_set_label(label1);
823
824 /*
825 * if (lpcfg) {
826 * SET_USR_FIELD(USR_LPCFG, lpcfg - 1);
827 * }
828 */
829 tcg_gen_brcondi_tl(TCG_COND_EQ, lpcfg, 0, label2);
830 {
831 tcg_gen_subi_tl(lpcfg, lpcfg, 1);
832 SET_USR_FIELD(USR_LPCFG, lpcfg);
833 }
834 gen_set_label(label2);
835
836 /*
837 * if (hex_gpr[HEX_REG_LC0] > 1) {
838 * PC = hex_gpr[HEX_REG_SA0];
839 * hex_new_value[HEX_REG_LC0] = hex_gpr[HEX_REG_LC0] - 1;
840 * } else {
841 * if (hex_gpr[HEX_REG_LC1] > 1) {
842 * hex_next_pc = hex_gpr[HEX_REG_SA1];
843 * hex_new_value[HEX_REG_LC1] = hex_gpr[HEX_REG_LC1] - 1;
844 * }
845 * }
846 */
847 tcg_gen_brcondi_tl(TCG_COND_LEU, hex_gpr[HEX_REG_LC0], 1, label3);
848 {
849 TCGv lc0 = get_result_gpr(ctx, HEX_REG_LC0);
850 gen_jumpr(ctx, hex_gpr[HEX_REG_SA0]);
851 tcg_gen_subi_tl(lc0, hex_gpr[HEX_REG_LC0], 1);
852 tcg_gen_br(done);
853 }
854 gen_set_label(label3);
855 tcg_gen_brcondi_tl(TCG_COND_LEU, hex_gpr[HEX_REG_LC1], 1, done);
856 {
857 TCGv lc1 = get_result_gpr(ctx, HEX_REG_LC1);
858 gen_jumpr(ctx, hex_gpr[HEX_REG_SA1]);
859 tcg_gen_subi_tl(lc1, hex_gpr[HEX_REG_LC1], 1);
860 }
861 gen_set_label(done);
862 }
863
864 static void gen_cmp_jumpnv(DisasContext *ctx,
865 TCGCond cond, TCGv val, TCGv src, int pc_off)
866 {
867 TCGv pred = tcg_temp_new();
868 tcg_gen_setcond_tl(cond, pred, val, src);
869 gen_cond_jump(ctx, TCG_COND_EQ, pred, pc_off);
870 }
871
872 static void gen_cmpi_jumpnv(DisasContext *ctx,
873 TCGCond cond, TCGv val, int src, int pc_off)
874 {
875 TCGv pred = tcg_temp_new();
876 tcg_gen_setcondi_tl(cond, pred, val, src);
877 gen_cond_jump(ctx, TCG_COND_EQ, pred, pc_off);
878 }
879
880 /* Shift left with saturation */
881 static void gen_shl_sat(TCGv dst, TCGv src, TCGv shift_amt)
882 {
883 TCGv sh32 = tcg_temp_new();
884 TCGv dst_sar = tcg_temp_new();
885 TCGv ovf = tcg_temp_new();
886 TCGv satval = tcg_temp_new();
887 TCGv min = tcg_constant_tl(0x80000000);
888 TCGv max = tcg_constant_tl(0x7fffffff);
889
890 /*
891 * Possible values for shift_amt are 0 .. 64
892 * We need special handling for values above 31
893 *
894 * sh32 = shift & 31;
895 * dst = sh32 == shift ? src : 0;
896 * dst <<= sh32;
897 * dst_sar = dst >> sh32;
898 * satval = src < 0 ? min : max;
899 * if (dst_asr != src) {
900 * usr.OVF |= 1;
901 * dst = satval;
902 * }
903 */
904
905 tcg_gen_andi_tl(sh32, shift_amt, 31);
906 tcg_gen_movcond_tl(TCG_COND_EQ, dst, sh32, shift_amt,
907 src, tcg_constant_tl(0));
908 tcg_gen_shl_tl(dst, dst, sh32);
909 tcg_gen_sar_tl(dst_sar, dst, sh32);
910 tcg_gen_movcond_tl(TCG_COND_LT, satval, src, tcg_constant_tl(0), min, max);
911
912 tcg_gen_setcond_tl(TCG_COND_NE, ovf, dst_sar, src);
913 tcg_gen_shli_tl(ovf, ovf, reg_field_info[USR_OVF].offset);
914 tcg_gen_or_tl(hex_new_value[HEX_REG_USR], hex_new_value[HEX_REG_USR], ovf);
915
916 tcg_gen_movcond_tl(TCG_COND_EQ, dst, dst_sar, src, dst, satval);
917 }
918
919 static void gen_sar(TCGv dst, TCGv src, TCGv shift_amt)
920 {
921 /*
922 * Shift arithmetic right
923 * Robust when shift_amt is >31 bits
924 */
925 TCGv tmp = tcg_temp_new();
926 tcg_gen_umin_tl(tmp, shift_amt, tcg_constant_tl(31));
927 tcg_gen_sar_tl(dst, src, tmp);
928 }
929
930 /* Bidirectional shift right with saturation */
931 static void gen_asr_r_r_sat(TCGv RdV, TCGv RsV, TCGv RtV)
932 {
933 TCGv shift_amt = tcg_temp_new();
934 TCGLabel *positive = gen_new_label();
935 TCGLabel *done = gen_new_label();
936
937 tcg_gen_sextract_i32(shift_amt, RtV, 0, 7);
938 tcg_gen_brcondi_tl(TCG_COND_GE, shift_amt, 0, positive);
939
940 /* Negative shift amount => shift left */
941 tcg_gen_neg_tl(shift_amt, shift_amt);
942 gen_shl_sat(RdV, RsV, shift_amt);
943 tcg_gen_br(done);
944
945 gen_set_label(positive);
946 /* Positive shift amount => shift right */
947 gen_sar(RdV, RsV, shift_amt);
948
949 gen_set_label(done);
950 }
951
952 /* Bidirectional shift left with saturation */
953 static void gen_asl_r_r_sat(TCGv RdV, TCGv RsV, TCGv RtV)
954 {
955 TCGv shift_amt = tcg_temp_new();
956 TCGLabel *positive = gen_new_label();
957 TCGLabel *done = gen_new_label();
958
959 tcg_gen_sextract_i32(shift_amt, RtV, 0, 7);
960 tcg_gen_brcondi_tl(TCG_COND_GE, shift_amt, 0, positive);
961
962 /* Negative shift amount => shift right */
963 tcg_gen_neg_tl(shift_amt, shift_amt);
964 gen_sar(RdV, RsV, shift_amt);
965 tcg_gen_br(done);
966
967 gen_set_label(positive);
968 /* Positive shift amount => shift left */
969 gen_shl_sat(RdV, RsV, shift_amt);
970
971 gen_set_label(done);
972 }
973
974 static intptr_t vreg_src_off(DisasContext *ctx, int num)
975 {
976 intptr_t offset = offsetof(CPUHexagonState, VRegs[num]);
977
978 if (test_bit(num, ctx->vregs_select)) {
979 offset = ctx_future_vreg_off(ctx, num, 1, false);
980 }
981 if (test_bit(num, ctx->vregs_updated_tmp)) {
982 offset = ctx_tmp_vreg_off(ctx, num, 1, false);
983 }
984 return offset;
985 }
986
987 static void gen_log_vreg_write(DisasContext *ctx, intptr_t srcoff, int num,
988 VRegWriteType type)
989 {
990 intptr_t dstoff;
991
992 if (type != EXT_TMP) {
993 dstoff = ctx_future_vreg_off(ctx, num, 1, true);
994 tcg_gen_gvec_mov(MO_64, dstoff, srcoff,
995 sizeof(MMVector), sizeof(MMVector));
996 } else {
997 dstoff = ctx_tmp_vreg_off(ctx, num, 1, false);
998 tcg_gen_gvec_mov(MO_64, dstoff, srcoff,
999 sizeof(MMVector), sizeof(MMVector));
1000 }
1001 }
1002
1003 static void gen_log_vreg_write_pair(DisasContext *ctx, intptr_t srcoff, int num,
1004 VRegWriteType type)
1005 {
1006 gen_log_vreg_write(ctx, srcoff, num ^ 0, type);
1007 srcoff += sizeof(MMVector);
1008 gen_log_vreg_write(ctx, srcoff, num ^ 1, type);
1009 }
1010
1011 static intptr_t get_result_qreg(DisasContext *ctx, int qnum)
1012 {
1013 return offsetof(CPUHexagonState, future_QRegs[qnum]);
1014 }
1015
1016 static void gen_vreg_load(DisasContext *ctx, intptr_t dstoff, TCGv src,
1017 bool aligned)
1018 {
1019 TCGv_i64 tmp = tcg_temp_new_i64();
1020 if (aligned) {
1021 tcg_gen_andi_tl(src, src, ~((int32_t)sizeof(MMVector) - 1));
1022 }
1023 for (int i = 0; i < sizeof(MMVector) / 8; i++) {
1024 tcg_gen_qemu_ld64(tmp, src, ctx->mem_idx);
1025 tcg_gen_addi_tl(src, src, 8);
1026 tcg_gen_st_i64(tmp, cpu_env, dstoff + i * 8);
1027 }
1028 }
1029
1030 static void gen_vreg_store(DisasContext *ctx, TCGv EA, intptr_t srcoff,
1031 int slot, bool aligned)
1032 {
1033 intptr_t dstoff = offsetof(CPUHexagonState, vstore[slot].data);
1034 intptr_t maskoff = offsetof(CPUHexagonState, vstore[slot].mask);
1035
1036 if (is_gather_store_insn(ctx)) {
1037 TCGv sl = tcg_constant_tl(slot);
1038 gen_helper_gather_store(cpu_env, EA, sl);
1039 return;
1040 }
1041
1042 tcg_gen_movi_tl(hex_vstore_pending[slot], 1);
1043 if (aligned) {
1044 tcg_gen_andi_tl(hex_vstore_addr[slot], EA,
1045 ~((int32_t)sizeof(MMVector) - 1));
1046 } else {
1047 tcg_gen_mov_tl(hex_vstore_addr[slot], EA);
1048 }
1049 tcg_gen_movi_tl(hex_vstore_size[slot], sizeof(MMVector));
1050
1051 /* Copy the data to the vstore buffer */
1052 tcg_gen_gvec_mov(MO_64, dstoff, srcoff, sizeof(MMVector), sizeof(MMVector));
1053 /* Set the mask to all 1's */
1054 tcg_gen_gvec_dup_imm(MO_64, maskoff, sizeof(MMQReg), sizeof(MMQReg), ~0LL);
1055 }
1056
1057 static void gen_vreg_masked_store(DisasContext *ctx, TCGv EA, intptr_t srcoff,
1058 intptr_t bitsoff, int slot, bool invert)
1059 {
1060 intptr_t dstoff = offsetof(CPUHexagonState, vstore[slot].data);
1061 intptr_t maskoff = offsetof(CPUHexagonState, vstore[slot].mask);
1062
1063 tcg_gen_movi_tl(hex_vstore_pending[slot], 1);
1064 tcg_gen_andi_tl(hex_vstore_addr[slot], EA,
1065 ~((int32_t)sizeof(MMVector) - 1));
1066 tcg_gen_movi_tl(hex_vstore_size[slot], sizeof(MMVector));
1067
1068 /* Copy the data to the vstore buffer */
1069 tcg_gen_gvec_mov(MO_64, dstoff, srcoff, sizeof(MMVector), sizeof(MMVector));
1070 /* Copy the mask */
1071 tcg_gen_gvec_mov(MO_64, maskoff, bitsoff, sizeof(MMQReg), sizeof(MMQReg));
1072 if (invert) {
1073 tcg_gen_gvec_not(MO_64, maskoff, maskoff,
1074 sizeof(MMQReg), sizeof(MMQReg));
1075 }
1076 }
1077
1078 static void vec_to_qvec(size_t size, intptr_t dstoff, intptr_t srcoff)
1079 {
1080 TCGv_i64 tmp = tcg_temp_new_i64();
1081 TCGv_i64 word = tcg_temp_new_i64();
1082 TCGv_i64 bits = tcg_temp_new_i64();
1083 TCGv_i64 mask = tcg_temp_new_i64();
1084 TCGv_i64 zero = tcg_constant_i64(0);
1085 TCGv_i64 ones = tcg_constant_i64(~0);
1086
1087 for (int i = 0; i < sizeof(MMVector) / 8; i++) {
1088 tcg_gen_ld_i64(tmp, cpu_env, srcoff + i * 8);
1089 tcg_gen_movi_i64(mask, 0);
1090
1091 for (int j = 0; j < 8; j += size) {
1092 tcg_gen_extract_i64(word, tmp, j * 8, size * 8);
1093 tcg_gen_movcond_i64(TCG_COND_NE, bits, word, zero, ones, zero);
1094 tcg_gen_deposit_i64(mask, mask, bits, j, size);
1095 }
1096
1097 tcg_gen_st8_i64(mask, cpu_env, dstoff + i);
1098 }
1099 }
1100
1101 void probe_noshuf_load(TCGv va, int s, int mi)
1102 {
1103 TCGv size = tcg_constant_tl(s);
1104 TCGv mem_idx = tcg_constant_tl(mi);
1105 gen_helper_probe_noshuf_load(cpu_env, va, size, mem_idx);
1106 }
1107
1108 /*
1109 * Note: Since this function might branch, `val` is
1110 * required to be a `tcg_temp_local`.
1111 */
1112 void gen_set_usr_field_if(int field, TCGv val)
1113 {
1114 /* Sets the USR field if `val` is non-zero */
1115 if (reg_field_info[field].width == 1) {
1116 TCGv tmp = tcg_temp_new();
1117 tcg_gen_extract_tl(tmp, val, 0, reg_field_info[field].width);
1118 tcg_gen_shli_tl(tmp, tmp, reg_field_info[field].offset);
1119 tcg_gen_or_tl(hex_new_value[HEX_REG_USR],
1120 hex_new_value[HEX_REG_USR],
1121 tmp);
1122 } else {
1123 TCGLabel *skip_label = gen_new_label();
1124 tcg_gen_brcondi_tl(TCG_COND_EQ, val, 0, skip_label);
1125 gen_set_usr_field(field, val);
1126 gen_set_label(skip_label);
1127 }
1128 }
1129
1130 void gen_sat_i32(TCGv dest, TCGv source, int width)
1131 {
1132 TCGv max_val = tcg_constant_tl((1 << (width - 1)) - 1);
1133 TCGv min_val = tcg_constant_tl(-(1 << (width - 1)));
1134 tcg_gen_smin_tl(dest, source, max_val);
1135 tcg_gen_smax_tl(dest, dest, min_val);
1136 }
1137
1138 void gen_sat_i32_ovfl(TCGv ovfl, TCGv dest, TCGv source, int width)
1139 {
1140 gen_sat_i32(dest, source, width);
1141 tcg_gen_setcond_tl(TCG_COND_NE, ovfl, source, dest);
1142 }
1143
1144 void gen_satu_i32(TCGv dest, TCGv source, int width)
1145 {
1146 TCGv max_val = tcg_constant_tl((1 << width) - 1);
1147 TCGv zero = tcg_constant_tl(0);
1148 tcg_gen_movcond_tl(TCG_COND_GTU, dest, source, max_val, max_val, source);
1149 tcg_gen_movcond_tl(TCG_COND_LT, dest, source, zero, zero, dest);
1150 }
1151
1152 void gen_satu_i32_ovfl(TCGv ovfl, TCGv dest, TCGv source, int width)
1153 {
1154 gen_satu_i32(dest, source, width);
1155 tcg_gen_setcond_tl(TCG_COND_NE, ovfl, source, dest);
1156 }
1157
1158 void gen_sat_i64(TCGv_i64 dest, TCGv_i64 source, int width)
1159 {
1160 TCGv_i64 max_val = tcg_constant_i64((1LL << (width - 1)) - 1LL);
1161 TCGv_i64 min_val = tcg_constant_i64(-(1LL << (width - 1)));
1162 tcg_gen_smin_i64(dest, source, max_val);
1163 tcg_gen_smax_i64(dest, dest, min_val);
1164 }
1165
1166 void gen_sat_i64_ovfl(TCGv ovfl, TCGv_i64 dest, TCGv_i64 source, int width)
1167 {
1168 TCGv_i64 ovfl_64;
1169 gen_sat_i64(dest, source, width);
1170 ovfl_64 = tcg_temp_new_i64();
1171 tcg_gen_setcond_i64(TCG_COND_NE, ovfl_64, dest, source);
1172 tcg_gen_trunc_i64_tl(ovfl, ovfl_64);
1173 }
1174
1175 void gen_satu_i64(TCGv_i64 dest, TCGv_i64 source, int width)
1176 {
1177 TCGv_i64 max_val = tcg_constant_i64((1LL << width) - 1LL);
1178 TCGv_i64 zero = tcg_constant_i64(0);
1179 tcg_gen_movcond_i64(TCG_COND_GTU, dest, source, max_val, max_val, source);
1180 tcg_gen_movcond_i64(TCG_COND_LT, dest, source, zero, zero, dest);
1181 }
1182
1183 void gen_satu_i64_ovfl(TCGv ovfl, TCGv_i64 dest, TCGv_i64 source, int width)
1184 {
1185 TCGv_i64 ovfl_64;
1186 gen_satu_i64(dest, source, width);
1187 ovfl_64 = tcg_temp_new_i64();
1188 tcg_gen_setcond_i64(TCG_COND_NE, ovfl_64, dest, source);
1189 tcg_gen_trunc_i64_tl(ovfl, ovfl_64);
1190 }
1191
1192 /* Implements the fADDSAT64 macro in TCG */
1193 void gen_add_sat_i64(TCGv_i64 ret, TCGv_i64 a, TCGv_i64 b)
1194 {
1195 TCGv_i64 sum = tcg_temp_new_i64();
1196 TCGv_i64 xor = tcg_temp_new_i64();
1197 TCGv_i64 cond1 = tcg_temp_new_i64();
1198 TCGv_i64 cond2 = tcg_temp_new_i64();
1199 TCGv_i64 cond3 = tcg_temp_new_i64();
1200 TCGv_i64 mask = tcg_constant_i64(0x8000000000000000ULL);
1201 TCGv_i64 max_pos = tcg_constant_i64(0x7FFFFFFFFFFFFFFFLL);
1202 TCGv_i64 max_neg = tcg_constant_i64(0x8000000000000000LL);
1203 TCGv_i64 zero = tcg_constant_i64(0);
1204 TCGLabel *no_ovfl_label = gen_new_label();
1205 TCGLabel *ovfl_label = gen_new_label();
1206 TCGLabel *ret_label = gen_new_label();
1207
1208 tcg_gen_add_i64(sum, a, b);
1209 tcg_gen_xor_i64(xor, a, b);
1210
1211 /* if (xor & mask) */
1212 tcg_gen_and_i64(cond1, xor, mask);
1213 tcg_gen_brcondi_i64(TCG_COND_NE, cond1, 0, no_ovfl_label);
1214
1215 /* else if ((a ^ sum) & mask) */
1216 tcg_gen_xor_i64(cond2, a, sum);
1217 tcg_gen_and_i64(cond2, cond2, mask);
1218 tcg_gen_brcondi_i64(TCG_COND_NE, cond2, 0, ovfl_label);
1219 /* fallthrough to no_ovfl_label branch */
1220
1221 /* if branch */
1222 gen_set_label(no_ovfl_label);
1223 tcg_gen_mov_i64(ret, sum);
1224 tcg_gen_br(ret_label);
1225
1226 /* else if branch */
1227 gen_set_label(ovfl_label);
1228 tcg_gen_and_i64(cond3, sum, mask);
1229 tcg_gen_movcond_i64(TCG_COND_NE, ret, cond3, zero, max_pos, max_neg);
1230 SET_USR_FIELD(USR_OVF, 1);
1231
1232 gen_set_label(ret_label);
1233 }
1234
1235 #include "tcg_funcs_generated.c.inc"
1236 #include "tcg_func_table_generated.c.inc"