@@ -991,24 +991,108 @@ xtensa_expand_conditional_move (rtx *operands, int isflt)
int
xtensa_expand_scc (rtx operands[4], machine_mode cmp_mode)
{
- rtx dest = operands[0];
- rtx cmp;
- rtx one_tmp, zero_tmp;
+ rtx dest = operands[0], op0 = operands[2], op1 = operands[3];
+ enum rtx_code code = GET_CODE (operands[1]);
+ rtx cmp, tmp0, tmp1;
rtx (*gen_fn) (rtx, rtx, rtx, rtx, rtx);
- if (!(cmp = gen_conditional_move (GET_CODE (operands[1]), cmp_mode,
- operands[2], operands[3])))
- return 0;
+ /* Dedicated optimizations for cstoresi4.
+ a. In a magnitude comparison operator, swapping both sides and
+ inverting magnitude does not change the result,
+ eg. '(x >= y) != (y <= x)' is a constant of zero
+ (GE is changed to LE, not LT).
+ b. Due to room for further optimization, we use subtraction rather
+ than XOR (the default for RTL expansion of EQ/NE) as the binary
+ operation which is zero if both sides are the same and non-zero
+ otherwise. */
+ if (cmp_mode == SImode)
+ switch (code)
+ {
+ /* EQ(op0, op1) := clz(op0 - op1) / 32 [requires TARGET_NSA] */
+ case EQ:
+ if (!TARGET_NSA)
+ break;
+ /* EQ to EQZ conversion by subtracting op1 from op0. */
+ emit_move_insn (dest,
+ expand_binop (SImode, sub_optab, op0, op1,
+ 0, 0, OPTAB_LIB_WIDEN));
+ /* NSAU instruction will return 32 iff the source is zero,
+ zero through 31 otherwise (See Xtensa ISA Reference Manual,
+ p. 462) */
+ emit_insn (gen_clzsi2 (dest, dest));
+ emit_insn (gen_lshrsi3 (dest, dest, GEN_INT (5)));
+ return 1;
+
+ /* NE(op0, op1) := (op0 - op1) == 0 ? 0 : 1 */
+ case NE:
+ /* NE to NEZ conversion by subtracting op1 from op0. */
+ emit_move_insn (tmp0 = gen_reg_rtx (SImode),
+ expand_binop (SImode, sub_optab, op0, op1,
+ 0, 0, OPTAB_LIB_WIDEN));
+ emit_move_insn (dest, const_true_rtx);
+ emit_move_insn (dest,
+ gen_rtx_fmt_eee (IF_THEN_ELSE, SImode,
+ gen_rtx_fmt_ee (EQ, VOIDmode,
+ tmp0, const0_rtx),
+ tmp0, dest));
+ return 1;
+
+ case LE:
+ if (REG_P (op1))
+ {
+ /* LE to GE conversion by swapping both sides. */
+ tmp0 = op0, op0 = op1, op1 = tmp0;
+ goto case_GE_reg;
+ }
+ /* LE to LT conversion by adding one to op1. */
+ op1 = GEN_INT (INTVAL (op1) + 1);
+ /* fallthru */
+
+ /* LT(op0, op1) := (unsigned)(op0 - op1) >> 31 */
+ case LT:
+case_LT:
+ /* LT to LTZ conversion by subtracting op1 from op0. */
+ emit_move_insn (dest,
+ expand_binop (SImode, sub_optab, op0, op1,
+ 0, 0, OPTAB_LIB_WIDEN));
+ emit_insn (gen_lshrsi3 (dest, dest, GEN_INT (31)));
+ return 1;
+
+ case GE:
+ if (REG_P (op1))
+ {
+case_GE_reg:
+ /* GE to GEZ conversion by subtracting op1 from op0. */
+ emit_move_insn (dest,
+ expand_binop (SImode, sub_optab, op0, op1,
+ 0, 0, OPTAB_LIB_WIDEN));
+ /* Emitting the dedicated insn pattern. */
+ emit_insn (gen_xtensa_ge_zero (dest, dest));
+ return 1;
+ }
+ /* GE to GT conversion by subtracting one from op1. */
+ op1 = GEN_INT (INTVAL (op1) - 1);
+ /* fallthru */
- one_tmp = gen_reg_rtx (SImode);
- zero_tmp = gen_reg_rtx (SImode);
- emit_insn (gen_movsi (one_tmp, const_true_rtx));
- emit_insn (gen_movsi (zero_tmp, const0_rtx));
+ case GT:
+ /* GT to LT conversion by swapping both sides. */
+ tmp0 = op0, op0 = op1, op1 = tmp0;
+ goto case_LT;
+ default:
+ break;
+ }
+
+ if (! (cmp = gen_conditional_move (code, cmp_mode, op0, op1)))
+ return 0;
+
+ tmp0 = force_reg (SImode, const0_rtx);
+ tmp1 = force_reg (SImode, const_true_rtx);
gen_fn = (cmp_mode == SImode
? gen_movsicc_internal0
: gen_movsicc_internal1);
- emit_insn (gen_fn (dest, XEXP (cmp, 0), one_tmp, zero_tmp, cmp));
+ emit_insn (gen_fn (dest, XEXP (cmp, 0), tmp1, tmp0, cmp));
+
return 1;
}
@@ -196,8 +196,8 @@
(match_operand:DI 2 "register_operand")))]
""
{
- rtx_code_label *label = gen_label_rtx ();
rtx lo_dest, hi_dest, lo_op0, hi_op0, lo_op1, hi_op1;
+ rtx_code_label *label;
lo_dest = gen_lowpart (SImode, operands[0]);
hi_dest = gen_highpart (SImode, operands[0]);
lo_op0 = gen_lowpart (SImode, operands[1]);
@@ -209,8 +209,8 @@
emit_clobber (operands[0]);
emit_insn (gen_addsi3 (lo_dest, lo_op0, lo_op1));
emit_insn (gen_addsi3 (hi_dest, hi_op0, hi_op1));
- emit_cmp_and_jump_insns (lo_dest, lo_op1, GEU,
- const0_rtx, SImode, true, label);
+ emit_cmp_and_jump_insns (lo_dest, lo_op1, GEU, const0_rtx,
+ SImode, true, label = gen_label_rtx ());
emit_insn (gen_addsi3 (hi_dest, hi_dest, const1_rtx));
emit_label (label);
DONE;
@@ -269,8 +269,8 @@
(match_operand:DI 2 "register_operand")))]
""
{
- rtx_code_label *label = gen_label_rtx ();
rtx lo_dest, hi_dest, lo_op0, hi_op0, lo_op1, hi_op1;
+ rtx_code_label *label;
lo_dest = gen_lowpart (SImode, operands[0]);
hi_dest = gen_highpart (SImode, operands[0]);
lo_op0 = gen_lowpart (SImode, operands[1]);
@@ -282,8 +282,8 @@
emit_clobber (operands[0]);
emit_insn (gen_subsi3 (lo_dest, lo_op0, lo_op1));
emit_insn (gen_subsi3 (hi_dest, hi_op0, hi_op1));
- emit_cmp_and_jump_insns (lo_op0, lo_op1, GEU,
- const0_rtx, SImode, true, label);
+ emit_cmp_and_jump_insns (lo_op0, lo_op1, GEU, const0_rtx,
+ SImode, true, label = gen_label_rtx ());
emit_insn (gen_addsi3 (hi_dest, hi_dest, constm1_rtx));
emit_label (label);
DONE;
@@ -3136,7 +3136,7 @@
(const_int 5)
(const_int 6)))])
-(define_insn_and_split "*signed_ge_zero"
+(define_insn_and_split "xtensa_ge_zero"
[(set (match_operand:SI 0 "register_operand" "=a")
(ge:SI (match_operand:SI 1 "register_operand" "r")
(const_int 0)))]