forked from cores/microwatt
217 lines
7.7 KiB
Diff
217 lines
7.7 KiB
Diff
[PATCH] Hack out ppc64le gcc fixed point divide instructions
|
|
|
|
This is a pretty horrible short term hack that removes hardware fixed
|
|
point divides from ppc64le gcc. It breaks VMX/VSX, but we aren't using
|
|
either on microwatt. We'll implement a hardware divide shortly and this
|
|
can go away. Please don't tell my toolchain team.
|
|
|
|
The firmware.hex file in this directory is a build of micropython using
|
|
a recent mainline gcc with this patch.
|
|
|
|
Signed-off-by: Anton Blanchard <anton@linux.ibm.com>
|
|
---
|
|
|
|
diff --git a/gcc/config/rs6000/rs6000-builtin.def b/gcc/config/rs6000/rs6000-builtin.def
|
|
index 0a2bdb79e15..02e325b73a9 100644
|
|
--- a/gcc/config/rs6000/rs6000-builtin.def
|
|
+++ b/gcc/config/rs6000/rs6000-builtin.def
|
|
@@ -1581,7 +1581,6 @@ BU_VSX_2 (VEC_MERGEH_V2DF, "mergeh_2df", CONST, vsx_mergeh_v2df)
|
|
BU_VSX_2 (VEC_MERGEH_V2DI, "mergeh_2di", CONST, vsx_mergeh_v2di)
|
|
BU_VSX_2 (XXSPLTD_V2DF, "xxspltd_2df", CONST, vsx_xxspltd_v2df)
|
|
BU_VSX_2 (XXSPLTD_V2DI, "xxspltd_2di", CONST, vsx_xxspltd_v2di)
|
|
-BU_VSX_2 (DIV_V2DI, "div_2di", CONST, vsx_div_v2di)
|
|
BU_VSX_2 (UDIV_V2DI, "udiv_2di", CONST, vsx_udiv_v2di)
|
|
BU_VSX_2 (MUL_V2DI, "mul_2di", CONST, vsx_mul_v2di)
|
|
|
|
diff --git a/gcc/config/rs6000/rs6000-c.c b/gcc/config/rs6000/rs6000-c.c
|
|
index 7f0cdc73d9b..ad0a8a74e63 100644
|
|
--- a/gcc/config/rs6000/rs6000-c.c
|
|
+++ b/gcc/config/rs6000/rs6000-c.c
|
|
@@ -1459,8 +1459,6 @@ const struct altivec_builtin_types altivec_overloaded_builtins[] = {
|
|
RS6000_BTI_V4SF, RS6000_BTI_V4SF, RS6000_BTI_V4SF, 0 },
|
|
{ VSX_BUILTIN_VEC_DIV, VSX_BUILTIN_XVDIVDP,
|
|
RS6000_BTI_V2DF, RS6000_BTI_V2DF, RS6000_BTI_V2DF, 0 },
|
|
- { VSX_BUILTIN_VEC_DIV, VSX_BUILTIN_DIV_V2DI,
|
|
- RS6000_BTI_V2DI, RS6000_BTI_V2DI, RS6000_BTI_V2DI, 0 },
|
|
{ VSX_BUILTIN_VEC_DIV, VSX_BUILTIN_UDIV_V2DI,
|
|
RS6000_BTI_unsigned_V2DI, RS6000_BTI_unsigned_V2DI, RS6000_BTI_unsigned_V2DI, 0 },
|
|
{ VSX_BUILTIN_VEC_DOUBLE, VSX_BUILTIN_XVCVSXDDP,
|
|
diff --git a/gcc/config/rs6000/rs6000-call.c b/gcc/config/rs6000/rs6000-call.c
|
|
index 832eda7cbad..1c5245c781b 100644
|
|
--- a/gcc/config/rs6000/rs6000-call.c
|
|
+++ b/gcc/config/rs6000/rs6000-call.c
|
|
@@ -5445,7 +5445,6 @@ rs6000_gimple_fold_builtin (gimple_stmt_iterator *gsi)
|
|
gsi_replace (gsi, g, true);
|
|
return true;
|
|
/* Flavors of vec_div (Integer). */
|
|
- case VSX_BUILTIN_DIV_V2DI:
|
|
case VSX_BUILTIN_UDIV_V2DI:
|
|
arg0 = gimple_call_arg (stmt, 0);
|
|
arg1 = gimple_call_arg (stmt, 1);
|
|
diff --git a/gcc/config/rs6000/rs6000.md b/gcc/config/rs6000/rs6000.md
|
|
index 9a7a1da987f..c443c2fe579 100644
|
|
--- a/gcc/config/rs6000/rs6000.md
|
|
+++ b/gcc/config/rs6000/rs6000.md
|
|
@@ -3071,45 +3071,6 @@
|
|
"maddld %0,%1,%2,%3"
|
|
[(set_attr "type" "mul")])
|
|
|
|
-(define_insn "udiv<mode>3"
|
|
- [(set (match_operand:GPR 0 "gpc_reg_operand" "=r")
|
|
- (udiv:GPR (match_operand:GPR 1 "gpc_reg_operand" "r")
|
|
- (match_operand:GPR 2 "gpc_reg_operand" "r")))]
|
|
- ""
|
|
- "div<wd>u %0,%1,%2"
|
|
- [(set_attr "type" "div")
|
|
- (set_attr "size" "<bits>")])
|
|
-
|
|
-
|
|
-;; For powers of two we can do sra[wd]i/addze for divide and then adjust for
|
|
-;; modulus. If it isn't a power of two, force operands into register and do
|
|
-;; a normal divide.
|
|
-(define_expand "div<mode>3"
|
|
- [(set (match_operand:GPR 0 "gpc_reg_operand")
|
|
- (div:GPR (match_operand:GPR 1 "gpc_reg_operand")
|
|
- (match_operand:GPR 2 "reg_or_cint_operand")))]
|
|
- ""
|
|
-{
|
|
- if (CONST_INT_P (operands[2])
|
|
- && INTVAL (operands[2]) > 0
|
|
- && exact_log2 (INTVAL (operands[2])) >= 0)
|
|
- {
|
|
- emit_insn (gen_div<mode>3_sra (operands[0], operands[1], operands[2]));
|
|
- DONE;
|
|
- }
|
|
-
|
|
- operands[2] = force_reg (<MODE>mode, operands[2]);
|
|
-})
|
|
-
|
|
-(define_insn "*div<mode>3"
|
|
- [(set (match_operand:GPR 0 "gpc_reg_operand" "=r")
|
|
- (div:GPR (match_operand:GPR 1 "gpc_reg_operand" "r")
|
|
- (match_operand:GPR 2 "gpc_reg_operand" "r")))]
|
|
- ""
|
|
- "div<wd> %0,%1,%2"
|
|
- [(set_attr "type" "div")
|
|
- (set_attr "size" "<bits>")])
|
|
-
|
|
(define_insn "div<mode>3_sra"
|
|
[(set (match_operand:GPR 0 "gpc_reg_operand" "=r")
|
|
(div:GPR (match_operand:GPR 1 "gpc_reg_operand" "r")
|
|
@@ -3170,37 +3131,6 @@
|
|
(set_attr "length" "8,12")
|
|
(set_attr "cell_micro" "not")])
|
|
|
|
-(define_expand "mod<mode>3"
|
|
- [(set (match_operand:GPR 0 "gpc_reg_operand")
|
|
- (mod:GPR (match_operand:GPR 1 "gpc_reg_operand")
|
|
- (match_operand:GPR 2 "reg_or_cint_operand")))]
|
|
- ""
|
|
-{
|
|
- int i;
|
|
- rtx temp1;
|
|
- rtx temp2;
|
|
-
|
|
- if (!CONST_INT_P (operands[2])
|
|
- || INTVAL (operands[2]) <= 0
|
|
- || (i = exact_log2 (INTVAL (operands[2]))) < 0)
|
|
- {
|
|
- if (!TARGET_MODULO)
|
|
- FAIL;
|
|
-
|
|
- operands[2] = force_reg (<MODE>mode, operands[2]);
|
|
- }
|
|
- else
|
|
- {
|
|
- temp1 = gen_reg_rtx (<MODE>mode);
|
|
- temp2 = gen_reg_rtx (<MODE>mode);
|
|
-
|
|
- emit_insn (gen_div<mode>3 (temp1, operands[1], operands[2]));
|
|
- emit_insn (gen_ashl<mode>3 (temp2, temp1, GEN_INT (i)));
|
|
- emit_insn (gen_sub<mode>3 (operands[0], operands[1], temp2));
|
|
- DONE;
|
|
- }
|
|
-})
|
|
-
|
|
;; In order to enable using a peephole2 for combining div/mod to eliminate the
|
|
;; mod, prefer putting the result of mod into a different register
|
|
(define_insn "*mod<mode>3"
|
|
diff --git a/gcc/config/rs6000/vsx.md b/gcc/config/rs6000/vsx.md
|
|
index 7633171df9c..1a2ac66bd43 100644
|
|
--- a/gcc/config/rs6000/vsx.md
|
|
+++ b/gcc/config/rs6000/vsx.md
|
|
@@ -1602,53 +1602,6 @@
|
|
"xvdiv<sd>p %x0,%x1,%x2"
|
|
[(set_attr "type" "<VStype_div>")])
|
|
|
|
-; Emulate vector with scalar for vec_div in V2DImode
|
|
-(define_insn_and_split "vsx_div_v2di"
|
|
- [(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
|
|
- (unspec:V2DI [(match_operand:V2DI 1 "vsx_register_operand" "wa")
|
|
- (match_operand:V2DI 2 "vsx_register_operand" "wa")]
|
|
- UNSPEC_VSX_DIVSD))]
|
|
- "VECTOR_MEM_VSX_P (V2DImode)"
|
|
- "#"
|
|
- "VECTOR_MEM_VSX_P (V2DImode) && !reload_completed"
|
|
- [(const_int 0)]
|
|
-{
|
|
- rtx op0 = operands[0];
|
|
- rtx op1 = operands[1];
|
|
- rtx op2 = operands[2];
|
|
- rtx op3 = gen_reg_rtx (DImode);
|
|
- rtx op4 = gen_reg_rtx (DImode);
|
|
- rtx op5 = gen_reg_rtx (DImode);
|
|
- emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (0)));
|
|
- emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (0)));
|
|
- if (TARGET_POWERPC64)
|
|
- emit_insn (gen_divdi3 (op5, op3, op4));
|
|
- else
|
|
- {
|
|
- rtx libfunc = optab_libfunc (sdiv_optab, DImode);
|
|
- rtx target = emit_library_call_value (libfunc,
|
|
- op5, LCT_NORMAL, DImode,
|
|
- op3, DImode,
|
|
- op4, DImode);
|
|
- emit_move_insn (op5, target);
|
|
- }
|
|
- emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (1)));
|
|
- emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (1)));
|
|
- if (TARGET_POWERPC64)
|
|
- emit_insn (gen_divdi3 (op3, op3, op4));
|
|
- else
|
|
- {
|
|
- rtx libfunc = optab_libfunc (sdiv_optab, DImode);
|
|
- rtx target = emit_library_call_value (libfunc,
|
|
- op3, LCT_NORMAL, DImode,
|
|
- op3, DImode,
|
|
- op4, DImode);
|
|
- emit_move_insn (op3, target);
|
|
- }
|
|
- emit_insn (gen_vsx_concat_v2di (op0, op5, op3));
|
|
- DONE;
|
|
-}
|
|
- [(set_attr "type" "div")])
|
|
|
|
(define_insn_and_split "vsx_udiv_v2di"
|
|
[(set (match_operand:V2DI 0 "vsx_register_operand" "=wa")
|
|
@@ -1668,9 +1621,6 @@
|
|
rtx op5 = gen_reg_rtx (DImode);
|
|
emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (0)));
|
|
emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (0)));
|
|
- if (TARGET_POWERPC64)
|
|
- emit_insn (gen_udivdi3 (op5, op3, op4));
|
|
- else
|
|
{
|
|
rtx libfunc = optab_libfunc (udiv_optab, DImode);
|
|
rtx target = emit_library_call_value (libfunc,
|
|
@@ -1681,9 +1631,6 @@
|
|
}
|
|
emit_insn (gen_vsx_extract_v2di (op3, op1, GEN_INT (1)));
|
|
emit_insn (gen_vsx_extract_v2di (op4, op2, GEN_INT (1)));
|
|
- if (TARGET_POWERPC64)
|
|
- emit_insn (gen_udivdi3 (op3, op3, op4));
|
|
- else
|
|
{
|
|
rtx libfunc = optab_libfunc (udiv_optab, DImode);
|
|
rtx target = emit_library_call_value (libfunc,
|