Use rem/div[u]_i32 drop div[u]2_i32


git-svn-id: svn://svn.savannah.nongnu.org/qemu/trunk@4722 c046a42c-6fe2-441c-8c8c-71466251a162
diff --git a/tcg/ppc/tcg-target.c b/tcg/ppc/tcg-target.c
index 9b5c6d6..0fd8e4b 100644
--- a/tcg/ppc/tcg-target.c
+++ b/tcg/ppc/tcg-target.c
@@ -23,8 +23,6 @@
  */
 
 static uint8_t *tb_ret_addr;
-static uint8_t *udiv_addr;
-static uint8_t *div_addr;
 
 #define FAST_PATH
 #if TARGET_PHYS_ADDR_BITS <= 32
@@ -137,22 +135,6 @@
     TCG_REG_R31
 };
 
-static const int div_save_regs[] = {
-    TCG_REG_R4,
-    TCG_REG_R5,
-    TCG_REG_R7,
-    TCG_REG_R8,
-    TCG_REG_R9,
-    TCG_REG_R10,
-    TCG_REG_R11,
-    TCG_REG_R12,
-    TCG_REG_R13,                /* should r13 be saved? */
-    TCG_REG_R24,
-    TCG_REG_R25,
-    TCG_REG_R26,
-    TCG_REG_R27,
-};
-
 static uint32_t reloc_pc24_val (void *pc, tcg_target_long target)
 {
     tcg_target_long disp;
@@ -817,22 +799,6 @@
 #endif
 }
 
-static uint64_t ppc_udiv_helper (uint64_t a, uint32_t b)
-{
-    uint64_t rem, quo;
-    quo = a / b;
-    rem = a % b;
-    return (rem << 32) | (uint32_t) quo;
-}
-
-static uint64_t ppc_div_helper (int64_t a, int32_t b)
-{
-    int64_t rem, quo;
-    quo = a / b;
-    rem = a % b;
-    return (rem << 32) | (uint32_t) quo;
-}
-
 void tcg_target_qemu_prologue (TCGContext *s)
 {
     int i, j, frame_size;
@@ -871,49 +837,6 @@
     tcg_out32 (s, MTSPR | RS (0) | LR);
     tcg_out32 (s, ADDI | RT (1) | RA (1) | frame_size);
     tcg_out32 (s, BCLR | BO_ALWAYS);
-
-    /* div trampolines */
-    for (j = 0; j < 2; ++j) {
-        tcg_target_long target;
-
-        frame_size = 8 + ARRAY_SIZE (div_save_regs) * 4;
-        frame_size = (frame_size + 15) & ~15;
-
-        if (j == 0) {
-            target = (tcg_target_long) ppc_udiv_helper;
-            udiv_addr = s->code_ptr;
-        }
-        else {
-            target = (tcg_target_long) ppc_div_helper;
-            div_addr = s->code_ptr;
-        }
-
-        tcg_out32 (s, MFSPR | RT (0) | LR);
-        tcg_out32 (s, STWU | RS (1) | RA (1) | (-frame_size & 0xffff));
-        for (i = 0; i < ARRAY_SIZE (div_save_regs); ++i)
-            tcg_out32 (s, (STW
-                           | RS (div_save_regs[i])
-                           | RA (1)
-                           | (i * 4 + 8)
-                           )
-                );
-        tcg_out32 (s, STW | RS (0) | RA (1) | (frame_size - 4));
-        tcg_out_mov (s, 4, 6);
-        tcg_out_b (s, LK, target);
-        tcg_out_mov (s, 6, 4);
-
-        for (i = 0; i < ARRAY_SIZE (div_save_regs); ++i)
-            tcg_out32 (s, (LWZ
-                           | RT (div_save_regs[i])
-                           | RA (1)
-                           | (i * 4 + 8)
-                           )
-                );
-        tcg_out32 (s, LWZ | RT (0) | RA (1) | (frame_size - 4));
-        tcg_out32 (s, MTSPR | RS (0) | LR);
-        tcg_out32 (s, ADDI | RT (1) | RA (1) | frame_size);
-        tcg_out32 (s, BCLR | BO_ALWAYS);
-    }
 }
 
 static void tcg_out_ld (TCGContext *s, TCGType type, int ret, int arg1,
@@ -1095,34 +1018,6 @@
     tcg_out_label(s, label_next, (tcg_target_long)s->code_ptr);
 }
 
-static void tcg_out_div2 (TCGContext *s, int uns)
-{
-    void *label1_ptr, *label2_ptr;
-
-    if (uns)
-        tcg_out32 (s, CMPLI | BF (7) | RA (3));
-    else {
-        tcg_out32 (s, SRAWI | RS (4) | RA (0) | 31);
-        tcg_out32 (s, CMPL | BF (7) | RA (3) | RB (4));
-    }
-
-    label1_ptr = s->code_ptr;
-    tcg_out32 (s, BC | BI (7, CR_EQ) | BO_COND_TRUE);
-
-    tcg_out_b (s, LK, (tcg_target_long) (uns ? udiv_addr : div_addr));
-
-    label2_ptr = s->code_ptr;
-    tcg_out32 (s, B);
-
-    reloc_pc14 (label1_ptr, (tcg_target_long) s->code_ptr);
-
-    tcg_out32 (s, (uns ? DIVWU : DIVW) | TAB (6, 4, 5));
-    tcg_out32 (s, MULLW | TAB (0, 6, 5));
-    tcg_out32 (s, SUBF | TAB (3, 0, 4));
-
-    reloc_pc24 (label2_ptr, (tcg_target_long) s->code_ptr);
-}
-
 static void tcg_out_op(TCGContext *s, int opc, const TCGArg *args,
                        const int *const_args)
 {
@@ -1301,6 +1196,27 @@
         else
             tcg_out32 (s, MULLW | TAB (args[0], args[1], args[2]));
         break;
+
+    case INDEX_op_div_i32:
+        tcg_out32 (s, DIVW | TAB (args[0], args[1], args[2]));
+        break;
+
+    case INDEX_op_divu_i32:
+        tcg_out32 (s, DIVWU | TAB (args[0], args[1], args[2]));
+        break;
+
+    case INDEX_op_rem_i32:
+        tcg_out32 (s, DIVW | TAB (0, args[1], args[2]));
+        tcg_out32 (s, MULLW | TAB (0, 0, args[2]));
+        tcg_out32 (s, SUBF | TAB (args[0], 0, args[1]));
+        break;
+
+    case INDEX_op_remu_i32:
+        tcg_out32 (s, DIVWU | TAB (0, args[1], args[2]));
+        tcg_out32 (s, MULLW | TAB (0, 0, args[2]));
+        tcg_out32 (s, SUBF | TAB (args[0], 0, args[1]));
+        break;
+
     case INDEX_op_mulu2_i32:
         if (args[0] == args[2] || args[0] == args[3]) {
             tcg_out32 (s, MULLW | TAB (0, args[2], args[3]));
@@ -1312,12 +1228,6 @@
             tcg_out32 (s, MULHWU | TAB (args[1], args[2], args[3]));
         }
         break;
-    case INDEX_op_div2_i32:
-        tcg_out_div2 (s, 0);
-        break;
-    case INDEX_op_divu2_i32:
-        tcg_out_div2 (s, 1);
-        break;
 
     case INDEX_op_shl_i32:
         if (const_args[2]) {
@@ -1458,9 +1368,11 @@
 
     { INDEX_op_add_i32, { "r", "r", "ri" } },
     { INDEX_op_mul_i32, { "r", "r", "ri" } },
+    { INDEX_op_div_i32, { "r", "r", "r" } },
+    { INDEX_op_divu_i32, { "r", "r", "r" } },
+    { INDEX_op_rem_i32, { "r", "r", "r" } },
+    { INDEX_op_remu_i32, { "r", "r", "r" } },
     { INDEX_op_mulu2_i32, { "r", "r", "r", "r" } },
-    { INDEX_op_div2_i32, { "D", "A", "B", "1", "C" } },
-    { INDEX_op_divu2_i32, { "D", "A", "B", "1", "C" } },
     { INDEX_op_sub_i32, { "r", "r", "ri" } },
     { INDEX_op_and_i32, { "r", "r", "ri" } },
     { INDEX_op_or_i32, { "r", "r", "ri" } },
diff --git a/tcg/ppc/tcg-target.h b/tcg/ppc/tcg-target.h
index e7a1c2a..db1b121 100644
--- a/tcg/ppc/tcg-target.h
+++ b/tcg/ppc/tcg-target.h
@@ -70,6 +70,7 @@
 
 /* optional instructions */
 #define TCG_TARGET_HAS_neg_i32
+#define TCG_TARGET_HAS_div_i32
 
 #define TCG_AREG0 TCG_REG_R27
 #define TCG_AREG1 TCG_REG_R24