Commit 9259f3b0 by David Edelsohn Committed by David Edelsohn

{40x.md,603.md,6xx.md,7450.md,7xx.md,mpc.md, [...]: Change mult_compare to imul_compare.

        * config/rs6000/{40x.md,603.md,6xx.md,7450.md,7xx.md,mpc.md,
        power4.md,rios1.md,rios2.md,rs64.md}: Change mult_compare to
        imul_compare.  Add lmul_compare.
        * config/rs6000/power4.md: Bump some latencies.  Model extra cycle
        in second pair of dispatch slots.  Model stores more accurately.
        Tweak multiply model.  Add bypasses for CR instructions dependent
        on complicated compares.
        * config/rs6000/rs6000.md (mulsi3): Name imul_compare patterns.
        (muldi3): Add lmul_compare patterns.
        * config/rs6000/rs6000.c (rs6000_variable_issue): Move FPLOAD_UX
        and FPSTORE_UX to split instructions and add COMPARE,
        DELAYED_COMPARE, IMUL_COMPARE, LMUL_COMPARE, IDIV, LDIV.
        (rs6000_adjust_cost): Add IMUL_COMPARE and LMUL_COMPARE.
        (rs6000_rtx_costs): Separate POWER4 multiply case.

From-SVN: r65135
parent 7fe317e4
2003-04-01 David Edelsohn <edelsohn@gnu.org>
* config/rs6000/{40x.md,603.md,6xx.md,7450.md,7xx.md,mpc.md,
power4.md,rios1.md,rios2.md,rs64.md}: Change mult_compare to
imul_compare. Add lmul_compare.
* config/rs6000/power4.md: Bump some latencies. Model extra cycle
in second pair of dispatch slots. Model stores more accurately.
Tweak multiply model. Add bypasses for CR instructions dependent
on complicated compares.
* config/rs6000/rs6000.md (mulsi3): Name imul_compare patterns.
(muldi3): Add lmul_compare patterns.
* config/rs6000/rs6000.c (rs6000_variable_issue): Move FPLOAD_UX
and FPSTORE_UX to split instructions and add COMPARE,
DELAYED_COMPARE, IMUL_COMPARE, LMUL_COMPARE, IDIV, LDIV.
(rs6000_adjust_cost): Add IMUL_COMPARE and LMUL_COMPARE.
(rs6000_rtx_costs): Separate POWER4 multiply case.
2003-04-01 Ulrich Weigand <uweigand@de.ibm.com> 2003-04-01 Ulrich Weigand <uweigand@de.ibm.com>
* config/s390/s390.c (s390_fixup_clobbered_return_reg): * config/s390/s390.c (s390_fixup_clobbered_return_reg):
......
...@@ -46,12 +46,12 @@ ...@@ -46,12 +46,12 @@
"iu_40x,nothing,bpu_40x") "iu_40x,nothing,bpu_40x")
(define_insn_reservation "ppc403-imul" 4 (define_insn_reservation "ppc403-imul" 4
(and (eq_attr "type" "imul,imul2,imul3,mult_compare") (and (eq_attr "type" "imul,imul2,imul3,imul_compare")
(eq_attr "cpu" "ppc403")) (eq_attr "cpu" "ppc403"))
"iu_40x*4") "iu_40x*4")
(define_insn_reservation "ppc405-imul" 5 (define_insn_reservation "ppc405-imul" 5
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul,imul_compare")
(eq_attr "cpu" "ppc405")) (eq_attr "cpu" "ppc405"))
"iu_40x*4") "iu_40x*4")
......
...@@ -60,7 +60,7 @@ ...@@ -60,7 +60,7 @@
; This takes 2 or 3 cycles ; This takes 2 or 3 cycles
(define_insn_reservation "ppc603-imul" 3 (define_insn_reservation "ppc603-imul" 3
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul,imul_compare")
(eq_attr "cpu" "ppc603")) (eq_attr "cpu" "ppc603"))
"iu_603*2") "iu_603*2")
......
...@@ -69,17 +69,17 @@ ...@@ -69,17 +69,17 @@
"iu1_6xx|iu2_6xx") "iu1_6xx|iu2_6xx")
(define_insn_reservation "ppc604-imul" 4 (define_insn_reservation "ppc604-imul" 4
(and (eq_attr "type" "imul,imul2,imul3,mult_compare") (and (eq_attr "type" "imul,imul2,imul3,imul_compare")
(eq_attr "cpu" "ppc604")) (eq_attr "cpu" "ppc604"))
"mciu_6xx*2") "mciu_6xx*2")
(define_insn_reservation "ppc604e-imul" 2 (define_insn_reservation "ppc604e-imul" 2
(and (eq_attr "type" "imul,imul2,imul3,mult_compare") (and (eq_attr "type" "imul,imul2,imul3,imul_compare")
(eq_attr "cpu" "ppc604e")) (eq_attr "cpu" "ppc604e"))
"mciu_6xx") "mciu_6xx")
(define_insn_reservation "ppc620-imul" 5 (define_insn_reservation "ppc620-imul" 5
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul,imul_compare")
(eq_attr "cpu" "ppc620,ppc630")) (eq_attr "cpu" "ppc620,ppc630"))
"mciu_6xx*3") "mciu_6xx*3")
...@@ -94,7 +94,7 @@ ...@@ -94,7 +94,7 @@
"mciu_6xx*3") "mciu_6xx*3")
(define_insn_reservation "ppc620-lmul" 7 (define_insn_reservation "ppc620-lmul" 7
(and (eq_attr "type" "lmul") (and (eq_attr "type" "lmul,lmul_compare")
(eq_attr "cpu" "ppc620,ppc630")) (eq_attr "cpu" "ppc620,ppc630"))
"mciu_6xx*5") "mciu_6xx*5")
......
...@@ -69,7 +69,7 @@ ...@@ -69,7 +69,7 @@
"ppc7450_du,(iu1_7450|iu2_7450|iu3_7450)") "ppc7450_du,(iu1_7450|iu2_7450|iu3_7450)")
(define_insn_reservation "ppc7450-imul" 4 (define_insn_reservation "ppc7450-imul" 4
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul,imul_compare")
(eq_attr "cpu" "ppc7450")) (eq_attr "cpu" "ppc7450"))
"ppc7450_du,mciu_7450*2") "ppc7450_du,mciu_7450*2")
......
...@@ -64,7 +64,7 @@ ...@@ -64,7 +64,7 @@
"ppc750_du,(iu1_7xx|iu2_7xx)") "ppc750_du,(iu1_7xx|iu2_7xx)")
(define_insn_reservation "ppc750-imul" 4 (define_insn_reservation "ppc750-imul" 4
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul,imul_compare")
(eq_attr "cpu" "ppc750,ppc7400")) (eq_attr "cpu" "ppc750,ppc7400"))
"ppc750_du,iu1_7xx*4") "ppc750_du,iu1_7xx*4")
......
...@@ -90,7 +90,7 @@ ...@@ -90,7 +90,7 @@
;; Multiply ;; Multiply
(define_insn_reservation "ppc8540_multiply" 4 (define_insn_reservation "ppc8540_multiply" 4
(and (eq_attr "type" "imul,imul2,imul3,mult_compare") (and (eq_attr "type" "imul,imul2,imul3,imul_compare")
(eq_attr "cpu" "ppc8540")) (eq_attr "cpu" "ppc8540"))
"ppc8540_decode,ppc8540_issue+ppc8540_miu_stage0,ppc8540_miu_stage1,\ "ppc8540_decode,ppc8540_issue+ppc8540_miu_stage0,ppc8540_miu_stage1,\
ppc8540_miu_stage2,ppc8540_miu_stage3,ppc8540_retire") ppc8540_miu_stage2,ppc8540_miu_stage3,ppc8540_retire")
......
...@@ -47,7 +47,7 @@ ...@@ -47,7 +47,7 @@
"iu_mpc") "iu_mpc")
(define_insn_reservation "mpccore-imul" 2 (define_insn_reservation "mpccore-imul" 2
(and (eq_attr "type" "imul,imul2,imul3,mult_compare") (and (eq_attr "type" "imul,imul2,imul3,imul_compare")
(eq_attr "cpu" "mpccore")) (eq_attr "cpu" "mpccore"))
"mciu_mpc") "mciu_mpc")
......
...@@ -35,12 +35,9 @@ ...@@ -35,12 +35,9 @@
(define_cpu_unit "du1_power4,du2_power4,du3_power4,du4_power4,du5_power4" (define_cpu_unit "du1_power4,du2_power4,du3_power4,du4_power4,du5_power4"
"power4disp") "power4disp")
(define_reservation "q1_power4" "du1_power4|du4_power4") (define_reservation "lsq_power4"
(define_reservation "q2_power4" "du2_power4|du3_power4") "(du1_power4,lsu1_power4)\
(define_reservation "q4_power4" "du1_power4|du2_power4|du3_power4|du4_power4") |(du2_power4,lsu2_power4)\
(define_reservation "lsq_power4" "(q1_power4,lsu1_power4)\
|(q2_power4,lsu2_power4)\
|(du3_power4,nothing,lsu2_power4)\ |(du3_power4,nothing,lsu2_power4)\
|(du4_power4,nothing,lsu1_power4)") |(du4_power4,nothing,lsu1_power4)")
...@@ -48,27 +45,31 @@ ...@@ -48,27 +45,31 @@
"((du1_power4+du2_power4),lsu1_power4+iu2_power4)\ "((du1_power4+du2_power4),lsu1_power4+iu2_power4)\
|((du2_power4+du3_power4),lsu2_power4+iu2_power4)\ |((du2_power4+du3_power4),lsu2_power4+iu2_power4)\
|((du3_power4+du4_power4),lsu2_power4+iu1_power4)") |((du3_power4+du4_power4),lsu2_power4+iu1_power4)")
;;; |((du2_power4+du3_power4),lsu2_power4,iu2_power4) ; |((du2_power4+du3_power4),nothing,lsu2_power4,iu2_power4)
(define_reservation "lsuxq_power4"
"(du1_power4+du2_power4+du3_power4+du4_power4),\
iu1_power4,(lsu2_power4+iu2_power4)")
(define_reservation "iq_power4" "(q1_power4,iu1_power4)\ (define_reservation "iq_power4"
|(q2_power4,iu2_power4)\ "(du1_power4,iu1_power4)\
|(du2_power4,iu2_power4)\
|(du3_power4,nothing,iu2_power4)\ |(du3_power4,nothing,iu2_power4)\
|(du4_power4,nothing,iu1_power4)") |(du4_power4,nothing,iu1_power4)")
(define_reservation "fpq_power4" "(q1_power4,fpu1_power4)\ (define_reservation "fpq_power4"
|(q2_power4,fpu2_power4)\ "(du1_power4,fpu1_power4)\
|(du2_power4,fpu2_power4)\
|(du3_power4,nothing,fpu2_power4)\ |(du3_power4,nothing,fpu2_power4)\
|(du4_power4,nothing,fpu1_power4)") |(du4_power4,nothing,fpu1_power4)")
(define_reservation "vq_power4" (define_reservation "vq_power4"
"(q4_power4,vec_power4)|(q4_power4,nothing,vec_power4)") "(du1_power4,vec_power4)\
|(du2_power4,vec_power4)\
|(du3_power4,nothing,vec_power4)\
|(du4_power4,nothing,vec_power4)")
(define_reservation "vpq_power4" (define_reservation "vpq_power4"
"(q4_power4,vecperm_power4)\ "(du1_power4,vecperm_power4)\
|(q4_power4,nothing,vecperm_power4)") |(du2_power4,vecperm_power4)\
|(du3_power4,nothing,vecperm_power4)\
|(du4_power4,nothing,vecperm_power4)")
; Dispatch slots are allocated in order conforming to program order. ; Dispatch slots are allocated in order conforming to program order.
...@@ -79,7 +80,7 @@ ...@@ -79,7 +80,7 @@
; Load/store ; Load/store
(define_insn_reservation "power4-load" 3 (define_insn_reservation "power4-load" 4 ; 3
(and (eq_attr "type" "load") (and (eq_attr "type" "load")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsq_power4") "lsq_power4")
...@@ -87,9 +88,9 @@ ...@@ -87,9 +88,9 @@
(define_insn_reservation "power4-load-ext" 5 (define_insn_reservation "power4-load-ext" 5
(and (eq_attr "type" "load_ext") (and (eq_attr "type" "load_ext")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"((du1_power4+du2_power4),lsu1_power4,nothing,nothing,iu2_power4)\ "(du1_power4+du2_power4,lsu1_power4,nothing,nothing,iu2_power4)\
|((du2_power4+du3_power4),lsu2_power4,nothing,nothing,iu2_power4)\ |(du2_power4+du3_power4,lsu2_power4,nothing,nothing,iu2_power4)\
|((du3_power4+du4_power4),lsu2_power4,nothing,nothing,iu1_power4)") |(du3_power4+du4_power4,lsu2_power4,nothing,nothing,iu1_power4)")
(define_insn_reservation "power4-load-ext-update" 5 (define_insn_reservation "power4-load-ext-update" 5
(and (eq_attr "type" "load_ext_u") (and (eq_attr "type" "load_ext_u")
...@@ -101,34 +102,30 @@ ...@@ -101,34 +102,30 @@
(and (eq_attr "type" "load_ext_ux") (and (eq_attr "type" "load_ext_ux")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(du1_power4+du2_power4+du3_power4+du4_power4),\ "(du1_power4+du2_power4+du3_power4+du4_power4),\
iu1_power4,(lsu2_power4+iu1_power4),nothing,nothing,iu2_power4") iu1_power4,lsu2_power4+iu1_power4,nothing,nothing,iu2_power4")
(define_insn_reservation "power4-load-update-indexed" 3 (define_insn_reservation "power4-load-update-indexed" 4 ; 3
(and (eq_attr "type" "load_ux") (and (eq_attr "type" "load_ux")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsuxq_power4") "du1_power4+du2_power4+du3_power4+du4_power4,\
iu1_power4,lsu2_power4+iu2_power4")
(define_insn_reservation "power4-load-update" 3 (define_insn_reservation "power4-load-update" 4 ; 3
(and (eq_attr "type" "load_u") (and (eq_attr "type" "load_u")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsuq_power4") "lsuq_power4")
(define_insn_reservation "power4-fpload" 5 (define_insn_reservation "power4-fpload" 6 ; 5
(and (eq_attr "type" "fpload") (and (eq_attr "type" "fpload")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsq_power4") "lsq_power4")
(define_insn_reservation "power4-fpload-update" 5 (define_insn_reservation "power4-fpload-update" 6 ; 5
(and (eq_attr "type" "fpload_u") (and (eq_attr "type" "fpload_u,fpload_ux")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsuq_power4") "lsuq_power4")
(define_insn_reservation "power4-fpload-update-indexed" 5 (define_insn_reservation "power4-vecload" 6 ; 5
(and (eq_attr "type" "fpload_ux")
(eq_attr "cpu" "power4"))
"lsuxq_power4")
(define_insn_reservation "power4-vecload" 5
(and (eq_attr "type" "vecload") (and (eq_attr "type" "vecload")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsq_power4") "lsq_power4")
...@@ -136,44 +133,48 @@ ...@@ -136,44 +133,48 @@
(define_insn_reservation "power4-store" 1 (define_insn_reservation "power4-store" 1
(and (eq_attr "type" "store") (and (eq_attr "type" "store")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,lsu1_power4,iu1_power4)\ "(du1_power4,lsu1_power4,iu1_power4)\
|(q2_power4,lsu2_power4,iu2_power4)") |(du2_power4,lsu2_power4,iu2_power4)\
|(du3_power4,lsu2_power4,nothing,iu2_power4)\
|(du4_power4,lsu1_power4,nothing,iu1_power4)")
(define_insn_reservation "power4-store-update" 1 (define_insn_reservation "power4-store-update" 1
(and (eq_attr "type" "store_u") (and (eq_attr "type" "store_u")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsuq_power4") "(du1_power4+du2_power4,lsu1_power4+iu2_power4,iu1_power4)\
|(du2_power4+du3_power4,lsu2_power4+iu2_power4,iu2_power4)\
|(du3_power4+du4_power4,lsu2_power4+iu1_power4,iu2_power4)\
|(du3_power4+du4_power4,lsu2_power4,iu1_power4,iu2_power4)")
(define_insn_reservation "power4-store-update-indexed" 1 (define_insn_reservation "power4-store-update-indexed" 1
(and (eq_attr "type" "store_ux") (and (eq_attr "type" "store_ux")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"lsuxq_power4") "du1_power4+du2_power4+du3_power4+du4_power4,\
iu1_power4,lsu2_power4+iu2_power4,iu2_power4")
(define_insn_reservation "power4-fpstore" 1 (define_insn_reservation "power4-fpstore" 1
(and (eq_attr "type" "fpstore") (and (eq_attr "type" "fpstore")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,lsu1_power4,fpu1_power4)\ "(du1_power4,lsu1_power4,fpu1_power4)\
|(q2_power4,lsu2_power4,fpu2_power4)") |(du2_power4,lsu2_power4,fpu2_power4)\
|(du3_power4,lsu2_power4,nothing,fpu2_power4)\
|(du4_power4,lsu1_power4,nothing,fpu1_power4)")
(define_insn_reservation "power4-fpstore-update" 1 (define_insn_reservation "power4-fpstore-update" 1
(and (eq_attr "type" "fpstore_u") (and (eq_attr "type" "fpstore_u,fpstore_ux")
(eq_attr "cpu" "power4"))
"((du1_power4+du2_power4),(fpu1_power4+iu2_power4),lsu1_power4)\
|((du2_power4+du3_power4),(fpu2_power4+iu2_power4),lsu2_power4)\
|((du3_power4+du4_power4),(fpu2_power4+iu1_power4),lsu2_power4)")
;;;((du2_power4+du3_power4),fpu2_power4,(iu2_power4+lsu2_power4))
(define_insn_reservation "power4-fpstore-update-indexed" 1
(and (eq_attr "type" "fpstore_ux")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(du1_power4+du2_power4+du3_power4+du4_power4), "(du1_power4+du2_power4,lsu1_power4+iu2_power4,fpu1_power4)\
iu1_power4,fpu2_power4,(iu2_power4+lsu2_power4)") |(du2_power4+du3_power4,lsu2_power4+iu2_power4,fpu2_power4)\
|(du3_power4+du4_power4,lsu2_power4+iu1_power4,fpu2_power4)")
; |(du3_power4+du4_power4,nothing,lsu2_power4+iu1_power4,fpu2_power4)")
(define_insn_reservation "power4-vecstore" 1 (define_insn_reservation "power4-vecstore" 1
(and (eq_attr "type" "vecstore") (and (eq_attr "type" "vecstore")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,lsu1_power4,vec_power4)\ "(du1_power4,lsu1_power4,vec_power4)\
|(q2_power4,lsu2_power4,vec_power4)") |(du2_power4,lsu2_power4,vec_power4)\
|(du3_power4,lsu2_power4,nothing,vec_power4)\
|(du4_power4,lsu1_power4,nothing,vec_power4)")
; Integer latency is 2 cycles ; Integer latency is 2 cycles
...@@ -187,29 +188,65 @@ ...@@ -187,29 +188,65 @@
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"iq_power4") "iq_power4")
(define_insn_reservation "power4-compare" 4 (define_insn_reservation "power4-compare" 2
(and (eq_attr "type" "compare,delayed_compare") (and (eq_attr "type" "compare,delayed_compare")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"((du1_power4+du2_power4),iu1_power4,iu2_power4)\ "(du1_power4+du2_power4,iu1_power4,iu2_power4)\
|((du2_power4+du3_power4),iu2_power4,iu2_power4)\ |(du2_power4+du3_power4,iu2_power4,iu2_power4)\
|((du3_power4+du4_power4),iu2_power4,iu1_power4)") |(du3_power4+du4_power4,nothing,iu2_power4,iu1_power4)")
(define_bypass 4 "power4-compare" "power4-branch,power4-crlogical,power4-delayedcr,power4-mfcr")
(define_insn_reservation "power4-lmul-cmp" 8 ; 7
(and (eq_attr "type" "lmul_compare")
(eq_attr "cpu" "power4"))
"(du1_power4+du2_power4,iu1_power4*6,iu2_power4)\
|(du2_power4+du3_power4,iu2_power4*6,iu2_power4)\
|(du3_power4+du4_power4,iu2_power4*6,iu1_power4)")
; |(du3_power4+du4_power4,nothing,iu2_power4*6,iu1_power4)")
(define_bypass 2 "power4-compare" "power4-integer") (define_bypass 10 "power4-lmul-cmp" "power4-branch,power4-crlogical,power4-delayedcr,power4-mfcr")
(define_insn_reservation "power4-imul" 7 (define_insn_reservation "power4-imul-cmp" 6 ; 5
(and (eq_attr "type" "imul,lmul,mult_compare") (and (eq_attr "type" "imul_compare")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,iu1_power4*6)|(q2_power4,iu2_power4*6)") "(du1_power4+du2_power4,iu1_power4*4,iu2_power4)\
|(du2_power4+du3_power4,iu2_power4*4,iu2_power4)\
|(du3_power4+du4_power4,iu2_power4*4,iu1_power4)")
; |(du3_power4+du4_power4,nothing,iu2_power4*4,iu1_power4)")
(define_insn_reservation "power4-imul2" 5 (define_bypass 8 "power4-imul-cmp" "power4-branch,power4-crlogical,power4-delayedcr,power4-mfcr")
(and (eq_attr "type" "imul2")
(define_insn_reservation "power4-lmul" 8 ; 7
(and (eq_attr "type" "lmul")
(eq_attr "cpu" "power4"))
"(du1_power4,iu1_power4*6)\
|(du2_power4,iu2_power4*6)\
|(du3_power4,iu2_power4*6)\
|(du4_power4,iu2_power4*6)")
; |(du3_power4,nothing,iu2_power4*6)\
; |(du4_power4,nothing,iu2_power4*6)")
(define_insn_reservation "power4-imul" 6 ; 5
(and (eq_attr "type" "imul")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,iu1_power4*4)|(q2_power4,iu2_power4*4)") "(du1_power4,iu1_power4*4)\
|(du2_power4,iu2_power4*4)\
|(du3_power4,iu2_power4*4)\
|(du4_power4,iu1_power4*4)")
; |(du3_power4,nothing,iu2_power4*4)\
; |(du4_power4,nothing,iu1_power4*4)")
(define_insn_reservation "power4-imul3" 4 (define_insn_reservation "power4-imul3" 5 ; 4
(and (eq_attr "type" "imul3") (and (eq_attr "type" "imul2,imul3")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,iu1_power4*3)|(q2_power4,iu2_power4*3)") "(du1_power4,iu1_power4*3)\
|(du2_power4,iu2_power4*3)\
|(du3_power4,iu2_power4*3)\
|(du4_power4,iu1_power4*3)")
; |(du3_power4,nothing,iu2_power4*3)\
; |(du4_power4,nothing,iu1_power4*3)")
; SPR move only executes in first IU. ; SPR move only executes in first IU.
; Integer division only executes in second IU. ; Integer division only executes in second IU.
...@@ -268,7 +305,7 @@ ...@@ -268,7 +305,7 @@
"du1_power4,iu1_power4") "du1_power4,iu1_power4")
; Basic FP latency is 6 cycles ; Basic FP latency is 6 cycles
(define_insn_reservation "power4-fp" 6 (define_insn_reservation "power4-fp" 7 ; 6
(and (eq_attr "type" "fp,dmul") (and (eq_attr "type" "fp,dmul")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"fpq_power4") "fpq_power4")
...@@ -281,12 +318,22 @@ ...@@ -281,12 +318,22 @@
(define_insn_reservation "power4-sdiv" 33 (define_insn_reservation "power4-sdiv" 33
(and (eq_attr "type" "sdiv,ddiv") (and (eq_attr "type" "sdiv,ddiv")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,fpu1_power4*28)|(q2_power4,fpu2_power4*28)") "(du1_power4,fpu1_power4*28)\
|(du2_power4,fpu2_power4*28)\
|(du3_power4,fpu2_power4*28)\
|(du4_power4,fpu1_power4*28)")
; |(du3_power4,nothing,fpu2_power4*28)\
; |(du4_power4,nothing,fpu1_power4*28)")
(define_insn_reservation "power4-sqrt" 40 (define_insn_reservation "power4-sqrt" 40
(and (eq_attr "type" "ssqrt,dsqrt") (and (eq_attr "type" "ssqrt,dsqrt")
(eq_attr "cpu" "power4")) (eq_attr "cpu" "power4"))
"(q1_power4,fpu1_power4*35)|(q2_power4,fpu2_power4*35)") "(du1_power4,fpu1_power4*35)\
|(du2_power4,fpu2_power4*35)\
|(du3_power4,fpu2_power4*35)\
|(du4_power4,fpu2_power4*35)")
; |(du3_power4,nothing,fpu2_power4*35)\
; |(du4_power4,nothing,fpu2_power4*35)")
; VMX ; VMX
......
...@@ -56,7 +56,7 @@ ...@@ -56,7 +56,7 @@
"iu_rios1") "iu_rios1")
(define_insn_reservation "rios1-imul" 5 (define_insn_reservation "rios1-imul" 5
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul,imul_compare")
(eq_attr "cpu" "rios1")) (eq_attr "cpu" "rios1"))
"iu_rios1*5") "iu_rios1*5")
...@@ -66,12 +66,12 @@ ...@@ -66,12 +66,12 @@
"iu_rios1*4") "iu_rios1*4")
(define_insn_reservation "rios1-imul3" 3 (define_insn_reservation "rios1-imul3" 3
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul")
(eq_attr "cpu" "rios1")) (eq_attr "cpu" "rios1"))
"iu_rios1*3") "iu_rios1*3")
(define_insn_reservation "ppc601-imul" 5 (define_insn_reservation "ppc601-imul" 5
(and (eq_attr "type" "imul,imul2,imul3,mult_compare") (and (eq_attr "type" "imul,imul2,imul3,imul_compare")
(eq_attr "cpu" "ppc601")) (eq_attr "cpu" "ppc601"))
"iu_rios1*5") "iu_rios1*5")
......
...@@ -44,7 +44,7 @@ ...@@ -44,7 +44,7 @@
"iu1_rios2|iu2_rios2") "iu1_rios2|iu2_rios2")
(define_insn_reservation "rios2-imul" 2 (define_insn_reservation "rios2-imul" 2
(and (eq_attr "type" "imul,imul2,imul3,mult_compare") (and (eq_attr "type" "imul,imul2,imul3,imul_compare")
(eq_attr "cpu" "rios2")) (eq_attr "cpu" "rios2"))
"iu1_rios2*2") "iu1_rios2*2")
......
...@@ -12522,12 +12522,15 @@ rs6000_variable_issue (stream, verbose, insn, more) ...@@ -12522,12 +12522,15 @@ rs6000_variable_issue (stream, verbose, insn, more)
{ {
enum attr_type type = get_attr_type (insn); enum attr_type type = get_attr_type (insn);
if (type == TYPE_LOAD_EXT_U || type == TYPE_LOAD_EXT_UX if (type == TYPE_LOAD_EXT_U || type == TYPE_LOAD_EXT_UX
|| type == TYPE_LOAD_UX || type == TYPE_STORE_UX || type == TYPE_LOAD_UX || type == TYPE_STORE_UX)
|| type == TYPE_FPLOAD_UX || type == TYPE_FPSTORE_UX)
return 0; return 0;
else if (type == TYPE_LOAD_U || type == TYPE_STORE_U else if (type == TYPE_LOAD_U || type == TYPE_STORE_U
|| type == TYPE_FPLOAD_U || type == TYPE_FPSTORE_U || type == TYPE_FPLOAD_U || type == TYPE_FPSTORE_U
|| type == TYPE_LOAD_EXT || type == TYPE_DELAYED_CR) || type == TYPE_FPLOAD_UX || type == TYPE_FPSTORE_UX
|| type == TYPE_LOAD_EXT || type == TYPE_DELAYED_CR
|| type == TYPE_COMPARE || type == TYPE_DELAYED_COMPARE
|| type == TYPE_IMUL_COMPARE || type == TYPE_LMUL_COMPARE
|| type == TYPE_IDIV || type == TYPE_LDIV)
return more > 2 ? more - 2 : 0; return more > 2 ? more - 2 : 0;
} }
...@@ -12580,6 +12583,8 @@ rs6000_adjust_cost (insn, link, dep_insn, cost) ...@@ -12580,6 +12583,8 @@ rs6000_adjust_cost (insn, link, dep_insn, cost)
&& (get_attr_type (dep_insn) == TYPE_CMP && (get_attr_type (dep_insn) == TYPE_CMP
|| get_attr_type (dep_insn) == TYPE_COMPARE || get_attr_type (dep_insn) == TYPE_COMPARE
|| get_attr_type (dep_insn) == TYPE_DELAYED_COMPARE || get_attr_type (dep_insn) == TYPE_DELAYED_COMPARE
|| get_attr_type (dep_insn) == TYPE_IMUL_COMPARE
|| get_attr_type (dep_insn) == TYPE_LMUL_COMPARE
|| get_attr_type (dep_insn) == TYPE_FPCOMPARE || get_attr_type (dep_insn) == TYPE_FPCOMPARE
|| get_attr_type (dep_insn) == TYPE_CR_LOGICAL || get_attr_type (dep_insn) == TYPE_CR_LOGICAL
|| get_attr_type (dep_insn) == TYPE_DELAYED_CR)) || get_attr_type (dep_insn) == TYPE_DELAYED_CR))
...@@ -13712,7 +13717,6 @@ rs6000_rtx_costs (x, code, outer_code, total) ...@@ -13712,7 +13717,6 @@ rs6000_rtx_costs (x, code, outer_code, total)
case PROCESSOR_PPC620: case PROCESSOR_PPC620:
case PROCESSOR_PPC630: case PROCESSOR_PPC630:
case PROCESSOR_POWER4:
*total = (GET_CODE (XEXP (x, 1)) != CONST_INT *total = (GET_CODE (XEXP (x, 1)) != CONST_INT
? GET_MODE (XEXP (x, 1)) != DImode ? GET_MODE (XEXP (x, 1)) != DImode
? COSTS_N_INSNS (5) : COSTS_N_INSNS (7) ? COSTS_N_INSNS (5) : COSTS_N_INSNS (7)
...@@ -13721,6 +13725,13 @@ rs6000_rtx_costs (x, code, outer_code, total) ...@@ -13721,6 +13725,13 @@ rs6000_rtx_costs (x, code, outer_code, total)
? COSTS_N_INSNS (3) : COSTS_N_INSNS (4)); ? COSTS_N_INSNS (3) : COSTS_N_INSNS (4));
return true; return true;
case PROCESSOR_POWER4:
*total = (GET_CODE (XEXP (x, 1)) != CONST_INT
? GET_MODE (XEXP (x, 1)) != DImode
? COSTS_N_INSNS (5) : COSTS_N_INSNS (7)
: COSTS_N_INSNS (4));
return true;
default: default:
abort (); abort ();
} }
......
...@@ -39,7 +39,7 @@ ...@@ -39,7 +39,7 @@
;; Define an insn type attribute. This is used in function unit delay ;; Define an insn type attribute. This is used in function unit delay
;; computations. ;; computations.
(define_attr "type" "integer,load,load_ext,load_ext_u,load_ext_ux,load_ux,load_u,store,store_ux,store_u,fpload,fpload_ux,fpload_u,fpstore,fpstore_ux,fpstore_u,vecload,vecstore,imul,imul2,imul3,lmul,idiv,ldiv,branch,cmp,fast_compare,compare,delayed_compare,mult_compare,fpcompare,cr_logical,delayed_cr,mfcr,mtcr,mtjmpr,fp,fpsimple,dmul,sdiv,ddiv,ssqrt,dsqrt,jmpreg,brinc,vecsimple,veccomplex,vecdiv,veccmp,veccmpsimple,vecperm,vecfloat,vecfdiv" (define_attr "type" "integer,load,load_ext,load_ext_u,load_ext_ux,load_ux,load_u,store,store_ux,store_u,fpload,fpload_ux,fpload_u,fpstore,fpstore_ux,fpstore_u,vecload,vecstore,imul,imul2,imul3,lmul,idiv,ldiv,branch,cmp,fast_compare,compare,delayed_compare,imul_compare,lmul_compare,fpcompare,cr_logical,delayed_cr,mfcr,mtcr,mtjmpr,fp,fpsimple,dmul,sdiv,ddiv,ssqrt,dsqrt,jmpreg,brinc,vecsimple,veccomplex,vecdiv,veccmp,veccmpsimple,vecperm,vecfloat,vecfdiv"
(const_string "integer")) (const_string "integer"))
;; Length (in bytes). ;; Length (in bytes).
...@@ -1669,7 +1669,7 @@ ...@@ -1669,7 +1669,7 @@
(const_string "imul2")] (const_string "imul2")]
(const_string "imul")))]) (const_string "imul")))])
(define_insn "" (define_insn "*mulsi3_mq_internal1"
[(set (match_operand:CC 0 "cc_reg_operand" "=x,?y") [(set (match_operand:CC 0 "cc_reg_operand" "=x,?y")
(compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r") (compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r")
(match_operand:SI 2 "gpc_reg_operand" "r,r")) (match_operand:SI 2 "gpc_reg_operand" "r,r"))
...@@ -1680,7 +1680,7 @@ ...@@ -1680,7 +1680,7 @@
"@ "@
{muls.|mullw.} %3,%1,%2 {muls.|mullw.} %3,%1,%2
#" #"
[(set_attr "type" "mult_compare") [(set_attr "type" "imul_compare")
(set_attr "length" "4,8")]) (set_attr "length" "4,8")])
(define_split (define_split
...@@ -1699,7 +1699,7 @@ ...@@ -1699,7 +1699,7 @@
(const_int 0)))] (const_int 0)))]
"") "")
(define_insn "" (define_insn "*mulsi3_no_mq_internal1"
[(set (match_operand:CC 0 "cc_reg_operand" "=x,?y") [(set (match_operand:CC 0 "cc_reg_operand" "=x,?y")
(compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r") (compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r")
(match_operand:SI 2 "gpc_reg_operand" "r,r")) (match_operand:SI 2 "gpc_reg_operand" "r,r"))
...@@ -1709,7 +1709,7 @@ ...@@ -1709,7 +1709,7 @@
"@ "@
{muls.|mullw.} %3,%1,%2 {muls.|mullw.} %3,%1,%2
#" #"
[(set_attr "type" "mult_compare") [(set_attr "type" "imul_compare")
(set_attr "length" "4,8")]) (set_attr "length" "4,8")])
(define_split (define_split
...@@ -1726,7 +1726,7 @@ ...@@ -1726,7 +1726,7 @@
(const_int 0)))] (const_int 0)))]
"") "")
(define_insn "" (define_insn "*mulsi3_mq_internal2"
[(set (match_operand:CC 3 "cc_reg_operand" "=x,?y") [(set (match_operand:CC 3 "cc_reg_operand" "=x,?y")
(compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r") (compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r")
(match_operand:SI 2 "gpc_reg_operand" "r,r")) (match_operand:SI 2 "gpc_reg_operand" "r,r"))
...@@ -1738,7 +1738,7 @@ ...@@ -1738,7 +1738,7 @@
"@ "@
{muls.|mullw.} %0,%1,%2 {muls.|mullw.} %0,%1,%2
#" #"
[(set_attr "type" "mult_compare") [(set_attr "type" "imul_compare")
(set_attr "length" "4,8")]) (set_attr "length" "4,8")])
(define_split (define_split
...@@ -1758,7 +1758,7 @@ ...@@ -1758,7 +1758,7 @@
(const_int 0)))] (const_int 0)))]
"") "")
(define_insn "" (define_insn "*mulsi3_no_mq_internal2"
[(set (match_operand:CC 3 "cc_reg_operand" "=x,?y") [(set (match_operand:CC 3 "cc_reg_operand" "=x,?y")
(compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r") (compare:CC (mult:SI (match_operand:SI 1 "gpc_reg_operand" "%r,r")
(match_operand:SI 2 "gpc_reg_operand" "r,r")) (match_operand:SI 2 "gpc_reg_operand" "r,r"))
...@@ -1769,7 +1769,7 @@ ...@@ -1769,7 +1769,7 @@
"@ "@
{muls.|mullw.} %0,%1,%2 {muls.|mullw.} %0,%1,%2
#" #"
[(set_attr "type" "mult_compare") [(set_attr "type" "imul_compare")
(set_attr "length" "4,8")]) (set_attr "length" "4,8")])
(define_split (define_split
...@@ -6023,6 +6023,62 @@ ...@@ -6023,6 +6023,62 @@
"mulld %0,%1,%2" "mulld %0,%1,%2"
[(set_attr "type" "lmul")]) [(set_attr "type" "lmul")])
(define_insn "*muldi3_internal1"
[(set (match_operand:CC 0 "cc_reg_operand" "=x,?y")
(compare:CC (mult:DI (match_operand:DI 1 "gpc_reg_operand" "%r,r")
(match_operand:DI 2 "gpc_reg_operand" "r,r"))
(const_int 0)))
(clobber (match_scratch:DI 3 "=r,r"))]
"TARGET_POWERPC64"
"@
mulld. %3,%1,%2
#"
[(set_attr "type" "lmul_compare")
(set_attr "length" "4,8")])
(define_split
[(set (match_operand:CC 0 "cc_reg_not_cr0_operand" "")
(compare:CC (mult:DI (match_operand:DI 1 "gpc_reg_operand" "")
(match_operand:DI 2 "gpc_reg_operand" ""))
(const_int 0)))
(clobber (match_scratch:DI 3 ""))]
"TARGET_POWERPC64 && reload_completed"
[(set (match_dup 3)
(mult:DI (match_dup 1) (match_dup 2)))
(set (match_dup 0)
(compare:CC (match_dup 3)
(const_int 0)))]
"")
(define_insn "*muldi3_internal2"
[(set (match_operand:CC 3 "cc_reg_operand" "=x,?y")
(compare:CC (mult:DI (match_operand:DI 1 "gpc_reg_operand" "%r,r")
(match_operand:DI 2 "gpc_reg_operand" "r,r"))
(const_int 0)))
(set (match_operand:DI 0 "gpc_reg_operand" "=r,r")
(mult:DI (match_dup 1) (match_dup 2)))]
"TARGET_POWERPC64"
"@
mulld. %0,%1,%2
#"
[(set_attr "type" "lmul_compare")
(set_attr "length" "4,8")])
(define_split
[(set (match_operand:CC 3 "cc_reg_not_cr0_operand" "")
(compare:CC (mult:DI (match_operand:DI 1 "gpc_reg_operand" "")
(match_operand:DI 2 "gpc_reg_operand" ""))
(const_int 0)))
(set (match_operand:DI 0 "gpc_reg_operand" "")
(mult:DI (match_dup 1) (match_dup 2)))]
"TARGET_POWERPC64 && reload_completed"
[(set (match_dup 0)
(mult:DI (match_dup 1) (match_dup 2)))
(set (match_dup 3)
(compare:CC (match_dup 0)
(const_int 0)))]
"")
(define_insn "smuldi3_highpart" (define_insn "smuldi3_highpart"
[(set (match_operand:DI 0 "gpc_reg_operand" "=r") [(set (match_operand:DI 0 "gpc_reg_operand" "=r")
(truncate:DI (truncate:DI
......
...@@ -47,7 +47,7 @@ ...@@ -47,7 +47,7 @@
"iu_rs64") "iu_rs64")
(define_insn_reservation "rs64a-imul" 20 (define_insn_reservation "rs64a-imul" 20
(and (eq_attr "type" "imul,mult_compare") (and (eq_attr "type" "imul,imul_compare")
(eq_attr "cpu" "rs64a")) (eq_attr "cpu" "rs64a"))
"mciu_rs64*13") "mciu_rs64*13")
...@@ -62,7 +62,7 @@ ...@@ -62,7 +62,7 @@
"mciu_rs64*2") "mciu_rs64*2")
(define_insn_reservation "rs64a-lmul" 34 (define_insn_reservation "rs64a-lmul" 34
(and (eq_attr "type" "lmul") (and (eq_attr "type" "lmul,lmul_compare")
(eq_attr "cpu" "rs64a")) (eq_attr "cpu" "rs64a"))
"mciu_rs64*34") "mciu_rs64*34")
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment