mirror of
https://github.com/RPCS3/llvm.git
synced 2025-01-09 05:31:37 +00:00
38b2a0bfdd
Summary: The accumulator-based (HI/LO) multiplies and divides from earlier ISA's have been removed and replaced with GPR-based equivalents. For example: div $1, $2 mflo $3 is now: div $3, $1, $2 This patch disables the accumulator-based multiplies and divides for MIPS32r6/MIPS64r6 and uses the GPR-based equivalents instead. Renamed expandPseudoDiv to insertDivByZeroTrap to better describe the behaviour of the function. MipsDelaySlotFiller now invalidates the liveness information when moving instructions to the delay slot. Without this, divrem.ll will abort since %GP ends up used before it is defined. Reviewers: vmedic, zoran.jovanovic, jkolek Reviewed By: jkolek Differential Revision: http://reviews.llvm.org/D3896 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@210760 91177308-0d34-0410-b5e6-96231b3b80d8
389 lines
9.9 KiB
LLVM
389 lines
9.9 KiB
LLVM
; RUN: llc -march=mips -mcpu=mips32 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=ACC32-TRAP
|
|
; RUN: llc -march=mips -mcpu=mips32r2 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=ACC32-TRAP
|
|
; RUN: llc -march=mips -mcpu=mips32r6 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR32 -check-prefix=GPR32-TRAP
|
|
; RUN: llc -march=mips64 -mcpu=mips64 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=ACC64-TRAP
|
|
; RUN: llc -march=mips64 -mcpu=mips64r2 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=ACC64-TRAP
|
|
; RUN: llc -march=mips64 -mcpu=mips64r6 -verify-machineinstrs < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR64 -check-prefix=GPR64-TRAP
|
|
|
|
; RUN: llc -march=mips -mcpu=mips32 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips -mcpu=mips32r2 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC32 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips -mcpu=mips32r6 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR32 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips64 -mcpu=mips64 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips64 -mcpu=mips64r2 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=ACC64 -check-prefix=NOCHECK
|
|
; RUN: llc -march=mips64 -mcpu=mips64r6 -mno-check-zero-division < %s | FileCheck %s -check-prefix=ALL -check-prefix=GPR64 -check-prefix=NOCHECK
|
|
|
|
; FileCheck Prefixes:
|
|
; ALL - All targets
|
|
; ACC32 - Accumulator based multiply/divide on 32-bit targets
|
|
; ACC64 - Same as ACC32 but only for 64-bit targets
|
|
; GPR32 - GPR based multiply/divide on 32-bit targets
|
|
; GPR64 - Same as GPR32 but only for 64-bit targets
|
|
; ACC32-TRAP - Same as TRAP and ACC32 combined
|
|
; ACC64-TRAP - Same as TRAP and ACC64 combined
|
|
; GPR32-TRAP - Same as TRAP and GPR32 combined
|
|
; GPR64-TRAP - Same as TRAP and GPR64 combined
|
|
; NOCHECK - Division by zero will not be detected
|
|
|
|
@g0 = common global i32 0, align 4
|
|
@g1 = common global i32 0, align 4
|
|
|
|
define i32 @sdiv1(i32 %a0, i32 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: sdiv1:
|
|
|
|
; ACC32: div $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: div $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: div $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mflo $2
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end sdiv1
|
|
|
|
%div = sdiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i32 @srem1(i32 %a0, i32 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: srem1:
|
|
|
|
; ACC32: div $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: mod $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: mod $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mfhi $2
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end srem1
|
|
|
|
%rem = srem i32 %a0, %a1
|
|
ret i32 %rem
|
|
}
|
|
|
|
define i32 @udiv1(i32 %a0, i32 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: udiv1:
|
|
|
|
; ACC32: divu $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: divu $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: divu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mflo $2
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end udiv1
|
|
%div = udiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i32 @urem1(i32 %a0, i32 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: urem1:
|
|
|
|
; ACC32: divu $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR32: modu $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: modu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC32: mfhi $2
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end urem1
|
|
|
|
%rem = urem i32 %a0, %a1
|
|
ret i32 %rem
|
|
}
|
|
|
|
define i32 @sdivrem1(i32 %a0, i32 %a1, i32* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: sdivrem1:
|
|
|
|
; ACC32: div $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC32: mflo $2
|
|
; ACC32: mfhi $[[R0:[0-9]+]]
|
|
; ACC32: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR32: mod $[[R0:[0-9]+]], $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR32: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR32-DAG: div $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: mod $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR64-DAG: div $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end sdivrem1
|
|
|
|
%rem = srem i32 %a0, %a1
|
|
store i32 %rem, i32* %r, align 4
|
|
%div = sdiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i32 @udivrem1(i32 %a0, i32 %a1, i32* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: udivrem1:
|
|
|
|
; ACC32: divu $zero, $4, $5
|
|
; ACC32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC32: mflo $2
|
|
; ACC32: mfhi $[[R0:[0-9]+]]
|
|
; ACC32: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sw $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR32: modu $[[R0:[0-9]+]], $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR32: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR32-DAG: divu $2, $4, $5
|
|
; GPR32-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; GPR64: modu $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sw $[[R0]], 0(${{[0-9]+}})
|
|
; GPR64-DAG: divu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end udivrem1
|
|
|
|
%rem = urem i32 %a0, %a1
|
|
store i32 %rem, i32* %r, align 4
|
|
%div = udiv i32 %a0, %a1
|
|
ret i32 %div
|
|
}
|
|
|
|
; FIXME: It's not clear what this is supposed to test.
|
|
define i32 @killFlags() {
|
|
entry:
|
|
%0 = load i32* @g0, align 4
|
|
%1 = load i32* @g1, align 4
|
|
%div = sdiv i32 %0, %1
|
|
ret i32 %div
|
|
}
|
|
|
|
define i64 @sdiv2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: sdiv2:
|
|
|
|
; ACC32: lw $25, %call16(__divdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: ddiv $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: ddiv $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end sdiv2
|
|
|
|
%div = sdiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|
|
|
|
define i64 @srem2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: srem2:
|
|
|
|
; ACC32: lw $25, %call16(__moddi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: div $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: dmod $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end srem2
|
|
|
|
%rem = srem i64 %a0, %a1
|
|
ret i64 %rem
|
|
}
|
|
|
|
define i64 @udiv2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: udiv2:
|
|
|
|
; ACC32: lw $25, %call16(__udivdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: ddivu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mflo $2
|
|
|
|
; ALL: .end udiv2
|
|
%div = udiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|
|
|
|
define i64 @urem2(i64 %a0, i64 %a1) nounwind readnone {
|
|
entry:
|
|
; ALL-LABEL: urem2:
|
|
|
|
; ACC32: lw $25, %call16(__umoddi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: divu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
|
|
; GPR64: dmodu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ACC64: mfhi $2
|
|
|
|
; ALL: .end urem2
|
|
|
|
%rem = urem i64 %a0, %a1
|
|
ret i64 %rem
|
|
}
|
|
|
|
define i64 @sdivrem2(i64 %a0, i64 %a1, i64* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: sdivrem2:
|
|
|
|
; sdivrem2 is too complex to effectively check. We can at least check for the
|
|
; calls though.
|
|
; ACC32: lw $25, %call16(__moddi3)(
|
|
; ACC32: jalr $25
|
|
; ACC32: lw $25, %call16(__divdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: ddiv $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64: dmod $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64-DAG: ddiv $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end sdivrem2
|
|
|
|
%rem = srem i64 %a0, %a1
|
|
store i64 %rem, i64* %r, align 8
|
|
%div = sdiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|
|
|
|
define i64 @udivrem2(i64 %a0, i64 %a1, i64* nocapture %r) nounwind {
|
|
entry:
|
|
; ALL-LABEL: udivrem2:
|
|
|
|
; udivrem2 is too complex to effectively check. We can at least check for the
|
|
; calls though.
|
|
; ACC32: lw $25, %call16(__umoddi3)(
|
|
; ACC32: jalr $25
|
|
; ACC32: lw $25, %call16(__udivdi3)(
|
|
; ACC32: jalr $25
|
|
|
|
; ACC64: ddivu $zero, $4, $5
|
|
; ACC64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; ACC64: mflo $2
|
|
; ACC64: mfhi $[[R0:[0-9]+]]
|
|
; ACC64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64: dmodu $[[R0:[0-9]+]], $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
; GPR64: sd $[[R0]], 0(${{[0-9]+}})
|
|
|
|
; GPR64-DAG: ddivu $2, $4, $5
|
|
; GPR64-TRAP: teq $5, $zero, 7
|
|
; NOCHECK-NOT: teq
|
|
|
|
; ALL: .end udivrem2
|
|
|
|
%rem = urem i64 %a0, %a1
|
|
store i64 %rem, i64* %r, align 8
|
|
%div = udiv i64 %a0, %a1
|
|
ret i64 %div
|
|
}
|