llvm/test/CodeGen/ARM/arm-and-tst-peephole.ll

; RUN: llc < %s -march=arm | FileCheck -check-prefix=ARM %s
; RUN: llc < %s -march=thumb | FileCheck -check-prefix=THUMB %s
; RUN: llc < %s -march=thumb -mattr=+thumb2 | FileCheck -check-prefix=T2 %s

; FIXME: The -march=thumb test doesn't change if -disable-peephole is specified.

%struct.Foo = type { i8* }

; ARM:   foo
; THUMB: foo
; T2:    foo
define %struct.Foo* @foo(%struct.Foo* %this, i32 %acc) nounwind readonly align 2 {
entry:
  %scevgep = getelementptr %struct.Foo* %this, i32 1
  br label %tailrecurse

tailrecurse:                                      ; preds = %sw.bb, %entry
  %lsr.iv2 = phi %struct.Foo* [ %scevgep3, %sw.bb ], [ %scevgep, %entry ]
  %lsr.iv = phi i32 [ %lsr.iv.next, %sw.bb ], [ 1, %entry ]
  %acc.tr = phi i32 [ %or, %sw.bb ], [ %acc, %entry ]
  %lsr.iv24 = bitcast %struct.Foo* %lsr.iv2 to i8**
  %scevgep5 = getelementptr i8** %lsr.iv24, i32 -1
  %tmp2 = load i8** %scevgep5
  %0 = ptrtoint i8* %tmp2 to i32

; ARM:      ands {{r[0-9]+}}, {{r[0-9]+}}, #3
; ARM-NEXT: beq

; THUMB:      movs r[[R0:[0-9]+]], #3
; THUMB-NEXT: ands r[[R0]], r
; THUMB-NEXT: cmp r[[R0]], #0
; THUMB-NEXT: beq

; T2:      ands {{r[0-9]+}}, {{r[0-9]+}}, #3
; T2-NEXT: beq

  %and = and i32 %0, 3
  %tst = icmp eq i32 %and, 0
  br i1 %tst, label %sw.bb, label %tailrecurse.switch

tailrecurse.switch:                               ; preds = %tailrecurse
  switch i32 %and, label %sw.epilog [
    i32 1, label %sw.bb
    i32 3, label %sw.bb6
    i32 2, label %sw.bb8
  ]

sw.bb:                                            ; preds = %tailrecurse.switch, %tailrecurse
  %shl = shl i32 %acc.tr, 1
  %or = or i32 %and, %shl
  %lsr.iv.next = add i32 %lsr.iv, 1
  %scevgep3 = getelementptr %struct.Foo* %lsr.iv2, i32 1
  br label %tailrecurse

sw.bb6:                                           ; preds = %tailrecurse.switch
  ret %struct.Foo* %lsr.iv2

sw.bb8:                                           ; preds = %tailrecurse.switch
  %tmp1 = add i32 %acc.tr, %lsr.iv
  %add.ptr11 = getelementptr inbounds %struct.Foo* %this, i32 %tmp1
  ret %struct.Foo* %add.ptr11

sw.epilog:                                        ; preds = %tailrecurse.switch
  ret %struct.Foo* undef
}

; Another test that exercises the AND/TST peephole optimization and also
; generates a predicated ANDS instruction. Check that the predicate is printed
; after the "S" modifier on the instruction.

%struct.S = type { i8* (i8*)*, [1 x i8] }

; ARM: bar
; THUMB: bar
; T2: bar
define internal zeroext i8 @bar(%struct.S* %x, %struct.S* nocapture %y) nounwind readonly {
entry:
  %0 = getelementptr inbounds %struct.S* %x, i32 0, i32 1, i32 0
  %1 = load i8* %0, align 1
  %2 = zext i8 %1 to i32
; ARM: ands
; THUMB: ands
; T2: ands
  %3 = and i32 %2, 112
  %4 = icmp eq i32 %3, 0
  br i1 %4, label %return, label %bb

bb:                                               ; preds = %entry
  %5 = getelementptr inbounds %struct.S* %y, i32 0, i32 1, i32 0
  %6 = load i8* %5, align 1
  %7 = zext i8 %6 to i32
; ARM: andsne
; THUMB: ands
; T2: andsne
  %8 = and i32 %7, 112
  %9 = icmp eq i32 %8, 0
  br i1 %9, label %return, label %bb2

bb2:                                              ; preds = %bb
  %10 = icmp eq i32 %3, 16
  %11 = icmp eq i32 %8, 16
  %or.cond = or i1 %10, %11
  br i1 %or.cond, label %bb4, label %return

bb4:                                              ; preds = %bb2
  %12 = ptrtoint %struct.S* %x to i32
  %phitmp = trunc i32 %12 to i8
  ret i8 %phitmp

return:                                           ; preds = %bb2, %bb, %entry
  ret i8 1
}
When we look at instructions to convert to setting the 's' flag, we need to look at more than those which define CPSR. You can have this situation: (1) subs ... (2) sub r6, r5, r4 (3) movge ... (4) cmp r6, 0 (5) movge ... We cannot convert (2) to "subs" because (3) is using the CPSR set by (1). There's an analogous situation here: (1) sub r1, r2, r3 (2) sub r4, r5, r6 (3) cmp r4, ... (5) movge ... (6) cmp r1, ... (7) movge ... We cannot convert (1) to "subs" because of the intervening use of CPSR. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@117950 91177308-0d34-0410-b5e6-96231b3b80d8 2010-11-01 20:41:43 +00:00			`; RUN: llc < %s -march=arm \| FileCheck -check-prefix=ARM %s`
			`; RUN: llc < %s -march=thumb \| FileCheck -check-prefix=THUMB %s`
			`; RUN: llc < %s -march=thumb -mattr=+thumb2 \| FileCheck -check-prefix=T2 %s`

			`; FIXME: The -march=thumb test doesn't change if -disable-peephole is specified.`
test for and-tst peephole optimization documents the status-quo with its opportunities git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@113838 91177308-0d34-0410-b5e6-96231b3b80d8 2010-09-14 08:50:43 +00:00
			`%struct.Foo = type { i8* }`

When we look at instructions to convert to setting the 's' flag, we need to look at more than those which define CPSR. You can have this situation: (1) subs ... (2) sub r6, r5, r4 (3) movge ... (4) cmp r6, 0 (5) movge ... We cannot convert (2) to "subs" because (3) is using the CPSR set by (1). There's an analogous situation here: (1) sub r1, r2, r3 (2) sub r4, r5, r6 (3) cmp r4, ... (5) movge ... (6) cmp r1, ... (7) movge ... We cannot convert (1) to "subs" because of the intervening use of CPSR. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@117950 91177308-0d34-0410-b5e6-96231b3b80d8 2010-11-01 20:41:43 +00:00			`; ARM: foo`
			`; THUMB: foo`
			`; T2: foo`
			`define %struct.Foo* @foo(%struct.Foo* %this, i32 %acc) nounwind readonly align 2 {`
test for and-tst peephole optimization documents the status-quo with its opportunities git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@113838 91177308-0d34-0410-b5e6-96231b3b80d8 2010-09-14 08:50:43 +00:00			`entry:`
			`%scevgep = getelementptr %struct.Foo* %this, i32 1`
			`br label %tailrecurse`

			`tailrecurse: ; preds = %sw.bb, %entry`
			`%lsr.iv2 = phi %struct.Foo* [ %scevgep3, %sw.bb ], [ %scevgep, %entry ]`
			`%lsr.iv = phi i32 [ %lsr.iv.next, %sw.bb ], [ 1, %entry ]`
			`%acc.tr = phi i32 [ %or, %sw.bb ], [ %acc, %entry ]`
			`%lsr.iv24 = bitcast %struct.Foo* %lsr.iv2 to i8**`
			`%scevgep5 = getelementptr i8** %lsr.iv24, i32 -1`
			`%tmp2 = load i8** %scevgep5`
			`%0 = ptrtoint i8* %tmp2 to i32`

Weekly fix of register allocation dependent unit tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@130567 91177308-0d34-0410-b5e6-96231b3b80d8 2011-04-30 01:37:52 +00:00			`; ARM: ands {{r[0-9]+}}, {{r[0-9]+}}, #3`
When we look at instructions to convert to setting the 's' flag, we need to look at more than those which define CPSR. You can have this situation: (1) subs ... (2) sub r6, r5, r4 (3) movge ... (4) cmp r6, 0 (5) movge ... We cannot convert (2) to "subs" because (3) is using the CPSR set by (1). There's an analogous situation here: (1) sub r1, r2, r3 (2) sub r4, r5, r6 (3) cmp r4, ... (5) movge ... (6) cmp r1, ... (7) movge ... We cannot convert (1) to "subs" because of the intervening use of CPSR. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@117950 91177308-0d34-0410-b5e6-96231b3b80d8 2010-11-01 20:41:43 +00:00			`; ARM-NEXT: beq`
test for and-tst peephole optimization documents the status-quo with its opportunities git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@113838 91177308-0d34-0410-b5e6-96231b3b80d8 2010-09-14 08:50:43 +00:00
Fix ARM tests to be register allocator independent. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@128680 91177308-0d34-0410-b5e6-96231b3b80d8 2011-03-31 22:14:03 +00:00			`; THUMB: movs r[[R0:[0-9]+]], #3`
			`; THUMB-NEXT: ands r[[R0]], r`
			`; THUMB-NEXT: cmp r[[R0]], #0`
do not compare actual branch labels; this may fix llvm-gcc-x86_64-darwin10-cross-mingw32 buildbot too git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@115034 91177308-0d34-0410-b5e6-96231b3b80d8 2010-09-29 10:45:43 +00:00			`; THUMB-NEXT: beq`
improve heuristics to find the 'and' corresponding to 'tst' to also catch opportunities on thumb2 added some doxygen on the way git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@115033 91177308-0d34-0410-b5e6-96231b3b80d8 2010-09-29 10:12:08 +00:00
Weekly fix of register allocation dependent unit tests. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@130567 91177308-0d34-0410-b5e6-96231b3b80d8 2011-04-30 01:37:52 +00:00			`; T2: ands {{r[0-9]+}}, {{r[0-9]+}}, #3`
do not compare actual branch labels; this may fix llvm-gcc-x86_64-darwin10-cross-mingw32 buildbot too git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@115034 91177308-0d34-0410-b5e6-96231b3b80d8 2010-09-29 10:45:43 +00:00			`; T2-NEXT: beq`
test for and-tst peephole optimization documents the status-quo with its opportunities git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@113838 91177308-0d34-0410-b5e6-96231b3b80d8 2010-09-14 08:50:43 +00:00
			`%and = and i32 %0, 3`
			`%tst = icmp eq i32 %and, 0`
			`br i1 %tst, label %sw.bb, label %tailrecurse.switch`

			`tailrecurse.switch: ; preds = %tailrecurse`
			`switch i32 %and, label %sw.epilog [`
			`i32 1, label %sw.bb`
			`i32 3, label %sw.bb6`
			`i32 2, label %sw.bb8`
			`]`

			`sw.bb: ; preds = %tailrecurse.switch, %tailrecurse`
			`%shl = shl i32 %acc.tr, 1`
			`%or = or i32 %and, %shl`
			`%lsr.iv.next = add i32 %lsr.iv, 1`
			`%scevgep3 = getelementptr %struct.Foo* %lsr.iv2, i32 1`
			`br label %tailrecurse`

			`sw.bb6: ; preds = %tailrecurse.switch`
			`ret %struct.Foo* %lsr.iv2`

			`sw.bb8: ; preds = %tailrecurse.switch`
			`%tmp1 = add i32 %acc.tr, %lsr.iv`
			`%add.ptr11 = getelementptr inbounds %struct.Foo* %this, i32 %tmp1`
			`ret %struct.Foo* %add.ptr11`

			`sw.epilog: ; preds = %tailrecurse.switch`
			`ret %struct.Foo* undef`
			`}`
ARM instructions that are both predicated and set the condition codes have been printed with the "S" modifier after the predicate. With ARM's unified syntax, they are supposed to go in the other order. We fixed this for Thumb when we switched to unified syntax but missed changing it for ARM. Apparently we don't generate these instructions often because no one noticed until now. Thanks to Bill Wendling for the testcase! git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@116563 91177308-0d34-0410-b5e6-96231b3b80d8 2010-10-15 03:23:44 +00:00
			`; Another test that exercises the AND/TST peephole optimization and also`
			`; generates a predicated ANDS instruction. Check that the predicate is printed`
			`; after the "S" modifier on the instruction.`

			`%struct.S = type { i8* (i8), [1 x i8] }`

When we look at instructions to convert to setting the 's' flag, we need to look at more than those which define CPSR. You can have this situation: (1) subs ... (2) sub r6, r5, r4 (3) movge ... (4) cmp r6, 0 (5) movge ... We cannot convert (2) to "subs" because (3) is using the CPSR set by (1). There's an analogous situation here: (1) sub r1, r2, r3 (2) sub r4, r5, r6 (3) cmp r4, ... (5) movge ... (6) cmp r1, ... (7) movge ... We cannot convert (1) to "subs" because of the intervening use of CPSR. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@117950 91177308-0d34-0410-b5e6-96231b3b80d8 2010-11-01 20:41:43 +00:00			`; ARM: bar`
ARM instructions that are both predicated and set the condition codes have been printed with the "S" modifier after the predicate. With ARM's unified syntax, they are supposed to go in the other order. We fixed this for Thumb when we switched to unified syntax but missed changing it for ARM. Apparently we don't generate these instructions often because no one noticed until now. Thanks to Bill Wendling for the testcase! git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@116563 91177308-0d34-0410-b5e6-96231b3b80d8 2010-10-15 03:23:44 +00:00			`; THUMB: bar`
			`; T2: bar`
			`define internal zeroext i8 @bar(%struct.S* %x, %struct.S* nocapture %y) nounwind readonly {`
			`entry:`
			`%0 = getelementptr inbounds %struct.S* %x, i32 0, i32 1, i32 0`
			`%1 = load i8* %0, align 1`
			`%2 = zext i8 %1 to i32`
When we look at instructions to convert to setting the 's' flag, we need to look at more than those which define CPSR. You can have this situation: (1) subs ... (2) sub r6, r5, r4 (3) movge ... (4) cmp r6, 0 (5) movge ... We cannot convert (2) to "subs" because (3) is using the CPSR set by (1). There's an analogous situation here: (1) sub r1, r2, r3 (2) sub r4, r5, r6 (3) cmp r4, ... (5) movge ... (6) cmp r1, ... (7) movge ... We cannot convert (1) to "subs" because of the intervening use of CPSR. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@117950 91177308-0d34-0410-b5e6-96231b3b80d8 2010-11-01 20:41:43 +00:00			`; ARM: ands`
ARM instructions that are both predicated and set the condition codes have been printed with the "S" modifier after the predicate. With ARM's unified syntax, they are supposed to go in the other order. We fixed this for Thumb when we switched to unified syntax but missed changing it for ARM. Apparently we don't generate these instructions often because no one noticed until now. Thanks to Bill Wendling for the testcase! git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@116563 91177308-0d34-0410-b5e6-96231b3b80d8 2010-10-15 03:23:44 +00:00			`; THUMB: ands`
			`; T2: ands`
			`%3 = and i32 %2, 112`
			`%4 = icmp eq i32 %3, 0`
			`br i1 %4, label %return, label %bb`

			`bb: ; preds = %entry`
			`%5 = getelementptr inbounds %struct.S* %y, i32 0, i32 1, i32 0`
			`%6 = load i8* %5, align 1`
			`%7 = zext i8 %6 to i32`
When we look at instructions to convert to setting the 's' flag, we need to look at more than those which define CPSR. You can have this situation: (1) subs ... (2) sub r6, r5, r4 (3) movge ... (4) cmp r6, 0 (5) movge ... We cannot convert (2) to "subs" because (3) is using the CPSR set by (1). There's an analogous situation here: (1) sub r1, r2, r3 (2) sub r4, r5, r6 (3) cmp r4, ... (5) movge ... (6) cmp r1, ... (7) movge ... We cannot convert (1) to "subs" because of the intervening use of CPSR. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@117950 91177308-0d34-0410-b5e6-96231b3b80d8 2010-11-01 20:41:43 +00:00			`; ARM: andsne`
ARM instructions that are both predicated and set the condition codes have been printed with the "S" modifier after the predicate. With ARM's unified syntax, they are supposed to go in the other order. We fixed this for Thumb when we switched to unified syntax but missed changing it for ARM. Apparently we don't generate these instructions often because no one noticed until now. Thanks to Bill Wendling for the testcase! git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@116563 91177308-0d34-0410-b5e6-96231b3b80d8 2010-10-15 03:23:44 +00:00			`; THUMB: ands`
			`; T2: andsne`
			`%8 = and i32 %7, 112`
			`%9 = icmp eq i32 %8, 0`
			`br i1 %9, label %return, label %bb2`

			`bb2: ; preds = %bb`
			`%10 = icmp eq i32 %3, 16`
			`%11 = icmp eq i32 %8, 16`
			`%or.cond = or i1 %10, %11`
			`br i1 %or.cond, label %bb4, label %return`

			`bb4: ; preds = %bb2`
			`%12 = ptrtoint %struct.S* %x to i32`
			`%phitmp = trunc i32 %12 to i8`
			`ret i8 %phitmp`

			`return: ; preds = %bb2, %bb, %entry`
			`ret i8 1`
			`}`