llvm/test/CodeGen/R600/loop-idiom.ll
Tom Stellard 40e455d992 R600/SI: Custom lower SI_IF and SI_ELSE to avoid machine verifier errors
SI_IF and SI_ELSE are terminators which also produce a value.  For
these instructions ISel always inserts a COPY to move their value
to another basic block.  This COPY ends up between SI_(IF|ELSE)
and the S_BRANCH* instruction at the end of the block.

This breaks MachineBasicBlock::getFirstTerminator() and also the
machine verifier which assumes that terminators are grouped together at
the end of blocks.

To solve this we coalesce the copy away right after ISel to make sure
there are no instructions in between terminators at the end of blocks.

git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@207591 91177308-0d34-0410-b5e6-96231b3b80d8
2014-04-29 23:12:53 +00:00

55 lines
1.5 KiB
LLVM

; RUN: opt -basicaa -loop-idiom -S < %s -march=r600 -mcpu=redwood | FileCheck --check-prefix=R600 --check-prefix=FUNC %s
; RUN: opt -basicaa -loop-idiom -S < %s -march=r600 -mcpu=SI -verify-machineinstrs| FileCheck --check-prefix=SI --check-prefix=FUNC %s
target datalayout = "e-p:32:32-p1:64:64-p2:64:64-p3:32:32-p4:32:32-p5:64:64-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64"
target triple = "r600--"
; Make sure loop-idiom doesn't create memcpy or memset. There are no library
; implementations of these for R600.
; FUNC: @no_memcpy
; R600-NOT: @llvm.memcpy
; SI-NOT: @llvm.memcpy
define void @no_memcpy(i8 addrspace(3)* %in, i32 %size) {
entry:
%dest = alloca i8, i32 32
br label %for.body
for.body:
%0 = phi i32 [0, %entry], [%4, %for.body]
%1 = getelementptr i8 addrspace(3)* %in, i32 %0
%2 = getelementptr i8* %dest, i32 %0
%3 = load i8 addrspace(3)* %1
store i8 %3, i8* %2
%4 = add i32 %0, 1
%5 = icmp eq i32 %4, %size
br i1 %5, label %for.end, label %for.body
for.end:
ret void
}
; FUNC: @no_memset
; R600-NOT: @llvm.memset
; R600-NOT: @memset_pattern16
; SI-NOT: @llvm.memset
; SI-NOT: @memset_pattern16
define void @no_memset(i32 %size) {
entry:
%dest = alloca i8, i32 32
br label %for.body
for.body:
%0 = phi i32 [0, %entry], [%2, %for.body]
%1 = getelementptr i8* %dest, i32 %0
store i8 0, i8* %1
%2 = add i32 %0, 1
%3 = icmp eq i32 %2, %size
br i1 %3, label %for.end, label %for.body
for.end:
ret void
}