mirror of
https://github.com/RPCS3/llvm.git
synced 2024-12-15 07:59:57 +00:00
707e018423
on any current target and aren't optimized in DAGCombiner. Instead of using intermediate nodes, expand the operations, choosing between simple loads/stores, target-specific code, and library calls, immediately. Previously, the code to emit optimized code for these operations was only used at initial SelectionDAG construction time; now it is used at all times. This fixes some cases where rep;movs was being used for small copies where simple loads/stores would be better. This also cleans up code that checks for alignments less than 4; let the targets make that decision instead of doing it in target-independent code. This allows x86 to use rep;movs in low-alignment cases. Also, this fixes a bug that resulted in the use of rep;stos for memsets of 0 with non-constant memory size when the alignment was at least 4. It's better to use the library in this case, which can be significantly faster when the size is large. This also preserves more SourceValue information when memory intrinsics are lowered into simple loads/stores. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@49572 91177308-0d34-0410-b5e6-96231b3b80d8
31 lines
1.2 KiB
LLVM
31 lines
1.2 KiB
LLVM
; RUN: llvm-as < %s | llc -march=x86-64 | grep rep.movsl | count 2
|
|
; RUN: llvm-as < %s | llc -march=x86 | grep rep.movsl | count 2
|
|
|
|
%struct.s = type { i32, i32, i32, i32, i32, i32, i32, i32,
|
|
i32, i32, i32, i32, i32, i32, i32, i32,
|
|
i32, i32, i32, i32, i32, i32, i32, i32,
|
|
i32, i32, i32, i32, i32, i32, i32, i32,
|
|
i32 }
|
|
|
|
define void @g(i32 %a1, i32 %a2, i32 %a3, i32 %a4, i32 %a5, i32 %a6) {
|
|
entry:
|
|
%d = alloca %struct.s, align 16
|
|
%tmp = getelementptr %struct.s* %d, i32 0, i32 0
|
|
store i32 %a1, i32* %tmp, align 16
|
|
%tmp2 = getelementptr %struct.s* %d, i32 0, i32 1
|
|
store i32 %a2, i32* %tmp2, align 16
|
|
%tmp4 = getelementptr %struct.s* %d, i32 0, i32 2
|
|
store i32 %a3, i32* %tmp4, align 16
|
|
%tmp6 = getelementptr %struct.s* %d, i32 0, i32 3
|
|
store i32 %a4, i32* %tmp6, align 16
|
|
%tmp8 = getelementptr %struct.s* %d, i32 0, i32 4
|
|
store i32 %a5, i32* %tmp8, align 16
|
|
%tmp10 = getelementptr %struct.s* %d, i32 0, i32 5
|
|
store i32 %a6, i32* %tmp10, align 16
|
|
call void @f( %struct.s* %d byval)
|
|
call void @f( %struct.s* %d byval)
|
|
ret void
|
|
}
|
|
|
|
declare void @f(%struct.s* byval)
|