mirror of
https://github.com/RPCSX/llvm.git
synced 2025-01-27 15:22:29 +00:00
47f0e3f434
its own variable. This is needed so that we can explicitly turn off MMX without turning off SSE and also so that we can diagnose feature set incompatibilities that involve MMX without SSE. Rationale: // sse3 __m128d test_mm_addsub_pd(__m128d A, __m128d B) { return _mm_addsub_pd(A, B); } // mmx void shift(__m64 a, __m64 b, int c) { _mm_slli_pi16(a, c); _mm_slli_pi32(a, c); _mm_slli_si64(a, c); _mm_srli_pi16(a, c); _mm_srli_pi32(a, c); _mm_srli_si64(a, c); _mm_srai_pi16(a, c); _mm_srai_pi32(a, c); } clang -msse3 -mno-mmx file.c -c For this code we should be able to explicitly turn off MMX without affecting the compilation of the SSE3 function and then diagnose and error on compiling the MMX function. This matches the existing gcc behavior and follows the spirit of the SSE/MMX separation in llvm where we can (and do) turn off MMX code generation except in the presence of intrinsics. Updated a couple of tests, but primarily tested with a couple of tests for turning on only mmx and only sse. This is paired with a patch to clang to take advantage of this behavior. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@249731 91177308-0d34-0410-b5e6-96231b3b80d8
22 lines
767 B
LLVM
22 lines
767 B
LLVM
; RUN: llc < %s -march=x86 -mattr=+mmx | FileCheck %s
|
|
; RUN: llc < %s -march=x86 -mattr=+mmx,-sse | FileCheck %s
|
|
|
|
; Test that turning off sse doesn't turn off mmx.
|
|
|
|
declare x86_mmx @llvm.x86.mmx.pcmpgt.d(x86_mmx, x86_mmx) nounwind readnone
|
|
|
|
define i64 @test88(<1 x i64> %a, <1 x i64> %b) nounwind readnone {
|
|
; CHECK-LABEL: @test88
|
|
; CHECK: pcmpgtd
|
|
entry:
|
|
%0 = bitcast <1 x i64> %b to <2 x i32>
|
|
%1 = bitcast <1 x i64> %a to <2 x i32>
|
|
%mmx_var.i = bitcast <2 x i32> %1 to x86_mmx
|
|
%mmx_var1.i = bitcast <2 x i32> %0 to x86_mmx
|
|
%2 = tail call x86_mmx @llvm.x86.mmx.pcmpgt.d(x86_mmx %mmx_var.i, x86_mmx %mmx_var1.i) nounwind
|
|
%3 = bitcast x86_mmx %2 to <2 x i32>
|
|
%4 = bitcast <2 x i32> %3 to <1 x i64>
|
|
%5 = extractelement <1 x i64> %4, i32 0
|
|
ret i64 %5
|
|
}
|