diff options
author | Chris Lattner <sabre@nondot.org> | 2008-03-09 05:42:06 +0000 |
---|---|---|
committer | Chris Lattner <sabre@nondot.org> | 2008-03-09 05:42:06 +0000 |
commit | 66a4ddacc25835471cca23ae48b13e9b6e9486e7 (patch) | |
tree | 7a7fd9ea19992b97cc52890188a1cdab8940c738 /lib/Target/X86/README-SSE.txt | |
parent | 95a0d76b1a4d17d4c1bef4d83cfb307352751e75 (diff) | |
download | external_llvm-66a4ddacc25835471cca23ae48b13e9b6e9486e7.zip external_llvm-66a4ddacc25835471cca23ae48b13e9b6e9486e7.tar.gz external_llvm-66a4ddacc25835471cca23ae48b13e9b6e9486e7.tar.bz2 |
Finish implementing a readme entry: when inserting an i64 variable
into a vector of zeros or undef, and when the top part is obviously
zero, we can just use movd + shuffle. This allows us to compile
vec_set-B.ll into:
_test3:
movl $1234567, %eax
andl 4(%esp), %eax
movd %eax, %xmm0
ret
instead of:
_test3:
subl $28, %esp
movl $1234567, %eax
andl 32(%esp), %eax
movl %eax, (%esp)
movl $0, 4(%esp)
movq (%esp), %xmm0
addl $28, %esp
ret
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@48090 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'lib/Target/X86/README-SSE.txt')
-rw-r--r-- | lib/Target/X86/README-SSE.txt | 38 |
1 files changed, 0 insertions, 38 deletions
diff --git a/lib/Target/X86/README-SSE.txt b/lib/Target/X86/README-SSE.txt index 7087c68..4d72245 100644 --- a/lib/Target/X86/README-SSE.txt +++ b/lib/Target/X86/README-SSE.txt @@ -781,41 +781,3 @@ LLVM should be able to generate the same thing as gcc. This looks like it is just a matter of matching (scalar_to_vector (load x)) to movd. //===---------------------------------------------------------------------===// - -These two functions should compile to identical code on x86-32: - -define <2 x i64> @test2(i64 %arg) { -entry: - %A = and i64 %arg, 1234567 - %B = insertelement <2 x i64> undef, i64 %A, i32 0 - ret <2 x i64> %B -} - -define <2 x i64> @test2(i64 %arg) { -entry: - %A = and i64 %arg, 1234567 - %B = insertelement <2 x i64> zeroinitializer, i64 %A, i32 0 - ret <2 x i64> %B -} - -The later compiles to: - -_test2: - movl $1234567, %eax - andl 4(%esp), %eax - movd %eax, %xmm0 - ret - -the former compiles to: - -_test2: - subl $28, %esp - movl $1234567, %eax - andl 32(%esp), %eax - movl %eax, (%esp) - movl $0, 4(%esp) - movaps (%esp), %xmm0 - addl $28, %esp - ret - -//===---------------------------------------------------------------------===// |