diff options
author | Bruno Cardoso Lopes <bruno.cardoso@gmail.com> | 2011-07-28 01:26:50 +0000 |
---|---|---|
committer | Bruno Cardoso Lopes <bruno.cardoso@gmail.com> | 2011-07-28 01:26:50 +0000 |
commit | 76bc28bac6625b4eaf585a0198f44e642251aed9 (patch) | |
tree | 5b44010c8e233c6b5c44bb515afda769ef44039d | |
parent | 3fb0b635bd41ede64765d3cc2bd99ee3f82cc0c0 (diff) | |
download | bcm5719-llvm-76bc28bac6625b4eaf585a0198f44e642251aed9.tar.gz bcm5719-llvm-76bc28bac6625b4eaf585a0198f44e642251aed9.zip |
Add patterns to generate copies for extract_subvector instead of
using vextractf128. This will reduce the number of issued instruction
for several avx codes.
llvm-svn: 136323
-rw-r--r-- | llvm/lib/Target/X86/X86InstrSSE.td | 12 | ||||
-rw-r--r-- | llvm/test/CodeGen/X86/avx-cast.ll | 6 |
2 files changed, 15 insertions, 3 deletions
diff --git a/llvm/lib/Target/X86/X86InstrSSE.td b/llvm/lib/Target/X86/X86InstrSSE.td index a3e8c4065d4..db1ab527f4f 100644 --- a/llvm/lib/Target/X86/X86InstrSSE.td +++ b/llvm/lib/Target/X86/X86InstrSSE.td @@ -5452,6 +5452,18 @@ def : Pat<(vextractf128_extract:$ext VR256:$src1, (i32 imm)), (v32i8 VR256:$src1), (EXTRACT_get_vextractf128_imm VR128:$ext)))>; +// Special COPY patterns +def : Pat<(v4i32 (extract_subvector (v8i32 VR256:$src), (i32 0))), + (v4i32 (EXTRACT_SUBREG (v8i32 VR256:$src), sub_xmm))>; +def : Pat<(v4f32 (extract_subvector (v8f32 VR256:$src), (i32 0))), + (v4f32 (EXTRACT_SUBREG (v8f32 VR256:$src), sub_xmm))>; + +def : Pat<(v2i64 (extract_subvector (v4i64 VR256:$src), (i32 0))), + (v2i64 (EXTRACT_SUBREG (v4i64 VR256:$src), sub_xmm))>; +def : Pat<(v2f64 (extract_subvector (v4f64 VR256:$src), (i32 0))), + (v2f64 (EXTRACT_SUBREG (v4f64 VR256:$src), sub_xmm))>; + + //===----------------------------------------------------------------------===// // VMASKMOV - Conditional SIMD Packed Loads and Stores // diff --git a/llvm/test/CodeGen/X86/avx-cast.ll b/llvm/test/CodeGen/X86/avx-cast.ll index 7e368b3d9ee..d6d2415ea05 100644 --- a/llvm/test/CodeGen/X86/avx-cast.ll +++ b/llvm/test/CodeGen/X86/avx-cast.ll @@ -24,21 +24,21 @@ entry: ret <4 x i64> %shuffle.i } -; CHECK: vextractf128 $0 +; CHECK-NOT: vextractf128 $0 define <4 x float> @castD(<8 x float> %m) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <8 x float> %m, <8 x float> %m, <4 x i32> <i32 0, i32 1, i32 2, i32 3> ret <4 x float> %shuffle.i } -; CHECK: vextractf128 $0 +; CHECK-NOT: vextractf128 $0 define <2 x i64> @castE(<4 x i64> %m) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x i64> %m, <4 x i64> %m, <2 x i32> <i32 0, i32 1> ret <2 x i64> %shuffle.i } -; CHECK: vextractf128 $0 +; CHECK-NOT: vextractf128 $0 define <2 x double> @castF(<4 x double> %m) nounwind uwtable readnone ssp { entry: %shuffle.i = shufflevector <4 x double> %m, <4 x double> %m, <2 x i32> <i32 0, i32 1> |