diff options
| author | Craig Topper <craig.topper@gmail.com> | 2016-05-08 07:10:50 +0000 |
|---|---|---|
| committer | Craig Topper <craig.topper@gmail.com> | 2016-05-08 07:10:50 +0000 |
| commit | 3d6722910c6284b4bb28cfec0680741a2259faa4 (patch) | |
| tree | a3a41784c34e26c956b745fc98fe0d7a0ced19a9 /llvm/lib/Target | |
| parent | d7884984119a1492181e31f7ff51c5f6e2534049 (diff) | |
| download | bcm5719-llvm-3d6722910c6284b4bb28cfec0680741a2259faa4.tar.gz bcm5719-llvm-3d6722910c6284b4bb28cfec0680741a2259faa4.zip | |
[X86] Add patterns for 256-bit non-temporal stores when only AVX1 is supported. While there, add a predicate to the SSE2 patterns to avoid an ordering dependency.
llvm-svn: 268872
Diffstat (limited to 'llvm/lib/Target')
| -rw-r--r-- | llvm/lib/Target/X86/X86InstrSSE.td | 26 |
1 files changed, 20 insertions, 6 deletions
diff --git a/llvm/lib/Target/X86/X86InstrSSE.td b/llvm/lib/Target/X86/X86InstrSSE.td index 1490fd03fe5..587d500dc56 100644 --- a/llvm/lib/Target/X86/X86InstrSSE.td +++ b/llvm/lib/Target/X86/X86InstrSSE.td @@ -3648,6 +3648,18 @@ let Predicates = [HasAVX2, NoVLX] in { (VMOVNTDQYmr addr:$dst, VR256:$src)>; } +// If integer type isn't available, use the floating point type. +let Predicates = [HasAVX1Only] in { + def : Pat<(alignednontemporalstore (v4i64 VR256:$src), addr:$dst), + (VMOVNTPSYmr addr:$dst, VR256:$src)>; + def : Pat<(alignednontemporalstore (v8i32 VR256:$src), addr:$dst), + (VMOVNTPSYmr addr:$dst, VR256:$src)>; + def : Pat<(alignednontemporalstore (v16i16 VR256:$src), addr:$dst), + (VMOVNTPSYmr addr:$dst, VR256:$src)>; + def : Pat<(alignednontemporalstore (v32i8 VR256:$src), addr:$dst), + (VMOVNTPSYmr addr:$dst, VR256:$src)>; +} + let Predicates = [HasAVX, NoVLX] in { def : Pat<(alignednontemporalstore (v4i32 VR128:$src), addr:$dst), (VMOVNTDQmr addr:$dst, VR128:$src)>; @@ -3657,12 +3669,14 @@ let Predicates = [HasAVX, NoVLX] in { (VMOVNTDQmr addr:$dst, VR128:$src)>; } -def : Pat<(alignednontemporalstore (v4i32 VR128:$src), addr:$dst), - (MOVNTDQmr addr:$dst, VR128:$src)>; -def : Pat<(alignednontemporalstore (v8i16 VR128:$src), addr:$dst), - (MOVNTDQmr addr:$dst, VR128:$src)>; -def : Pat<(alignednontemporalstore (v16i8 VR128:$src), addr:$dst), - (MOVNTDQmr addr:$dst, VR128:$src)>; +let Predicates = [UseSSE2] in { + def : Pat<(alignednontemporalstore (v4i32 VR128:$src), addr:$dst), + (MOVNTDQmr addr:$dst, VR128:$src)>; + def : Pat<(alignednontemporalstore (v8i16 VR128:$src), addr:$dst), + (MOVNTDQmr addr:$dst, VR128:$src)>; + def : Pat<(alignednontemporalstore (v16i8 VR128:$src), addr:$dst), + (MOVNTDQmr addr:$dst, VR128:$src)>; +} } // AddedComplexity |

