[AArch64] Prefer DUP/MOV ("CPY") to INS for vector_extract.

This avoids a partial false dependency on the previous content of the upper lanes of the destination vector register. Differential Revision: http://reviews.llvm.org/D7307 llvm-svn: 227820
author: Ahmed Bougacha <ahmed.bougacha@gmail.com> 2015-02-02 17:55:57 +0000
committer: Ahmed Bougacha <ahmed.bougacha@gmail.com> 2015-02-02 17:55:57 +0000
commit: dff57a61432da0c27869759581c1009d09f40e49 (patch)
tree: b613a98b3a9c6c5f942bed327913dbf279775dac /llvm/lib/Target/AArch64
parent: 8341358adc05877750543fcf2dbbb7e1d60fe645 (diff)
download: bcm5719-llvm-dff57a61432da0c27869759581c1009d09f40e49.tar.gz
bcm5719-llvm-dff57a61432da0c27869759581c1009d09f40e49.zip
1 files changed, 6 insertions, 14 deletions
diff --git a/llvm/lib/Target/AArch64/AArch64InstrInfo.td b/llvm/lib/Target/AArch64/AArch64InstrInfo.td
index e0fb90a9f62..6e4c0b006f2 100644
--- a/llvm/lib/Target/AArch64/AArch64InstrInfo.td
+++ b/llvm/lib/Target/AArch64/AArch64InstrInfo.td
@@ -3716,29 +3716,21 @@ defm : Neon_INS_elt_pattern<v2i64, v1i64, i64, INSvi32lane>;
 
 
 // Floating point vector extractions are codegen'd as either a sequence of
-// subregister extractions, possibly fed by an INS if the lane number is
-// anything other than zero.
+// subregister extractions, or a MOV (aka CPY here, alias for DUP) if
+// the lane number is anything other than zero.
 def : Pat<(vector_extract (v2f64 V128:$Rn), 0),
           (f64 (EXTRACT_SUBREG V128:$Rn, dsub))>;
 def : Pat<(vector_extract (v4f32 V128:$Rn), 0),
           (f32 (EXTRACT_SUBREG V128:$Rn, ssub))>;
 def : Pat<(vector_extract (v8f16 V128:$Rn), 0),
           (f16 (EXTRACT_SUBREG V128:$Rn, hsub))>;
+
 def : Pat<(vector_extract (v2f64 V128:$Rn), VectorIndexD:$idx),
-          (f64 (EXTRACT_SUBREG
-            (INSvi64lane (v2f64 (IMPLICIT_DEF)), 0,
-                         V128:$Rn, VectorIndexD:$idx),
-            dsub))>;
+          (f64 (CPYi64 V128:$Rn, VectorIndexD:$idx))>;
 def : Pat<(vector_extract (v4f32 V128:$Rn), VectorIndexS:$idx),
-          (f32 (EXTRACT_SUBREG
-            (INSvi32lane (v4f32 (IMPLICIT_DEF)), 0,
-                         V128:$Rn, VectorIndexS:$idx),
-            ssub))>;
+          (f32 (CPYi32 V128:$Rn, VectorIndexS:$idx))>;
 def : Pat<(vector_extract (v8f16 V128:$Rn), VectorIndexH:$idx),
-          (f16 (EXTRACT_SUBREG
-            (INSvi16lane (v8f16 (IMPLICIT_DEF)), 0,
-                         V128:$Rn, VectorIndexH:$idx),
-            hsub))>;
+          (f16 (CPYi16 V128:$Rn, VectorIndexH:$idx))>;
 
 // All concat_vectors operations are canonicalised to act on i64 vectors for
 // AArch64. In the general case we need an instruction, which had just as well be
author	Ahmed Bougacha <ahmed.bougacha@gmail.com>	2015-02-02 17:55:57 +0000
committer	Ahmed Bougacha <ahmed.bougacha@gmail.com>	2015-02-02 17:55:57 +0000
commit	dff57a61432da0c27869759581c1009d09f40e49 (patch)
tree	b613a98b3a9c6c5f942bed327913dbf279775dac /llvm/lib/Target/AArch64
parent	8341358adc05877750543fcf2dbbb7e1d60fe645 (diff)
download	bcm5719-llvm-dff57a61432da0c27869759581c1009d09f40e49.tar.gz bcm5719-llvm-dff57a61432da0c27869759581c1009d09f40e49.zip