ARM: add cyclone CPU with ZeroCycleZeroing feature.

The Cyclone CPU is similar to swift for most LLVM purposes, but does have two preferred instructions for zeroing a VFP register. This teaches LLVM about them. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@205309 91177308-0d34-0410-b5e6-96231b3b80d8
author: Tim Northover <tnorthover@apple.com> 2014-04-01 13:22:02 +0000
committer: Tim Northover <tnorthover@apple.com> 2014-04-01 13:22:02 +0000
commit: c077472250ef27e514f5ad44f3b258a18a70f065 (patch)
tree: 29202ba7c1bc69f0b720c6d9a43168d066b1aa78 /lib/Target/ARM/ARMInstrNEON.td
parent: 279edf967edc1b2dcaaad3e263972cb4fe83b35d (diff)
download: llvm-c077472250ef27e514f5ad44f3b258a18a70f065.tar.gz
llvm-c077472250ef27e514f5ad44f3b258a18a70f065.tar.bz2
llvm-c077472250ef27e514f5ad44f3b258a18a70f065.tar.xz
1 files changed, 20 insertions, 0 deletions
diff --git a/lib/Target/ARM/ARMInstrNEON.td b/lib/Target/ARM/ARMInstrNEON.td
index b18eac55d8..0d46c49bcf 100644
--- a/lib/Target/ARM/ARMInstrNEON.td
+++ b/lib/Target/ARM/ARMInstrNEON.td
@@ -5245,6 +5245,26 @@ def VMOVv4f32 : N1ModImm<1, 0b000, 0b1111, 0, 1, 0, 1, (outs QPR:$Vd),
                          [(set QPR:$Vd, (v4f32 (NEONvmovFPImm timm:$SIMM)))]>;
 } // isReMaterializable
 
+
+// On some CPUs the two instructions "vmov.i32 dD, #0" and "vmov.i32 qD, #0"
+// require zero cycles to execute so they should be used wherever possible for
+// setting a register to zero.
+
+// Even without these pseudo-insts we would probably end up with the correct
+// instruction, but we could not mark the general ones with "isAsCheapAsAMove"
+// since they are sometimes rather expensive (in general).
+
+let AddedComplexity = 50, isAsCheapAsAMove = 1, isReMaterializable = 1 in {
+  def VMOVD0 : ARMPseudoExpand<(outs DPR:$Vd), (ins), 4, IIC_VMOVImm,
+                               [(set DPR:$Vd, (v2i32 NEONimmAllZerosV))],
+                               (VMOVv2i32 DPR:$Vd, 0, (ops 14, zero_reg))>,
+               Requires<[HasZCZ]>;
+  def VMOVQ0 : ARMPseudoExpand<(outs QPR:$Vd), (ins), 4, IIC_VMOVImm,
+                               [(set QPR:$Vd, (v4i32 NEONimmAllZerosV))],
+                               (VMOVv4i32 QPR:$Vd, 0, (ops 14, zero_reg))>,
+               Requires<[HasZCZ]>;
+}
+
 //   VMOV     : Vector Get Lane (move scalar to ARM core register)
 
 def VGETLNs8  : NVGetLane<{1,1,1,0,0,1,?,1}, 0b1011, {?,?},
author	Tim Northover <tnorthover@apple.com>	2014-04-01 13:22:02 +0000
committer	Tim Northover <tnorthover@apple.com>	2014-04-01 13:22:02 +0000
commit	c077472250ef27e514f5ad44f3b258a18a70f065 (patch)
tree	29202ba7c1bc69f0b720c6d9a43168d066b1aa78 /lib/Target/ARM/ARMInstrNEON.td
parent	279edf967edc1b2dcaaad3e263972cb4fe83b35d (diff)
download	llvm-c077472250ef27e514f5ad44f3b258a18a70f065.tar.gz llvm-c077472250ef27e514f5ad44f3b258a18a70f065.tar.bz2 llvm-c077472250ef27e514f5ad44f3b258a18a70f065.tar.xz