Add new intrinsics for Neon VTRN, VZIP and VUZP operations. Modeling these

as vector shuffles did not work out well. Shuffles that produce double-wide vectors accurately represent the operation but make it hard to do anything with the results. I considered splitting them up into 2 shuffles, one to write each register separately, but there doesn't seem to be a good way to reunite them for codegen. git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@78437 91177308-0d34-0410-b5e6-96231b3b80d8
author: Bob Wilson <bob.wilson@apple.com> 2009-08-07 23:53:05 +0000
committer: Bob Wilson <bob.wilson@apple.com> 2009-08-07 23:53:05 +0000
commit: 9e699cc72639f25b20e73f51ab06ab7a0884ea62 (patch)
tree: 8e0082e7544b47805f1f4cad5ba444dd66308f26 /include/llvm/IntrinsicsARM.td
parent: c3c9239d76e2acb01dac8c72323a0b28fadebe4b (diff)
download: llvm-9e699cc72639f25b20e73f51ab06ab7a0884ea62.tar.gz
llvm-9e699cc72639f25b20e73f51ab06ab7a0884ea62.tar.bz2
llvm-9e699cc72639f25b20e73f51ab06ab7a0884ea62.tar.xz
1 files changed, 18 insertions, 0 deletions
diff --git a/include/llvm/IntrinsicsARM.td b/include/llvm/IntrinsicsARM.td
index efe5bff437..e9a7e2e91d 100644
--- a/include/llvm/IntrinsicsARM.td
+++ b/include/llvm/IntrinsicsARM.td
@@ -66,6 +66,12 @@ let TargetPrefix = "arm" in {  // All intrinsics start with "llvm.arm.".
                  LLVMTruncatedElementVectorType<0>,
                  LLVMTruncatedElementVectorType<0>],
                 [IntrNoMem]>;
+  class Neon_2Result_Intrinsic
+    : Intrinsic<[llvm_anyint_ty, LLVMMatchType<0>],
+                [LLVMMatchType<0>, LLVMMatchType<0>], [IntrNoMem]>;
+  class Neon_2Result_Float_Intrinsic
+    : Intrinsic<[llvm_anyfloat_ty, LLVMMatchType<0>],
+                [LLVMMatchType<0>, LLVMMatchType<0>], [IntrNoMem]>;
   class Neon_CvtFxToFP_Intrinsic
     : Intrinsic<[llvm_anyfloat_ty], [llvm_anyint_ty, llvm_i32_ty], [IntrNoMem]>;
   class Neon_CvtFPToFx_Intrinsic
@@ -288,6 +294,18 @@ def int_arm_neon_vqmovnsu : Neon_1Arg_Narrow_Intrinsic;
 def int_arm_neon_vmovls : Neon_1Arg_Long_Intrinsic;
 def int_arm_neon_vmovlu : Neon_1Arg_Long_Intrinsic;
 
+// Vector Transpose.
+def int_arm_neon_vtrni : Neon_2Result_Intrinsic;
+def int_arm_neon_vtrnf : Neon_2Result_Float_Intrinsic;
+
+// Vector Interleave (vzip).
+def int_arm_neon_vzipi : Neon_2Result_Intrinsic;
+def int_arm_neon_vzipf : Neon_2Result_Float_Intrinsic;
+
+// Vector Deinterleave (vuzp).
+def int_arm_neon_vuzpi : Neon_2Result_Intrinsic;
+def int_arm_neon_vuzpf : Neon_2Result_Float_Intrinsic;
+
 let TargetPrefix = "arm" in {
 
   // De-interleaving vector loads from N-element structures.
author	Bob Wilson <bob.wilson@apple.com>	2009-08-07 23:53:05 +0000
committer	Bob Wilson <bob.wilson@apple.com>	2009-08-07 23:53:05 +0000
commit	9e699cc72639f25b20e73f51ab06ab7a0884ea62 (patch)
tree	8e0082e7544b47805f1f4cad5ba444dd66308f26 /include/llvm/IntrinsicsARM.td
parent	c3c9239d76e2acb01dac8c72323a0b28fadebe4b (diff)
download	llvm-9e699cc72639f25b20e73f51ab06ab7a0884ea62.tar.gz llvm-9e699cc72639f25b20e73f51ab06ab7a0884ea62.tar.bz2 llvm-9e699cc72639f25b20e73f51ab06ab7a0884ea62.tar.xz