diff options
author | Bob Wilson <bob.wilson@apple.com> | 2009-08-08 05:53:00 +0000 |
---|---|---|
committer | Bob Wilson <bob.wilson@apple.com> | 2009-08-08 05:53:00 +0000 |
commit | 64efd90f8c878214abc29afa3d1c1e7bfe854a49 (patch) | |
tree | 9be36b26d6b2d9f2b20600577471d4b6d4d02bd6 /lib/Target/ARM/ARMInstrNEON.td | |
parent | b7479c035534b1c240117cd0aea8342393160da8 (diff) | |
download | external_llvm-64efd90f8c878214abc29afa3d1c1e7bfe854a49.zip external_llvm-64efd90f8c878214abc29afa3d1c1e7bfe854a49.tar.gz external_llvm-64efd90f8c878214abc29afa3d1c1e7bfe854a49.tar.bz2 |
Implement Neon VTRN instructions. For now, anyway, these are selected
directly from the intrinsics produced by the frontend. If it is more
convenient to have a custom DAG node for using these to implement shuffles,
we can add that later.
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@78459 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'lib/Target/ARM/ARMInstrNEON.td')
-rw-r--r-- | lib/Target/ARM/ARMInstrNEON.td | 21 |
1 files changed, 21 insertions, 0 deletions
diff --git a/lib/Target/ARM/ARMInstrNEON.td b/lib/Target/ARM/ARMInstrNEON.td index d7b132c..a69ef12 100644 --- a/lib/Target/ARM/ARMInstrNEON.td +++ b/lib/Target/ARM/ARMInstrNEON.td @@ -1917,6 +1917,27 @@ class VREV16Q<bits<2> op19_18, string OpcodeStr, ValueType Ty> def VREV16d8 : VREV16D<0b00, "vrev16.8", v8i8>; def VREV16q8 : VREV16Q<0b00, "vrev16.8", v16i8>; +// VTRN : Vector Transpose + +class VTRND<bits<2> op19_18, string OpcodeStr> + : N2V<0b11, 0b11, op19_18, 0b10, 0b00001, 0, 0, (outs DPR:$dst1, DPR:$dst2), + (ins DPR:$src1, DPR:$src2), NoItinerary, + !strconcat(OpcodeStr, "\t$dst1, $dst2"), + "$src1 = $dst1, $src2 = $dst2", []>; +class VTRNQ<bits<2> op19_18, string OpcodeStr> + : N2V<0b11, 0b11, op19_18, 0b10, 0b00001, 1, 0, (outs QPR:$dst1, QPR:$dst2), + (ins QPR:$src1, QPR:$src2), NoItinerary, + !strconcat(OpcodeStr, "\t$dst1, $dst2"), + "$src1 = $dst1, $src2 = $dst2", []>; + +def VTRNd8 : VTRND<0b00, "vtrn.8">; +def VTRNd16 : VTRND<0b01, "vtrn.16">; +def VTRNd32 : VTRND<0b10, "vtrn.32">; + +def VTRNq8 : VTRNQ<0b00, "vtrn.8">; +def VTRNq16 : VTRNQ<0b01, "vtrn.16">; +def VTRNq32 : VTRNQ<0b10, "vtrn.32">; + //===----------------------------------------------------------------------===// // NEON instructions for single-precision FP math //===----------------------------------------------------------------------===// |