diff options
author | Bruno Cardoso Lopes <bruno.cardoso@gmail.com> | 2010-06-19 00:37:31 +0000 |
---|---|---|
committer | Bruno Cardoso Lopes <bruno.cardoso@gmail.com> | 2010-06-19 00:37:31 +0000 |
commit | be4d595afd6e0d1a1c0a511dabf2c5a724bdf366 (patch) | |
tree | 5999f608fcf3bd19475aa6c2c52803ff10f08524 /lib | |
parent | 617e595022504652c083421dbb49a9c5d95aba23 (diff) | |
download | external_llvm-be4d595afd6e0d1a1c0a511dabf2c5a724bdf366.zip external_llvm-be4d595afd6e0d1a1c0a511dabf2c5a724bdf366.tar.gz external_llvm-be4d595afd6e0d1a1c0a511dabf2c5a724bdf366.tar.bz2 |
Shrink down code and add for free AVX {MIN,MAX}P{S,D}{rm,rr} instructions
git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@106366 91177308-0d34-0410-b5e6-96231b3b80d8
Diffstat (limited to 'lib')
-rw-r--r-- | lib/Target/X86/X86InstrSSE.td | 87 |
1 files changed, 28 insertions, 59 deletions
diff --git a/lib/Target/X86/X86InstrSSE.td b/lib/Target/X86/X86InstrSSE.td index 1c84cc7..88c4771 100644 --- a/lib/Target/X86/X86InstrSSE.td +++ b/lib/Target/X86/X86InstrSSE.td @@ -788,6 +788,24 @@ multiclass sse12_fp_binop_rm<bits<8> opc, string OpcodeStr, defm V#NAME#SD : sse12_fp_scalar<opc, !strconcat(OpcodeStr, "sd\t{$src2, $src1, $dst|$dst, $src1, $src2}"), OpNode, FR64, f64mem>, XD, VEX_4V; + + defm V#NAME#PS : sse12_fp_packed<opc, !strconcat(OpcodeStr, + "ps\t{$src2, $src1, $dst|$dst, $src1, $src2}"), OpNode, + VR128, v4f32, f128mem, memopv4f32, SSEPackedSingle>, + VEX_4V; + + defm V#NAME#PD : sse12_fp_packed<opc, !strconcat(OpcodeStr, + "pd\t{$src2, $src1, $dst|$dst, $src1, $src2}"), OpNode, + VR128, v2f64, f128mem, memopv2f64, SSEPackedDouble>, + OpSize, VEX_4V; + + defm V#NAME#SS : sse12_fp_scalar_int<opc, OpcodeStr, VR128, + !strconcat(OpcodeStr, "ss\t{$src2, $src1, $dst|$dst, $src1, $src2}"), + "", "_ss", ssmem, sse_load_f32>, XS, VEX_4V; + + defm V#NAME#SD : sse12_fp_scalar_int<opc, OpcodeStr, VR128, + !strconcat(OpcodeStr, "sd\t{$src2, $src1, $dst|$dst, $src1, $src2}"), + "2", "_sd", sdmem, sse_load_f64>, XD, VEX_4V; } let Constraints = "$src1 = $dst" in { @@ -798,72 +816,23 @@ multiclass sse12_fp_binop_rm<bits<8> opc, string OpcodeStr, defm SD : sse12_fp_scalar<opc, !strconcat(OpcodeStr, "sd\t{$src2, $dst|$dst, $src2}"), OpNode, FR64, f64mem>, XD; - } - - // Vector operation, reg+reg. - def PSrr : PSI<opc, MRMSrcReg, (outs VR128:$dst), - (ins VR128:$src1, VR128:$src2), - !strconcat(OpcodeStr, "ps\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (v4f32 (OpNode VR128:$src1, VR128:$src2)))]> { - let isCommutable = Commutable; - } - - def PDrr : PDI<opc, MRMSrcReg, (outs VR128:$dst), - (ins VR128:$src1, VR128:$src2), - !strconcat(OpcodeStr, "pd\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (v2f64 (OpNode VR128:$src1, VR128:$src2)))]> { - let isCommutable = Commutable; - } - - // Vector operation, reg+mem. - def PSrm : PSI<opc, MRMSrcMem, (outs VR128:$dst), - (ins VR128:$src1, f128mem:$src2), - !strconcat(OpcodeStr, "ps\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (OpNode VR128:$src1, (memopv4f32 addr:$src2)))]>; + defm PS : sse12_fp_packed<opc, !strconcat(OpcodeStr, + "ps\t{$src2, $dst|$dst, $src2}"), OpNode, VR128, v4f32, + f128mem, memopv4f32, SSEPackedSingle>, TB; - def PDrm : PDI<opc, MRMSrcMem, (outs VR128:$dst), - (ins VR128:$src1, f128mem:$src2), - !strconcat(OpcodeStr, "pd\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (OpNode VR128:$src1, (memopv2f64 addr:$src2)))]>; + defm PD : sse12_fp_packed<opc, !strconcat(OpcodeStr, + "pd\t{$src2, $dst|$dst, $src2}"), OpNode, VR128, v2f64, + f128mem, memopv2f64, SSEPackedDouble>, TB, OpSize; - // Intrinsic operation, reg+reg. - def SSrr_Int : SSI<opc, MRMSrcReg, (outs VR128:$dst), - (ins VR128:$src1, VR128:$src2), + defm SS : sse12_fp_scalar_int<opc, OpcodeStr, VR128, !strconcat(OpcodeStr, "ss\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (!nameconcat<Intrinsic>("int_x86_sse_", - !strconcat(OpcodeStr, "_ss")) VR128:$src1, - VR128:$src2))]> { - // int_x86_sse_xxx_ss - let isCommutable = Commutable; - } + "", "_ss", ssmem, sse_load_f32>, XS; - def SDrr_Int : SDI<opc, MRMSrcReg, (outs VR128:$dst), - (ins VR128:$src1, VR128:$src2), + defm SD : sse12_fp_scalar_int<opc, OpcodeStr, VR128, !strconcat(OpcodeStr, "sd\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (!nameconcat<Intrinsic>("int_x86_sse2_", - !strconcat(OpcodeStr, "_sd")) VR128:$src1, - VR128:$src2))]> { - // int_x86_sse2_xxx_sd - let isCommutable = Commutable; + "2", "_sd", sdmem, sse_load_f64>, XD; } - // Intrinsic operation, reg+mem. - def SSrm_Int : SSI<opc, MRMSrcMem, (outs VR128:$dst), - (ins VR128:$src1, ssmem:$src2), - !strconcat(OpcodeStr, "ss\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (!nameconcat<Intrinsic>("int_x86_sse_", - !strconcat(OpcodeStr, "_ss")) VR128:$src1, - sse_load_f32:$src2))]>; - // int_x86_sse_xxx_ss - - def SDrm_Int : SDI<opc, MRMSrcMem, (outs VR128:$dst), - (ins VR128:$src1, sdmem:$src2), - !strconcat(OpcodeStr, "sd\t{$src2, $dst|$dst, $src2}"), - [(set VR128:$dst, (!nameconcat<Intrinsic>("int_x86_sse2_", - !strconcat(OpcodeStr, "_sd")) VR128:$src1, - sse_load_f64:$src2))]>; - // int_x86_sse2_xxx_sd - // Vector intrinsic operation, reg+reg. def PSrr_Int : PSI<opc, MRMSrcReg, (outs VR128:$dst), (ins VR128:$src1, VR128:$src2), |