forked from OSchip/llvm-project
VST2 four-register w/ update pseudos for fixed/register update.
rdar://10724489 llvm-svn: 148560
This commit is contained in:
parent
9652adf2af
commit
90f5780fc1
|
@ -1409,6 +1409,15 @@ class VSTQQWBPseudo<InstrItinClass itin>
|
|||
: PseudoNLdSt<(outs GPR:$wb),
|
||||
(ins addrmode6:$addr, am6offset:$offset, QQPR:$src), itin,
|
||||
"$addr.addr = $wb">;
|
||||
class VSTQQWBfixedPseudo<InstrItinClass itin>
|
||||
: PseudoNLdSt<(outs GPR:$wb),
|
||||
(ins addrmode6:$addr, QQPR:$src), itin,
|
||||
"$addr.addr = $wb">;
|
||||
class VSTQQWBregisterPseudo<InstrItinClass itin>
|
||||
: PseudoNLdSt<(outs GPR:$wb),
|
||||
(ins addrmode6:$addr, rGPR:$offset, QQPR:$src), itin,
|
||||
"$addr.addr = $wb">;
|
||||
|
||||
class VSTQQQQPseudo<InstrItinClass itin>
|
||||
: PseudoNLdSt<(outs), (ins addrmode6:$addr, QQQQPR:$src), itin, "">;
|
||||
class VSTQQQQWBPseudo<InstrItinClass itin>
|
||||
|
@ -1680,12 +1689,12 @@ def VST2d8PseudoWB_register : VSTQWBregisterPseudo<IIC_VST2u>;
|
|||
def VST2d16PseudoWB_register : VSTQWBregisterPseudo<IIC_VST2u>;
|
||||
def VST2d32PseudoWB_register : VSTQWBregisterPseudo<IIC_VST2u>;
|
||||
|
||||
def VST2q8PseudoWB_fixed : VSTQQWBPseudo<IIC_VST2x2u>;
|
||||
def VST2q16PseudoWB_fixed : VSTQQWBPseudo<IIC_VST2x2u>;
|
||||
def VST2q32PseudoWB_fixed : VSTQQWBPseudo<IIC_VST2x2u>;
|
||||
def VST2q8PseudoWB_register : VSTQQWBPseudo<IIC_VST2x2u>;
|
||||
def VST2q16PseudoWB_register : VSTQQWBPseudo<IIC_VST2x2u>;
|
||||
def VST2q32PseudoWB_register : VSTQQWBPseudo<IIC_VST2x2u>;
|
||||
def VST2q8PseudoWB_fixed : VSTQQWBfixedPseudo<IIC_VST2x2u>;
|
||||
def VST2q16PseudoWB_fixed : VSTQQWBfixedPseudo<IIC_VST2x2u>;
|
||||
def VST2q32PseudoWB_fixed : VSTQQWBfixedPseudo<IIC_VST2x2u>;
|
||||
def VST2q8PseudoWB_register : VSTQQWBregisterPseudo<IIC_VST2x2u>;
|
||||
def VST2q16PseudoWB_register : VSTQQWBregisterPseudo<IIC_VST2x2u>;
|
||||
def VST2q32PseudoWB_register : VSTQQWBregisterPseudo<IIC_VST2x2u>;
|
||||
|
||||
// ...with double-spaced registers
|
||||
def VST2b8 : VST2<0b1001, {0,0,?,?}, "8", VecListTwoQ, IIC_VST2>;
|
||||
|
|
|
@ -119,6 +119,15 @@ define i8* @vst2update(i8* %out, <4 x i16>* %B) nounwind {
|
|||
ret i8* %t5
|
||||
}
|
||||
|
||||
define i8* @vst2update2(i8 * %out, <4 x float> * %this) nounwind optsize ssp align 2 {
|
||||
;CHECK: vst2update2
|
||||
;CHECK: vst2.32 {d16, d17, d18, d19}, [r0]!
|
||||
%tmp1 = load <4 x float>* %this
|
||||
call void @llvm.arm.neon.vst2.v4f32(i8* %out, <4 x float> %tmp1, <4 x float> %tmp1, i32 4) nounwind
|
||||
%tmp2 = getelementptr inbounds i8* %out, i32 32
|
||||
ret i8* %tmp2
|
||||
}
|
||||
|
||||
declare void @llvm.arm.neon.vst2.v8i8(i8*, <8 x i8>, <8 x i8>, i32) nounwind
|
||||
declare void @llvm.arm.neon.vst2.v4i16(i8*, <4 x i16>, <4 x i16>, i32) nounwind
|
||||
declare void @llvm.arm.neon.vst2.v2i32(i8*, <2 x i32>, <2 x i32>, i32) nounwind
|
||||
|
|
Loading…
Reference in New Issue