26 lines
1.5 KiB
LLVM
26 lines
1.5 KiB
LLVM
; RUN: llc < %s -march=x86 -mattr=+sse2 -mtriple=i686-apple-darwin8.8.0 | grep mov | count 7
|
|
|
|
%struct.vector4_t = type { <4 x float> }
|
|
|
|
define void @swizzle(i8* %a, %struct.vector4_t* %b, %struct.vector4_t* %c) nounwind {
|
|
entry:
|
|
%tmp9 = getelementptr %struct.vector4_t* %b, i32 0, i32 0 ; <<4 x float>*> [#uses=2]
|
|
%tmp10 = load <4 x float>* %tmp9, align 16 ; <<4 x float>> [#uses=1]
|
|
%tmp14 = bitcast i8* %a to double* ; <double*> [#uses=1]
|
|
%tmp15 = load double* %tmp14 ; <double> [#uses=1]
|
|
%tmp16 = insertelement <2 x double> undef, double %tmp15, i32 0 ; <<2 x double>> [#uses=1]
|
|
%tmp18 = bitcast <2 x double> %tmp16 to <4 x float> ; <<4 x float>> [#uses=1]
|
|
%tmp19 = shufflevector <4 x float> %tmp10, <4 x float> %tmp18, <4 x i32> < i32 4, i32 5, i32 2, i32 3 > ; <<4 x float>> [#uses=1]
|
|
store <4 x float> %tmp19, <4 x float>* %tmp9, align 16
|
|
%tmp28 = getelementptr %struct.vector4_t* %c, i32 0, i32 0 ; <<4 x float>*> [#uses=2]
|
|
%tmp29 = load <4 x float>* %tmp28, align 16 ; <<4 x float>> [#uses=1]
|
|
%tmp26 = getelementptr i8* %a, i32 8 ; <i8*> [#uses=1]
|
|
%tmp33 = bitcast i8* %tmp26 to double* ; <double*> [#uses=1]
|
|
%tmp34 = load double* %tmp33 ; <double> [#uses=1]
|
|
%tmp35 = insertelement <2 x double> undef, double %tmp34, i32 0 ; <<2 x double>> [#uses=1]
|
|
%tmp37 = bitcast <2 x double> %tmp35 to <4 x float> ; <<4 x float>> [#uses=1]
|
|
%tmp38 = shufflevector <4 x float> %tmp29, <4 x float> %tmp37, <4 x i32> < i32 4, i32 5, i32 2, i32 3 > ; <<4 x float>> [#uses=1]
|
|
store <4 x float> %tmp38, <4 x float>* %tmp28, align 16
|
|
ret void
|
|
}
|