third_party/LLVM/test/Transforms/ScalarRepl/vector_memcpy.ll - SwiftShader - Git at Google

 ; RUN: opt < %s -scalarrepl -S > %t
 ; RUN: grep {ret <16 x float> %A} %t
 ; RUN: grep {ret <16 x float> zeroinitializer} %t
 target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64"

 define <16 x float> @foo(<16 x float> %A) nounwind {
 	%tmp = alloca <16 x float>, align 16
 	%tmp2 = alloca <16 x float>, align 16
 	store <16 x float> %A, <16 x float>* %tmp
 	%s = bitcast <16 x float>* %tmp to i8*
 	%s2 = bitcast <16 x float>* %tmp2 to i8*
 	call void @llvm.memcpy.i64(i8* %s2, i8* %s, i64 64, i32 16)

 	%R = load <16 x float>* %tmp2
 	ret <16 x float> %R
 }

 define <16 x float> @foo2(<16 x float> %A) nounwind {
 	%tmp2 = alloca <16 x float>, align 16

 	%s2 = bitcast <16 x float>* %tmp2 to i8*
 	call void @llvm.memset.i64(i8* %s2, i8 0, i64 64, i32 16)

 	%R = load <16 x float>* %tmp2
 	ret <16 x float> %R
 }


 declare void @llvm.memcpy.i64(i8* nocapture, i8* nocapture, i64, i32) nounwind
 declare void @llvm.memset.i64(i8* nocapture, i8, i64, i32) nounwind
	; RUN: opt < %s -scalarrepl -S > %t
	; RUN: grep {ret <16 x float> %A} %t
	; RUN: grep {ret <16 x float> zeroinitializer} %t
	target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64"

	define <16 x float> @foo(<16 x float> %A) nounwind {
	%tmp = alloca <16 x float>, align 16
	%tmp2 = alloca <16 x float>, align 16
	store <16 x float> %A, <16 x float>* %tmp
	%s = bitcast <16 x float>* %tmp to i8*
	%s2 = bitcast <16 x float>* %tmp2 to i8*
	call void @llvm.memcpy.i64(i8* %s2, i8* %s, i64 64, i32 16)

	%R = load <16 x float>* %tmp2
	ret <16 x float> %R
	}

	define <16 x float> @foo2(<16 x float> %A) nounwind {
	%tmp2 = alloca <16 x float>, align 16

	%s2 = bitcast <16 x float>* %tmp2 to i8*
	call void @llvm.memset.i64(i8* %s2, i8 0, i64 64, i32 16)

	%R = load <16 x float>* %tmp2
	ret <16 x float> %R
	}


	declare void @llvm.memcpy.i64(i8* nocapture, i8* nocapture, i64, i32) nounwind
	declare void @llvm.memset.i64(i8* nocapture, i8, i64, i32) nounwind