vector_memcpy.ll 1.1 KB

12345678910111213141516171819202122232425262728
  1. ; RUN: opt < %s -scalarrepl -S > %t
  2. ; RUN: grep "ret <16 x float> %A" %t
  3. ; RUN: grep "ret <16 x float> zeroinitializer" %t
  4. target datalayout = "E-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64"
  5. define <16 x float> @foo(<16 x float> %A) nounwind {
  6. %tmp = alloca <16 x float>, align 16
  7. %tmp2 = alloca <16 x float>, align 16
  8. store <16 x float> %A, <16 x float>* %tmp
  9. %s = bitcast <16 x float>* %tmp to i8*
  10. %s2 = bitcast <16 x float>* %tmp2 to i8*
  11. call void @llvm.memcpy.p0i8.p0i8.i64(i8* %s2, i8* %s, i64 64, i32 16, i1 false)
  12. %R = load <16 x float>, <16 x float>* %tmp2
  13. ret <16 x float> %R
  14. }
  15. define <16 x float> @foo2(<16 x float> %A) nounwind {
  16. %tmp2 = alloca <16 x float>, align 16
  17. %s2 = bitcast <16 x float>* %tmp2 to i8*
  18. call void @llvm.memset.p0i8.i64(i8* %s2, i8 0, i64 64, i32 16, i1 false)
  19. %R = load <16 x float>, <16 x float>* %tmp2
  20. ret <16 x float> %R
  21. }
  22. declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i32, i1) nounwind
  23. declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i32, i1) nounwind