OverwriteStoreEnd.ll 4.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495
  1. ; RUN: opt < %s -basicaa -dse -S | FileCheck %s
  2. target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
  3. %struct.vec2 = type { <4 x i32>, <4 x i32> }
  4. %struct.vec2plusi = type { <4 x i32>, <4 x i32>, i32 }
  5. @glob1 = global %struct.vec2 zeroinitializer, align 16
  6. @glob2 = global %struct.vec2plusi zeroinitializer, align 16
  7. define void @write24to28(i32* nocapture %p) nounwind uwtable ssp {
  8. ; CHECK-LABEL: @write24to28(
  9. entry:
  10. %arrayidx0 = getelementptr inbounds i32, i32* %p, i64 1
  11. %p3 = bitcast i32* %arrayidx0 to i8*
  12. ; CHECK: call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 24, i32 4, i1 false)
  13. call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 28, i32 4, i1 false)
  14. %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7
  15. store i32 1, i32* %arrayidx1, align 4
  16. ret void
  17. }
  18. define void @write28to32(i32* nocapture %p) nounwind uwtable ssp {
  19. ; CHECK-LABEL: @write28to32(
  20. entry:
  21. %p3 = bitcast i32* %p to i8*
  22. ; CHECK: call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 28, i32 4, i1 false)
  23. call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 32, i32 4, i1 false)
  24. %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7
  25. store i32 1, i32* %arrayidx1, align 4
  26. ret void
  27. }
  28. define void @dontwrite28to32memset(i32* nocapture %p) nounwind uwtable ssp {
  29. ; CHECK-LABEL: @dontwrite28to32memset(
  30. entry:
  31. %p3 = bitcast i32* %p to i8*
  32. ; CHECK: call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 32, i32 16, i1 false)
  33. call void @llvm.memset.p0i8.i64(i8* %p3, i8 0, i64 32, i32 16, i1 false)
  34. %arrayidx1 = getelementptr inbounds i32, i32* %p, i64 7
  35. store i32 1, i32* %arrayidx1, align 4
  36. ret void
  37. }
  38. define void @write32to36(%struct.vec2plusi* nocapture %p) nounwind uwtable ssp {
  39. ; CHECK-LABEL: @write32to36(
  40. entry:
  41. %0 = bitcast %struct.vec2plusi* %p to i8*
  42. ; CHECK: tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* %0, i8* bitcast (%struct.vec2plusi* @glob2 to i8*), i64 32, i32 16, i1 false)
  43. tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* %0, i8* bitcast (%struct.vec2plusi* @glob2 to i8*), i64 36, i32 16, i1 false)
  44. %c = getelementptr inbounds %struct.vec2plusi, %struct.vec2plusi* %p, i64 0, i32 2
  45. store i32 1, i32* %c, align 4
  46. ret void
  47. }
  48. define void @write16to32(%struct.vec2* nocapture %p) nounwind uwtable ssp {
  49. ; CHECK-LABEL: @write16to32(
  50. entry:
  51. %0 = bitcast %struct.vec2* %p to i8*
  52. ; CHECK: tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* %0, i8* bitcast (%struct.vec2* @glob1 to i8*), i64 16, i32 16, i1 false)
  53. tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* %0, i8* bitcast (%struct.vec2* @glob1 to i8*), i64 32, i32 16, i1 false)
  54. %c = getelementptr inbounds %struct.vec2, %struct.vec2* %p, i64 0, i32 1
  55. store <4 x i32> <i32 1, i32 2, i32 3, i32 4>, <4 x i32>* %c, align 4
  56. ret void
  57. }
  58. define void @dontwrite28to32memcpy(%struct.vec2* nocapture %p) nounwind uwtable ssp {
  59. ; CHECK-LABEL: @dontwrite28to32memcpy(
  60. entry:
  61. %0 = bitcast %struct.vec2* %p to i8*
  62. ; CHECK: tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* %0, i8* bitcast (%struct.vec2* @glob1 to i8*), i64 32, i32 16, i1 false)
  63. tail call void @llvm.memcpy.p0i8.p0i8.i64(i8* %0, i8* bitcast (%struct.vec2* @glob1 to i8*), i64 32, i32 16, i1 false)
  64. %arrayidx1 = getelementptr inbounds %struct.vec2, %struct.vec2* %p, i64 0, i32 0, i64 7
  65. store i32 1, i32* %arrayidx1, align 4
  66. ret void
  67. }
  68. declare void @llvm.memcpy.p0i8.p0i8.i64(i8* nocapture, i8* nocapture, i64, i32, i1) nounwind
  69. declare void @llvm.memset.p0i8.i64(i8* nocapture, i8, i64, i32, i1) nounwind
  70. %struct.trapframe = type { i64, i64, i64 }
  71. ; bugzilla 11455 - make sure negative GEP's don't break this optimisation
  72. ; CHECK-LABEL: @cpu_lwp_fork(
  73. define void @cpu_lwp_fork(%struct.trapframe* %md_regs, i64 %pcb_rsp0) nounwind uwtable noinline ssp {
  74. entry:
  75. %0 = inttoptr i64 %pcb_rsp0 to %struct.trapframe*
  76. %add.ptr = getelementptr inbounds %struct.trapframe, %struct.trapframe* %0, i64 -1
  77. %1 = bitcast %struct.trapframe* %add.ptr to i8*
  78. %2 = bitcast %struct.trapframe* %md_regs to i8*
  79. ; CHECK: call void @llvm.memcpy.p0i8.p0i8.i64(i8* %1, i8* %2, i64 24, i32 1, i1 false)
  80. call void @llvm.memcpy.p0i8.p0i8.i64(i8* %1, i8* %2, i64 24, i32 1, i1 false)
  81. %tf_trapno = getelementptr inbounds %struct.trapframe, %struct.trapframe* %0, i64 -1, i32 1
  82. store i64 3, i64* %tf_trapno, align 8
  83. ret void
  84. }