cycle.ll 5.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112
  1. target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128"
  2. ; RUN: opt < %s -bb-vectorize -bb-vectorize-req-chain-depth=3 -bb-vectorize-ignore-target-info -instcombine -gvn -S | FileCheck %s
  3. ; This test checks the non-trivial pairing-induced cycle avoidance. Without this cycle avoidance, the algorithm would otherwise
  4. ; want to select the pairs:
  5. ; %div77 = fdiv double %sub74, %mul76.v.r1 <-> %div125 = fdiv double %mul121, %mul76.v.r2 (div125 depends on mul117)
  6. ; %add84 = fadd double %sub83, 2.000000e+00 <-> %add127 = fadd double %mul126, 1.000000e+00 (add127 depends on div77)
  7. ; %mul95 = fmul double %sub45.v.r1, %sub36.v.r1 <-> %mul88 = fmul double %sub36.v.r1, %sub87 (mul88 depends on add84)
  8. ; %mul117 = fmul double %sub39.v.r1, %sub116 <-> %mul97 = fmul double %mul96, %sub39.v.r1 (mul97 depends on mul95)
  9. ; and so a dependency cycle would be created.
  10. declare double @fabs(double) nounwind readnone
  11. define void @test1(double %a, double %b, double %c, double %add80, double %mul1, double %mul2.v.r1, double %mul73, double %sub, double %sub65, double %F.0, i32 %n.0, double %Bnm3.0, double %Bnm2.0, double %Bnm1.0, double %Anm3.0, double %Anm2.0, double %Anm1.0) {
  12. entry:
  13. br label %go
  14. go:
  15. %conv = sitofp i32 %n.0 to double
  16. %add35 = fadd double %conv, %a
  17. %sub36 = fadd double %add35, -1.000000e+00
  18. %add38 = fadd double %conv, %b
  19. %sub39 = fadd double %add38, -1.000000e+00
  20. %add41 = fadd double %conv, %c
  21. %sub42 = fadd double %add41, -1.000000e+00
  22. %sub45 = fadd double %add35, -2.000000e+00
  23. %sub48 = fadd double %add38, -2.000000e+00
  24. %sub51 = fadd double %add41, -2.000000e+00
  25. %mul52 = shl nsw i32 %n.0, 1
  26. %sub53 = add nsw i32 %mul52, -1
  27. %conv54 = sitofp i32 %sub53 to double
  28. %sub56 = add nsw i32 %mul52, -3
  29. %conv57 = sitofp i32 %sub56 to double
  30. %sub59 = add nsw i32 %mul52, -5
  31. %conv60 = sitofp i32 %sub59 to double
  32. %mul61 = mul nsw i32 %n.0, %n.0
  33. %conv62 = sitofp i32 %mul61 to double
  34. %mul63 = fmul double %conv62, 3.000000e+00
  35. %mul67 = fmul double %sub65, %conv
  36. %add68 = fadd double %mul63, %mul67
  37. %add69 = fadd double %add68, 2.000000e+00
  38. %sub71 = fsub double %add69, %mul2.v.r1
  39. %sub74 = fsub double %sub71, %mul73
  40. %mul75 = fmul double %conv57, 2.000000e+00
  41. %mul76 = fmul double %mul75, %sub42
  42. %div77 = fdiv double %sub74, %mul76
  43. %mul82 = fmul double %add80, %conv
  44. %sub83 = fsub double %mul63, %mul82
  45. %add84 = fadd double %sub83, 2.000000e+00
  46. %sub86 = fsub double %add84, %mul2.v.r1
  47. %sub87 = fsub double -0.000000e+00, %sub86
  48. %mul88 = fmul double %sub36, %sub87
  49. %mul89 = fmul double %mul88, %sub39
  50. %mul90 = fmul double %conv54, 4.000000e+00
  51. %mul91 = fmul double %mul90, %conv57
  52. %mul92 = fmul double %mul91, %sub51
  53. %mul93 = fmul double %mul92, %sub42
  54. %div94 = fdiv double %mul89, %mul93
  55. %mul95 = fmul double %sub45, %sub36
  56. %mul96 = fmul double %mul95, %sub48
  57. %mul97 = fmul double %mul96, %sub39
  58. %sub99 = fsub double %conv, %a
  59. %sub100 = fadd double %sub99, -2.000000e+00
  60. %mul101 = fmul double %mul97, %sub100
  61. %sub103 = fsub double %conv, %b
  62. %sub104 = fadd double %sub103, -2.000000e+00
  63. %mul105 = fmul double %mul101, %sub104
  64. %mul106 = fmul double %conv57, 8.000000e+00
  65. %mul107 = fmul double %mul106, %conv57
  66. %mul108 = fmul double %mul107, %conv60
  67. %sub111 = fadd double %add41, -3.000000e+00
  68. %mul112 = fmul double %mul108, %sub111
  69. %mul113 = fmul double %mul112, %sub51
  70. %mul114 = fmul double %mul113, %sub42
  71. %div115 = fdiv double %mul105, %mul114
  72. %sub116 = fsub double -0.000000e+00, %sub36
  73. %mul117 = fmul double %sub39, %sub116
  74. %sub119 = fsub double %conv, %c
  75. %sub120 = fadd double %sub119, -1.000000e+00
  76. %mul121 = fmul double %mul117, %sub120
  77. %mul123 = fmul double %mul75, %sub51
  78. %mul124 = fmul double %mul123, %sub42
  79. %div125 = fdiv double %mul121, %mul124
  80. %mul126 = fmul double %div77, %sub
  81. %add127 = fadd double %mul126, 1.000000e+00
  82. %mul128 = fmul double %add127, %Anm1.0
  83. %mul129 = fmul double %div94, %sub
  84. %add130 = fadd double %div125, %mul129
  85. %mul131 = fmul double %add130, %sub
  86. %mul132 = fmul double %mul131, %Anm2.0
  87. %add133 = fadd double %mul128, %mul132
  88. %mul134 = fmul double %div115, %mul1
  89. %mul135 = fmul double %mul134, %Anm3.0
  90. %add136 = fadd double %add133, %mul135
  91. %mul139 = fmul double %add127, %Bnm1.0
  92. %mul143 = fmul double %mul131, %Bnm2.0
  93. %add144 = fadd double %mul139, %mul143
  94. %mul146 = fmul double %mul134, %Bnm3.0
  95. %add147 = fadd double %add144, %mul146
  96. %div148 = fdiv double %add136, %add147
  97. %sub149 = fsub double %F.0, %div148
  98. %div150 = fdiv double %sub149, %F.0
  99. %call = tail call double @fabs(double %div150) nounwind readnone
  100. %cmp = fcmp olt double %call, 0x3CB0000000000000
  101. %cmp152 = icmp sgt i32 %n.0, 20000
  102. %or.cond = or i1 %cmp, %cmp152
  103. br i1 %or.cond, label %done, label %go
  104. done:
  105. ret void
  106. ; CHECK-LABEL: @test1(
  107. ; CHECK: go:
  108. ; CHECK: %conv.v.i0.1 = insertelement <2 x i32> undef, i32 %n.0, i32 0
  109. ; FIXME: When tree pruning is deterministic, include the entire output.
  110. }