profitability.ll 8.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205
  1. ; RUN: opt < %s -basicaa -loop-interchange -S | FileCheck %s
  2. ;; We test profitability model in these test cases.
  3. target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
  4. target triple = "x86_64-unknown-linux-gnu"
  5. @A = common global [100 x [100 x i32]] zeroinitializer
  6. @B = common global [100 x [100 x i32]] zeroinitializer
  7. ;;---------------------------------------Test case 01---------------------------------
  8. ;; Loops interchange will result in code vectorization and hence profitable. Check for interchange.
  9. ;; for(int i=1;i<N;i++)
  10. ;; for(int j=1;j<N;j++)
  11. ;; A[j][i] = A[j - 1][i] + B[j][i];
  12. define void @interchange_01(i32 %N) {
  13. entry:
  14. %cmp27 = icmp sgt i32 %N, 1
  15. br i1 %cmp27, label %for.cond1.preheader.lr.ph, label %for.end16
  16. for.cond1.preheader.lr.ph:
  17. %0 = add i32 %N, -1
  18. br label %for.body3.preheader
  19. for.body3.preheader:
  20. %indvars.iv30 = phi i64 [ 1, %for.cond1.preheader.lr.ph ], [ %indvars.iv.next31, %for.inc14 ]
  21. br label %for.body3
  22. for.body3:
  23. %indvars.iv = phi i64 [ %indvars.iv.next, %for.body3 ], [ 1, %for.body3.preheader ]
  24. %1 = add nsw i64 %indvars.iv, -1
  25. %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %1, i64 %indvars.iv30
  26. %2 = load i32, i32* %arrayidx5
  27. %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @B, i64 0, i64 %indvars.iv, i64 %indvars.iv30
  28. %3 = load i32, i32* %arrayidx9
  29. %add = add nsw i32 %3, %2
  30. %arrayidx13 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %indvars.iv, i64 %indvars.iv30
  31. store i32 %add, i32* %arrayidx13
  32. %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
  33. %lftr.wideiv = trunc i64 %indvars.iv to i32
  34. %exitcond = icmp eq i32 %lftr.wideiv, %0
  35. br i1 %exitcond, label %for.inc14, label %for.body3
  36. for.inc14:
  37. %indvars.iv.next31 = add nuw nsw i64 %indvars.iv30, 1
  38. %lftr.wideiv32 = trunc i64 %indvars.iv30 to i32
  39. %exitcond33 = icmp eq i32 %lftr.wideiv32, %0
  40. br i1 %exitcond33, label %for.end16, label %for.body3.preheader
  41. for.end16:
  42. ret void
  43. }
  44. ;; Here we are checking partial .ll to check if loop are interchanged.
  45. ; CHECK-LABEL: @interchange_01
  46. ; CHECK: for.body3.preheader: ; preds = %for.inc14, %for.cond1.preheader.lr.ph
  47. ; CHECK: %indvars.iv30 = phi i64 [ 1, %for.cond1.preheader.lr.ph ], [ %indvars.iv.next31, %for.inc14 ]
  48. ; CHECK: br label %for.body3.split2
  49. ; CHECK: for.body3.preheader1: ; preds = %entry
  50. ; CHECK: br label %for.body3
  51. ; CHECK: for.body3: ; preds = %for.body3.preheader1, %for.body3.split
  52. ; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %for.body3.split ], [ 1, %for.body3.preheader1 ]
  53. ; CHECK: br label %for.cond1.preheader.lr.ph
  54. ; CHECK: for.body3.split2: ; preds = %for.body3.preheader
  55. ; CHECK: %1 = add nsw i64 %indvars.iv, -1
  56. ; CHECK: %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %1, i64 %indvars.iv30
  57. ; CHECK: %2 = load i32, i32* %arrayidx5
  58. ; CHECK: %arrayidx9 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @B, i64 0, i64 %indvars.iv, i64 %indvars.iv30
  59. ; CHECK: %3 = load i32, i32* %arrayidx9
  60. ; CHECK: %add = add nsw i32 %3, %2
  61. ; CHECK: %arrayidx13 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %indvars.iv, i64 %indvars.iv30
  62. ; CHECK: store i32 %add, i32* %arrayidx13
  63. ; CHECK: br label %for.inc14
  64. ;; ---------------------------------------Test case 02---------------------------------
  65. ;; Check loop interchange profitability model.
  66. ;; This tests profitability model when operands of getelementpointer and not exactly the induction variable but some
  67. ;; arithmetic operation on them.
  68. ;; for(int i=1;i<N;i++)
  69. ;; for(int j=1;j<N;j++)
  70. ;; A[j-1][i-1] = A[j - 1][i-1] + B[j-1][i-1];
  71. define void @interchange_02(i32 %N) {
  72. entry:
  73. %cmp32 = icmp sgt i32 %N, 1
  74. br i1 %cmp32, label %for.cond1.preheader.lr.ph, label %for.end21
  75. for.cond1.preheader.lr.ph:
  76. %0 = add i32 %N, -1
  77. br label %for.body3.lr.ph
  78. for.body3.lr.ph:
  79. %indvars.iv35 = phi i64 [ 1, %for.cond1.preheader.lr.ph ], [ %indvars.iv.next36, %for.inc19 ]
  80. %1 = add nsw i64 %indvars.iv35, -1
  81. br label %for.body3
  82. for.body3:
  83. %indvars.iv = phi i64 [ 1, %for.body3.lr.ph ], [ %indvars.iv.next, %for.body3 ]
  84. %2 = add nsw i64 %indvars.iv, -1
  85. %arrayidx6 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %2, i64 %1
  86. %3 = load i32, i32* %arrayidx6
  87. %arrayidx12 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @B, i64 0, i64 %2, i64 %1
  88. %4 = load i32, i32* %arrayidx12
  89. %add = add nsw i32 %4, %3
  90. store i32 %add, i32* %arrayidx6
  91. %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
  92. %lftr.wideiv = trunc i64 %indvars.iv to i32
  93. %exitcond = icmp eq i32 %lftr.wideiv, %0
  94. br i1 %exitcond, label %for.inc19, label %for.body3
  95. for.inc19:
  96. %indvars.iv.next36 = add nuw nsw i64 %indvars.iv35, 1
  97. %lftr.wideiv38 = trunc i64 %indvars.iv35 to i32
  98. %exitcond39 = icmp eq i32 %lftr.wideiv38, %0
  99. br i1 %exitcond39, label %for.end21, label %for.body3.lr.ph
  100. for.end21:
  101. ret void
  102. }
  103. ; CHECK-LABEL: @interchange_02
  104. ; CHECK: for.body3.lr.ph: ; preds = %for.inc19, %for.cond1.preheader.lr.ph
  105. ; CHECK: %indvars.iv35 = phi i64 [ 1, %for.cond1.preheader.lr.ph ], [ %indvars.iv.next36, %for.inc19 ]
  106. ; CHECK: %0 = add nsw i64 %indvars.iv35, -1
  107. ; CHECK: br label %for.body3.split1
  108. ; CHECK: for.body3.preheader: ; preds = %entry
  109. ; CHECK: %1 = add i32 %N, -1
  110. ; CHECK: br label %for.body3
  111. ; CHECK: for.body3: ; preds = %for.body3.preheader, %for.body3.split
  112. ; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %for.body3.split ], [ 1, %for.body3.preheader ]
  113. ; CHECK: br label %for.cond1.preheader.lr.ph
  114. ; CHECK: for.body3.split1: ; preds = %for.body3.lr.ph
  115. ; CHECK: %2 = add nsw i64 %indvars.iv, -1
  116. ; CHECK: %arrayidx6 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %2, i64 %0
  117. ; CHECK: %3 = load i32, i32* %arrayidx6
  118. ; CHECK: %arrayidx12 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @B, i64 0, i64 %2, i64 %0
  119. ; CHECK: %4 = load i32, i32* %arrayidx12
  120. ; CHECK: %add = add nsw i32 %4, %3
  121. ; CHECK: store i32 %add, i32* %arrayidx6
  122. ; CHECK: br label %for.inc19
  123. ;;---------------------------------------Test case 03---------------------------------
  124. ;; Loops interchange is not profitable.
  125. ;; for(int i=1;i<N;i++)
  126. ;; for(int j=1;j<N;j++)
  127. ;; A[i-1][j-1] = A[i - 1][j-1] + B[i][j];
  128. define void @interchange_03(i32 %N){
  129. entry:
  130. %cmp31 = icmp sgt i32 %N, 1
  131. br i1 %cmp31, label %for.cond1.preheader.lr.ph, label %for.end19
  132. for.cond1.preheader.lr.ph:
  133. %0 = add i32 %N, -1
  134. br label %for.body3.lr.ph
  135. for.body3.lr.ph:
  136. %indvars.iv34 = phi i64 [ 1, %for.cond1.preheader.lr.ph ], [ %indvars.iv.next35, %for.inc17 ]
  137. %1 = add nsw i64 %indvars.iv34, -1
  138. br label %for.body3
  139. for.body3:
  140. %indvars.iv = phi i64 [ 1, %for.body3.lr.ph ], [ %indvars.iv.next, %for.body3 ]
  141. %2 = add nsw i64 %indvars.iv, -1
  142. %arrayidx6 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %1, i64 %2
  143. %3 = load i32, i32* %arrayidx6
  144. %arrayidx10 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @B, i64 0, i64 %indvars.iv34, i64 %indvars.iv
  145. %4 = load i32, i32* %arrayidx10
  146. %add = add nsw i32 %4, %3
  147. store i32 %add, i32* %arrayidx6
  148. %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
  149. %lftr.wideiv = trunc i64 %indvars.iv to i32
  150. %exitcond = icmp eq i32 %lftr.wideiv, %0
  151. br i1 %exitcond, label %for.inc17, label %for.body3
  152. for.inc17:
  153. %indvars.iv.next35 = add nuw nsw i64 %indvars.iv34, 1
  154. %lftr.wideiv37 = trunc i64 %indvars.iv34 to i32
  155. %exitcond38 = icmp eq i32 %lftr.wideiv37, %0
  156. br i1 %exitcond38, label %for.end19, label %for.body3.lr.ph
  157. for.end19:
  158. ret void
  159. }
  160. ; CHECK-LABEL: @interchange_03
  161. ; CHECK: for.body3.lr.ph:
  162. ; CHECK: %indvars.iv34 = phi i64 [ 1, %for.cond1.preheader.lr.ph ], [ %indvars.iv.next35, %for.inc17 ]
  163. ; CHECK: %1 = add nsw i64 %indvars.iv34, -1
  164. ; CHECK: br label %for.body3.preheader
  165. ; CHECK: for.body3.preheader:
  166. ; CHECK: br label %for.body3
  167. ; CHECK: for.body3:
  168. ; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %for.body3 ], [ 1, %for.body3.preheader ]
  169. ; CHECK: %2 = add nsw i64 %indvars.iv, -1
  170. ; CHECK: %arrayidx6 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %1, i64 %2
  171. ; CHECK: %3 = load i32, i32* %arrayidx6
  172. ; CHECK: %arrayidx10 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @B, i64 0, i64 %indvars.iv34, i64 %indvars.iv
  173. ; CHECK: %4 = load i32, i32* %arrayidx10