vector-casts.ll 5.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163
  1. ; RUN: opt < %s -instcombine -S | FileCheck %s
  2. ; This turns into a&1 != 0
  3. define <2 x i1> @test1(<2 x i64> %a) {
  4. %t = trunc <2 x i64> %a to <2 x i1>
  5. ret <2 x i1> %t
  6. ; CHECK-LABEL: @test1(
  7. ; CHECK: and <2 x i64> %a, <i64 1, i64 1>
  8. ; CHECK: icmp ne <2 x i64> %1, zeroinitializer
  9. }
  10. ; The ashr turns into an lshr.
  11. define <2 x i64> @test2(<2 x i64> %a) {
  12. %b = and <2 x i64> %a, <i64 65535, i64 65535>
  13. %t = ashr <2 x i64> %b, <i64 1, i64 1>
  14. ret <2 x i64> %t
  15. ; CHECK-LABEL: @test2(
  16. ; CHECK: and <2 x i64> %a, <i64 65535, i64 65535>
  17. ; CHECK: lshr <2 x i64> %b, <i64 1, i64 1>
  18. }
  19. define <2 x i64> @test3(<4 x float> %a, <4 x float> %b) nounwind readnone {
  20. entry:
  21. %cmp = fcmp ord <4 x float> %a, zeroinitializer
  22. %sext = sext <4 x i1> %cmp to <4 x i32>
  23. %cmp4 = fcmp ord <4 x float> %b, zeroinitializer
  24. %sext5 = sext <4 x i1> %cmp4 to <4 x i32>
  25. %and = and <4 x i32> %sext, %sext5
  26. %conv = bitcast <4 x i32> %and to <2 x i64>
  27. ret <2 x i64> %conv
  28. ; CHECK-LABEL: @test3(
  29. ; CHECK: fcmp ord <4 x float> %a, %b
  30. }
  31. define <2 x i64> @test4(<4 x float> %a, <4 x float> %b) nounwind readnone {
  32. entry:
  33. %cmp = fcmp uno <4 x float> %a, zeroinitializer
  34. %sext = sext <4 x i1> %cmp to <4 x i32>
  35. %cmp4 = fcmp uno <4 x float> %b, zeroinitializer
  36. %sext5 = sext <4 x i1> %cmp4 to <4 x i32>
  37. %or = or <4 x i32> %sext, %sext5
  38. %conv = bitcast <4 x i32> %or to <2 x i64>
  39. ret <2 x i64> %conv
  40. ; CHECK-LABEL: @test4(
  41. ; CHECK: fcmp uno <4 x float> %a, %b
  42. }
  43. ; rdar://7434900
  44. define <2 x i64> @test5(<4 x float> %a, <4 x float> %b) nounwind readnone {
  45. entry:
  46. %cmp = fcmp ult <4 x float> %a, zeroinitializer
  47. %sext = sext <4 x i1> %cmp to <4 x i32>
  48. %cmp4 = fcmp ult <4 x float> %b, zeroinitializer
  49. %sext5 = sext <4 x i1> %cmp4 to <4 x i32>
  50. %and = and <4 x i32> %sext, %sext5
  51. %conv = bitcast <4 x i32> %and to <2 x i64>
  52. ret <2 x i64> %conv
  53. ; CHECK-LABEL: @test5(
  54. ; CHECK: sext <4 x i1> %cmp to <4 x i32>
  55. ; The sext-and pair is canonicalized to a select.
  56. ; CHECK: select <4 x i1> %cmp4, <4 x i32> %sext, <4 x i32> zeroinitializer
  57. }
  58. define void @convert(<2 x i32>* %dst.addr, <2 x i64> %src) nounwind {
  59. entry:
  60. %val = trunc <2 x i64> %src to <2 x i32>
  61. %add = add <2 x i32> %val, <i32 1, i32 1>
  62. store <2 x i32> %add, <2 x i32>* %dst.addr
  63. ret void
  64. }
  65. define <2 x i65> @foo(<2 x i64> %t) {
  66. %a = trunc <2 x i64> %t to <2 x i32>
  67. %b = zext <2 x i32> %a to <2 x i65>
  68. ret <2 x i65> %b
  69. }
  70. define <2 x i64> @bar(<2 x i65> %t) {
  71. %a = trunc <2 x i65> %t to <2 x i32>
  72. %b = zext <2 x i32> %a to <2 x i64>
  73. ret <2 x i64> %b
  74. }
  75. define <2 x i65> @foos(<2 x i64> %t) {
  76. %a = trunc <2 x i64> %t to <2 x i32>
  77. %b = sext <2 x i32> %a to <2 x i65>
  78. ret <2 x i65> %b
  79. }
  80. define <2 x i64> @bars(<2 x i65> %t) {
  81. %a = trunc <2 x i65> %t to <2 x i32>
  82. %b = sext <2 x i32> %a to <2 x i64>
  83. ret <2 x i64> %b
  84. }
  85. define <2 x i64> @quxs(<2 x i64> %t) {
  86. %a = trunc <2 x i64> %t to <2 x i32>
  87. %b = sext <2 x i32> %a to <2 x i64>
  88. ret <2 x i64> %b
  89. }
  90. define <2 x i64> @quxt(<2 x i64> %t) {
  91. %a = shl <2 x i64> %t, <i64 32, i64 32>
  92. %b = ashr <2 x i64> %a, <i64 32, i64 32>
  93. ret <2 x i64> %b
  94. }
  95. define <2 x double> @fa(<2 x double> %t) {
  96. %a = fptrunc <2 x double> %t to <2 x float>
  97. %b = fpext <2 x float> %a to <2 x double>
  98. ret <2 x double> %b
  99. }
  100. define <2 x double> @fb(<2 x double> %t) {
  101. %a = fptoui <2 x double> %t to <2 x i64>
  102. %b = uitofp <2 x i64> %a to <2 x double>
  103. ret <2 x double> %b
  104. }
  105. define <2 x double> @fc(<2 x double> %t) {
  106. %a = fptosi <2 x double> %t to <2 x i64>
  107. %b = sitofp <2 x i64> %a to <2 x double>
  108. ret <2 x double> %b
  109. }
  110. ; PR9228
  111. ; This was a crasher, so no CHECK statements.
  112. define <4 x float> @f(i32 %a) nounwind alwaysinline {
  113. ; CHECK-LABEL: @f(
  114. entry:
  115. %dim = insertelement <4 x i32> undef, i32 %a, i32 0
  116. %dim30 = insertelement <4 x i32> %dim, i32 %a, i32 1
  117. %dim31 = insertelement <4 x i32> %dim30, i32 %a, i32 2
  118. %dim32 = insertelement <4 x i32> %dim31, i32 %a, i32 3
  119. %offset_ptr = getelementptr <4 x float>, <4 x float>* null, i32 1
  120. %offset_int = ptrtoint <4 x float>* %offset_ptr to i64
  121. %sizeof32 = trunc i64 %offset_int to i32
  122. %smearinsert33 = insertelement <4 x i32> undef, i32 %sizeof32, i32 0
  123. %smearinsert34 = insertelement <4 x i32> %smearinsert33, i32 %sizeof32, i32 1
  124. %smearinsert35 = insertelement <4 x i32> %smearinsert34, i32 %sizeof32, i32 2
  125. %smearinsert36 = insertelement <4 x i32> %smearinsert35, i32 %sizeof32, i32 3
  126. %delta_scale = mul <4 x i32> %dim32, %smearinsert36
  127. %offset_delta = add <4 x i32> zeroinitializer, %delta_scale
  128. %offset_varying_delta = add <4 x i32> %offset_delta, undef
  129. ret <4 x float> undef
  130. }
  131. define <8 x i32> @pr24458(<8 x float> %n) {
  132. ; CHECK-LABEL: @pr24458
  133. %notequal_b_load_.i = fcmp une <8 x float> %n, zeroinitializer
  134. %equal_a_load72_.i = fcmp ueq <8 x float> %n, zeroinitializer
  135. %notequal_b_load__to_boolvec.i = sext <8 x i1> %notequal_b_load_.i to <8 x i32>
  136. %equal_a_load72__to_boolvec.i = sext <8 x i1> %equal_a_load72_.i to <8 x i32>
  137. %wrong = or <8 x i32> %notequal_b_load__to_boolvec.i, %equal_a_load72__to_boolvec.i
  138. ret <8 x i32> %wrong
  139. ; CHECK-NEXT: ret <8 x i32> <i32 -1, i32 -1, i32 -1, i32 -1, i32 -1, i32 -1, i32 -1, i32 -1>
  140. }