cs4.ref 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152
  1. %dx.types.Handle = type { i8* }
  2. %dx.types.ResRet.i32 = type { i32, i32, i32, i32, i32 }
  3. %dx.types.CBufRet.i32 = type { i32, i32, i32, i32 }
  4. %dx.types.u32 = type { i32 }
  5. %dx.types.i8x16 = type { [16 x i8] }
  6. @TGSM0 = internal addrspace(3) global [7680 x i8] undef, align 4
  7. @llvm.used = appending global [1 x i8*] [i8* addrspacecast (i8 addrspace(3)* getelementptr inbounds ([7680 x i8], [7680 x i8] addrspace(3)* @TGSM0, i32 0, i32 0) to i8*)], section "llvm.metadata"
  8. define void @main() {
  9. entry:
  10. %0 = call %dx.types.Handle @dx.op.createHandle(i32 57, i8 1, i32 0, i32 0, i1 false)
  11. %1 = call %dx.types.Handle @dx.op.createHandle(i32 57, i8 2, i32 0, i32 0, i1 false)
  12. %2 = call i32 @dx.op.threadId.i32(i32 93, i32 0)
  13. %3 = shl i32 %2, 7
  14. %4 = call i32 @dx.op.groupId.i32(i32 94, i32 1)
  15. %5 = shl i32 %4, 10
  16. %6 = add i32 %5, %3
  17. %7 = call i32 @dx.op.threadIdInGroup.i32(i32 95, i32 2)
  18. %8 = add i32 %6, %7
  19. %9 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  20. %10 = add i32 %8, %9
  21. %11 = call %dx.types.ResRet.i32 @dx.op.bufferLoad.i32(i32 68, %dx.types.Handle %0, i32 %10, i32 undef)
  22. %12 = extractvalue %dx.types.ResRet.i32 %11, 0
  23. %13 = call float @dx.op.bitcastI32toF32(i32 126, i32 %12)
  24. %14 = fptoui float %13 to i32
  25. %15 = call float @dx.op.bitcastI32toF32(i32 126, i32 %14)
  26. %16 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  27. %17 = mul i32 %16, 20
  28. %18 = add i32 %17, 16
  29. %19 = getelementptr [7680 x i8], [7680 x i8] addrspace(3)* @TGSM0, i32 0, i32 %18
  30. %20 = bitcast i8 addrspace(3)* %19 to float addrspace(3)*
  31. store float %15, float addrspace(3)* %20, align 4
  32. %21 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  33. %22 = mul i32 %21, 20
  34. %23 = add i32 %22, 16
  35. %24 = call i32 @dx.op.threadId.i32(i32 93, i32 0)
  36. %25 = getelementptr [7680 x i8], [7680 x i8] addrspace(3)* @TGSM0, i32 0, i32 %23
  37. %26 = bitcast i8 addrspace(3)* %25 to i32 addrspace(3)*
  38. %27 = atomicrmw add i32 addrspace(3)* %26, i32 %24 monotonic
  39. %28 = mul i32 %21, 20
  40. %29 = add i32 %28, 16
  41. %30 = call i32 @dx.op.threadId.i32(i32 93, i32 0)
  42. %31 = getelementptr [7680 x i8], [7680 x i8] addrspace(3)* @TGSM0, i32 0, i32 %29
  43. %32 = bitcast i8 addrspace(3)* %31 to i32 addrspace(3)*
  44. %33 = atomicrmw or i32 addrspace(3)* %32, i32 %30 monotonic
  45. %34 = uitofp i32 %27 to float
  46. %35 = fadd fast float %34, %13
  47. %36 = mul i32 %21, 20
  48. %37 = add i32 %36, 16
  49. %38 = call i32 @dx.op.groupId.i32(i32 94, i32 1)
  50. %39 = call i32 @dx.op.threadId.i32(i32 93, i32 0)
  51. %40 = getelementptr [7680 x i8], [7680 x i8] addrspace(3)* @TGSM0, i32 0, i32 %37
  52. %41 = bitcast i8 addrspace(3)* %40 to i32 addrspace(3)*
  53. %42 = cmpxchg i32 addrspace(3)* %41, i32 %38, i32 %39 monotonic monotonic
  54. %43 = mul i32 %21, 20
  55. %44 = add i32 %43, 16
  56. %45 = call i32 @dx.op.groupId.i32(i32 94, i32 1)
  57. %46 = call i32 @dx.op.threadId.i32(i32 93, i32 0)
  58. %47 = getelementptr [7680 x i8], [7680 x i8] addrspace(3)* @TGSM0, i32 0, i32 %44
  59. %48 = bitcast i8 addrspace(3)* %47 to i32 addrspace(3)*
  60. %49 = cmpxchg i32 addrspace(3)* %48, i32 %45, i32 %46 monotonic monotonic
  61. %50 = extractvalue { i32, i1 } %49, 0
  62. call void @dx.op.barrier(i32 80, i32 11)
  63. %51 = uitofp i32 %50 to float
  64. %52 = fadd fast float %51, %35
  65. %53 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  66. %54 = call %dx.types.CBufRet.i32 @dx.op.cbufferLoadLegacy.i32(i32 59, %dx.types.Handle %1, i32 0)
  67. %55 = extractvalue %dx.types.CBufRet.i32 %54, 0
  68. %56 = add i32 %53, %55
  69. %57 = mul i32 %56, 20
  70. %58 = add i32 %57, 16
  71. %59 = getelementptr [7680 x i8], [7680 x i8] addrspace(3)* @TGSM0, i32 0, i32 %58
  72. %60 = bitcast i8 addrspace(3)* %59 to float addrspace(3)*
  73. %61 = load float, float addrspace(3)* %60, align 4
  74. %62 = call i32 @dx.op.bitcastF32toI32(i32 127, float %61)
  75. %63 = uitofp i32 %62 to float
  76. %64 = fadd fast float %63, %52
  77. %65 = call i32 @dx.op.bitcastF32toI32(i32 127, float %64)
  78. call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %0, i32 %10, i32 undef, i32 %65, i32 undef, i32 undef, i32 undef, i8 1)
  79. ret void
  80. }
  81. ; Function Attrs: nounwind readonly
  82. declare %dx.types.Handle @dx.op.createHandle(i32, i8, i32, i32, i1) #0
  83. ; Function Attrs: nounwind readnone
  84. declare i32 @dx.op.threadId.i32(i32, i32) #1
  85. ; Function Attrs: nounwind
  86. declare void @dx.op.tempRegStore.i32(i32, i32, i32) #2
  87. ; Function Attrs: nounwind readnone
  88. declare i32 @dx.op.groupId.i32(i32, i32) #1
  89. ; Function Attrs: nounwind readonly
  90. declare i32 @dx.op.tempRegLoad.i32(i32, i32) #0
  91. ; Function Attrs: nounwind readnone
  92. declare i32 @dx.op.threadIdInGroup.i32(i32, i32) #1
  93. ; Function Attrs: nounwind readnone
  94. declare i32 @dx.op.flattenedThreadIdInGroup.i32(i32) #1
  95. ; Function Attrs: nounwind readonly
  96. declare %dx.types.ResRet.i32 @dx.op.bufferLoad.i32(i32, %dx.types.Handle, i32, i32) #0
  97. ; Function Attrs: nounwind readonly
  98. declare float @dx.op.tempRegLoad.f32(i32, i32) #0
  99. ; Function Attrs: nounwind
  100. declare void @dx.op.tempRegStore.f32(i32, i32, float) #2
  101. ; Function Attrs: noduplicate nounwind
  102. declare void @dx.op.barrier(i32, i32) #3
  103. ; Function Attrs: nounwind readonly
  104. declare %dx.types.CBufRet.i32 @dx.op.cbufferLoadLegacy.i32(i32, %dx.types.Handle, i32) #0
  105. ; Function Attrs: nounwind
  106. declare void @dx.op.bufferStore.i32(i32, %dx.types.Handle, i32, i32, i32, i32, i32, i32, i8) #2
  107. ; Function Attrs: nounwind readnone
  108. declare float @dx.op.bitcastI32toF32(i32, i32) #1
  109. ; Function Attrs: nounwind readnone
  110. declare i32 @dx.op.bitcastF32toI32(i32, float) #1
  111. attributes #0 = { nounwind readonly }
  112. attributes #1 = { nounwind readnone }
  113. attributes #2 = { nounwind }
  114. attributes #3 = { noduplicate nounwind }
  115. !dx.version = !{!0}
  116. !dx.valver = !{!0}
  117. !dx.shaderModel = !{!1}
  118. !dx.resources = !{!2}
  119. !dx.entryPoints = !{!7}
  120. !llvm.ident = !{!10}
  121. !0 = !{i32 1, i32 0}
  122. !1 = !{!"cs", i32 6, i32 0}
  123. !2 = !{null, !3, !5, null}
  124. !3 = !{!4}
  125. !4 = !{i32 0, %dx.types.u32 addrspace(1)* undef, !"U0", i32 0, i32 0, i32 1, i32 11, i1 false, i1 false, i1 false, null}
  126. !5 = !{!6}
  127. !6 = !{i32 0, %dx.types.i8x16 addrspace(2)* undef, !"CB0", i32 0, i32 0, i32 1, i32 16, null}
  128. !7 = !{void ()* @main, !"main", null, !2, !8}
  129. !8 = !{i32 0, i64 256, i32 4, !9}
  130. !9 = !{i32 16, i32 8, i32 3}
  131. !10 = !{!"dxbc2dxil 1.2"}