cs2.ref 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167
  1. %dx.types.Handle = type { i8* }
  2. %dx.types.ResRet.i32 = type { i32, i32, i32, i32, i32 }
  3. %dx.types.CBufRet.i32 = type { i32, i32, i32, i32 }
  4. %dx.types.u32 = type { i32 }
  5. %dx.types.i8x16 = type { [16 x i8] }
  6. @TGSM0 = internal addrspace(3) global [6144 x i8] undef, align 4
  7. @llvm.used = appending global [1 x i8*] [i8* addrspacecast (i8 addrspace(3)* getelementptr inbounds ([6144 x i8], [6144 x i8] addrspace(3)* @TGSM0, i32 0, i32 0) to i8*)], section "llvm.metadata"
  8. define void @main() {
  9. entry:
  10. %0 = call %dx.types.Handle @dx.op.createHandle(i32 57, i8 1, i32 0, i32 0, i1 false)
  11. %1 = call %dx.types.Handle @dx.op.createHandle(i32 57, i8 2, i32 0, i32 0, i1 false)
  12. %2 = call i32 @dx.op.threadId.i32(i32 93, i32 0)
  13. %3 = shl i32 %2, 7
  14. %4 = call i32 @dx.op.groupId.i32(i32 94, i32 1)
  15. %5 = shl i32 %4, 10
  16. %6 = add i32 %5, %3
  17. %7 = call i32 @dx.op.threadIdInGroup.i32(i32 95, i32 2)
  18. %8 = add i32 %6, %7
  19. %9 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  20. %10 = add i32 %8, %9
  21. %11 = call %dx.types.ResRet.i32 @dx.op.bufferLoad.i32(i32 68, %dx.types.Handle %0, i32 %10, i32 undef)
  22. %12 = extractvalue %dx.types.ResRet.i32 %11, 0
  23. %13 = call float @dx.op.bitcastI32toF32(i32 126, i32 %12)
  24. %14 = fptrunc float %13 to half
  25. %15 = fadd fast half %14, 0xH4000
  26. %16 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  27. %17 = mul i32 %16, 16
  28. %18 = add i32 %17, 4
  29. %19 = fpext half %15 to float
  30. %20 = getelementptr [6144 x i8], [6144 x i8] addrspace(3)* @TGSM0, i32 0, i32 %18
  31. %21 = bitcast i8 addrspace(3)* %20 to float addrspace(3)*
  32. store float %19, float addrspace(3)* %21, align 4
  33. %22 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  34. %23 = mul i32 %22, 16
  35. %24 = add i32 %23, 8
  36. %25 = getelementptr [6144 x i8], [6144 x i8] addrspace(3)* @TGSM0, i32 0, i32 %24
  37. %26 = bitcast i8 addrspace(3)* %25 to float addrspace(3)*
  38. store float %13, float addrspace(3)* %26, align 4
  39. %27 = fptosi float %13 to i32
  40. %28 = trunc i32 %27 to i16
  41. %29 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  42. %30 = mul i32 %29, 16
  43. %31 = add i32 %30, 12
  44. %32 = sext i16 %28 to i32
  45. %33 = call float @dx.op.bitcastI32toF32(i32 126, i32 %32)
  46. %34 = getelementptr [6144 x i8], [6144 x i8] addrspace(3)* @TGSM0, i32 0, i32 %31
  47. %35 = bitcast i8 addrspace(3)* %34 to float addrspace(3)*
  48. store float %33, float addrspace(3)* %35, align 4
  49. call void @dx.op.barrier(i32 80, i32 11)
  50. %36 = call i32 @dx.op.flattenedThreadIdInGroup.i32(i32 96)
  51. %37 = call %dx.types.CBufRet.i32 @dx.op.cbufferLoadLegacy.i32(i32 59, %dx.types.Handle %1, i32 0)
  52. %38 = extractvalue %dx.types.CBufRet.i32 %37, 0
  53. %39 = add i32 %36, %38
  54. %40 = mul i32 %39, 16
  55. %41 = add i32 %40, 8
  56. %42 = getelementptr [6144 x i8], [6144 x i8] addrspace(3)* @TGSM0, i32 0, i32 %41
  57. %43 = bitcast i8 addrspace(3)* %42 to float addrspace(3)*
  58. %44 = load float, float addrspace(3)* %43, align 4
  59. %45 = fadd fast float %44, %13
  60. %46 = mul i32 %39, 16
  61. %47 = add i32 %46, 12
  62. %48 = getelementptr [6144 x i8], [6144 x i8] addrspace(3)* @TGSM0, i32 0, i32 %47
  63. %49 = bitcast i8 addrspace(3)* %48 to float addrspace(3)*
  64. %50 = load float, float addrspace(3)* %49, align 4
  65. %51 = call i32 @dx.op.bitcastF32toI32(i32 127, float %50)
  66. %52 = trunc i32 %51 to i16
  67. %53 = sext i16 %52 to i32
  68. %54 = sitofp i32 %53 to float
  69. %55 = fadd fast float %54, %45
  70. call void @dx.op.barrier(i32 80, i32 9)
  71. call void @dx.op.barrier(i32 80, i32 2)
  72. %56 = mul i32 %39, 16
  73. %57 = add i32 %56, 4
  74. %58 = getelementptr [6144 x i8], [6144 x i8] addrspace(3)* @TGSM0, i32 0, i32 %57
  75. %59 = bitcast i8 addrspace(3)* %58 to float addrspace(3)*
  76. %60 = load float, float addrspace(3)* %59, align 4
  77. %61 = fptrunc float %60 to half
  78. %62 = fpext half %61 to float
  79. %63 = fadd fast float %55, %62
  80. %64 = call i32 @dx.op.bitcastF32toI32(i32 127, float %63)
  81. call void @dx.op.bufferStore.i32(i32 69, %dx.types.Handle %0, i32 %10, i32 undef, i32 %64, i32 undef, i32 undef, i32 undef, i8 1)
  82. ret void
  83. }
  84. ; Function Attrs: nounwind readonly
  85. declare %dx.types.Handle @dx.op.createHandle(i32, i8, i32, i32, i1) #0
  86. ; Function Attrs: nounwind readnone
  87. declare i32 @dx.op.threadId.i32(i32, i32) #1
  88. ; Function Attrs: nounwind
  89. declare void @dx.op.tempRegStore.i32(i32, i32, i32) #2
  90. ; Function Attrs: nounwind readnone
  91. declare i32 @dx.op.groupId.i32(i32, i32) #1
  92. ; Function Attrs: nounwind readonly
  93. declare i32 @dx.op.tempRegLoad.i32(i32, i32) #0
  94. ; Function Attrs: nounwind readnone
  95. declare i32 @dx.op.threadIdInGroup.i32(i32, i32) #1
  96. ; Function Attrs: nounwind readnone
  97. declare i32 @dx.op.flattenedThreadIdInGroup.i32(i32) #1
  98. ; Function Attrs: nounwind readonly
  99. declare %dx.types.ResRet.i32 @dx.op.bufferLoad.i32(i32, %dx.types.Handle, i32, i32) #0
  100. ; Function Attrs: nounwind readonly
  101. declare float @dx.op.tempRegLoad.f32(i32, i32) #0
  102. ; Function Attrs: nounwind
  103. declare void @dx.op.tempRegStore.f16(i32, i32, half) #2
  104. ; Function Attrs: nounwind readonly
  105. declare half @dx.op.tempRegLoad.f16(i32, i32) #0
  106. ; Function Attrs: nounwind
  107. declare void @dx.op.tempRegStore.i16(i32, i32, i16) #2
  108. ; Function Attrs: nounwind readonly
  109. declare i16 @dx.op.tempRegLoad.i16(i32, i32) #0
  110. ; Function Attrs: nounwind readnone
  111. declare float @dx.op.bitcastI32toF32(i32, i32) #1
  112. ; Function Attrs: noduplicate nounwind
  113. declare void @dx.op.barrier(i32, i32) #3
  114. ; Function Attrs: nounwind readonly
  115. declare %dx.types.CBufRet.i32 @dx.op.cbufferLoadLegacy.i32(i32, %dx.types.Handle, i32) #0
  116. ; Function Attrs: nounwind
  117. declare void @dx.op.tempRegStore.f32(i32, i32, float) #2
  118. ; Function Attrs: nounwind readnone
  119. declare i32 @dx.op.bitcastF32toI32(i32, float) #1
  120. ; Function Attrs: nounwind
  121. declare void @dx.op.bufferStore.i32(i32, %dx.types.Handle, i32, i32, i32, i32, i32, i32, i8) #2
  122. attributes #0 = { nounwind readonly }
  123. attributes #1 = { nounwind readnone }
  124. attributes #2 = { nounwind }
  125. attributes #3 = { noduplicate nounwind }
  126. !dx.version = !{!0}
  127. !dx.valver = !{!0}
  128. !dx.shaderModel = !{!1}
  129. !dx.resources = !{!2}
  130. !dx.entryPoints = !{!7}
  131. !llvm.ident = !{!10}
  132. !0 = !{i32 1, i32 0}
  133. !1 = !{!"cs", i32 6, i32 0}
  134. !2 = !{null, !3, !5, null}
  135. !3 = !{!4}
  136. !4 = !{i32 0, %dx.types.u32 addrspace(1)* undef, !"U0", i32 0, i32 0, i32 1, i32 11, i1 false, i1 false, i1 false, null}
  137. !5 = !{!6}
  138. !6 = !{i32 0, %dx.types.i8x16 addrspace(2)* undef, !"CB0", i32 0, i32 0, i32 1, i32 16, null}
  139. !7 = !{void ()* @main, !"main", null, !2, !8}
  140. !8 = !{i32 0, i64 288, i32 4, !9}
  141. !9 = !{i32 16, i32 8, i32 3}
  142. !10 = !{!"dxbc2dxil 1.2"}