ComputeShaderSort11.hlsl 2.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970
  1. // RUN: %dxc -E main -T cs_6_0 %s | FileCheck %s
  2. // CHECK: threadId
  3. // CHECK: flattenedThreadIdInGroup
  4. // CHECK: bufferLoad
  5. // CHECK: addrspace(3)
  6. // CHECK: barrier
  7. // CHECK: addrspace(3)
  8. // CHECK: barrier
  9. // CHECK: addrspace(3)
  10. // CHECK: barrier
  11. // CHECK: addrspace(3)
  12. // CHECK: bufferStore
  13. //--------------------------------------------------------------------------------------
  14. // File: ComputeShaderSort11.hlsl
  15. //
  16. // This file contains the compute shaders to perform GPU sorting using DirectX 11.
  17. //
  18. // Copyright (c) Microsoft Corporation. All rights reserved.
  19. //--------------------------------------------------------------------------------------
  20. #define BITONIC_BLOCK_SIZE 512
  21. #define TRANSPOSE_BLOCK_SIZE 16
  22. //--------------------------------------------------------------------------------------
  23. // Constant Buffers
  24. //--------------------------------------------------------------------------------------
  25. cbuffer CB : register( b0 )
  26. {
  27. unsigned int g_iLevel;
  28. unsigned int g_iLevelMask;
  29. unsigned int g_iWidth;
  30. unsigned int g_iHeight;
  31. };
  32. //--------------------------------------------------------------------------------------
  33. // Structured Buffers
  34. //--------------------------------------------------------------------------------------
  35. StructuredBuffer<unsigned int> Input : register( t0 );
  36. RWStructuredBuffer<unsigned int> Data : register( u0 );
  37. //--------------------------------------------------------------------------------------
  38. // Bitonic Sort Compute Shader
  39. //--------------------------------------------------------------------------------------
  40. groupshared unsigned int shared_data[BITONIC_BLOCK_SIZE];
  41. [numthreads(BITONIC_BLOCK_SIZE, 1, 1)]
  42. void main( uint3 Gid : SV_GroupID,
  43. uint3 DTid : SV_DispatchThreadID,
  44. uint3 GTid : SV_GroupThreadID,
  45. uint GI : SV_GroupIndex )
  46. {
  47. // Load shared data
  48. shared_data[GI] = Data[DTid.x];
  49. GroupMemoryBarrierWithGroupSync();
  50. // Sort the shared data
  51. for (unsigned int j = g_iLevel >> 1 ; j > 0 ; j >>= 1)
  52. {
  53. unsigned int result = ((shared_data[GI & ~j] <= shared_data[GI | j]) == (bool)(g_iLevelMask & DTid.x))? shared_data[GI ^ j] : shared_data[GI];
  54. GroupMemoryBarrierWithGroupSync();
  55. shared_data[GI] = result;
  56. GroupMemoryBarrierWithGroupSync();
  57. }
  58. // Store shared data
  59. Data[DTid.x] = shared_data[GI];
  60. }