spv.subgroupShuffle.comp 3.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869
  1. #version 450
  2. #extension GL_KHR_shader_subgroup_shuffle: enable
  3. layout (local_size_x = 8, local_size_y = 8, local_size_z = 1) in;
  4. layout(binding = 0) buffer Buffers
  5. {
  6. vec4 f4;
  7. ivec4 i4;
  8. uvec4 u4;
  9. dvec4 d4;
  10. } data[4];
  11. void main()
  12. {
  13. uint invocation = (gl_SubgroupInvocationID + gl_SubgroupSize) % 4;
  14. data[invocation].f4.x = subgroupShuffle(data[0].f4.x, invocation);
  15. data[invocation].f4.xy = subgroupShuffle(data[1].f4.xy, invocation);
  16. data[invocation].f4.xyz = subgroupShuffle(data[2].f4.xyz, invocation);
  17. data[invocation].f4 = subgroupShuffle(data[3].f4, invocation);
  18. data[invocation].i4.x = subgroupShuffle(data[0].i4.x, invocation);
  19. data[invocation].i4.xy = subgroupShuffle(data[1].i4.xy, invocation);
  20. data[invocation].i4.xyz = subgroupShuffle(data[2].i4.xyz, invocation);
  21. data[invocation].i4 = subgroupShuffle(data[3].i4, invocation);
  22. data[invocation].u4.x = subgroupShuffle(data[0].u4.x, invocation);
  23. data[invocation].u4.xy = subgroupShuffle(data[1].u4.xy, invocation);
  24. data[invocation].u4.xyz = subgroupShuffle(data[2].u4.xyz, invocation);
  25. data[invocation].u4 = subgroupShuffle(data[3].u4, invocation);
  26. data[invocation].d4.x = subgroupShuffle(data[0].d4.x, invocation);
  27. data[invocation].d4.xy = subgroupShuffle(data[1].d4.xy, invocation);
  28. data[invocation].d4.xyz = subgroupShuffle(data[2].d4.xyz, invocation);
  29. data[invocation].d4 = subgroupShuffle(data[3].d4, invocation);
  30. data[invocation].i4.x = int(subgroupShuffle(data[0].i4.x < 0, invocation));
  31. data[invocation].i4.xy = ivec2(subgroupShuffle(lessThan(data[1].i4.xy, ivec2(0)), invocation));
  32. data[invocation].i4.xyz = ivec3(subgroupShuffle(lessThan(data[1].i4.xyz, ivec3(0)), invocation));
  33. data[invocation].i4 = ivec4(subgroupShuffle(lessThan(data[1].i4, ivec4(0)), invocation));
  34. data[invocation].f4.x = subgroupShuffleXor(data[0].f4.x, invocation);
  35. data[invocation].f4.xy = subgroupShuffleXor(data[1].f4.xy, invocation);
  36. data[invocation].f4.xyz = subgroupShuffleXor(data[2].f4.xyz, invocation);
  37. data[invocation].f4 = subgroupShuffleXor(data[3].f4, invocation);
  38. data[invocation].i4.x = subgroupShuffleXor(data[0].i4.x, invocation);
  39. data[invocation].i4.xy = subgroupShuffleXor(data[1].i4.xy, invocation);
  40. data[invocation].i4.xyz = subgroupShuffleXor(data[2].i4.xyz, invocation);
  41. data[invocation].i4 = subgroupShuffleXor(data[3].i4, invocation);
  42. data[invocation].u4.x = subgroupShuffleXor(data[0].u4.x, invocation);
  43. data[invocation].u4.xy = subgroupShuffleXor(data[1].u4.xy, invocation);
  44. data[invocation].u4.xyz = subgroupShuffleXor(data[2].u4.xyz, invocation);
  45. data[invocation].u4 = subgroupShuffleXor(data[3].u4, invocation);
  46. data[invocation].d4.x = subgroupShuffleXor(data[0].d4.x, invocation);
  47. data[invocation].d4.xy = subgroupShuffleXor(data[1].d4.xy, invocation);
  48. data[invocation].d4.xyz = subgroupShuffleXor(data[2].d4.xyz, invocation);
  49. data[invocation].d4 = subgroupShuffleXor(data[3].d4, invocation);
  50. data[invocation].i4.x = int(subgroupShuffleXor(data[0].i4.x < 0, invocation));
  51. data[invocation].i4.xy = ivec2(subgroupShuffleXor(lessThan(data[1].i4.xy, ivec2(0)), invocation));
  52. data[invocation].i4.xyz = ivec3(subgroupShuffleXor(lessThan(data[1].i4.xyz, ivec3(0)), invocation));
  53. data[invocation].i4 = ivec4(subgroupShuffleXor(lessThan(data[1].i4, ivec4(0)), invocation));
  54. }