spv.coopmat_Error.comp 1.9 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677
  1. #version 450 core
  2. #extension GL_KHR_memory_scope_semantics : enable
  3. #extension GL_NV_cooperative_matrix : enable
  4. #extension GL_EXT_shader_explicit_arithmetic_types_float16 : enable
  5. layout (local_size_x = 64, local_size_y = 1, local_size_z = 1) in;
  6. float<16> ftemplate16;
  7. fcoopmatNV fnoparams;
  8. fcoopmatNV<8, gl_ScopeSubgroup, 8, 8> fbadbits;
  9. fcoopmatNV<16, gl_ScopeSubgroup, 8> fbadnumparams;
  10. int X = 8;
  11. fcoopmatNV<16, gl_ScopeSubgroup, 8, X> fbadparam;
  12. layout(constant_id = 0) int Y = 1;
  13. shared fcoopmatNV<16, gl_ScopeSubgroup, 16, 16> sharedmat;
  14. layout(set = 0, binding = 0) buffer InvBlock {
  15. fcoopmatNV<16, gl_ScopeSubgroup, 16, 16> bufmat;
  16. } invblock;
  17. void main()
  18. {
  19. fcoopmatNV<32, gl_ScopeSubgroup, 16, 8> f32_16_8;
  20. fcoopmatNV<16, gl_ScopeSubgroup, 16, 8> f16_16_8;
  21. // invalid implicit conversions
  22. f32_16_8 = f16_16_8;
  23. f32_16_8 = f16_16_8 + f16_16_8;
  24. fcoopmatNV<16, gl_ScopeSubgroup, 8, 8> f16_8_8;
  25. // mismatching dimensions
  26. f16_16_8 = f16_8_8;
  27. fcoopmatNV<16, gl_ScopeSubgroup, 8, Y> f16_8_Y;
  28. fcoopmatNV<16, gl_ScopeSubgroup, 8, (Y+1)> f16_8_Y1;
  29. // mismatching dimensions with specialization constants
  30. f16_8_Y = f16_8_Y1;
  31. // wrong arguments for constructor
  32. f16_8_8 = fcoopmatNV<16, gl_ScopeSubgroup, 8, 8>(1, 1);
  33. // can't construct from a builtin type
  34. mat4 m4;
  35. fcoopmatNV<32, gl_ScopeSubgroup, 4, 4> f32_4_4 = fcoopmatNV<32, gl_ScopeSubgroup, 4, 4>(m4);
  36. // only support a single array subscript
  37. f16_16_8[0][0];
  38. // don't support scalar component selection
  39. f16_16_8.x;
  40. f16_16_8 * f16_16_8;
  41. f16_16_8 + 1.0;
  42. f16_16_8 - 1.0;
  43. f16_16_8 / 1.0;
  44. f16_16_8 += 1.0;
  45. f16_16_8 -= 1.0;
  46. f16_16_8 /= 1.0;
  47. f16_16_8*2.0;
  48. 2.0*f16_16_8;
  49. f32_16_8*float16_t(2.0);
  50. float16_t(2.0)*f32_16_8;
  51. transpose(f16_8_8);
  52. }