dequant_f32.comp 442 B

1234567891011121314151617181920
  1. #version 450
  2. #include "dequant_head.comp"
  3. layout(local_size_x = 256, local_size_y = 1, local_size_z = 1) in;
  4. layout (binding = 0) readonly buffer A {float data_a[];};
  5. layout (binding = 1) writeonly buffer D {D_TYPE data_b[];};
  6. void main() {
  7. const uint i = gl_GlobalInvocationID.x * 16;
  8. if (i >= p.nel) {
  9. return;
  10. }
  11. [[unroll]] for (uint l = 0; l < 16; l++) {
  12. data_b[i + l] = D_TYPE(data_a[i + l]);
  13. }
  14. }