llama-cpp-turboquant/shaders/glsl/opmult.comp

27 lines
573 B
Text

#version 450
layout(set = 0, binding = 0) buffer tensorLhs {
uint valuesLhs[ ];
};
layout(set = 0, binding = 1) buffer tensorRhs {
uint valuesRhs[ ];
};
layout(set = 0, binding = 2) buffer tensorOutput {
uint valuesOutput[ ];
};
// TODO: Explore how to make layout inside shader dynamic
layout (local_size_x = 1, local_size_y = 1, local_size_z = 1) in;
void main()
{
uint index = gl_GlobalInvocationID.x;
//valuesOutput[index] = valuesLhs[index] * valuesRhs[index];
// FOR TESTING
valuesOutput[index] = valuesLhs[index] + valuesRhs[index];
}