[ET-VK][qconv] Read weight buffer as int in pack_q8_conv2d_weights shader

ssjia · ssjia · commit bace537be99a · 2026-02-25T06:17:58.000-08:00
The shader previously declared the input weight buffer as int8, requiring the GL_EXT_shader_8bit_storage extension which is not supported on all devices. Replace with an int (int32) buffer and extract individual bytes via shift-and-mask, the same technique used in nchw_to_int8x4_buffer.glsl. This makes the shader functional on devices without 8-bit buffer support. Differential Revision: [D94314255](https://our.internmc.facebook.com/intern/diff/D94314255/) [ghstack-poisoned]
diff --git a/backends/vulkan/runtime/graph/ops/glsl/pack_q8_conv2d_weights.glsl b/backends/vulkan/runtime/graph/ops/glsl/pack_q8_conv2d_weights.glsl
@@ -8,8 +8,6 @@
 
 #version 450 core
 
-${define_required_extensions("buffer", "int8")}
-
 #define PRECISION ${PRECISION}
 
 ${define_active_storage_type(STORAGE)}
@@ -19,7 +17,7 @@ ${define_active_storage_type(STORAGE)}
 layout(std430) buffer;
 
 ${layout_declare_tensor(B, "w", "t_packed_int8_weight", "int", STORAGE, is_scalar_array=False)}
-${layout_declare_tensor(B, "r", "t_int8_weight", "int8", "buffer")}
+${layout_declare_tensor(B, "r", "t_int8_weight", "int", "buffer")}
 
 layout(push_constant) uniform restrict Block {
   ivec4 qmat2_sizes;
@@ -65,7 +63,9 @@ void main() {
       ivec4 weight_vals = ivec4(0);
       for (int col = 0; col < 4; col++) {
         if (ic + col < orig_sizes.w) {
-          weight_vals[col] = int(t_int8_weight[buf_idx + col]);
+          const int byte_idx = buf_idx + col;
+          const int byte_pos = byte_idx & 3;
+          weight_vals[col] = (t_int8_weight[byte_idx >> 2] >> (byte_pos * 8)) & 0xFF;
         }
       }
       packed_block[row] = pack_into_int32(weight_vals);