Skip to content

Commit aa17d32

Browse files
vulkan: avoid using workgroup size before it is referenced
1 parent 118b4f0 commit aa17d32

14 files changed

+26
-26
lines changed

ggml/src/ggml-vulkan/vulkan-shaders/copy_from_quant.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ layout(local_size_x = 1, local_size_y = 1, local_size_z = 1) in;
1313

1414
void main() {
1515
#if defined(DATA_A_IQ2_XXS) || defined(DATA_A_IQ2_XS) || defined(DATA_A_IQ2_S) || defined(DATA_A_IQ3_XXS) || defined(DATA_A_IQ3_S) || defined(DATA_A_IQ4_NL)
16-
init_iq_shmem();
16+
init_iq_shmem(gl_WorkGroupSize);
1717
if (gl_LocalInvocationIndex.x != 0) {
1818
return;
1919
}

ggml/src/ggml-vulkan/vulkan-shaders/copy_to_quant.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -218,7 +218,7 @@ void quantize(uint dst_idx, uint src_idx)
218218

219219
void main() {
220220
#if defined(DATA_A_IQ2_XXS) || defined(DATA_A_IQ2_XS) || defined(DATA_A_IQ2_S) || defined(DATA_A_IQ3_XXS) || defined(DATA_A_IQ3_S) || defined(DATA_A_IQ4_NL)
221-
init_iq_shmem();
221+
init_iq_shmem(gl_WorkGroupSize);
222222
if (gl_LocalInvocationIndex.x != 0) {
223223
return;
224224
}

ggml/src/ggml-vulkan/vulkan-shaders/dequant_iq2_s.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@ void main() {
1111
// Each thread handles 1 subblock (32 values with 2 scales)
1212
const uint ib = gl_WorkGroupID.x * 32 + gl_LocalInvocationID.x / 8;
1313

14-
init_iq_shmem();
14+
init_iq_shmem(gl_WorkGroupSize);
1515

1616
if (ib >= p.nel / 256) {
1717
return;

ggml/src/ggml-vulkan/vulkan-shaders/dequant_iq2_xs.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@ void main() {
1111
// Each thread handles 1 subblock (32 values with 2 scales)
1212
const uint ib = gl_WorkGroupID.x * 32 + gl_LocalInvocationID.x / 8;
1313

14-
init_iq_shmem();
14+
init_iq_shmem(gl_WorkGroupSize);
1515

1616
if (ib >= p.nel / 256) {
1717
return;

ggml/src/ggml-vulkan/vulkan-shaders/dequant_iq2_xxs.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ void main() {
1212
// Each block is described by 4 lattice indices, 4x7 sign bits and 4 scale bits
1313
const uint ib = gl_WorkGroupID.x * 32 + gl_LocalInvocationID.x / 8;
1414

15-
init_iq_shmem();
15+
init_iq_shmem(gl_WorkGroupSize);
1616

1717
if (ib >= p.nel / 256) {
1818
return;

ggml/src/ggml-vulkan/vulkan-shaders/dequant_iq3_s.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ void main() {
1212
// Each block contains 4 scale bytes (8 scales) for 256 output values.
1313
const uint ib = gl_WorkGroupID.x * 32 + gl_LocalInvocationID.x / 8;
1414

15-
init_iq_shmem();
15+
init_iq_shmem(gl_WorkGroupSize);
1616

1717
if (ib >= p.nel / 256) {
1818
return;

ggml/src/ggml-vulkan/vulkan-shaders/dequant_iq3_xxs.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ void main() {
1212
// 8 threads handle 1 superblock
1313
const uint ib = gl_WorkGroupID.x * 32 + gl_LocalInvocationID.x / 8;
1414

15-
init_iq_shmem();
15+
init_iq_shmem(gl_WorkGroupSize);
1616

1717
if (ib >= p.nel / 256) {
1818
return;

ggml/src/ggml-vulkan/vulkan-shaders/dequant_iq4_nl.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ layout (binding = 1) writeonly buffer D {D_TYPE data_b[];};
1010
void main() {
1111
const uint i = gl_WorkGroupID.x * 4 + gl_LocalInvocationID.x / 64;
1212

13-
init_iq_shmem();
13+
init_iq_shmem(gl_WorkGroupSize);
1414

1515
const uint tid = gl_LocalInvocationID.x % 64;
1616
const uint il = tid/32;

ggml/src/ggml-vulkan/vulkan-shaders/flash_attn_cm2.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -105,7 +105,7 @@ ACC_TYPE Max(const in uint32_t row, const in uint32_t col, const in ACC_TYPE ele
105105

106106
void main() {
107107
#if defined(DATA_A_IQ2_XXS) || defined(DATA_A_IQ2_XS) || defined(DATA_A_IQ2_S) || defined(DATA_A_IQ3_XXS) || defined(DATA_A_IQ3_S) || defined(DATA_A_IQ4_NL)
108-
init_iq_shmem();
108+
init_iq_shmem(gl_WorkGroupSize);
109109
#endif
110110

111111
const uint32_t N = p.N;

ggml/src/ggml-vulkan/vulkan-shaders/get_rows_quant.comp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ void main() {
1313
const uint i12 = (gl_GlobalInvocationID.z)%p.ne12;
1414

1515
#if defined(DATA_A_IQ2_XXS) || defined(DATA_A_IQ2_XS) || defined(DATA_A_IQ2_S) || defined(DATA_A_IQ3_XXS) || defined(DATA_A_IQ3_S) || defined(DATA_A_IQ4_NL)
16-
init_iq_shmem();
16+
init_iq_shmem(gl_WorkGroupSize);
1717
#endif
1818

1919
if (i00 >= p.ne00) {

0 commit comments

Comments
 (0)