vulkan: add missing clamps in new mul_mat_id paths (llama/15702)

This is a missing interaction between #15546 and #15652
This commit is contained in:
Jeff Bolz 2025-09-01 14:01:10 -05:00 committed by Georgi Gerganov
parent d5f80a2982
commit 7a5e7368a3
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735
1 changed files with 6 additions and 0 deletions

View File

@ -494,6 +494,9 @@ void main() {
sum = coopMatMulAdd(mat_a, mat_b, sum);
}
}
#if defined(ACC_TYPE_MAX)
[[unroll]] for (uint i = 0; i < sum.length(); ++i) { sum[i] = clamp(sum[i], -ACC_TYPE_MAX, ACC_TYPE_MAX); }
#endif
// Convert from ACC_TYPE to D_TYPE
coopmat<D_TYPE, gl_ScopeWorkgroup, BM, BNover4, gl_MatrixUseAccumulator> mat_d;
@ -535,6 +538,9 @@ void main() {
sum = coopMatMulAdd(mat_a, mat_b, sum);
}
}
#if defined(ACC_TYPE_MAX)
[[unroll]] for (uint i = 0; i < sum.length(); ++i) { sum[i] = clamp(sum[i], -ACC_TYPE_MAX, ACC_TYPE_MAX); }
#endif
// Convert from ACC_TYPE to D_TYPE
coopmat<D_TYPE, gl_ScopeWorkgroup, BM, BNover2, gl_MatrixUseAccumulator> mat_d;