vulkan: Apply bias before softmax in FA, to avoid overflow (#24909)

This commit is contained in:
Jeff Bolz 2026-06-23 22:34:00 -05:00 committed by GitHub
parent be4a6a63eb
commit ac4105d68b
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 2 additions and 0 deletions

View File

@ -463,6 +463,7 @@ void main() {
} }
rowmaxf = max(rowmaxf, float(Sf[r][c])); rowmaxf = max(rowmaxf, float(Sf[r][c]));
} }
rowmaxf += FATTN_KQ_MAX_OFFSET;
float Moldf = Mf[r]; float Moldf = Mf[r];
// M = max(rowmax, Mold) // M = max(rowmax, Mold)

View File

@ -352,6 +352,7 @@ void main() {
} }
rowmaxf = max(rowmaxf, float(sfsh[r_vec + (c * cols_per_iter + col_tid) * sfshstride][r_comp])); rowmaxf = max(rowmaxf, float(sfsh[r_vec + (c * cols_per_iter + col_tid) * sfshstride][r_comp]));
} }
rowmaxf += FATTN_KQ_MAX_OFFSET;
float Moldf = Mf[r]; float Moldf = Mf[r];
// Compute max across the row // Compute max across the row