We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 0b8040d commit 2f60f37Copy full SHA for 2f60f37
1 file changed
dpctl/tensor/libtensor/include/kernels/linalg_functions/gemm.hpp
@@ -2190,7 +2190,7 @@ class GemmBatchNoAtomicFunctorThreadK
2190
for (size_t vec_id = 1; vec_id < m_groups; ++vec_id) {
2191
if (j + vec_id < m) {
2192
res[total_offset + res_indexer(i * m + j + vec_id)] =
2193
- local_sum[1];
+ local_sum[vec_id];
2194
}
2195
2196
0 commit comments