bug fix from commit 3c108d4232

This commit is contained in:
PanQiWei 2023-05-04 22:34:16 +08:00
parent e4d476be16
commit fe3456100c

View file

@ -291,6 +291,7 @@ __global__ void VecQuant2MatMulKernel(
res += weight[k] * blockvec[k];
}
atomicAdd(&mul[b * width + w], res);
__syncthreads();
}
}
@ -435,6 +436,7 @@ __global__ void VecQuant3MatMulKernel(
res += weight[k] * blockvec[k];
}
atomicAdd(&mul[b * width + w], res);
__syncthreads();
}
}
@ -522,6 +524,7 @@ __global__ void VecQuant4MatMulKernel(
res += weight[k] * blockvec[k];
}
atomicAdd(&mul[b * width + w], res);
__syncthreads();
}
}
@ -608,6 +611,7 @@ __global__ void VecQuant8MatMulKernel(
res += weight[k] * blockvec[k];
}
atomicAdd(&mul[b * width + w], res);
__syncthreads();
}
}