Skip to content

Commit

Permalink
Fix debug Turing switch
Browse files Browse the repository at this point in the history
  • Loading branch information
ZeronSix committed Feb 26, 2025
1 parent a24ba57 commit 4772f2c
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions inference_lib/src/aqlm/inference_kernels/cuda_kernel.cu
Original file line number Diff line number Diff line change
Expand Up @@ -589,7 +589,7 @@ void code2x8_matvec_cuda(
int threads = 32 * thread_m;
cudaStream_t stream = at::cuda::getCurrentCUDAStream().stream();
const bool is_turing = cc_major == 7 && cc_minor == 5;
if (is_turing) {
if (!is_turing) {
int shared = 16 * (2 * 256 * 8 + 32 * 9);
cudaFuncSetAttribute(
Code2x8MatVec<use_bfloat16>, cudaFuncAttributeMaxDynamicSharedMemorySize, shared
Expand Down Expand Up @@ -655,7 +655,7 @@ void code2x8_dequant_cuda(
int threads = 32 * thread_m;
cudaStream_t stream = at::cuda::getCurrentCUDAStream().stream();
const bool is_turing = cc_major == 7 && cc_minor == 5;
if (is_turing) {
if (!is_turing) {
int shared = 16 * (2 * 256 * 8 + 32 * 9);
if (use_bfloat16) {
cudaFuncSetAttribute(
Expand Down

0 comments on commit 4772f2c

Please sign in to comment.