From c059bd284832d09bc51cf82c377642b26a48ef28 Mon Sep 17 00:00:00 2001 From: Tim Dettmers Date: Sun, 20 Nov 2022 14:18:15 -0800 Subject: Added additional blocksizes: {64, 128, 256}. --- csrc/ops.cu | 12 ++++++++++++ 1 file changed, 12 insertions(+) (limited to 'csrc/ops.cu') diff --git a/csrc/ops.cu b/csrc/ops.cu index b121fc2..30079e6 100644 --- a/csrc/ops.cu +++ b/csrc/ops.cu @@ -65,6 +65,12 @@ template void quantizeBlockwise(float * code, T *A, kQuantizeBlockwise<<>>(code, A, absmax, out, rand, rand_offset, n); else if(blocksize == 512) kQuantizeBlockwise<<>>(code, A, absmax, out, rand, rand_offset, n); + else if(blocksize == 256) + kQuantizeBlockwise<<>>(code, A, absmax, out, rand, rand_offset, n); + else if(blocksize == 128) + kQuantizeBlockwise<<>>(code, A, absmax, out, rand, rand_offset, n); + else if(blocksize == 64) + kQuantizeBlockwise<<>>(code, A, absmax, out, rand, rand_offset, n); CUDA_CHECK_RETURN(cudaPeekAtLastError()); @@ -82,6 +88,12 @@ template void dequantizeBlockwise(float *code, unsigned char *A, flo kDequantizeBlockwise<<>>(code, A, absmax, out, n); else if(blocksize == 512) kDequantizeBlockwise<<>>(code, A, absmax, out, n); + else if(blocksize == 256) + kDequantizeBlockwise<<>>(code, A, absmax, out, n); + else if(blocksize == 128) + kDequantizeBlockwise<<>>(code, A, absmax, out, n); + else if(blocksize == 64) + kDequantizeBlockwise<<>>(code, A, absmax, out, n); CUDA_CHECK_RETURN(cudaPeekAtLastError()); } -- cgit v1.2.3