template spacing

microsoft · Oct 23, 2023 · 2ad5689 · 2ad5689
1 parent 7f1d345
commit 2ad5689
Show file tree

Hide file tree

Showing 2 changed files with 19 additions and 19 deletions.
diff --git a/onnxruntime/contrib_ops/cuda/quantization/dequantize_blockwise_bnb4.cu b/onnxruntime/contrib_ops/cuda/quantization/dequantize_blockwise_bnb4.cu
@@ -111,13 +111,13 @@ template Status DequantizeBnb4<float>(
     cudaStream_t stream);
 
 template Status DequantizeBnb4<half>(
-  const half* quant_map, 
-  half *output, 
-  const uint8_t *quant_data, 
-  const half *absmax, 
-  int block_size, 
-  int numel, 
-  cudaStream_t stream);
+    const half* quant_map, 
+    half *output, 
+    const uint8_t *quant_data, 
+    const half *absmax, 
+    int block_size, 
+    int numel, 
+    cudaStream_t stream);
 
 }  // namespace cuda
 }  // namespace contrib

diff --git a/onnxruntime/contrib_ops/cuda/quantization/matmul_bnb4.cu b/onnxruntime/contrib_ops/cuda/quantization/matmul_bnb4.cu
@@ -13,18 +13,18 @@ namespace cuda {
 #define num_values_4bit 32
 template <typename T, int THREADS, int BITS>
 __global__ void kgemm_4bit_inference_naive(
-  int M,
-  int N,
-  int K,
-  const T* __restrict__ A,
-  const uint8_t *B,
-  const T *absmax,
-  const T *datatype,
-  T * out,
-  int lda,
-  int ldb,
-  int ldc,
-  int block_size) {
+    int M,
+    int N,
+    int K,
+    const T* __restrict__ A,
+    const uint8_t *B,
+    const T *absmax,
+    const T *datatype,
+    T * out,
+    int lda,
+    int ldb,
+    int ldc,
+    int block_size) {
   // per threadblock:
   // load step-by-step in chunks of [32,warps]: 1x32 * [32,warps] -> [1,warps]
   // 4 warps -> 4 loads per iter