[CPU] Fix mamtulnbits accuracy level (microsoft#22963)

### Description Fix mamtulnbits accuracy level ### Motivation and Context
intel · Dec 11, 2024 · 3828c33 · 3828c33
1 parent 14950cc
commit 3828c33
Show file tree

Hide file tree

Showing 2 changed files with 5 additions and 3 deletions.
diff --git a/onnxruntime/contrib_ops/cpu/quantization/matmul_nbits.cc b/onnxruntime/contrib_ops/cpu/quantization/matmul_nbits.cc
@@ -33,6 +33,7 @@ constexpr size_t A = 0,
 };
 
 typedef enum {
+  Level0, /*!< input fp32, accumulator fp32 */
   Level1, /*!< input fp32, accumulator fp32 */
   Level2, /*!< input fp16, accumulator fp16 */
   Level3, /*!< input bf16, accumulator fp32 */

diff --git a/onnxruntime/test/contrib_ops/matmul_4bits_test.cc b/onnxruntime/test/contrib_ops/matmul_4bits_test.cc
@@ -274,11 +274,12 @@ void TestMatMulNBitsTyped() {
   base_opts.block_size = block_size;
   base_opts.accuracy_level = accuracy_level;
 
-  if constexpr (std::is_same<AType, MLFloat16>::value) {
+  if (base_opts.accuracy_level == 4) {
+    base_opts.output_abs_error = 0.1f;
+    base_opts.output_rel_error = 0.02f;
+  } else if constexpr (std::is_same<AType, MLFloat16>::value) {
     base_opts.output_abs_error = 0.055f;
     base_opts.output_rel_error = 0.02f;
-  } else if (base_opts.accuracy_level == 4) {
-    base_opts.output_abs_error = 0.1f;
   }
 
   {