From 9acf19413d6326d88b8389d2b0c48928f787f5eb Mon Sep 17 00:00:00 2001 From: Sushanth Rajasankar Date: Tue, 10 Dec 2024 15:14:14 -0800 Subject: [PATCH] fix typo --- onnxruntime/contrib_ops/webgpu/quantization/matmul_nbits.cc | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/onnxruntime/contrib_ops/webgpu/quantization/matmul_nbits.cc b/onnxruntime/contrib_ops/webgpu/quantization/matmul_nbits.cc index 919054796d42c..4e2429c7c2964 100644 --- a/onnxruntime/contrib_ops/webgpu/quantization/matmul_nbits.cc +++ b/onnxruntime/contrib_ops/webgpu/quantization/matmul_nbits.cc @@ -502,7 +502,7 @@ Status MatMulNBits::ComputeInternal(onnxruntime::webgpu::ComputeContext& context constexpr int32_t subgroup_size = 16; // How many times each workgroup reloads A sharing B. This is tuneable, // 8 produces a good performance for sequence length of 256/512, 16 will give - // slightly better performance for seqeengths of 1024. + // slightly better performance for sequence lengths of 1024. // Note: This should match A_REPEAT in the shader. constexpr unsigned int kMatMulPrefillARepeat = 8; program.SetWorkgroupSize(tile_size * subgroup_size);