From 8e7b193a1f5e9c7be38e09727af6704858744416 Mon Sep 17 00:00:00 2001 From: cryscan Date: Thu, 20 Jun 2024 21:28:20 +0800 Subject: [PATCH] Fix no subgroups quant GEMV. --- Cargo.toml | 2 +- src/tensor/ops.rs | 2 ++ 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/Cargo.toml b/Cargo.toml index 418e125..451d44b 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -9,7 +9,7 @@ keywords = ["deep-learning", "language", "model", "rwkv"] license = "MIT OR Apache-2.0" name = "web-rwkv" repository = "https://github.com/cryscan/web-rwkv" -version = "0.8.14" +version = "0.8.15" [dependencies] ahash = "0.8" diff --git a/src/tensor/ops.rs b/src/tensor/ops.rs index 8daccd6..973c89f 100644 --- a/src/tensor/ops.rs +++ b/src/tensor/ops.rs @@ -740,6 +740,7 @@ impl TensorOp { None, Macros::new() .u32("BLOCK_SIZE", BLOCK_SIZE) + .int8(Self::INT8_BLOCK_SIZE) .tensor(&input, Some("IN")) .tensor(&output, Some("OUT")) .custom(active, Some("ACT")), @@ -833,6 +834,7 @@ impl TensorOp { None, Macros::new() .u32("BLOCK_SIZE", BLOCK_SIZE) + .nf4(Self::NF4_BLOCK_SIZE) .tensor(&input, Some("IN")) .tensor(&output, Some("OUT")) .custom(active, Some("ACT")),