From 6bc1eab1cde90f025ab02f89034334e46e5c7f9a Mon Sep 17 00:00:00 2001 From: Gabriele Oliaro Date: Sun, 29 Sep 2024 15:40:30 +0000 Subject: [PATCH] support llama3.2 --- python/flexflow/serve/models/llama.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/python/flexflow/serve/models/llama.py b/python/flexflow/serve/models/llama.py index 53209298a5..7d67ccbed6 100644 --- a/python/flexflow/serve/models/llama.py +++ b/python/flexflow/serve/models/llama.py @@ -281,3 +281,7 @@ def convert_hf_model(model, dst_folder): for name, params in model.named_parameters(): name = FlexFlowLLAMA.convert_hf_weight_name(name) params.detach().cpu().numpy().tofile(f"{dst_folder}/{name}") + # LM head weight + model.lm_head.weight.detach().cpu().numpy().tofile( + os.path.join(dst_folder, "lm_head.weight") + )