From 896cbab669fe2be574571275ffea64942812e587 Mon Sep 17 00:00:00 2001
From: Xida <xidaren2@amd.com>
Date: Thu, 26 Dec 2024 19:14:08 +0000
Subject: [PATCH] fix prefix_sharing_algorithm config write

---
 .../llm/server_management.py                  | 20 ++++++-------------
 1 file changed, 6 insertions(+), 14 deletions(-)

diff --git a/app_tests/integration_tests/llm/server_management.py b/app_tests/integration_tests/llm/server_management.py
index 7cbfc390b..cf7211655 100644
--- a/app_tests/integration_tests/llm/server_management.py
+++ b/app_tests/integration_tests/llm/server_management.py
@@ -40,8 +40,9 @@ def find_available_port() -> int:
     def __init__(self, config: ServerConfig):
         self.config = config
 
-    def write_config(self) -> Path:
+    def _write_config(self) -> Path:
         """Creates server config by extending the exported model config."""
+        # TODO: eliminate this by moving prefix sharing algorithm to be a cmdline arg of server.py
         source_config_path = self.config.artifacts.config_path
         server_config_path = (
             source_config_path.parent
@@ -51,25 +52,16 @@ def write_config(self) -> Path:
         # Read the exported config as base
         with open(source_config_path) as f:
             config = json.load(f)
-
-        # Update with server-specific settings
-        config.update(
-            {
-                "paged_kv_cache": {
-                    "prefix_sharing_algorithm": self.config.prefix_sharing_algorithm
-                }
-            }
-        )
-
-        # Write the extended config
+        config["paged_kv_cache"][
+            "prefix_sharing_algorithm"
+        ] = self.config.prefix_sharing_algorithm
         with open(server_config_path, "w") as f:
             json.dump(config, f)
-        6
         return server_config_path
 
     def start(self) -> subprocess.Popen:
         """Starts the server process."""
-        config_path = self.write_config()
+        config_path = self._write_config()
         cmd = [
             sys.executable,
             "-m",