From 7544d304bfb5343ead8e2d2993aedb5a5be6b6dc Mon Sep 17 00:00:00 2001 From: sd109 Date: Thu, 29 Aug 2024 16:33:22 +0100 Subject: [PATCH 1/2] Update vLLM to v0.5.5 --- chart/values.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/chart/values.yaml b/chart/values.yaml index 6fd3841..d37d5fc 100644 --- a/chart/values.yaml +++ b/chart/values.yaml @@ -35,7 +35,7 @@ api: # Container image config image: repository: vllm/vllm-openai - version: v0.5.4 + version: v0.5.5 monitoring: enabled: true # The number of replicas for the backend deployment From 3dc68bce938fe72d602d2162a4714da2cd54308c Mon Sep 17 00:00:00 2001 From: sd109 Date: Thu, 29 Aug 2024 16:33:47 +0100 Subject: [PATCH 2/2] Update default model to a newer open-access LLM --- chart/values.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/chart/values.yaml b/chart/values.yaml index d37d5fc..626b265 100644 --- a/chart/values.yaml +++ b/chart/values.yaml @@ -5,7 +5,7 @@ huggingface: # The name of the HuggingFace model to use # Use a yaml anchor to avoid duplication elsewhere - model: &model-name ise-uiuc/Magicoder-S-DS-6.7B + model: &model-name microsoft/Phi-3.5-mini-instruct # A Jinja formatted chat template to provide to the language model. # See https://huggingface.co/blog/chat-templates for background info. # If not provided, the default template specified in the HuggingFace