diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/README.md b/bentoml/bentos/gemma/2b-instruct-fp16-0856/README.md similarity index 97% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/README.md rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/README.md index b94fda3..d8b48b3 100644 --- a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/README.md +++ b/bentoml/bentos/gemma/2b-instruct-fp16-0856/README.md @@ -1,4 +1,4 @@ -# gemma:2b-instruct-fp16-26b3 +# gemma:2b-instruct-fp16-0856 [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/apis/openapi.yaml b/bentoml/bentos/gemma/2b-instruct-fp16-0856/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/apis/openapi.yaml rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/apis/openapi.yaml diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/apis/schema.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/apis/schema.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/apis/schema.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/apis/schema.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/bento.yaml b/bentoml/bentos/gemma/2b-instruct-fp16-0856/bento.yaml similarity index 95% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/bento.yaml rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/bento.yaml index 31cfc63..b7fbee6 100644 --- a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/bento.yaml +++ b/bentoml/bentos/gemma/2b-instruct-fp16-0856/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: gemma -version: 2b-instruct-fp16-26b3 +version: 2b-instruct-fp16-0856 bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:57:26.100524+00:00' +creation_time: '2024-07-12T13:40:09.050778+00:00' labels: + model_name: google/gemma-2b-it openllm_alias: 2b,2b-instruct - openllm_hf_model_id: google/gemma-2b-it - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/docker/Dockerfile b/bentoml/bentos/gemma/2b-instruct-fp16-0856/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/docker/Dockerfile rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/env/docker/Dockerfile diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/docker/entrypoint.sh b/bentoml/bentos/gemma/2b-instruct-fp16-0856/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/docker/entrypoint.sh rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/env/docker/entrypoint.sh diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/install.sh b/bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/install.sh similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/install.sh rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/install.sh diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/requirements.lock.txt b/bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/requirements.lock.txt similarity index 96% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/requirements.lock.txt rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/requirements.lock.txt index 925ce19..f6acdf5 100644 --- a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/requirements.lock.txt +++ b/bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/requirements.lock.txt @@ -41,7 +41,7 @@ inflection==0.5.1 interegular==0.3.3 jinja2==3.1.4 joblib==1.4.2 -jsonschema==4.22.0 +jsonschema==4.23.0 jsonschema-specifications==2023.12.1 lark==1.1.9 llvmlite==0.43.0 @@ -70,7 +70,7 @@ nvidia-ml-py==11.525.150 nvidia-nccl-cu12==2.20.5 nvidia-nvjitlink-cu12==12.5.82 nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 +openai==1.35.13 opentelemetry-api==1.20.0 opentelemetry-instrumentation==0.41b0 opentelemetry-instrumentation-aiohttp-client==0.41b0 @@ -100,12 +100,12 @@ python-json-logger==2.0.7 python-multipart==0.0.9 pyyaml==6.0.1 pyzmq==26.0.3 -ray==2.31.0 +ray==2.32.0 referencing==0.35.1 regex==2024.5.15 requests==2.32.3 rich==13.7.1 -rpds-py==0.18.1 +rpds-py==0.19.0 safetensors==0.4.3 schema==0.7.7 scipy==1.13.1 @@ -115,7 +115,7 @@ simple-di==0.1.5 six==1.16.0 sniffio==1.3.1 starlette==0.37.2 -sympy==1.12.1 +sympy==1.13.0 tiktoken==0.7.0 tokenizers==0.19.1 tomli==2.0.1 @@ -144,4 +144,4 @@ zipp==3.19.2 # The following packages are considered to be unsafe in a requirements file: pip==24.1.2 -setuptools==70.2.0 +setuptools==70.3.0 diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/requirements.txt b/bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/requirements.txt rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/requirements.txt diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/version.txt b/bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/version.txt similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/version.txt rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/env/python/version.txt diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/bento_constants.py b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/bento_constants.py similarity index 87% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/bento_constants.py rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/bento_constants.py index f408ae0..0414c91 100644 --- a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/bento_constants.py +++ b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: google/gemma-2b-it extra_labels: + model_name: google/gemma-2b-it openllm_alias: 2b,2b-instruct - openllm_hf_model_id: google/gemma-2b-it project: vllm-chat service_config: name: gemma diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/bentofile.yaml b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/bentofile.yaml similarity index 93% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/bentofile.yaml rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/bentofile.yaml index 49d283b..ce465e0 100644 --- a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/bentofile.yaml +++ b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: google/gemma-2b-it openllm_alias: 2b,2b-instruct - openllm_hf_model_id: google/gemma-2b-it - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/service.py b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/service.py similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/service.py rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/service.py diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/404.html b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/404.html similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/404.html rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/404.html diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/apple-touch-icon.png b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/apple-touch-icon.png rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/chat.html b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/chat.html similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/chat.html rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/chat.html diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/chat.txt b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/chat.txt rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/chat.txt diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/favicon-16x16.png b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/favicon-16x16.png rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/favicon.ico b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/favicon.ico rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/favicon.ico diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/index.html b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/index.html similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/index.html rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/index.html diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/index.txt b/bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/index.txt similarity index 100% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/ui/index.txt rename to bentoml/bentos/gemma/2b-instruct-fp16-0856/src/ui/index.txt diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/README.md b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/README.md similarity index 96% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/README.md rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/README.md index 141fc9b..1145507 100644 --- a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/README.md +++ b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/README.md @@ -1,4 +1,4 @@ -# gemma:7b-instruct-awq-4bit-d670 +# gemma:7b-instruct-awq-4bit-d11b [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/apis/openapi.yaml b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/apis/openapi.yaml rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/apis/openapi.yaml diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/apis/schema.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/apis/schema.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/apis/schema.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/apis/schema.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/bento.yaml b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/bento.yaml similarity index 94% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/bento.yaml rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/bento.yaml index 4284021..3ede09f 100644 --- a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/bento.yaml +++ b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: gemma -version: 7b-instruct-awq-4bit-d670 +version: 7b-instruct-awq-4bit-d11b bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:59:18.619602+00:00' +creation_time: '2024-07-12T13:42:23.707025+00:00' labels: + model_name: casperhansen/gemma-7b-it-awq openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: casperhansen/gemma-7b-it-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/docker/Dockerfile b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/docker/Dockerfile rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/docker/Dockerfile diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/docker/entrypoint.sh b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/docker/entrypoint.sh rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/docker/entrypoint.sh diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/install.sh b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/install.sh similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/install.sh rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/install.sh diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/requirements.lock.txt b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/requirements.lock.txt similarity index 96% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/requirements.lock.txt rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/requirements.lock.txt index 925ce19..f6acdf5 100644 --- a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/requirements.lock.txt +++ b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/requirements.lock.txt @@ -41,7 +41,7 @@ inflection==0.5.1 interegular==0.3.3 jinja2==3.1.4 joblib==1.4.2 -jsonschema==4.22.0 +jsonschema==4.23.0 jsonschema-specifications==2023.12.1 lark==1.1.9 llvmlite==0.43.0 @@ -70,7 +70,7 @@ nvidia-ml-py==11.525.150 nvidia-nccl-cu12==2.20.5 nvidia-nvjitlink-cu12==12.5.82 nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 +openai==1.35.13 opentelemetry-api==1.20.0 opentelemetry-instrumentation==0.41b0 opentelemetry-instrumentation-aiohttp-client==0.41b0 @@ -100,12 +100,12 @@ python-json-logger==2.0.7 python-multipart==0.0.9 pyyaml==6.0.1 pyzmq==26.0.3 -ray==2.31.0 +ray==2.32.0 referencing==0.35.1 regex==2024.5.15 requests==2.32.3 rich==13.7.1 -rpds-py==0.18.1 +rpds-py==0.19.0 safetensors==0.4.3 schema==0.7.7 scipy==1.13.1 @@ -115,7 +115,7 @@ simple-di==0.1.5 six==1.16.0 sniffio==1.3.1 starlette==0.37.2 -sympy==1.12.1 +sympy==1.13.0 tiktoken==0.7.0 tokenizers==0.19.1 tomli==2.0.1 @@ -144,4 +144,4 @@ zipp==3.19.2 # The following packages are considered to be unsafe in a requirements file: pip==24.1.2 -setuptools==70.2.0 +setuptools==70.3.0 diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/requirements.txt b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/requirements.txt rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/requirements.txt diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/version.txt b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/version.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/version.txt rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/env/python/version.txt diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/bento_constants.py b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/bento_constants.py similarity index 86% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/bento_constants.py rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/bento_constants.py index 6b6891f..c379bb9 100644 --- a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/bento_constants.py +++ b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/bento_constants.py @@ -6,8 +6,8 @@ model: casperhansen/gemma-7b-it-awq quantization: awq extra_labels: + model_name: casperhansen/gemma-7b-it-awq openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: casperhansen/gemma-7b-it-awq project: vllm-chat service_config: name: gemma diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/bentofile.yaml b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/bentofile.yaml rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/bentofile.yaml index 1ba06a4..9fdf522 100644 --- a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/bentofile.yaml +++ b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: casperhansen/gemma-7b-it-awq openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: Qwen/Qwen2-7B-Instruct-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/service.py b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/service.py similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/service.py rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/service.py diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/404.html b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/404.html similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/404.html rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/404.html diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/apple-touch-icon.png b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/apple-touch-icon.png rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/chat.html b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/chat.html similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/chat.html rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/chat.html diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/chat.txt b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/chat.txt rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/chat.txt diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/favicon-16x16.png b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/favicon-16x16.png rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/favicon.ico b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/favicon.ico rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/favicon.ico diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/index.html b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/index.html similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/index.html rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/index.html diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/index.txt b/bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/index.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/ui/index.txt rename to bentoml/bentos/gemma/7b-instruct-awq-4bit-d11b/src/ui/index.txt diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/README.md b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/README.md similarity index 97% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/README.md rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/README.md index 8b67b93..4fb0a30 100644 --- a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/README.md +++ b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/README.md @@ -1,4 +1,4 @@ -# gemma:7b-instruct-fp16-ae3e +# gemma:7b-instruct-fp16-3e1c [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/apis/openapi.yaml b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/apis/openapi.yaml rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/apis/openapi.yaml diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/apis/schema.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/apis/schema.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/apis/schema.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/apis/schema.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/bento.yaml b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/bento.yaml similarity index 95% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/bento.yaml rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/bento.yaml index d34ccd6..60b4c26 100644 --- a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/bento.yaml +++ b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: gemma -version: 7b-instruct-fp16-ae3e +version: 7b-instruct-fp16-3e1c bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:58:22.853090+00:00' +creation_time: '2024-07-12T13:41:08.692955+00:00' labels: + model_name: google/gemma-7b-it openllm_alias: 7b,7b-instruct - openllm_hf_model_id: google/gemma-7b-it - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/docker/Dockerfile b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/docker/Dockerfile rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/docker/Dockerfile diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/docker/entrypoint.sh b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/docker/entrypoint.sh rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/docker/entrypoint.sh diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/install.sh b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/install.sh similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/install.sh rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/install.sh diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/requirements.lock.txt b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/requirements.lock.txt similarity index 96% rename from bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/requirements.lock.txt rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/requirements.lock.txt index 925ce19..f6acdf5 100644 --- a/bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/requirements.lock.txt +++ b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/requirements.lock.txt @@ -41,7 +41,7 @@ inflection==0.5.1 interegular==0.3.3 jinja2==3.1.4 joblib==1.4.2 -jsonschema==4.22.0 +jsonschema==4.23.0 jsonschema-specifications==2023.12.1 lark==1.1.9 llvmlite==0.43.0 @@ -70,7 +70,7 @@ nvidia-ml-py==11.525.150 nvidia-nccl-cu12==2.20.5 nvidia-nvjitlink-cu12==12.5.82 nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 +openai==1.35.13 opentelemetry-api==1.20.0 opentelemetry-instrumentation==0.41b0 opentelemetry-instrumentation-aiohttp-client==0.41b0 @@ -100,12 +100,12 @@ python-json-logger==2.0.7 python-multipart==0.0.9 pyyaml==6.0.1 pyzmq==26.0.3 -ray==2.31.0 +ray==2.32.0 referencing==0.35.1 regex==2024.5.15 requests==2.32.3 rich==13.7.1 -rpds-py==0.18.1 +rpds-py==0.19.0 safetensors==0.4.3 schema==0.7.7 scipy==1.13.1 @@ -115,7 +115,7 @@ simple-di==0.1.5 six==1.16.0 sniffio==1.3.1 starlette==0.37.2 -sympy==1.12.1 +sympy==1.13.0 tiktoken==0.7.0 tokenizers==0.19.1 tomli==2.0.1 @@ -144,4 +144,4 @@ zipp==3.19.2 # The following packages are considered to be unsafe in a requirements file: pip==24.1.2 -setuptools==70.2.0 +setuptools==70.3.0 diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/requirements.txt b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/requirements.txt rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/requirements.txt diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/version.txt b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/version.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/version.txt rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/env/python/version.txt diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/bento_constants.py b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/bento_constants.py similarity index 87% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/bento_constants.py rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/bento_constants.py index 580d3d5..1806249 100644 --- a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/bento_constants.py +++ b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: google/gemma-7b-it extra_labels: + model_name: google/gemma-7b-it openllm_alias: 7b,7b-instruct - openllm_hf_model_id: google/gemma-7b-it project: vllm-chat service_config: name: gemma diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/bentofile.yaml b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/bentofile.yaml similarity index 93% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/bentofile.yaml rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/bentofile.yaml index 68015cf..7aa404d 100644 --- a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/bentofile.yaml +++ b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: google/gemma-7b-it openllm_alias: 7b,7b-instruct - openllm_hf_model_id: google/gemma-7b-it - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/service.py b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/service.py similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/service.py rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/service.py diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/404.html b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/404.html similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/404.html rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/404.html diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/apple-touch-icon.png b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/apple-touch-icon.png rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/chat.html b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/chat.html similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/chat.html rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/chat.html diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/chat.txt b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/chat.txt rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/chat.txt diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/favicon-16x16.png b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/favicon-16x16.png rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/favicon.ico b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/favicon.ico rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/favicon.ico diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/index.html b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/index.html similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/index.html rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/index.html diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/index.txt b/bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/index.txt similarity index 100% rename from bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/ui/index.txt rename to bentoml/bentos/gemma/7b-instruct-fp16-3e1c/src/ui/index.txt diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/README.md b/bentoml/bentos/llama2/13b-chat-fp16-921b/README.md similarity index 97% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/README.md rename to bentoml/bentos/llama2/13b-chat-fp16-921b/README.md index 6e491b0..d5a7312 100644 --- a/bentoml/bentos/llama2/70b-chat-fp16-b0de/README.md +++ b/bentoml/bentos/llama2/13b-chat-fp16-921b/README.md @@ -1,4 +1,4 @@ -# llama2:70b-chat-fp16-b0de +# llama2:13b-chat-fp16-921b [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/apis/openapi.yaml b/bentoml/bentos/llama2/13b-chat-fp16-921b/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/apis/openapi.yaml rename to bentoml/bentos/llama2/13b-chat-fp16-921b/apis/openapi.yaml diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/apis/schema.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/apis/schema.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/apis/schema.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/apis/schema.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/bento.yaml b/bentoml/bentos/llama2/13b-chat-fp16-921b/bento.yaml similarity index 95% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/bento.yaml rename to bentoml/bentos/llama2/13b-chat-fp16-921b/bento.yaml index b7ac776..ab2001d 100644 --- a/bentoml/bentos/llama2/13b-chat-fp16-4059/bento.yaml +++ b/bentoml/bentos/llama2/13b-chat-fp16-921b/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama2 -version: 13b-chat-fp16-4059 +version: 13b-chat-fp16-921b bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:49:27.527664+00:00' +creation_time: '2024-07-12T13:30:51.101256+00:00' labels: + model_name: meta-llama/Llama-2-13b-chat-hf openllm_alias: 13b,13b-chat - openllm_hf_model_id: meta-llama/Llama-2-13b-chat-hf - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/env/docker/Dockerfile b/bentoml/bentos/llama2/13b-chat-fp16-921b/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/env/docker/Dockerfile rename to bentoml/bentos/llama2/13b-chat-fp16-921b/env/docker/Dockerfile diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/env/docker/entrypoint.sh b/bentoml/bentos/llama2/13b-chat-fp16-921b/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/env/docker/entrypoint.sh rename to bentoml/bentos/llama2/13b-chat-fp16-921b/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/install.sh b/bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/install.sh rename to bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/install.sh diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/requirements.lock.txt b/bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/requirements.lock.txt similarity index 96% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/requirements.lock.txt rename to bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/requirements.lock.txt index 925ce19..f6acdf5 100644 --- a/bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/requirements.lock.txt +++ b/bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/requirements.lock.txt @@ -41,7 +41,7 @@ inflection==0.5.1 interegular==0.3.3 jinja2==3.1.4 joblib==1.4.2 -jsonschema==4.22.0 +jsonschema==4.23.0 jsonschema-specifications==2023.12.1 lark==1.1.9 llvmlite==0.43.0 @@ -70,7 +70,7 @@ nvidia-ml-py==11.525.150 nvidia-nccl-cu12==2.20.5 nvidia-nvjitlink-cu12==12.5.82 nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 +openai==1.35.13 opentelemetry-api==1.20.0 opentelemetry-instrumentation==0.41b0 opentelemetry-instrumentation-aiohttp-client==0.41b0 @@ -100,12 +100,12 @@ python-json-logger==2.0.7 python-multipart==0.0.9 pyyaml==6.0.1 pyzmq==26.0.3 -ray==2.31.0 +ray==2.32.0 referencing==0.35.1 regex==2024.5.15 requests==2.32.3 rich==13.7.1 -rpds-py==0.18.1 +rpds-py==0.19.0 safetensors==0.4.3 schema==0.7.7 scipy==1.13.1 @@ -115,7 +115,7 @@ simple-di==0.1.5 six==1.16.0 sniffio==1.3.1 starlette==0.37.2 -sympy==1.12.1 +sympy==1.13.0 tiktoken==0.7.0 tokenizers==0.19.1 tomli==2.0.1 @@ -144,4 +144,4 @@ zipp==3.19.2 # The following packages are considered to be unsafe in a requirements file: pip==24.1.2 -setuptools==70.2.0 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/requirements.txt b/bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/requirements.txt rename to bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/requirements.txt diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/version.txt b/bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/env/python/version.txt rename to bentoml/bentos/llama2/13b-chat-fp16-921b/env/python/version.txt diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/bento_constants.py b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/bento_constants.py similarity index 85% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/bento_constants.py rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/bento_constants.py index 309abd4..64bce5f 100644 --- a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/bento_constants.py +++ b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/bento_constants.py @@ -6,8 +6,8 @@ max_model_len: 1024 model: meta-llama/Llama-2-13b-chat-hf extra_labels: + model_name: meta-llama/Llama-2-13b-chat-hf openllm_alias: 13b,13b-chat - openllm_hf_model_id: meta-llama/Llama-2-13b-chat-hf project: vllm-chat service_config: name: llama2 diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/bentofile.yaml b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/bentofile.yaml rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/bentofile.yaml index 6ca0ed1..b9b4bd3 100644 --- a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/bentofile.yaml +++ b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: meta-llama/Llama-2-13b-chat-hf openllm_alias: 13b,13b-chat - openllm_hf_model_id: meta-llama/Llama-2-13b-chat-hf - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/service.py b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/service.py similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/service.py rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/service.py diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/404.html b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/404.html rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/404.html diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/apple-touch-icon.png b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/chat.html b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/chat.html rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/chat.html diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/chat.txt b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/chat.txt rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/chat.txt diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/favicon-16x16.png b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/favicon-16x16.png rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/favicon.ico b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/favicon.ico rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/favicon.ico diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/index.html b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/index.html rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/index.html diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/index.txt b/bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/src/ui/index.txt rename to bentoml/bentos/llama2/13b-chat-fp16-921b/src/ui/index.txt diff --git a/bentoml/bentos/llama2/13b-chat-fp16-4059/README.md b/bentoml/bentos/llama2/70b-chat-fp16-258c/README.md similarity index 97% rename from bentoml/bentos/llama2/13b-chat-fp16-4059/README.md rename to bentoml/bentos/llama2/70b-chat-fp16-258c/README.md index 13f594c..8954351 100644 --- a/bentoml/bentos/llama2/13b-chat-fp16-4059/README.md +++ b/bentoml/bentos/llama2/70b-chat-fp16-258c/README.md @@ -1,4 +1,4 @@ -# llama2:13b-chat-fp16-4059 +# llama2:70b-chat-fp16-258c [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/apis/openapi.yaml b/bentoml/bentos/llama2/70b-chat-fp16-258c/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/apis/openapi.yaml rename to bentoml/bentos/llama2/70b-chat-fp16-258c/apis/openapi.yaml diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/apis/schema.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/apis/schema.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/apis/schema.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/apis/schema.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/bento.yaml b/bentoml/bentos/llama2/70b-chat-fp16-258c/bento.yaml similarity index 95% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/bento.yaml rename to bentoml/bentos/llama2/70b-chat-fp16-258c/bento.yaml index 8bcf39e..cac20d1 100644 --- a/bentoml/bentos/llama2/70b-chat-fp16-b0de/bento.yaml +++ b/bentoml/bentos/llama2/70b-chat-fp16-258c/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama2 -version: 70b-chat-fp16-b0de +version: 70b-chat-fp16-258c bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:50:16.964511+00:00' +creation_time: '2024-07-12T13:31:51.241453+00:00' labels: + model_name: meta-llama/Llama-2-70b-chat-hf openllm_alias: 70b,70b-chat - openllm_hf_model_id: meta-llama/Llama-2-70b-chat-hf - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/docker/Dockerfile b/bentoml/bentos/llama2/70b-chat-fp16-258c/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/env/docker/Dockerfile rename to bentoml/bentos/llama2/70b-chat-fp16-258c/env/docker/Dockerfile diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/docker/entrypoint.sh b/bentoml/bentos/llama2/70b-chat-fp16-258c/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/env/docker/entrypoint.sh rename to bentoml/bentos/llama2/70b-chat-fp16-258c/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/install.sh b/bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/install.sh rename to bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/install.sh diff --git a/bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/requirements.lock.txt b/bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/requirements.txt b/bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/requirements.txt rename to bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/requirements.txt diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/version.txt b/bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/version.txt rename to bentoml/bentos/llama2/70b-chat-fp16-258c/env/python/version.txt diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/bento_constants.py b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/bento_constants.py similarity index 85% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/bento_constants.py rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/bento_constants.py index ac7af97..4ce5168 100644 --- a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/bento_constants.py +++ b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/bento_constants.py @@ -6,8 +6,8 @@ max_model_len: 1024 model: meta-llama/Llama-2-70b-chat-hf extra_labels: + model_name: meta-llama/Llama-2-70b-chat-hf openllm_alias: 70b,70b-chat - openllm_hf_model_id: meta-llama/Llama-2-70b-chat-hf project: vllm-chat service_config: name: llama2 diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/bentofile.yaml b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/bentofile.yaml rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/bentofile.yaml index c5a4796..4f30d0f 100644 --- a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/bentofile.yaml +++ b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: meta-llama/Llama-2-70b-chat-hf openllm_alias: 70b,70b-chat - openllm_hf_model_id: meta-llama/Llama-2-70b-chat-hf - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/service.py b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/service.py similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/service.py rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/service.py diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/404.html b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/404.html rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/404.html diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/apple-touch-icon.png b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/chat.html b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/chat.html rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/chat.html diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/chat.txt b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/chat.txt rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/chat.txt diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/favicon-16x16.png b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/favicon-16x16.png rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/favicon.ico b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/favicon.ico rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/favicon.ico diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/index.html b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/index.html rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/index.html diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/index.txt b/bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama2/70b-chat-fp16-b0de/src/ui/index.txt rename to bentoml/bentos/llama2/70b-chat-fp16-258c/src/ui/index.txt diff --git a/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/requirements.lock.txt b/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/llama2/70b-chat-fp16-b0de/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/README.md b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/README.md new file mode 100644 index 0000000..7c53f79 --- /dev/null +++ b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/README.md @@ -0,0 +1,16 @@ +# llama2:7b-chat-awq-4bit-8df2 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/apis/openapi.yaml b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/apis/openapi.yaml rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/apis/openapi.yaml diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/apis/schema.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/apis/schema.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/apis/schema.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/apis/schema.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/bento.yaml b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/bento.yaml similarity index 95% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/bento.yaml rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/bento.yaml index 3327654..2f895ec 100644 --- a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/bento.yaml +++ b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama2 -version: 7b-chat-awq-4bit-a35d +version: 7b-chat-awq-4bit-8df2 bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:51:07.606369+00:00' +creation_time: '2024-07-12T13:32:54.939874+00:00' labels: + model_name: TheBloke/Llama-2-7B-Chat-AWQ openllm_alias: 7b-4bit,7b-chat-4bit - openllm_hf_model_id: TheBloke/Llama-2-7B-Chat-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/docker/Dockerfile b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/docker/Dockerfile rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/docker/Dockerfile diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/docker/entrypoint.sh b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/docker/entrypoint.sh rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/install.sh b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/install.sh rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/install.sh diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/requirements.lock.txt b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/requirements.txt b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/requirements.txt rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/requirements.txt diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/version.txt b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/version.txt rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/env/python/version.txt diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/bento_constants.py b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/bento_constants.py similarity index 87% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/bento_constants.py rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/bento_constants.py index 5f5490d..ba4735c 100644 --- a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/bento_constants.py +++ b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/bento_constants.py @@ -7,8 +7,8 @@ model: TheBloke/Llama-2-7B-Chat-AWQ quantization: awq extra_labels: + model_name: TheBloke/Llama-2-7B-Chat-AWQ openllm_alias: 7b-4bit,7b-chat-4bit - openllm_hf_model_id: TheBloke/Llama-2-7B-Chat-AWQ project: vllm-chat service_config: name: llama2 diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/bentofile.yaml b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/bentofile.yaml rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/bentofile.yaml index 8e79e7d..ad86550 100644 --- a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/bentofile.yaml +++ b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: TheBloke/Llama-2-7B-Chat-AWQ openllm_alias: 7b-4bit,7b-chat-4bit - openllm_hf_model_id: TheBloke/Llama-2-7B-Chat-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/service.py b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/service.py similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/service.py rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/service.py diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/404.html b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/404.html rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/404.html diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/apple-touch-icon.png b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/chat.html b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/chat.html rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/chat.html diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/chat.txt b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/chat.txt rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/chat.txt diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/favicon-16x16.png b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/favicon-16x16.png rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/favicon.ico b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/favicon.ico rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/favicon.ico diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/index.html b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/index.html rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/index.html diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/index.txt b/bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/src/ui/index.txt rename to bentoml/bentos/llama2/7b-chat-awq-4bit-8df2/src/ui/index.txt diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/README.md b/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/README.md deleted file mode 100644 index 35641bf..0000000 --- a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# llama2:7b-chat-awq-4bit-a35d - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/requirements.lock.txt b/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/llama2/7b-chat-awq-4bit-a35d/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/README.md b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/README.md similarity index 97% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/README.md rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/README.md index 80f71b9..3a5fffa 100644 --- a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/README.md +++ b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/README.md @@ -1,4 +1,4 @@ -# llama2:7b-chat-fp16-f9ef +# llama2:7b-chat-fp16-2e3a [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/apis/openapi.yaml b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/apis/openapi.yaml rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/apis/openapi.yaml diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/apis/schema.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/apis/schema.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/apis/schema.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/apis/schema.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/bento.yaml b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/bento.yaml similarity index 95% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/bento.yaml rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/bento.yaml index e65c062..e2689cb 100644 --- a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/bento.yaml +++ b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama2 -version: 7b-chat-fp16-f9ef +version: 7b-chat-fp16-2e3a bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:48:39.737970+00:00' +creation_time: '2024-07-12T13:29:39.928558+00:00' labels: + model_name: meta-llama/Llama-2-7b-chat-hf openllm_alias: 7b,7b-chat - openllm_hf_model_id: meta-llama/Llama-2-7b-chat-hf - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/docker/Dockerfile b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/docker/Dockerfile rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/docker/Dockerfile diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/docker/entrypoint.sh b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/docker/entrypoint.sh rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/install.sh b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/install.sh rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/install.sh diff --git a/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/requirements.lock.txt b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/requirements.txt b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/requirements.txt rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/requirements.txt diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/version.txt b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/version.txt rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/env/python/version.txt diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/bento_constants.py b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/bento_constants.py similarity index 85% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/bento_constants.py rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/bento_constants.py index 158da9b..f1ea8ac 100644 --- a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/bento_constants.py +++ b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/bento_constants.py @@ -6,8 +6,8 @@ max_model_len: 1024 model: meta-llama/Llama-2-7b-chat-hf extra_labels: + model_name: meta-llama/Llama-2-7b-chat-hf openllm_alias: 7b,7b-chat - openllm_hf_model_id: meta-llama/Llama-2-7b-chat-hf project: vllm-chat service_config: name: llama2 diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/bentofile.yaml b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/bentofile.yaml rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/bentofile.yaml index ea3c215..9674c91 100644 --- a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/bentofile.yaml +++ b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: meta-llama/Llama-2-7b-chat-hf openllm_alias: 7b,7b-chat - openllm_hf_model_id: meta-llama/Llama-2-7b-chat-hf - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/service.py b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/service.py similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/service.py rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/service.py diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/404.html b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/404.html rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/404.html diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/apple-touch-icon.png b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/chat.html b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/chat.html rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/chat.html diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/chat.txt b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/chat.txt rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/chat.txt diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/favicon-16x16.png b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/favicon-16x16.png rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/favicon.ico b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/favicon.ico rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/favicon.ico diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/index.html b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/index.html rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/index.html diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/index.txt b/bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama2/7b-chat-fp16-f9ef/src/ui/index.txt rename to bentoml/bentos/llama2/7b-chat-fp16-2e3a/src/ui/index.txt diff --git a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/requirements.lock.txt b/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/llama2/7b-chat-fp16-f9ef/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/README.md b/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/README.md deleted file mode 100644 index 41865b5..0000000 --- a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# llama3:70b-instruct-awq-4bit-a5d5 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/requirements.lock.txt b/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/README.md b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/README.md new file mode 100644 index 0000000..a9ca138 --- /dev/null +++ b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/README.md @@ -0,0 +1,16 @@ +# llama3:70b-instruct-awq-4bit-e968 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/apis/openapi.yaml b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/apis/openapi.yaml rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/apis/openapi.yaml diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/apis/schema.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/apis/schema.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/apis/schema.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/apis/schema.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/bento.yaml b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/bento.yaml similarity index 94% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/bento.yaml rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/bento.yaml index e8220dd..232d264 100644 --- a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/bento.yaml +++ b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama3 -version: 70b-instruct-awq-4bit-a5d5 +version: 70b-instruct-awq-4bit-e968 bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:54:39.183603+00:00' +creation_time: '2024-07-12T13:37:06.457762+00:00' labels: + model_name: casperhansen/llama-3-70b-instruct-awq openllm_alias: 70b-4bit,70b-instruct-4bit - openllm_hf_model_id: casperhansen/llama-3-70b-instruct-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/docker/Dockerfile b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/docker/Dockerfile rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/docker/Dockerfile diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/docker/entrypoint.sh b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/docker/entrypoint.sh rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/install.sh b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/install.sh rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/install.sh diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/requirements.lock.txt b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/requirements.txt b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/requirements.txt rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/requirements.txt diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/version.txt b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/env/python/version.txt rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/env/python/version.txt diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/bento_constants.py b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/bento_constants.py similarity index 83% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/bento_constants.py rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/bento_constants.py index 788a01a..de96562 100644 --- a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/bento_constants.py +++ b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/bento_constants.py @@ -5,8 +5,8 @@ model: casperhansen/llama-3-70b-instruct-awq quantization: awq extra_labels: + model_name: casperhansen/llama-3-70b-instruct-awq openllm_alias: 70b-4bit,70b-instruct-4bit - openllm_hf_model_id: casperhansen/llama-3-70b-instruct-awq project: vllm-chat service_config: name: llama3 diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/bentofile.yaml b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/bentofile.yaml similarity index 91% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/bentofile.yaml rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/bentofile.yaml index a8b9021..2c8838b 100644 --- a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/bentofile.yaml +++ b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: casperhansen/llama-3-70b-instruct-awq openllm_alias: 70b-4bit,70b-instruct-4bit - openllm_hf_model_id: casperhansen/llama-3-70b-instruct-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/service.py b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/service.py similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/service.py rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/service.py diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/404.html b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/404.html rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/404.html diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/apple-touch-icon.png b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/chat.html b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/chat.html rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/chat.html diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/chat.txt b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/chat.txt rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/chat.txt diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/favicon-16x16.png b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/favicon-16x16.png rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/favicon.ico b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/favicon.ico rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/favicon.ico diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/index.html b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/index.html rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/index.html diff --git a/bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/index.txt b/bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-awq-4bit-a5d5/src/ui/index.txt rename to bentoml/bentos/llama3/70b-instruct-awq-4bit-e968/src/ui/index.txt diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-6aed/README.md b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/README.md new file mode 100644 index 0000000..db08203 --- /dev/null +++ b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/README.md @@ -0,0 +1,16 @@ +# llama3:70b-instruct-fp16-6aed + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/apis/openapi.yaml b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/apis/openapi.yaml rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/apis/openapi.yaml diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/apis/schema.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/apis/schema.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/apis/schema.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/apis/schema.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/bento.yaml b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/bento.yaml similarity index 94% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/bento.yaml rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/bento.yaml index e6e8e81..b6db24a 100644 --- a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/bento.yaml +++ b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama3 -version: 70b-instruct-fp16-d0d4 +version: 70b-instruct-fp16-6aed bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:56:30.483132+00:00' +creation_time: '2024-07-12T13:39:08.321781+00:00' labels: + model_name: meta-llama/Meta-Llama-3-70B-Instruct openllm_alias: 70b,70b-instruct - openllm_hf_model_id: meta-llama/Meta-Llama-3-70B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/docker/Dockerfile b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/docker/Dockerfile rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/docker/Dockerfile diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/docker/entrypoint.sh b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/docker/entrypoint.sh rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/install.sh b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/install.sh rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/install.sh diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/requirements.lock.txt b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/requirements.txt b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/requirements.txt rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/requirements.txt diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/version.txt b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/version.txt rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/env/python/version.txt diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/bento_constants.py b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/bento_constants.py similarity index 82% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/bento_constants.py rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/bento_constants.py index ccdf575..f536876 100644 --- a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/bento_constants.py +++ b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/bento_constants.py @@ -4,8 +4,8 @@ max_model_len: 2048 model: meta-llama/Meta-Llama-3-70B-Instruct extra_labels: + model_name: meta-llama/Meta-Llama-3-70B-Instruct openllm_alias: 70b,70b-instruct - openllm_hf_model_id: meta-llama/Meta-Llama-3-70B-Instruct project: vllm-chat service_config: name: llama3 diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/bentofile.yaml b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/bentofile.yaml similarity index 91% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/bentofile.yaml rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/bentofile.yaml index a1f038a..6bc3ab5 100644 --- a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/bentofile.yaml +++ b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: meta-llama/Meta-Llama-3-70B-Instruct openllm_alias: 70b,70b-instruct - openllm_hf_model_id: meta-llama/Meta-Llama-3-70B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/service.py b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/service.py similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/service.py rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/service.py diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/404.html b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/404.html rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/404.html diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/apple-touch-icon.png b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/chat.html b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/chat.html rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/chat.html diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/chat.txt b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/chat.txt rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/chat.txt diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/favicon-16x16.png b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/favicon-16x16.png rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/favicon.ico b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/favicon.ico rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/favicon.ico diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/index.html b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/index.html rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/index.html diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/index.txt b/bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama3/70b-instruct-fp16-d0d4/src/ui/index.txt rename to bentoml/bentos/llama3/70b-instruct-fp16-6aed/src/ui/index.txt diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/README.md b/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/README.md deleted file mode 100644 index 91bc230..0000000 --- a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# llama3:70b-instruct-fp16-d0d4 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/requirements.lock.txt b/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/llama3/70b-instruct-fp16-d0d4/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/README.md b/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/README.md deleted file mode 100644 index 33d89ae..0000000 --- a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# llama3:8b-instruct-awq-4bit-e780 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/requirements.lock.txt b/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/README.md b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/README.md new file mode 100644 index 0000000..883c1bd --- /dev/null +++ b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/README.md @@ -0,0 +1,16 @@ +# llama3:8b-instruct-awq-4bit-f9de + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/apis/openapi.yaml b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/apis/openapi.yaml rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/apis/openapi.yaml diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/apis/schema.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/apis/schema.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/apis/schema.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/apis/schema.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/bento.yaml b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/bento.yaml similarity index 94% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/bento.yaml rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/bento.yaml index bb8fdbf..3453e51 100644 --- a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/bento.yaml +++ b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama3 -version: 8b-instruct-awq-4bit-e780 +version: 8b-instruct-awq-4bit-f9de bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:53:44.539551+00:00' +creation_time: '2024-07-12T13:36:07.192628+00:00' labels: + model_name: casperhansen/llama-3-8b-instruct-awq openllm_alias: 8b-4bit,8b-instruct-4bit - openllm_hf_model_id: casperhansen/llama-3-8b-instruct-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/docker/Dockerfile b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/docker/Dockerfile rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/docker/Dockerfile diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/docker/entrypoint.sh b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/docker/entrypoint.sh rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/install.sh b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/install.sh rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/install.sh diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/requirements.lock.txt b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/requirements.txt b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/requirements.txt rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/requirements.txt diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/version.txt b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/env/python/version.txt rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/env/python/version.txt diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/bento_constants.py b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/bento_constants.py similarity index 84% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/bento_constants.py rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/bento_constants.py index aba1d7b..a34462d 100644 --- a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/bento_constants.py +++ b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/bento_constants.py @@ -5,8 +5,8 @@ model: casperhansen/llama-3-8b-instruct-awq quantization: awq extra_labels: + model_name: casperhansen/llama-3-8b-instruct-awq openllm_alias: 8b-4bit,8b-instruct-4bit - openllm_hf_model_id: casperhansen/llama-3-8b-instruct-awq project: vllm-chat service_config: name: llama3 diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/bentofile.yaml b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/bentofile.yaml rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/bentofile.yaml index 7548a6c..b1968a8 100644 --- a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/bentofile.yaml +++ b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: casperhansen/llama-3-8b-instruct-awq openllm_alias: 8b-4bit,8b-instruct-4bit - openllm_hf_model_id: casperhansen/llama-3-8b-instruct-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/service.py b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/service.py similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/service.py rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/service.py diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/404.html b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/404.html rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/404.html diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/apple-touch-icon.png b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/chat.html b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/chat.html rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/chat.html diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/chat.txt b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/chat.txt rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/chat.txt diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/favicon-16x16.png b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/favicon-16x16.png rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/favicon.ico b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/favicon.ico rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/favicon.ico diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/index.html b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/index.html rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/index.html diff --git a/bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/index.txt b/bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-awq-4bit-e780/src/ui/index.txt rename to bentoml/bentos/llama3/8b-instruct-awq-4bit-f9de/src/ui/index.txt diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/README.md b/bentoml/bentos/llama3/8b-instruct-fp16-0083/README.md deleted file mode 100644 index 2ca7abd..0000000 --- a/bentoml/bentos/llama3/8b-instruct-fp16-0083/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# llama3:8b-instruct-fp16-0083 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/requirements.lock.txt b/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-f703/README.md b/bentoml/bentos/llama3/8b-instruct-fp16-f703/README.md new file mode 100644 index 0000000..ab2b441 --- /dev/null +++ b/bentoml/bentos/llama3/8b-instruct-fp16-f703/README.md @@ -0,0 +1,16 @@ +# llama3:8b-instruct-fp16-f703 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/apis/openapi.yaml b/bentoml/bentos/llama3/8b-instruct-fp16-f703/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/apis/openapi.yaml rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/apis/openapi.yaml diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/apis/schema.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/apis/schema.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/apis/schema.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/apis/schema.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/bento.yaml b/bentoml/bentos/llama3/8b-instruct-fp16-f703/bento.yaml similarity index 94% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/bento.yaml rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/bento.yaml index d53bfee..4aa68f5 100644 --- a/bentoml/bentos/llama3/8b-instruct-fp16-0083/bento.yaml +++ b/bentoml/bentos/llama3/8b-instruct-fp16-f703/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: llama3 -version: 8b-instruct-fp16-0083 +version: 8b-instruct-fp16-f703 bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:55:34.916627+00:00' +creation_time: '2024-07-12T13:38:06.662635+00:00' labels: + model_name: meta-llama/Meta-Llama-3-8B-Instruct openllm_alias: 8b,8b-instruct - openllm_hf_model_id: meta-llama/Meta-Llama-3-8B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/docker/Dockerfile b/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/env/docker/Dockerfile rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/env/docker/Dockerfile diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/docker/entrypoint.sh b/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/env/docker/entrypoint.sh rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/env/docker/entrypoint.sh diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/install.sh b/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/install.sh similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/install.sh rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/install.sh diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/requirements.lock.txt b/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/requirements.txt b/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/requirements.txt rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/requirements.txt diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/version.txt b/bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/version.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/env/python/version.txt rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/env/python/version.txt diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/bento_constants.py b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/bento_constants.py similarity index 83% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/bento_constants.py rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/bento_constants.py index c2733b1..172f4be 100644 --- a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/bento_constants.py +++ b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: meta-llama/Meta-Llama-3-8B-Instruct extra_labels: + model_name: meta-llama/Meta-Llama-3-8B-Instruct openllm_alias: 8b,8b-instruct - openllm_hf_model_id: meta-llama/Meta-Llama-3-8B-Instruct project: vllm-chat service_config: name: llama3 diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/bentofile.yaml b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/bentofile.yaml rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/bentofile.yaml index 34eec25..d924922 100644 --- a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/bentofile.yaml +++ b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: meta-llama/Meta-Llama-3-8B-Instruct openllm_alias: 8b,8b-instruct - openllm_hf_model_id: meta-llama/Meta-Llama-3-8B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/service.py b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/service.py similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/service.py rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/service.py diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/404.html b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/404.html similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/404.html rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/404.html diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/apple-touch-icon.png b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/apple-touch-icon.png rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/chat.html b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/chat.html similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/chat.html rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/chat.html diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/chat.txt b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/chat.txt rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/chat.txt diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/favicon-16x16.png b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/favicon-16x16.png rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/favicon.ico b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/favicon.ico rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/favicon.ico diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/index.html b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/index.html similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/index.html rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/index.html diff --git a/bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/index.txt b/bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/index.txt similarity index 100% rename from bentoml/bentos/llama3/8b-instruct-fp16-0083/src/ui/index.txt rename to bentoml/bentos/llama3/8b-instruct-fp16-f703/src/ui/index.txt diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/README.md b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/README.md new file mode 100644 index 0000000..13c2fec --- /dev/null +++ b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/README.md @@ -0,0 +1,16 @@ +# mistral:7b-instruct-awq-4bit-0850 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/apis/openapi.yaml b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/apis/openapi.yaml rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/apis/openapi.yaml diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/apis/schema.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/apis/schema.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/apis/schema.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/apis/schema.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/bento.yaml b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/bento.yaml similarity index 94% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/bento.yaml rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/bento.yaml index e078bf6..2969df6 100644 --- a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/bento.yaml +++ b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: mistral -version: 7b-instruct-awq-4bit-33ce +version: 7b-instruct-awq-4bit-0850 bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:52:01.835826+00:00' +creation_time: '2024-07-12T13:33:54.010245+00:00' labels: + model_name: TheBloke/Mistral-7B-Instruct-v0.1-AWQ openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: TheBloke/Mistral-7B-Instruct-v0.1-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/docker/Dockerfile b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/docker/Dockerfile rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/docker/Dockerfile diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/docker/entrypoint.sh b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/docker/entrypoint.sh rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/docker/entrypoint.sh diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/install.sh b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/install.sh similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/install.sh rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/install.sh diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/requirements.lock.txt b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/requirements.txt b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/requirements.txt rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/requirements.txt diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/version.txt b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/version.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/version.txt rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/env/python/version.txt diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/bento_constants.py b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/bento_constants.py similarity index 86% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/bento_constants.py rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/bento_constants.py index 26adfa8..134f905 100644 --- a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/bento_constants.py +++ b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/bento_constants.py @@ -8,8 +8,8 @@ model: TheBloke/Mistral-7B-Instruct-v0.1-AWQ quantization: awq extra_labels: + model_name: TheBloke/Mistral-7B-Instruct-v0.1-AWQ openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: TheBloke/Mistral-7B-Instruct-v0.1-AWQ project: vllm-chat service_config: name: mistral diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/bentofile.yaml b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/bentofile.yaml rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/bentofile.yaml index 78707e6..6ec08f0 100644 --- a/bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/bentofile.yaml +++ b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: TheBloke/Mistral-7B-Instruct-v0.1-AWQ openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: casperhansen/gemma-7b-it-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/service.py b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/service.py similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/service.py rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/service.py diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/404.html b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/404.html similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/404.html rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/404.html diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/apple-touch-icon.png b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/apple-touch-icon.png rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/chat.html b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/chat.html similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/chat.html rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/chat.html diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/chat.txt b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/chat.txt rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/chat.txt diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/favicon-16x16.png b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/favicon-16x16.png rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/favicon.ico b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/favicon.ico rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/favicon.ico diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/index.html b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/index.html similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/index.html rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/index.html diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/index.txt b/bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/index.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/ui/index.txt rename to bentoml/bentos/mistral/7b-instruct-awq-4bit-0850/src/ui/index.txt diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/README.md b/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/README.md deleted file mode 100644 index d0d777b..0000000 --- a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# mistral:7b-instruct-awq-4bit-33ce - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/requirements.lock.txt b/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/README.md b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/README.md new file mode 100644 index 0000000..a6ff96a --- /dev/null +++ b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/README.md @@ -0,0 +1,16 @@ +# mistral:7b-instruct-fp16-ac2b + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/apis/openapi.yaml b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/apis/openapi.yaml rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/apis/openapi.yaml diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/apis/schema.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/apis/schema.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/apis/schema.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/apis/schema.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/bento.yaml b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/bento.yaml similarity index 94% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/bento.yaml rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/bento.yaml index e34f4c8..8facfa8 100644 --- a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/bento.yaml +++ b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: mistral -version: 7b-instruct-fp16-fe78 +version: 7b-instruct-fp16-ac2b bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:52:53.052699+00:00' +creation_time: '2024-07-12T13:34:54.036739+00:00' labels: + model_name: mistralai/Mistral-7B-Instruct-v0.1 openllm_alias: 7b,7b-instruct - openllm_hf_model_id: mistralai/Mistral-7B-Instruct-v0.1 - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/docker/Dockerfile b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/docker/Dockerfile rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/docker/Dockerfile diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/docker/entrypoint.sh b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/docker/entrypoint.sh rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/docker/entrypoint.sh diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/install.sh b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/install.sh similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/install.sh rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/install.sh diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/requirements.lock.txt b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/requirements.txt b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/requirements.txt rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/requirements.txt diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/version.txt b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/version.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/version.txt rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/env/python/version.txt diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/bento_constants.py b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/bento_constants.py similarity index 85% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/bento_constants.py rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/bento_constants.py index 9c2d85b..08f18c6 100644 --- a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/bento_constants.py +++ b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/bento_constants.py @@ -7,8 +7,8 @@ max_model_len: 1024 model: mistralai/Mistral-7B-Instruct-v0.1 extra_labels: + model_name: mistralai/Mistral-7B-Instruct-v0.1 openllm_alias: 7b,7b-instruct - openllm_hf_model_id: mistralai/Mistral-7B-Instruct-v0.1 project: vllm-chat service_config: name: mistral diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/bentofile.yaml b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/bentofile.yaml similarity index 93% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/bentofile.yaml rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/bentofile.yaml index 6a53abf..db1a5d4 100644 --- a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/bentofile.yaml +++ b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: mistralai/Mistral-7B-Instruct-v0.1 openllm_alias: 7b,7b-instruct - openllm_hf_model_id: Qwen/Qwen2-7B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/service.py b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/service.py similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/service.py rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/service.py diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/404.html b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/404.html similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/404.html rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/404.html diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/apple-touch-icon.png b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/apple-touch-icon.png rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/chat.html b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/chat.html similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/chat.html rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/chat.html diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/chat.txt b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/chat.txt rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/chat.txt diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/favicon-16x16.png b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/favicon-16x16.png rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/favicon.ico b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/favicon.ico rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/favicon.ico diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/index.html b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/index.html similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/index.html rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/index.html diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/index.txt b/bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/index.txt similarity index 100% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/ui/index.txt rename to bentoml/bentos/mistral/7b-instruct-fp16-ac2b/src/ui/index.txt diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/README.md b/bentoml/bentos/mistral/7b-instruct-fp16-fe78/README.md deleted file mode 100644 index 932624b..0000000 --- a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# mistral:7b-instruct-fp16-fe78 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/requirements.lock.txt b/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/README.md b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/README.md deleted file mode 100644 index fac5419..0000000 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# mixtral:8x7b-instruct-v0.1-awq-4bit-0016 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/requirements.lock.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/README.md b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/README.md new file mode 100644 index 0000000..64c74d5 --- /dev/null +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/README.md @@ -0,0 +1,16 @@ +# mixtral:8x7b-instruct-v0.1-awq-4bit-2953 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/apis/openapi.yaml b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/apis/openapi.yaml rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/apis/openapi.yaml diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/apis/schema.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/apis/schema.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/apis/schema.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/apis/schema.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/bento.yaml b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/bento.yaml similarity index 94% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/bento.yaml rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/bento.yaml index 26e05d4..1f2f27e 100644 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/bento.yaml +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: mixtral -version: 8x7b-instruct-v0.1-awq-4bit-0016 +version: 8x7b-instruct-v0.1-awq-4bit-2953 bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:01:04.838303+00:00' +creation_time: '2024-07-12T13:44:29.497980+00:00' labels: + model_name: casperhansen/mixtral-instruct-awq openllm_alias: 8x7b-4bit - openllm_hf_model_id: casperhansen/mixtral-instruct-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/docker/Dockerfile b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/docker/Dockerfile rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/docker/Dockerfile diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/docker/entrypoint.sh b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/docker/entrypoint.sh rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/docker/entrypoint.sh diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/install.sh b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/install.sh similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/install.sh rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/install.sh diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/requirements.lock.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/requirements.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/requirements.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/requirements.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/version.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/version.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/env/python/version.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/env/python/version.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/bento_constants.py b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/bento_constants.py similarity index 86% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/bento_constants.py rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/bento_constants.py index ebed24c..eb42ae8 100644 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/bento_constants.py +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/bento_constants.py @@ -7,8 +7,8 @@ model: casperhansen/mixtral-instruct-awq quantization: awq extra_labels: + model_name: casperhansen/mixtral-instruct-awq openllm_alias: 8x7b-4bit - openllm_hf_model_id: casperhansen/mixtral-instruct-awq project: vllm-chat service_config: name: mixtral diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/bentofile.yaml b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/bentofile.yaml rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/bentofile.yaml index 08ff52f..7fd1c10 100644 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/bentofile.yaml +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: casperhansen/mixtral-instruct-awq openllm_alias: 8x7b-4bit - openllm_hf_model_id: casperhansen/mixtral-instruct-awq - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/service.py b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/service.py similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/service.py rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/service.py diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/404.html b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/404.html similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/404.html rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/404.html diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/apple-touch-icon.png b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/apple-touch-icon.png rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/chat.html b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/chat.html similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/chat.html rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/chat.html diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/chat.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/chat.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/chat.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/favicon-16x16.png b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/favicon-16x16.png rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/favicon.ico b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/favicon.ico rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/favicon.ico diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/index.html b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/index.html similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/index.html rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/index.html diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/index.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/index.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-0016/src/ui/index.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-awq-4bit-2953/src/ui/index.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/README.md b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/README.md new file mode 100644 index 0000000..ead7c51 --- /dev/null +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/README.md @@ -0,0 +1,16 @@ +# mixtral:8x7b-instruct-v0.1-fp16-71c6 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/apis/openapi.yaml b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/apis/openapi.yaml rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/apis/openapi.yaml diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/apis/schema.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/apis/schema.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/apis/schema.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/apis/schema.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/bento.yaml b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/bento.yaml similarity index 94% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/bento.yaml rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/bento.yaml index 62c773e..40fa791 100644 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/bento.yaml +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: mixtral -version: 8x7b-instruct-v0.1-fp16-b90a +version: 8x7b-instruct-v0.1-fp16-71c6 bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:00:09.830997+00:00' +creation_time: '2024-07-12T13:43:22.893115+00:00' labels: + model_name: mistralai/Mixtral-8x7B-Instruct-v0.1 openllm_alias: 8x7b,8x7b-instruct - openllm_hf_model_id: mistralai/Mixtral-8x7B-Instruct-v0.1 - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/docker/Dockerfile b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/docker/Dockerfile rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/docker/Dockerfile diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/docker/entrypoint.sh b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/docker/entrypoint.sh rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/docker/entrypoint.sh diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/install.sh b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/install.sh similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/install.sh rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/install.sh diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/requirements.lock.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/requirements.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/requirements.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/requirements.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/version.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/version.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/version.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/env/python/version.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/bento_constants.py b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/bento_constants.py similarity index 84% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/bento_constants.py rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/bento_constants.py index 7cd5502..93cf732 100644 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/bento_constants.py +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: mistralai/Mixtral-8x7B-Instruct-v0.1 extra_labels: + model_name: mistralai/Mixtral-8x7B-Instruct-v0.1 openllm_alias: 8x7b,8x7b-instruct - openllm_hf_model_id: mistralai/Mixtral-8x7B-Instruct-v0.1 project: vllm-chat service_config: name: mixtral diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/bentofile.yaml b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/bentofile.yaml rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/bentofile.yaml index d7c8007..510ad48 100644 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/bentofile.yaml +++ b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: mistralai/Mixtral-8x7B-Instruct-v0.1 openllm_alias: 8x7b,8x7b-instruct - openllm_hf_model_id: mistralai/Mixtral-8x7B-Instruct-v0.1 - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/service.py b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/service.py similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/service.py rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/service.py diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/404.html b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/404.html similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/404.html rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/404.html diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/apple-touch-icon.png b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/apple-touch-icon.png rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/chat.html b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/chat.html similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/chat.html rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/chat.html diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/chat.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/chat.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/chat.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/favicon-16x16.png b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/favicon-16x16.png rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/favicon.ico b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/favicon.ico rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/favicon.ico diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/index.html b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/index.html similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/index.html rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/index.html diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/index.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/index.txt similarity index 100% rename from bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/src/ui/index.txt rename to bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-71c6/src/ui/index.txt diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/README.md b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/README.md deleted file mode 100644 index f24b3f8..0000000 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# mixtral:8x7b-instruct-v0.1-fp16-b90a - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/requirements.lock.txt b/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/mixtral/8x7b-instruct-v0.1-fp16-b90a/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/README.md b/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/README.md deleted file mode 100644 index 297cc7b..0000000 --- a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# phi3:3.8b-instruct-fp16-07bf - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/requirements.lock.txt b/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/README.md b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/README.md new file mode 100644 index 0000000..8c9dd12 --- /dev/null +++ b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/README.md @@ -0,0 +1,16 @@ +# phi3:3.8b-instruct-fp16-30b8 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/apis/openapi.yaml b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/apis/openapi.yaml rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/apis/openapi.yaml diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/apis/schema.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/apis/schema.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/apis/schema.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/apis/schema.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/bento.yaml b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/bento.yaml similarity index 94% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/bento.yaml rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/bento.yaml index 7c133e5..8ccab76 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/bento.yaml +++ b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: phi3 -version: 3.8b-instruct-fp16-07bf +version: 3.8b-instruct-fp16-30b8 bentoml_version: 1.2.19 -creation_time: '2024-07-08T07:47:49.195324+00:00' +creation_time: '2024-07-12T13:28:39.030528+00:00' labels: + model_name: microsoft/Phi-3-mini-4k-instruct openllm_alias: 3.8b,3.8b-mini,3.8b-mini-instruct-4k-fp16 - openllm_hf_model_id: microsoft/Phi-3-mini-4k-instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/docker/Dockerfile b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/docker/Dockerfile rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/docker/Dockerfile diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/docker/entrypoint.sh b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/docker/entrypoint.sh rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/docker/entrypoint.sh diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/install.sh b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/install.sh similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/install.sh rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/install.sh diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/requirements.lock.txt b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/requirements.txt b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/requirements.txt rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/requirements.txt diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/version.txt b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/version.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/env/python/version.txt rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/env/python/version.txt diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/bento_constants.py b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/bento_constants.py similarity index 85% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/bento_constants.py rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/bento_constants.py index 0181e32..4a5496e 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/bento_constants.py +++ b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/bento_constants.py @@ -6,8 +6,8 @@ max_model_len: 4096 model: microsoft/Phi-3-mini-4k-instruct extra_labels: + model_name: microsoft/Phi-3-mini-4k-instruct openllm_alias: 3.8b,3.8b-mini,3.8b-mini-instruct-4k-fp16 - openllm_hf_model_id: microsoft/Phi-3-mini-4k-instruct project: vllm-chat service_config: name: phi3 diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/bentofile.yaml b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/bentofile.yaml rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/bentofile.yaml index 4d1d51f..5848da8 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/bentofile.yaml +++ b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: microsoft/Phi-3-mini-4k-instruct openllm_alias: 3.8b,3.8b-mini,3.8b-mini-instruct-4k-fp16 - openllm_hf_model_id: microsoft/Phi-3-mini-4k-instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/service.py b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/service.py similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/service.py rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/service.py diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/404.html b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/404.html similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/404.html rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/404.html diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/apple-touch-icon.png b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/apple-touch-icon.png rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/chat.html b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/chat.html similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/chat.html rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/chat.html diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/chat.txt b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/chat.txt rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/chat.txt diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/favicon-16x16.png b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/favicon-16x16.png rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/favicon.ico b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/favicon.ico rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/favicon.ico diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/index.html b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/index.html similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/index.html rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/index.html diff --git a/bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/index.txt b/bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/index.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-fp16-07bf/src/ui/index.txt rename to bentoml/bentos/phi3/3.8b-instruct-fp16-30b8/src/ui/index.txt diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/README.md b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/README.md deleted file mode 100644 index 730e2b4..0000000 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# phi3:3.8b-instruct-ggml-q4-584f - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/README.md b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/README.md new file mode 100644 index 0000000..3cbe28f --- /dev/null +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/README.md @@ -0,0 +1,16 @@ +# phi3:3.8b-instruct-ggml-q4-e31e + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/apis/openapi.yaml b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/apis/openapi.yaml similarity index 99% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/apis/openapi.yaml rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/apis/openapi.yaml index 54d43aa..31d8b84 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/apis/openapi.yaml +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/apis/openapi.yaml @@ -127,7 +127,7 @@ components: anyOf: - type: boolean - type: 'null' - default: false + default: true title: Stream temperature: anyOf: @@ -273,7 +273,7 @@ paths: title: Stop type: array stream: - default: false + default: true title: Stream type: boolean temperature: diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/apis/schema.json b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/apis/schema.json similarity index 98% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/apis/schema.json rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/apis/schema.json index 17fe798..c53823f 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/apis/schema.json +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/apis/schema.json @@ -62,7 +62,7 @@ "type": "array" }, "stream": { - "default": false, + "default": true, "title": "Stream", "type": "boolean" }, diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/bento.yaml b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/bento.yaml similarity index 93% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/bento.yaml rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/bento.yaml index 955d0af..a222bbc 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/bento.yaml +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/bento.yaml @@ -1,12 +1,11 @@ service: service:LlamaCppChat name: phi3 -version: 3.8b-instruct-ggml-q4-584f +version: 3.8b-instruct-ggml-q4-e31e bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:07:54.266242+00:00' +creation_time: '2024-07-12T13:52:53.455637+00:00' labels: + model_name: microsoft/Phi-3-mini-4k-instruct-gguf openllm_alias: 3.8b-q4,3.8b-mini-q4,3.8b-mini-instruct-4k-ggml-q4 - openllm_hf_model_id: microsoft/Phi-3-mini-4k-instruct-gguf - owner: bentoml-team platforms: macos source: https://github.com/bentoml/openllm-models-feed/tree/main/source/llamacpp-chat models: [] @@ -75,7 +74,7 @@ schema: type: string type: array stream: - default: false + default: true title: Stream type: boolean temperature: diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/docker/Dockerfile b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/docker/Dockerfile rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/docker/Dockerfile diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/docker/entrypoint.sh b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/docker/entrypoint.sh rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/docker/entrypoint.sh diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/install.sh b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/install.sh similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/install.sh rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/install.sh diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/requirements.lock.txt b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/requirements.lock.txt similarity index 99% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/requirements.lock.txt rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/requirements.lock.txt index 35a2baa..0df0625 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/requirements.lock.txt +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/requirements.lock.txt @@ -97,4 +97,4 @@ zipp==3.19.2 # The following packages are considered to be unsafe in a requirements file: pip==24.1.2 -setuptools==70.2.0 +setuptools==70.3.0 diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/requirements.txt b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/requirements.txt rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/requirements.txt diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/version.txt b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/version.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/env/python/version.txt rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/env/python/version.txt diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/bento_constants.py b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/bento_constants.py similarity index 84% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/bento_constants.py rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/bento_constants.py index 16585ed..f802573 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/bento_constants.py +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: microsoft/Phi-3-mini-4k-instruct-gguf extra_labels: + model_name: microsoft/Phi-3-mini-4k-instruct-gguf openllm_alias: 3.8b-q4,3.8b-mini-q4,3.8b-mini-instruct-4k-ggml-q4 - openllm_hf_model_id: microsoft/Phi-3-mini-4k-instruct-gguf project: llamacpp-chat service_config: name: phi3 diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/bentofile.yaml b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/bentofile.yaml similarity index 91% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/bentofile.yaml rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/bentofile.yaml index 2004a12..d032987 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/bentofile.yaml +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/bentofile.yaml @@ -22,9 +22,8 @@ include: - '*.py' - ui/* labels: + model_name: microsoft/Phi-3-mini-4k-instruct-gguf openllm_alias: 3.8b-q4,3.8b-mini-q4,3.8b-mini-instruct-4k-ggml-q4 - openllm_hf_model_id: microsoft/Phi-3-mini-4k-instruct-gguf - owner: bentoml-team platforms: macos source: https://github.com/bentoml/openllm-models-feed/tree/main/source/llamacpp-chat models: [] diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/service.py b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/service.py similarity index 97% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/service.py rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/service.py index 3cfd766..146a84c 100644 --- a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/service.py +++ b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/service.py @@ -9,7 +9,7 @@ import fastapi.staticfiles import os from fastapi.responses import FileResponse -from typing_extensions import Annotated, Literal +from typing_extensions import Literal import sys import pydantic from bentoml.io import SSE @@ -76,7 +76,7 @@ async def catch_all(full_path: str): @bentoml.mount_asgi_app(openai_api_app, path="/v1") @bentoml.service(**SERVICE_CONFIG) class LlamaCppChat: - + def __init__(self) -> None: self.llm = Llama.from_pretrained( repo_id=ENGINE_CONFIG["model"], @@ -97,7 +97,7 @@ async def chat_completions( Le(ENGINE_CONFIG["max_model_len"]), ] = ENGINE_CONFIG["max_model_len"], stop: Optional[list[str]] = None, - stream: Optional[bool] = False, + stream: Optional[bool] = True, temperature: Optional[float] = 0, top_p: Optional[float] = 1.0, frequency_penalty: Optional[float] = 0.0, @@ -107,6 +107,7 @@ async def chat_completions( """ try: response = self.llm.create_chat_completion( + model=model, messages=messages, max_tokens=max_tokens, stream=stream, @@ -125,7 +126,7 @@ async def chat_completions( except Exception as e: print(e) yield SSE(data=str(e)).marshal() - + yield SSE(data="[DONE]").marshal() except Exception as e: yield SSE(data=str(e)).marshal() diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/404.html b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/404.html similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/404.html rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/404.html diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/apple-touch-icon.png b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/apple-touch-icon.png rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/chat.html b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/chat.html similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/chat.html rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/chat.html diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/chat.txt b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/chat.txt rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/chat.txt diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/favicon-16x16.png b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/favicon-16x16.png rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/favicon.ico b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/favicon.ico rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/favicon.ico diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/index.html b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/index.html similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/index.html rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/index.html diff --git a/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/index.txt b/bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/index.txt similarity index 100% rename from bentoml/bentos/phi3/3.8b-instruct-ggml-q4-584f/src/ui/index.txt rename to bentoml/bentos/phi3/3.8b-instruct-ggml-q4-e31e/src/ui/index.txt diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/README.md b/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/README.md deleted file mode 100644 index 044b517..0000000 --- a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# qwen2:0.5b-instruct-fp16-96bb - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/README.md b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/README.md new file mode 100644 index 0000000..3680fbe --- /dev/null +++ b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/README.md @@ -0,0 +1,16 @@ +# qwen2:0.5b-instruct-fp16-fcc6 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/apis/openapi.yaml b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/apis/openapi.yaml rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/apis/openapi.yaml diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/apis/schema.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/apis/schema.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/apis/schema.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/apis/schema.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/bento.yaml b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/bento.yaml similarity index 95% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/bento.yaml rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/bento.yaml index 70e7ad5..8cd0e70 100644 --- a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/bento.yaml +++ b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: qwen2 -version: 0.5b-instruct-fp16-96bb +version: 0.5b-instruct-fp16-fcc6 bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:01:59.846091+00:00' +creation_time: '2024-07-12T13:45:29.217202+00:00' labels: + model_name: Qwen/Qwen2-0.5B-Instruct openllm_alias: 0.5b,0.5b-instruct - openllm_hf_model_id: Qwen/Qwen2-0.5B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/docker/Dockerfile b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/docker/Dockerfile rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/docker/Dockerfile diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/docker/entrypoint.sh b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/docker/entrypoint.sh rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/docker/entrypoint.sh diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/install.sh b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/install.sh similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/install.sh rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/install.sh diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/requirements.txt b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/requirements.txt rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/requirements.txt diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/version.txt b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/version.txt similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/env/python/version.txt rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/env/python/version.txt diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/bento_constants.py b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/bento_constants.py similarity index 85% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/bento_constants.py rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/bento_constants.py index cdd2cc3..95732c2 100644 --- a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/bento_constants.py +++ b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: Qwen/Qwen2-0.5B-Instruct extra_labels: + model_name: Qwen/Qwen2-0.5B-Instruct openllm_alias: 0.5b,0.5b-instruct - openllm_hf_model_id: Qwen/Qwen2-0.5B-Instruct project: vllm-chat service_config: name: qwen2 diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/bentofile.yaml b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/bentofile.yaml similarity index 93% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/bentofile.yaml rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/bentofile.yaml index aac3406..12b35db 100644 --- a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/bentofile.yaml +++ b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: Qwen/Qwen2-0.5B-Instruct openllm_alias: 0.5b,0.5b-instruct - openllm_hf_model_id: Qwen/Qwen2-0.5B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/service.py b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/service.py similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/service.py rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/service.py diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/404.html b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/404.html similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/404.html rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/404.html diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/apple-touch-icon.png b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/apple-touch-icon.png rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/chat.html b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/chat.html similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/chat.html rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/chat.html diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/chat.txt b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/chat.txt rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/chat.txt diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/favicon-16x16.png b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/favicon-16x16.png rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/favicon.ico b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/favicon.ico rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/favicon.ico diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/index.html b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/index.html similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/index.html rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/index.html diff --git a/bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/index.txt b/bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/index.txt similarity index 100% rename from bentoml/bentos/qwen2/0.5b-instruct-fp16-96bb/src/ui/index.txt rename to bentoml/bentos/qwen2/0.5b-instruct-fp16-fcc6/src/ui/index.txt diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/README.md b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/README.md new file mode 100644 index 0000000..e79d287 --- /dev/null +++ b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/README.md @@ -0,0 +1,16 @@ +# qwen2:1.5b-instruct-fp16-50d8 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/apis/openapi.yaml b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/apis/openapi.yaml rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/apis/openapi.yaml diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/apis/schema.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/apis/schema.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/apis/schema.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/apis/schema.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/bento.yaml b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/bento.yaml similarity index 95% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/bento.yaml rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/bento.yaml index 7d3c565..c4c3532 100644 --- a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/bento.yaml +++ b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: qwen2 -version: 1.5b-instruct-fp16-ec69 +version: 1.5b-instruct-fp16-50d8 bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:02:52.426817+00:00' +creation_time: '2024-07-12T13:46:35.790743+00:00' labels: + model_name: Qwen/Qwen2-1.5B-Instruct openllm_alias: 1.5b,1.5b-instruct - openllm_hf_model_id: Qwen/Qwen2-1.5B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/docker/Dockerfile b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/docker/Dockerfile rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/docker/Dockerfile diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/docker/entrypoint.sh b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/docker/entrypoint.sh rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/docker/entrypoint.sh diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/install.sh b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/install.sh similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/install.sh rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/install.sh diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/requirements.txt b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/requirements.txt rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/requirements.txt diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/version.txt b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/version.txt similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/version.txt rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/env/python/version.txt diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/bento_constants.py b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/bento_constants.py similarity index 85% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/bento_constants.py rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/bento_constants.py index fc6159f..b171f52 100644 --- a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/bento_constants.py +++ b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: Qwen/Qwen2-1.5B-Instruct extra_labels: + model_name: Qwen/Qwen2-1.5B-Instruct openllm_alias: 1.5b,1.5b-instruct - openllm_hf_model_id: Qwen/Qwen2-1.5B-Instruct project: vllm-chat service_config: name: qwen2 diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/bentofile.yaml b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/bentofile.yaml similarity index 93% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/bentofile.yaml rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/bentofile.yaml index 9ef28fd..f9147b8 100644 --- a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/bentofile.yaml +++ b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: Qwen/Qwen2-1.5B-Instruct openllm_alias: 1.5b,1.5b-instruct - openllm_hf_model_id: Qwen/Qwen2-1.5B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/service.py b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/service.py similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/service.py rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/service.py diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/404.html b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/404.html similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/404.html rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/404.html diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/apple-touch-icon.png b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/apple-touch-icon.png rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/chat.html b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/chat.html similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/chat.html rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/chat.html diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/chat.txt b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/chat.txt rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/chat.txt diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/favicon-16x16.png b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/favicon-16x16.png rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/favicon.ico b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/favicon.ico rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/favicon.ico diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/index.html b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/index.html similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/index.html rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/index.html diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/index.txt b/bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/index.txt similarity index 100% rename from bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/src/ui/index.txt rename to bentoml/bentos/qwen2/1.5b-instruct-fp16-50d8/src/ui/index.txt diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/README.md b/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/README.md deleted file mode 100644 index ea4c69c..0000000 --- a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# qwen2:1.5b-instruct-fp16-ec69 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/qwen2/1.5b-instruct-fp16-ec69/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/README.md b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/README.md new file mode 100644 index 0000000..09a217d --- /dev/null +++ b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/README.md @@ -0,0 +1,16 @@ +# qwen2:57b-a14b-instruct-fp16-3f06 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/apis/openapi.yaml b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/apis/openapi.yaml rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/apis/openapi.yaml diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/apis/schema.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/apis/schema.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/apis/schema.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/apis/schema.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/bento.yaml b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/bento.yaml similarity index 94% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/bento.yaml rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/bento.yaml index 0ed3366..cc5eeb1 100644 --- a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/bento.yaml +++ b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: qwen2 -version: 57b-a14b-instruct-fp16-f63b +version: 57b-a14b-instruct-fp16-3f06 bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:06:13.245817+00:00' +creation_time: '2024-07-12T13:51:06.623893+00:00' labels: + model_name: Qwen/Qwen2-57B-A14B-Instruct openllm_alias: 57b-a14b,57b-a14b-instruct - openllm_hf_model_id: Qwen/Qwen2-57B-A14B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/docker/Dockerfile b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/docker/Dockerfile rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/docker/Dockerfile diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/docker/entrypoint.sh b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/docker/entrypoint.sh rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/docker/entrypoint.sh diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/install.sh b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/install.sh similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/install.sh rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/install.sh diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/requirements.txt b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/requirements.txt rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/requirements.txt diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/version.txt b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/version.txt similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/version.txt rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/env/python/version.txt diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/bento_constants.py b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/bento_constants.py similarity index 85% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/bento_constants.py rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/bento_constants.py index ef757e6..19dbd91 100644 --- a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/bento_constants.py +++ b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: Qwen/Qwen2-57B-A14B-Instruct extra_labels: + model_name: Qwen/Qwen2-57B-A14B-Instruct openllm_alias: 57b-a14b,57b-a14b-instruct - openllm_hf_model_id: Qwen/Qwen2-57B-A14B-Instruct project: vllm-chat service_config: name: qwen2 diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/bentofile.yaml b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/bentofile.yaml rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/bentofile.yaml index 7e90155..7d6145f 100644 --- a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/bentofile.yaml +++ b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: Qwen/Qwen2-57B-A14B-Instruct openllm_alias: 57b-a14b,57b-a14b-instruct - openllm_hf_model_id: Qwen/Qwen2-57B-A14B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/service.py b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/service.py similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/service.py rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/service.py diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/404.html b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/404.html similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/404.html rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/404.html diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/apple-touch-icon.png b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/apple-touch-icon.png rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/chat.html b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/chat.html similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/chat.html rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/chat.html diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/chat.txt b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/chat.txt rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/chat.txt diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/favicon-16x16.png b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/favicon-16x16.png rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/favicon.ico b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/favicon.ico rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/favicon.ico diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/index.html b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/index.html similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/index.html rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/index.html diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/index.txt b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/index.txt similarity index 100% rename from bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/src/ui/index.txt rename to bentoml/bentos/qwen2/57b-a14b-instruct-fp16-3f06/src/ui/index.txt diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/README.md b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/README.md deleted file mode 100644 index 486b076..0000000 --- a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# qwen2:57b-a14b-instruct-fp16-f63b - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/qwen2/57b-a14b-instruct-fp16-f63b/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/README.md b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/README.md new file mode 100644 index 0000000..b16f69f --- /dev/null +++ b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/README.md @@ -0,0 +1,16 @@ +# qwen2:72b-instruct-awq-4bit-15fd + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/apis/openapi.yaml b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/apis/openapi.yaml rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/apis/openapi.yaml diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/apis/schema.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/apis/schema.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/apis/schema.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/apis/schema.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/bento.yaml b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/bento.yaml similarity index 94% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/bento.yaml rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/bento.yaml index dad942e..d7f793d 100644 --- a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/bento.yaml +++ b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: qwen2 -version: 72b-instruct-awq-4bit-f44a +version: 72b-instruct-awq-4bit-15fd bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:05:19.616286+00:00' +creation_time: '2024-07-12T13:49:55.548892+00:00' labels: + model_name: Qwen/Qwen2-72B-Instruct-AWQ openllm_alias: 72b-4bit,72b-instruct-4bit - openllm_hf_model_id: Qwen/Qwen2-72B-Instruct-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/docker/Dockerfile b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/docker/Dockerfile rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/docker/Dockerfile diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/docker/entrypoint.sh b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/docker/entrypoint.sh rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/docker/entrypoint.sh diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/install.sh b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/install.sh similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/install.sh rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/install.sh diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/requirements.txt b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/requirements.txt rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/requirements.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/version.txt b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/version.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/version.txt rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/env/python/version.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/bento_constants.py b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/bento_constants.py similarity index 85% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/bento_constants.py rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/bento_constants.py index 2714868..b5f6e00 100644 --- a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/bento_constants.py +++ b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/bento_constants.py @@ -5,8 +5,8 @@ model: Qwen/Qwen2-72B-Instruct-AWQ quantization: awq extra_labels: + model_name: Qwen/Qwen2-72B-Instruct-AWQ openllm_alias: 72b-4bit,72b-instruct-4bit - openllm_hf_model_id: Qwen/Qwen2-72B-Instruct-AWQ project: vllm-chat service_config: name: qwen2 diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/bentofile.yaml b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/bentofile.yaml rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/bentofile.yaml index bc8a195..96877ff 100644 --- a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/bentofile.yaml +++ b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: Qwen/Qwen2-72B-Instruct-AWQ openllm_alias: 72b-4bit,72b-instruct-4bit - openllm_hf_model_id: Qwen/Qwen2-72B-Instruct-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/service.py b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/service.py similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/service.py rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/service.py diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/404.html b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/404.html similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/404.html rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/404.html diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/apple-touch-icon.png b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/apple-touch-icon.png rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/chat.html b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/chat.html similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/chat.html rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/chat.html diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/chat.txt b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/chat.txt rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/chat.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/favicon-16x16.png b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/favicon-16x16.png rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/favicon.ico b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/favicon.ico rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/favicon.ico diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/index.html b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/index.html similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/index.html rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/index.html diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/index.txt b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/index.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/src/ui/index.txt rename to bentoml/bentos/qwen2/72b-instruct-awq-4bit-15fd/src/ui/index.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/README.md b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/README.md deleted file mode 100644 index fd5a6a8..0000000 --- a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# qwen2:72b-instruct-awq-4bit-f44a - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/qwen2/72b-instruct-awq-4bit-f44a/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/README.md b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/README.md new file mode 100644 index 0000000..4d581f2 --- /dev/null +++ b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/README.md @@ -0,0 +1,16 @@ +# qwen2:72b-instruct-fp16-7b44 + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/apis/openapi.yaml b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/apis/openapi.yaml rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/apis/openapi.yaml diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/apis/schema.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/apis/schema.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/apis/schema.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/apis/schema.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/bento.yaml b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/bento.yaml similarity index 95% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/bento.yaml rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/bento.yaml index bdbe2a8..a5e255d 100644 --- a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/bento.yaml +++ b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: qwen2 -version: 72b-instruct-fp16-8d53 +version: 72b-instruct-fp16-7b44 bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:07:07.352770+00:00' +creation_time: '2024-07-12T13:52:06.649672+00:00' labels: + model_name: Qwen/Qwen2-72B-Instruct openllm_alias: 72b,72b-instruct - openllm_hf_model_id: Qwen/Qwen2-72B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/docker/Dockerfile b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/docker/Dockerfile rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/docker/Dockerfile diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/docker/entrypoint.sh b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/docker/entrypoint.sh rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/docker/entrypoint.sh diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/install.sh b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/install.sh similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/install.sh rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/install.sh diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/requirements.txt b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/requirements.txt rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/requirements.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/version.txt b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/version.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/version.txt rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/env/python/version.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/bento_constants.py b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/bento_constants.py similarity index 86% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/bento_constants.py rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/bento_constants.py index df7065c..00671df 100644 --- a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/bento_constants.py +++ b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: Qwen/Qwen2-72B-Instruct extra_labels: + model_name: Qwen/Qwen2-72B-Instruct openllm_alias: 72b,72b-instruct - openllm_hf_model_id: Qwen/Qwen2-72B-Instruct project: vllm-chat service_config: name: qwen2 diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/bentofile.yaml b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/bentofile.yaml similarity index 93% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/bentofile.yaml rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/bentofile.yaml index 441f618..de8f2cb 100644 --- a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/bentofile.yaml +++ b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: Qwen/Qwen2-72B-Instruct openllm_alias: 72b,72b-instruct - openllm_hf_model_id: Qwen/Qwen2-72B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/service.py b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/service.py similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/service.py rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/service.py diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/404.html b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/404.html similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/404.html rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/404.html diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/apple-touch-icon.png b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/apple-touch-icon.png rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/chat.html b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/chat.html similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/chat.html rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/chat.html diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/chat.txt b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/chat.txt rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/chat.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/favicon-16x16.png b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/favicon-16x16.png rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/favicon.ico b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/favicon.ico rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/favicon.ico diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/index.html b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/index.html similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/index.html rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/index.html diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/index.txt b/bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/index.txt similarity index 100% rename from bentoml/bentos/qwen2/72b-instruct-fp16-8d53/src/ui/index.txt rename to bentoml/bentos/qwen2/72b-instruct-fp16-7b44/src/ui/index.txt diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/README.md b/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/README.md deleted file mode 100644 index 15efac1..0000000 --- a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# qwen2:72b-instruct-fp16-8d53 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/qwen2/72b-instruct-fp16-8d53/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/README.md b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/README.md deleted file mode 100644 index 1c54b21..0000000 --- a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# qwen2:7b-instruct-awq-4bit-6b70 - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/README.md b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/README.md new file mode 100644 index 0000000..8e51a4d --- /dev/null +++ b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/README.md @@ -0,0 +1,16 @@ +# qwen2:7b-instruct-awq-4bit-ce1b + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/apis/openapi.yaml b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/apis/openapi.yaml rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/apis/openapi.yaml diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/apis/schema.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/apis/schema.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/apis/schema.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/apis/schema.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/bento.yaml b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/bento.yaml similarity index 94% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/bento.yaml rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/bento.yaml index 80a1dd6..1aa9001 100644 --- a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/bento.yaml +++ b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: qwen2 -version: 7b-instruct-awq-4bit-6b70 +version: 7b-instruct-awq-4bit-ce1b bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:03:39.433813+00:00' +creation_time: '2024-07-12T13:47:44.941425+00:00' labels: + model_name: Qwen/Qwen2-7B-Instruct-AWQ openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: Qwen/Qwen2-7B-Instruct-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/docker/Dockerfile b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/docker/Dockerfile rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/docker/Dockerfile diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/docker/entrypoint.sh b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/docker/entrypoint.sh rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/docker/entrypoint.sh diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/install.sh b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/install.sh similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/install.sh rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/install.sh diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/requirements.txt b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/requirements.txt rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/requirements.txt diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/version.txt b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/version.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/env/python/version.txt rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/env/python/version.txt diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/bento_constants.py b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/bento_constants.py similarity index 85% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/bento_constants.py rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/bento_constants.py index adcb6b4..5f9317b 100644 --- a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/bento_constants.py +++ b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/bento_constants.py @@ -5,8 +5,8 @@ model: Qwen/Qwen2-7B-Instruct-AWQ quantization: awq extra_labels: + model_name: Qwen/Qwen2-7B-Instruct-AWQ openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: Qwen/Qwen2-7B-Instruct-AWQ project: vllm-chat service_config: name: qwen2 diff --git a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/bentofile.yaml b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/bentofile.yaml similarity index 91% rename from bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/bentofile.yaml rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/bentofile.yaml index 475dcd1..2b23ad7 100644 --- a/bentoml/bentos/mistral/7b-instruct-awq-4bit-33ce/src/bentofile.yaml +++ b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: Qwen/Qwen2-7B-Instruct-AWQ openllm_alias: 7b-4bit,7b-instruct-4bit - openllm_hf_model_id: TheBloke/Mistral-7B-Instruct-v0.1-AWQ - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/service.py b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/service.py similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/service.py rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/service.py diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/404.html b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/404.html similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/404.html rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/404.html diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/apple-touch-icon.png b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/apple-touch-icon.png rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/chat.html b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/chat.html similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/chat.html rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/chat.html diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/chat.txt b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/chat.txt rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/chat.txt diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/favicon-16x16.png b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/favicon-16x16.png rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/favicon.ico b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/favicon.ico rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/favicon.ico diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/index.html b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/index.html similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/index.html rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/index.html diff --git a/bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/index.txt b/bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/index.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-awq-4bit-6b70/src/ui/index.txt rename to bentoml/bentos/qwen2/7b-instruct-awq-4bit-ce1b/src/ui/index.txt diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/README.md b/bentoml/bentos/qwen2/7b-instruct-fp16-805b/README.md deleted file mode 100644 index e10ffbd..0000000 --- a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/README.md +++ /dev/null @@ -1,16 +0,0 @@ -# qwen2:7b-instruct-fp16-805b - -[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) -[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) -[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) -[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) -[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) - -This is a Machine Learning Service created with BentoML. - -## Help - -* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. -* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. -* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. -* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/requirements.lock.txt deleted file mode 100644 index 925ce19..0000000 --- a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/requirements.lock.txt +++ /dev/null @@ -1,147 +0,0 @@ -aiohttp==3.9.5 -aiosignal==1.3.1 -annotated-types==0.7.0 -anyio==4.4.0 -appdirs==1.4.4 -asgiref==3.8.1 -async-timeout==4.0.3 -attrs==23.2.0 -bentoml==1.2.19 -build==1.2.1 -cattrs==23.1.2 -certifi==2024.7.4 -charset-normalizer==3.3.2 -circus==0.18.0 -click==8.1.7 -click-option-group==0.5.6 -cloudpickle==3.0.0 -cmake==3.30.0 -deepmerge==1.1.1 -deprecated==1.2.14 -diskcache==5.6.3 -distro==1.9.0 -dnspython==2.6.1 -email-validator==2.2.0 -exceptiongroup==1.2.1 -fastapi==0.111.0 -fastapi-cli==0.0.4 -filelock==3.15.4 -frozenlist==1.4.1 -fs==2.4.16 -fsspec==2024.6.1 -h11==0.14.0 -httpcore==1.0.5 -httptools==0.6.1 -httpx==0.27.0 -httpx-ws==0.6.0 -huggingface-hub==0.23.4 -idna==3.7 -importlib-metadata==6.11.0 -inflection==0.5.1 -interegular==0.3.3 -jinja2==3.1.4 -joblib==1.4.2 -jsonschema==4.22.0 -jsonschema-specifications==2023.12.1 -lark==1.1.9 -llvmlite==0.43.0 -lm-format-enforcer==0.10.1 -markdown-it-py==3.0.0 -markupsafe==2.1.5 -mdurl==0.1.2 -mpmath==1.3.0 -msgpack==1.0.8 -multidict==6.0.5 -nest-asyncio==1.6.0 -networkx==3.2.1 -ninja==1.11.1.1 -numba==0.60.0 -numpy==1.26.0 -nvidia-cublas-cu12==12.1.3.1 -nvidia-cuda-cupti-cu12==12.1.105 -nvidia-cuda-nvrtc-cu12==12.1.105 -nvidia-cuda-runtime-cu12==12.1.105 -nvidia-cudnn-cu12==8.9.2.26 -nvidia-cufft-cu12==11.0.2.54 -nvidia-curand-cu12==10.3.2.106 -nvidia-cusolver-cu12==11.4.5.107 -nvidia-cusparse-cu12==12.1.0.106 -nvidia-ml-py==11.525.150 -nvidia-nccl-cu12==2.20.5 -nvidia-nvjitlink-cu12==12.5.82 -nvidia-nvtx-cu12==12.1.105 -openai==1.35.10 -opentelemetry-api==1.20.0 -opentelemetry-instrumentation==0.41b0 -opentelemetry-instrumentation-aiohttp-client==0.41b0 -opentelemetry-instrumentation-asgi==0.41b0 -opentelemetry-sdk==1.20.0 -opentelemetry-semantic-conventions==0.41b0 -opentelemetry-util-http==0.41b0 -orjson==3.10.6 -outlines==0.0.34 -packaging==24.1 -pathspec==0.12.1 -pip-requirements-parser==32.0.1 -pip-tools==7.4.1 -prometheus-client==0.20.0 -prometheus-fastapi-instrumentator==7.0.0 -protobuf==5.27.2 -psutil==6.0.0 -py-cpuinfo==9.0.0 -pydantic==2.8.2 -pydantic-core==2.20.1 -pygments==2.18.0 -pyparsing==3.1.2 -pyproject-hooks==1.1.0 -python-dateutil==2.9.0.post0 -python-dotenv==1.0.1 -python-json-logger==2.0.7 -python-multipart==0.0.9 -pyyaml==6.0.1 -pyzmq==26.0.3 -ray==2.31.0 -referencing==0.35.1 -regex==2024.5.15 -requests==2.32.3 -rich==13.7.1 -rpds-py==0.18.1 -safetensors==0.4.3 -schema==0.7.7 -scipy==1.13.1 -sentencepiece==0.2.0 -shellingham==1.5.4 -simple-di==0.1.5 -six==1.16.0 -sniffio==1.3.1 -starlette==0.37.2 -sympy==1.12.1 -tiktoken==0.7.0 -tokenizers==0.19.1 -tomli==2.0.1 -tomli-w==1.0.0 -torch==2.3.0 -tornado==6.4.1 -tqdm==4.66.4 -transformers==4.41.0 -triton==2.3.0 -typer==0.12.3 -typing-extensions==4.12.2 -ujson==5.10.0 -urllib3==2.2.2 -uvicorn[standard]==0.30.1 -uvloop==0.19.0 -vllm==0.4.3 -vllm-flash-attn==2.5.8.post2 -watchfiles==0.22.0 -websockets==12.0 -wheel==0.43.0 -wrapt==1.16.0 -wsproto==1.2.0 -xformers==0.0.26.post1 -yarl==1.9.4 -zipp==3.19.2 - -# The following packages are considered to be unsafe in a requirements file: -pip==24.1.2 -setuptools==70.2.0 diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-844c/README.md b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/README.md new file mode 100644 index 0000000..9ffa9c4 --- /dev/null +++ b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/README.md @@ -0,0 +1,16 @@ +# qwen2:7b-instruct-fp16-844c + +[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML) +[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/) +[![join_slack](https://badgen.net/badge/Join/BentoML%20Slack/cyan?icon=slack)](https://l.bentoml.com/join-slack-swagger) +[![BentoML GitHub Repo](https://img.shields.io/github/stars/bentoml/bentoml?style=social)](https://github.com/bentoml/BentoML) +[![Twitter Follow](https://img.shields.io/twitter/follow/bentomlai?label=Follow%20BentoML&style=social)](https://twitter.com/bentomlai) + +This is a Machine Learning Service created with BentoML. + +## Help + +* [📖 Documentation](https://docs.bentoml.com/en/latest/): Learn how to use BentoML. +* [💬 Community](https://l.bentoml.com/join-slack-swagger): Join the BentoML Slack community. +* [🐛 GitHub Issues](https://github.com/bentoml/BentoML/issues): Report bugs and feature requests. +* Tip: you can also [customize this README](https://docs.bentoml.com/en/latest/concepts/bento.html#description). diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/apis/openapi.yaml b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/apis/openapi.yaml similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/apis/openapi.yaml rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/apis/openapi.yaml diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/apis/schema.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/apis/schema.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/apis/schema.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/apis/schema.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/bento.yaml b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/bento.yaml similarity index 95% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/bento.yaml rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/bento.yaml index 936e46a..97b506c 100644 --- a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/bento.yaml +++ b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/bento.yaml @@ -1,12 +1,11 @@ service: service:VLLM name: qwen2 -version: 7b-instruct-fp16-805b +version: 7b-instruct-fp16-844c bentoml_version: 1.2.19 -creation_time: '2024-07-08T08:04:26.795593+00:00' +creation_time: '2024-07-12T13:48:44.992066+00:00' labels: + model_name: Qwen/Qwen2-7B-Instruct openllm_alias: 7b,7b-instruct - openllm_hf_model_id: Qwen/Qwen2-7B-Instruct - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/docker/Dockerfile b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/docker/Dockerfile similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/docker/Dockerfile rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/docker/Dockerfile diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/docker/entrypoint.sh b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/docker/entrypoint.sh similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/docker/entrypoint.sh rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/docker/entrypoint.sh diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/install.sh b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/install.sh similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/install.sh rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/install.sh diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/requirements.lock.txt b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/requirements.lock.txt new file mode 100644 index 0000000..f6acdf5 --- /dev/null +++ b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/requirements.lock.txt @@ -0,0 +1,147 @@ +aiohttp==3.9.5 +aiosignal==1.3.1 +annotated-types==0.7.0 +anyio==4.4.0 +appdirs==1.4.4 +asgiref==3.8.1 +async-timeout==4.0.3 +attrs==23.2.0 +bentoml==1.2.19 +build==1.2.1 +cattrs==23.1.2 +certifi==2024.7.4 +charset-normalizer==3.3.2 +circus==0.18.0 +click==8.1.7 +click-option-group==0.5.6 +cloudpickle==3.0.0 +cmake==3.30.0 +deepmerge==1.1.1 +deprecated==1.2.14 +diskcache==5.6.3 +distro==1.9.0 +dnspython==2.6.1 +email-validator==2.2.0 +exceptiongroup==1.2.1 +fastapi==0.111.0 +fastapi-cli==0.0.4 +filelock==3.15.4 +frozenlist==1.4.1 +fs==2.4.16 +fsspec==2024.6.1 +h11==0.14.0 +httpcore==1.0.5 +httptools==0.6.1 +httpx==0.27.0 +httpx-ws==0.6.0 +huggingface-hub==0.23.4 +idna==3.7 +importlib-metadata==6.11.0 +inflection==0.5.1 +interegular==0.3.3 +jinja2==3.1.4 +joblib==1.4.2 +jsonschema==4.23.0 +jsonschema-specifications==2023.12.1 +lark==1.1.9 +llvmlite==0.43.0 +lm-format-enforcer==0.10.1 +markdown-it-py==3.0.0 +markupsafe==2.1.5 +mdurl==0.1.2 +mpmath==1.3.0 +msgpack==1.0.8 +multidict==6.0.5 +nest-asyncio==1.6.0 +networkx==3.2.1 +ninja==1.11.1.1 +numba==0.60.0 +numpy==1.26.0 +nvidia-cublas-cu12==12.1.3.1 +nvidia-cuda-cupti-cu12==12.1.105 +nvidia-cuda-nvrtc-cu12==12.1.105 +nvidia-cuda-runtime-cu12==12.1.105 +nvidia-cudnn-cu12==8.9.2.26 +nvidia-cufft-cu12==11.0.2.54 +nvidia-curand-cu12==10.3.2.106 +nvidia-cusolver-cu12==11.4.5.107 +nvidia-cusparse-cu12==12.1.0.106 +nvidia-ml-py==11.525.150 +nvidia-nccl-cu12==2.20.5 +nvidia-nvjitlink-cu12==12.5.82 +nvidia-nvtx-cu12==12.1.105 +openai==1.35.13 +opentelemetry-api==1.20.0 +opentelemetry-instrumentation==0.41b0 +opentelemetry-instrumentation-aiohttp-client==0.41b0 +opentelemetry-instrumentation-asgi==0.41b0 +opentelemetry-sdk==1.20.0 +opentelemetry-semantic-conventions==0.41b0 +opentelemetry-util-http==0.41b0 +orjson==3.10.6 +outlines==0.0.34 +packaging==24.1 +pathspec==0.12.1 +pip-requirements-parser==32.0.1 +pip-tools==7.4.1 +prometheus-client==0.20.0 +prometheus-fastapi-instrumentator==7.0.0 +protobuf==5.27.2 +psutil==6.0.0 +py-cpuinfo==9.0.0 +pydantic==2.8.2 +pydantic-core==2.20.1 +pygments==2.18.0 +pyparsing==3.1.2 +pyproject-hooks==1.1.0 +python-dateutil==2.9.0.post0 +python-dotenv==1.0.1 +python-json-logger==2.0.7 +python-multipart==0.0.9 +pyyaml==6.0.1 +pyzmq==26.0.3 +ray==2.32.0 +referencing==0.35.1 +regex==2024.5.15 +requests==2.32.3 +rich==13.7.1 +rpds-py==0.19.0 +safetensors==0.4.3 +schema==0.7.7 +scipy==1.13.1 +sentencepiece==0.2.0 +shellingham==1.5.4 +simple-di==0.1.5 +six==1.16.0 +sniffio==1.3.1 +starlette==0.37.2 +sympy==1.13.0 +tiktoken==0.7.0 +tokenizers==0.19.1 +tomli==2.0.1 +tomli-w==1.0.0 +torch==2.3.0 +tornado==6.4.1 +tqdm==4.66.4 +transformers==4.41.0 +triton==2.3.0 +typer==0.12.3 +typing-extensions==4.12.2 +ujson==5.10.0 +urllib3==2.2.2 +uvicorn[standard]==0.30.1 +uvloop==0.19.0 +vllm==0.4.3 +vllm-flash-attn==2.5.8.post2 +watchfiles==0.22.0 +websockets==12.0 +wheel==0.43.0 +wrapt==1.16.0 +wsproto==1.2.0 +xformers==0.0.26.post1 +yarl==1.9.4 +zipp==3.19.2 + +# The following packages are considered to be unsafe in a requirements file: +pip==24.1.2 +setuptools==70.3.0 diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/requirements.txt b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/requirements.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/requirements.txt rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/requirements.txt diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/version.txt b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/version.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/env/python/version.txt rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/env/python/version.txt diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/bento_constants.py b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/bento_constants.py similarity index 86% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/bento_constants.py rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/bento_constants.py index dfff13a..1ed0f12 100644 --- a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/bento_constants.py +++ b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/bento_constants.py @@ -5,8 +5,8 @@ max_model_len: 2048 model: Qwen/Qwen2-7B-Instruct extra_labels: + model_name: Qwen/Qwen2-7B-Instruct openllm_alias: 7b,7b-instruct - openllm_hf_model_id: Qwen/Qwen2-7B-Instruct project: vllm-chat service_config: name: qwen2 diff --git a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/bentofile.yaml b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/bentofile.yaml similarity index 92% rename from bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/bentofile.yaml rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/bentofile.yaml index 8347bf5..1343d81 100644 --- a/bentoml/bentos/mistral/7b-instruct-fp16-fe78/src/bentofile.yaml +++ b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/bentofile.yaml @@ -28,9 +28,8 @@ include: - chat_templates/chat_templates/*.jinja - chat_templates/generation_configs/*.json labels: + model_name: Qwen/Qwen2-7B-Instruct openllm_alias: 7b,7b-instruct - openllm_hf_model_id: mistralai/Mistral-7B-Instruct-v0.1 - owner: bentoml-team platforms: linux source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat models: [] diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/alpaca.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/alpaca.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/alpaca.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/alpaca.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/amberchat.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/amberchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/amberchat.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/amberchat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/chatml.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/chatml.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/chatml.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/chatml.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/chatqa.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/chatqa.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/chatqa.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/chatqa.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/falcon-instruct.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/falcon-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/falcon-instruct.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/falcon-instruct.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/gemma-it.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/gemma-it.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/gemma-it.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/gemma-it.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/llama-2-chat.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/llama-2-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/llama-2-chat.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/llama-2-chat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/llama-3-chat.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/llama-3-chat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/llama-3-chat.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/llama-3-chat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/mistral-instruct.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/mistral-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/mistral-instruct.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/mistral-instruct.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/openchat.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/openchat.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/openchat.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/openchat.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/phi-3.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/phi-3.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/phi-3.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/phi-3.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/saiga.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/saiga.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/saiga.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/saiga.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/solar-instruct.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/solar-instruct.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/solar-instruct.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/solar-instruct.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/vicuna.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/vicuna.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/vicuna.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/vicuna.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/zephyr.jinja b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/zephyr.jinja similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/chat_templates/zephyr.jinja rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/chat_templates/zephyr.jinja diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/alpaca.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/alpaca.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/alpaca.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/alpaca.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/amberchat.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/amberchat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/amberchat.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/amberchat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/chatqa.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/chatqa.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/chatqa.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/chatqa.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/gemma-it.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/gemma-it.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/gemma-it.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/gemma-it.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/llama-2-chat.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/llama-2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/llama-2-chat.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/llama-2-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/llama-3-chat.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/llama-3-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/llama-3-chat.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/llama-3-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/mistral-instruct.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/mistral-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/mistral-instruct.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/mistral-instruct.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/openchat.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/openchat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/openchat.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/openchat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/orca-2.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/orca-2.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/orca-2.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/orca-2.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/phi-3.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/phi-3.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/phi-3.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/phi-3.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/qwen2-chat.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/qwen2-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/qwen2-chat.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/qwen2-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/saiga.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/saiga.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/saiga.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/saiga.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/solar-instruct.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/solar-instruct.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/solar-instruct.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/solar-instruct.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/vicuna.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/vicuna.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/vicuna.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/vicuna.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/yi-chat.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/yi-chat.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/yi-chat.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/yi-chat.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/zephyr.json b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/zephyr.json similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/chat_templates/generation_configs/zephyr.json rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/chat_templates/generation_configs/zephyr.json diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/service.py b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/service.py similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/service.py rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/service.py diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/404.html b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/404.html similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/404.html rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/404.html diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/0e5ce63c-f5957df8d97fa48f.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/370b0802-87e84e603248538e.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/3d47b92a-f8bda4b39f1e2d9d.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/479ba886-0c92f49cb8e74e58.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/59650de3-87b10f0662b51900.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/66ec4792-34336521b476aa45.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/674-a1fcdac3696c5ed0.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/69-bf2efb63b1299e3b.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/700-532b1fe2415e5859.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/700-532b1fe2415e5859.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/700-532b1fe2415e5859.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/899-fa939dd99dc7a1df.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/8e1d74a4-a6b9a2554f9153c0.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/94730671-0f73873f7f5896de.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/995-34374f39bb210839.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/995-34374f39bb210839.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/995-34374f39bb210839.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/995-34374f39bb210839.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/(site)/page-5b6e14439f55739b.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/chat/page-9c8e223f40771eb6.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/layout-df2dea9dba0ceb06.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/app/not-found-c76dccfb8b88da53.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/d3ac728e-0c798b3b8aa3bf53.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/fd9d1056-32c33f3919735051.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/framework-00a8ba1a63cfdc9e.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/main-app-e95f89b5006af8a8.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/main-bf1416cb53f2b4c0.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/pages/_app-d21e88acd55d90f1.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/pages/_error-d6107f1aac0c574c.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/polyfills-c67a75d1b6f99dc8.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/chunks/webpack-ee8b17d5a5297ccd.js diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/css/429544bd3cd8ce3a.css b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/css/429544bd3cd8ce3a.css similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/css/429544bd3cd8ce3a.css rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/css/429544bd3cd8ce3a.css diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/css/5b67f082b31cfc7b.css b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/css/5b67f082b31cfc7b.css similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/css/5b67f082b31cfc7b.css rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/css/5b67f082b31cfc7b.css diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/css/9e63023b20ddb15e.css b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/css/9e63023b20ddb15e.css similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/_next/static/css/9e63023b20ddb15e.css rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/_next/static/css/9e63023b20ddb15e.css diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/apple-touch-icon.png b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/apple-touch-icon.png similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/apple-touch-icon.png rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/apple-touch-icon.png diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/chat.html b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/chat.html similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/chat.html rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/chat.html diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/chat.txt b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/chat.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/chat.txt rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/chat.txt diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/favicon-16x16.png b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/favicon-16x16.png similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/favicon-16x16.png rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/favicon-16x16.png diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/favicon.ico b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/favicon.ico similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/favicon.ico rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/favicon.ico diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/index.html b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/index.html similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/index.html rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/index.html diff --git a/bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/index.txt b/bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/index.txt similarity index 100% rename from bentoml/bentos/qwen2/7b-instruct-fp16-805b/src/ui/index.txt rename to bentoml/bentos/qwen2/7b-instruct-fp16-844c/src/ui/index.txt