From 19ef67a4c461880e7d3a214173be21962d2e98b6 Mon Sep 17 00:00:00 2001 From: Tom Stesco Date: Mon, 4 Nov 2024 20:18:19 +0000 Subject: [PATCH] adding updated commit shas --- evals/README.md | 9 +++++++-- vllm-tt-metal-llama3-70b/docs/development.md | 2 +- 2 files changed, 8 insertions(+), 3 deletions(-) diff --git a/evals/README.md b/evals/README.md index a428eff..b06e2ae 100644 --- a/evals/README.md +++ b/evals/README.md @@ -9,8 +9,13 @@ Source code: Docker images are published to: https://ghcr.io/tenstorrent/tt-inference-server/tt-metal-llama3-70b-src-base-vllm ```bash +# commit SHAs +export TT_METAL_COMMIT_SHA_OR_TAG=685ef1303b5abdfda63183fdd4fd6ed51b496833 +export TT_METAL_COMMIT_DOCKER_TAG=${TT_METAL_COMMIT_SHA_OR_TAG:0:12} +export TT_VLLM_COMMIT_SHA_OR_TAG=54b9157d852b0fa219613c00abbaa5a35f221049 +export TT_VLLM_COMMIT_DOCKER_TAG=${TT_VLLM_COMMIT_SHA_OR_TAG:0:12} # pull image -docker pull ghcr.io/tenstorrent/tt-inference-server/tt-metal-llama3-70b-src-base-vllm:v0.0.1-tt-metal-v0.53.0-rc16-ebdffa93d911 +docker pull ghcr.io/tenstorrent/tt-inference-server/tt-metal-llama3-70b-src-base-vllm:v0.0.1-tt-metal-${TT_METAL_COMMIT_DOCKER_TAG}-${TT_VLLM_COMMIT_DOCKER_TAG} ``` For instructions on building the Docker image see: [Development](../vllm-tt-metal-llama3-70b/docs/development.md) @@ -31,7 +36,7 @@ docker run \ --volume /dev/hugepages-1G:/dev/hugepages-1G:rw \ --volume ${PERSISTENT_VOLUME?ERROR env var PERSISTENT_VOLUME must be set}:/home/user/cache_root:rw \ --shm-size 32G \ - ghcr.io/tenstorrent/tt-inference-server/tt-metal-llama3-70b-src-base-vllm:v0.0.1-tt-metal-v0.53.0-rc16-ebdffa93d911 bash + ghcr.io/tenstorrent/tt-inference-server/tt-metal-llama3-70b-src-base-vllm:v0.0.1-tt-metal-${TT_METAL_COMMIT_DOCKER_TAG}-${TT_VLLM_COMMIT_DOCKER_TAG} bash ``` ## Step 3: Inside container setup and run vLLM diff --git a/vllm-tt-metal-llama3-70b/docs/development.md b/vllm-tt-metal-llama3-70b/docs/development.md index 082379f..379ebb5 100644 --- a/vllm-tt-metal-llama3-70b/docs/development.md +++ b/vllm-tt-metal-llama3-70b/docs/development.md @@ -43,7 +43,7 @@ docker run \ --volume /dev/hugepages-1G:/dev/hugepages-1G:rw \ --volume ${PERSISTENT_VOLUME?ERROR env var PERSISTENT_VOLUME must be set}:/home/user/cache_root:rw \ --shm-size 32G \ - ghcr.io/tenstorrent/tt-inference-server/tt-metal-llama3-70b-src-base-vllm:v0.0.1-tt-metal-v0.53.0-rc16-ebdffa93d911 bash + ghcr.io/tenstorrent/tt-inference-server/tt-metal-llama3-70b-src-base-vllm:v0.0.1-tt-metal-${TT_METAL_COMMIT_DOCKER_TAG}-${TT_VLLM_COMMIT_DOCKER_TAG} bash ``` additionally for development you can mount the volumes: