diff --git a/tutorials/08-benchmark-multi-round-qa-multi-gpu.md b/tutorials/08-benchmark-multi-round-qa-multi-gpu.md index 463c85a..2cd89ce 100644 --- a/tutorials/08-benchmark-multi-round-qa-multi-gpu.md +++ b/tutorials/08-benchmark-multi-round-qa-multi-gpu.md @@ -104,7 +104,7 @@ servingEngineSpec: runtimeClassName: "" modelSpec: - name: "llama3" - repository: "lmcache/vllm-openai" + repository: "vllm/vllm-openai" tag: "latest" modelURL: "meta-llama/Llama-3.1-8B-Instruct" replicaCount: 1