diff --git a/serving/docker/tensorrt-llm.Dockerfile b/serving/docker/tensorrt-llm.Dockerfile index 2cdf49267..462d8aaa7 100644 --- a/serving/docker/tensorrt-llm.Dockerfile +++ b/serving/docker/tensorrt-llm.Dockerfile @@ -18,7 +18,7 @@ ARG djl_version=0.27.0 ARG transformers_version=4.38.1 ARG accelerate_version=0.27.0 ARG tensorrtlibs_version=9.2.0.post12.dev5 -ARG trtllm_toolkit_version=nightly +ARG trtllm_toolkit_version=0.8.0 ARG trtllm_version=v0.8.0 ARG cuda_python_version=12.2.0 ARG peft_wheel="https://publish.djl.ai/peft/peft-0.5.0alpha-py3-none-any.whl"