From cd75f2bee3e5473bf8bf07ab78bb8c070b48332e Mon Sep 17 00:00:00 2001 From: ShivamB25 <104637569+ShivamB25@users.noreply.github.com> Date: Sun, 31 Aug 2025 09:08:02 +0530 Subject: [PATCH] Update trtllm_deepseek.py (#1349) * Update trtllm_deepseek.py * bring back revision, comma * ruff --------- Co-authored-by: Charles Frye Co-authored-by: Charles Frye --- misc/trtllm_deepseek.py | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/misc/trtllm_deepseek.py b/misc/trtllm_deepseek.py index 86080b8c..51046f32 100644 --- a/misc/trtllm_deepseek.py +++ b/misc/trtllm_deepseek.py @@ -91,8 +91,8 @@ hf_cache_vol = modal.Volume.from_name(f"{app_name}-hf-cache", create_if_missing= HF_CACHE_PATH = Path("/hf_cache") volumes = {HF_CACHE_PATH: hf_cache_vol} -MODEL_NAME = "nvidia/DeepSeek-R1-0528-FP4" -MODEL_REVISION = "91cfc7c35acd8ecfc769205989310208b8b81c9c" # in case repo updates! +MODEL_NAME = "nvidia/DeepSeek-R1-0528-FP4-v2" +MODEL_REVISION = "d12ff8db9876124d533b26bc24523c27907ce386" # in case repo updates! MODELS_PATH = HF_CACHE_PATH / "models" MODEL_PATH = MODELS_PATH / MODEL_NAME @@ -118,9 +118,7 @@ def download_model(): MINUTES = 60 # seconds tensorrt_image = ( - tensorrt_image.run_commands( - "uv pip install --system --compile-bytecode hf-transfer==0.1.9 huggingface_hub==0.33.0" - ) + tensorrt_image.uv_pip_install("hf-transfer==0.1.9", "huggingface_hub==0.33.0") .env( { "HF_HUB_ENABLE_HF_TRANSFER": "1",