Update trtllm_deepseek.py (#1349)
* Update trtllm_deepseek.py * bring back revision, comma * ruff --------- Co-authored-by: Charles Frye <cfrye59@gmail.com> Co-authored-by: Charles Frye <charles@modal.com>
This commit is contained in:
@@ -91,8 +91,8 @@ hf_cache_vol = modal.Volume.from_name(f"{app_name}-hf-cache", create_if_missing=
|
||||
HF_CACHE_PATH = Path("/hf_cache")
|
||||
volumes = {HF_CACHE_PATH: hf_cache_vol}
|
||||
|
||||
MODEL_NAME = "nvidia/DeepSeek-R1-0528-FP4"
|
||||
MODEL_REVISION = "91cfc7c35acd8ecfc769205989310208b8b81c9c" # in case repo updates!
|
||||
MODEL_NAME = "nvidia/DeepSeek-R1-0528-FP4-v2"
|
||||
MODEL_REVISION = "d12ff8db9876124d533b26bc24523c27907ce386" # in case repo updates!
|
||||
MODELS_PATH = HF_CACHE_PATH / "models"
|
||||
MODEL_PATH = MODELS_PATH / MODEL_NAME
|
||||
|
||||
@@ -118,9 +118,7 @@ def download_model():
|
||||
|
||||
MINUTES = 60 # seconds
|
||||
tensorrt_image = (
|
||||
tensorrt_image.run_commands(
|
||||
"uv pip install --system --compile-bytecode hf-transfer==0.1.9 huggingface_hub==0.33.0"
|
||||
)
|
||||
tensorrt_image.uv_pip_install("hf-transfer==0.1.9", "huggingface_hub==0.33.0")
|
||||
.env(
|
||||
{
|
||||
"HF_HUB_ENABLE_HF_TRANSFER": "1",
|
||||
|
||||
Reference in New Issue
Block a user