Spaces:

KillerKing93
/

Transformers-InferenceServer-OpenAPI

Sleeping

KillerKing93 commited on 15 days ago

Commit

9f99713

verified ·

1 Parent(s): c996e04

Sync from GitHub 1e79046

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -23,6 +23,7 @@ ARG BACKEND=cpu
 # - CUDA cu124 index publishes up to 2.6.0 (auto-resolves to +cu124)
 # - ROCm 6.2 index publishes up to 2.5.1+rocm6.2 (must include local tag)
 ARG TORCH_VER_CPU=2.9.0
 ARG TORCH_VER_NVIDIA=2.6.0
 ARG TORCH_VER_AMD=2.5.1+rocm6.2
@@ -35,7 +36,7 @@ ENV PIP_NO_CACHE_DIR=1
 # Install appropriate PyTorch for the selected backend, then the rest
 RUN if [ "$BACKEND" = "cpu" ]; then \
-      pip install --no-cache-dir --index-url https://download.pytorch.org/whl/cpu torch==${TORCH_VER_CPU}; \
     elif [ "$BACKEND" = "nvidia" ]; then \
       pip install --no-cache-dir --index-url https://download.pytorch.org/whl/cu124 torch==${TORCH_VER_NVIDIA}; \
     elif [ "$BACKEND" = "amd" ]; then \

 # - CUDA cu124 index publishes up to 2.6.0 (auto-resolves to +cu124)
 # - ROCm 6.2 index publishes up to 2.5.1+rocm6.2 (must include local tag)
 ARG TORCH_VER_CPU=2.9.0
+ARG TORCHVISION_VER_CPU=0.24.0
 ARG TORCH_VER_NVIDIA=2.6.0
 ARG TORCH_VER_AMD=2.5.1+rocm6.2
 # Install appropriate PyTorch for the selected backend, then the rest
 RUN if [ "$BACKEND" = "cpu" ]; then \
+      pip install --no-cache-dir --index-url https://download.pytorch.org/whl/cpu torch==${TORCH_VER_CPU} torchvision==${TORCHVISION_VER_CPU}; \
     elif [ "$BACKEND" = "nvidia" ]; then \
       pip install --no-cache-dir --index-url https://download.pytorch.org/whl/cu124 torch==${TORCH_VER_NVIDIA}; \
     elif [ "$BACKEND" = "amd" ]; then \

main.py CHANGED Viewed

@@ -105,8 +105,16 @@ def prefetch_model_assets(repo_id: str, token: Optional[str]) -> Optional[str]:
     - If CLI is unavailable, falls back to verbose API prefetch.
     """
     try:
-        # Enable accelerated transfer + xet if available
-        os.environ.setdefault("HF_HUB_ENABLE_HF_TRANSFER", "1")
         os.environ.setdefault("HF_HUB_ENABLE_XET", "1")
         cache_dir = os.getenv("HF_HOME") or os.getenv("TRANSFORMERS_CACHE") or ""

     - If CLI is unavailable, falls back to verbose API prefetch.
     """
     try:
+        # Enable accelerated transfer only if hf_transfer is installed; otherwise disable to avoid runtime errors on Spaces
+        try:
+            import importlib.util as _imputil
+            if _imputil.find_spec("hf_transfer") is not None:
+                os.environ.setdefault("HF_HUB_ENABLE_HF_TRANSFER", "1")
+            else:
+                os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "0"
+        except Exception:
+            os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "0"
+        # XET acceleration if available; harmless if missing
         os.environ.setdefault("HF_HUB_ENABLE_XET", "1")
         cache_dir = os.getenv("HF_HOME") or os.getenv("TRANSFORMERS_CACHE") or ""