Spaces:
Paused
Paused
| # GPU‑fertige Basis mit Python 3.10, CUDA 11.8, cuDNN 8 | |
| FROM pytorch/pytorch:2.2.2-cuda11.8-cudnn8-runtime | |
| # System‑Tools (schlank halten!) | |
| RUN apt-get update && \ | |
| apt-get install -y git-lfs build-essential && \ | |
| rm -rf /var/lib/apt/lists/* | |
| # Non‑root‑User, weil Spaces das mögen | |
| RUN useradd -m -u 1000 user | |
| USER user | |
| WORKDIR /app | |
| ENV PATH="/home/user/.local/bin:$PATH" | |
| ENV HF_HOME=/app/.cache # HF‑Cache in deinem Schreibverzeichnis | |
| # Python-Abhängigkeiten | |
| COPY --chown=user requirements.txt . | |
| RUN pip install --upgrade pip && \ | |
| pip install --no-cache-dir -r requirements.txt | |
| # Optional: flash‑attn (Ampere 86 wird erkannt, Wheel vorhanden) | |
| RUN pip install --no-cache-dir flash-attn==2.5.2 --no-build-isolation | |
| # Mount das geheime HF‑Token beim Build: | |
| # Settings → Secrets → Name: HF_TOKEN (scope: "read") | |
| #ARG HF_TOKEN | |
| #RUN --mount=type=secret,id=HF_TOKEN \ | |
| # echo "machine huggingface.co login __token__ password $(cat /run/secrets/HF_TOKEN)" > ~/.netrc | |
| # App‑Code | |
| COPY --chown=user . /app | |
| CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"] |