Update Dockerfile
Browse files- Dockerfile +19 -5
Dockerfile
CHANGED
|
@@ -25,10 +25,24 @@ COPY --chown=user . /app
|
|
| 25 |
RUN pip install --no-cache-dir \
|
| 26 |
torch==2.3.1+cu121 torchaudio==2.3.1 \
|
| 27 |
--index-url https://download.pytorch.org/whl/cu121
|
| 28 |
-
|
| 29 |
-
RUN pip install text-generation==0.6.1
|
| 30 |
-
ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
|
| 31 |
EXPOSE 7860
|
| 32 |
-
|
| 33 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 34 |
|
|
|
|
| 25 |
RUN pip install --no-cache-dir \
|
| 26 |
torch==2.3.1+cu121 torchaudio==2.3.1 \
|
| 27 |
--index-url https://download.pytorch.org/whl/cu121
|
| 28 |
+
|
|
|
|
|
|
|
| 29 |
EXPOSE 7860
|
| 30 |
+
|
| 31 |
+
RUN pip install --no-cache-dir text-generation==0.6.1
|
| 32 |
+
|
| 33 |
+
ENV HF_HOME=/app/.cache
|
| 34 |
+
ENV MODEL_ID="SebastianBodza/Kartoffel_Orpheus-3B_german_natural-v0.1"
|
| 35 |
+
ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
|
| 36 |
+
ENV ORPHEUS_MODEL=$MODEL_ID # landet im JSON-Payload von OrpheusEngine
|
| 37 |
+
|
| 38 |
+
CMD bash -c "\
|
| 39 |
+
text-generation-launcher \
|
| 40 |
+
--model-id $MODEL_ID \
|
| 41 |
+
--port 1234 \
|
| 42 |
+
--max-input-length 4096 \
|
| 43 |
+
--dtype auto \
|
| 44 |
+
--quantization fp8 \
|
| 45 |
+
--enable-chunked-prefill \
|
| 46 |
+
--gpu-memory-utilization 0.7 & \
|
| 47 |
+
uvicorn app:app --host 0.0.0.0 --port 7860"
|
| 48 |
|