Update Dockerfile
Browse files- Dockerfile +7 -8
Dockerfile
CHANGED
|
@@ -50,12 +50,11 @@ ENV ORPHEUS_API_URL=http://127.0.0.1:1234/v1/completions
|
|
| 50 |
|
| 51 |
# βββββ Entrypoint ββββββββββββββββββββββββββββββββββββββββ
|
| 52 |
CMD bash -c "\
|
| 53 |
-
|
| 54 |
-
|
| 55 |
-
|
| 56 |
-
|
| 57 |
-
|
| 58 |
-
|
| 59 |
-
|
| 60 |
-
|
| 61 |
|
|
|
|
| 50 |
|
| 51 |
# βββββ Entrypoint ββββββββββββββββββββββββββββββββββββββββ
|
| 52 |
CMD bash -c "\
|
| 53 |
+
python -m vllm.entrypoints.openai.api_server \
|
| 54 |
+
--model ${MODEL_ID} \
|
| 55 |
+
--port 1234 \
|
| 56 |
+
--dtype bfloat16 \
|
| 57 |
+
--gpu-memory-utilization 0.9 \
|
| 58 |
+
--max-model-len 8192 & # β im Hintergrund starten
|
| 59 |
+
exec uvicorn app:app --host 0.0.0.0 --port 7860"
|
|
|
|
| 60 |
|