Spaces:

dmartincy
/

document-translation

Sleeping

App Files Files Community

dmartincy commited on Jan 19

Commit

da9dd3b

1 Parent(s): 5341e74

Add DocAuthoring and Nginx

Browse files

Files changed (3) hide show

Dockerfile +21 -1
nginx.conf +1 -1
start-services.sh +18 -3

Dockerfile CHANGED Viewed

@@ -14,14 +14,26 @@ RUN apt-get update && apt-get install -y \
     unzip \
     clang \
     cuda-toolkit \
     && rm -rf /var/lib/apt/lists/*
 # Create directories and set permissions
 RUN mkdir -p /tmp/llamafile && \
     mkdir -p $HOME/models && \
     mkdir -p $HOME/app && \
     mkdir -p $HOME/.llamafile && \
-    chown -R user:user $HOME
 # Install llamafiler
 RUN cd /tmp/llamafile && \
@@ -31,6 +43,9 @@ RUN cd /tmp/llamafile && \
     chmod +x /usr/local/bin/llamafiler && \
     rm -rf /tmp/llamafile
 # Switch to non-root user
 USER user
 WORKDIR $HOME/app
@@ -39,6 +54,11 @@ WORKDIR $HOME/app
 RUN wget -q https://huggingface.co/bartowski/gemma-2-2b-it-GGUF/resolve/main/gemma-2-2b-it-Q8_0.gguf -O $HOME/models/gemma-2b.gguf && \
     wget -q https://huggingface.co/leliuga/all-MiniLM-L6-v2-GGUF/resolve/main/all-MiniLM-L6-v2.F16.gguf -O $HOME/models/embeddings.gguf
 # Copy start script
 COPY --chown=user:user start-services.sh $HOME/app/
 RUN chmod +x $HOME/app/start-services.sh

     unzip \
     clang \
     cuda-toolkit \
+    nginx \
     && rm -rf /var/lib/apt/lists/*
 # Create directories and set permissions
 RUN mkdir -p /tmp/llamafile && \
     mkdir -p $HOME/models && \
     mkdir -p $HOME/app && \
+    mkdir -p $HOME/app/docauth && \
     mkdir -p $HOME/.llamafile && \
+    mkdir -p /var/cache/nginx && \
+    mkdir -p /var/log/nginx && \
+    mkdir -p /var/lib/nginx && \
+    mkdir -p /run/nginx && \
+    touch /var/run/nginx.pid && \
+    chown -R user:user $HOME && \
+    chown -R user:user /var/cache/nginx && \
+    chown -R user:user /var/log/nginx && \
+    chown -R user:user /var/lib/nginx && \
+    chown -R user:user /var/run/nginx.pid && \
+    chown -R user:user /run/nginx
 # Install llamafiler
 RUN cd /tmp/llamafile && \
     chmod +x /usr/local/bin/llamafiler && \
     rm -rf /tmp/llamafile
+# Copy nginx configuration
+COPY nginx.conf /etc/nginx/nginx.conf
 # Switch to non-root user
 USER user
 WORKDIR $HOME/app
 RUN wget -q https://huggingface.co/bartowski/gemma-2-2b-it-GGUF/resolve/main/gemma-2-2b-it-Q8_0.gguf -O $HOME/models/gemma-2b.gguf && \
     wget -q https://huggingface.co/leliuga/all-MiniLM-L6-v2-GGUF/resolve/main/all-MiniLM-L6-v2.F16.gguf -O $HOME/models/embeddings.gguf
+# Copy web files
+COPY --chown=user:user index.html $HOME/app/docauth/
+COPY --chown=user:user document-authoring.js $HOME/app/docauth/
+COPY --chown=user:user Sample.docx $HOME/app/docauth/
 # Copy start script
 COPY --chown=user:user start-services.sh $HOME/app/
 RUN chmod +x $HOME/app/start-services.sh

nginx.conf CHANGED Viewed

@@ -8,7 +8,7 @@ http {
         listen 7861;
         location / {
-            root /docauth;
         }
         location /healthcheck {

         listen 7861;
         location / {
+            root /home/user/app/docauth;
         }
         location /healthcheck {

start-services.sh CHANGED Viewed

@@ -10,9 +10,24 @@ nvidia-smi --query-gpu=compute_cap --format=csv,noheader || echo "Warning: Could
 # Create temporary directory for llamafiler
 mkdir -p /tmp/llamafiler
-# Start the model in server mode
 echo "Starting chat model..."
-TMPDIR=/tmp/llamafiler /usr/local/bin/llamafiler --model $HOME/models/gemma-2b.gguf -ngl 2 --listen 0.0.0.0:7860 --verbose &
 GEMMA_PID=$!
 # Wait for the model to be ready with a timeout
@@ -21,7 +36,7 @@ TIMEOUT=600  # 10 minutes timeout
 START_TIME=$SECONDS
 wait_for_services() {
-    curl -s --fail -X POST http://127.0.0.1:7860/v1/chat/completions \
         -H "Content-Type: application/json" \
         -d '{"model": "gemma-2b", "messages":[{"role":"user","content":"hi"}]}' >/dev/null 2>&1
 }

 # Create temporary directory for llamafiler
 mkdir -p /tmp/llamafiler
+# Start nginx
+echo "Starting nginx..."
+/usr/sbin/nginx -c /etc/nginx/nginx.conf
+if [ $? -ne 0 ]; then
+    echo "Failed to start nginx"
+    exit 1
+fi
+# Verify nginx is running
+if ! ps aux | grep nginx | grep -v grep > /dev/null; then
+    echo "Nginx failed to start"
+    exit 1
+fi
+echo "Nginx started successfully"
+# Start the model in server mode (now on port 8081)
 echo "Starting chat model..."
+TMPDIR=/tmp/llamafiler /usr/local/bin/llamafiler --model $HOME/models/gemma-2b.gguf -ngl 2 --listen 0.0.0.0:8081 --verbose &
 GEMMA_PID=$!
 # Wait for the model to be ready with a timeout
 START_TIME=$SECONDS
 wait_for_services() {
+    curl -s --fail -X POST http://127.0.0.1:8081/v1/chat/completions \
         -H "Content-Type: application/json" \
         -d '{"model": "gemma-2b", "messages":[{"role":"user","content":"hi"}]}' >/dev/null 2>&1
 }