no server kill

d527efc6 · nanahira · 72e49d5f · d527efc6 · d527efc6 · d527efc6
Commit d527efc6 authored Oct 15, 2022 by nanahira
Hide whitespace changes
Inline Side-by-side

Showing with 14 additions and 5 deletions

.dockerignore .dockerignore +1 -0

Dockerfile Dockerfile +1 -1

docker-compose.yml docker-compose.yml +8 -0

main.py main.py +4 -4

No files found.
--- a/.dockerignore
+++ b/.dockerignore
@@ -6,3 +6,4 @@ Dockerfile
 /*.sh
 /models
 /static
+/docker-compose.yml
--- a/Dockerfile
+++ b/Dockerfile
@@ -6,7 +6,7 @@ RUN apt update && apt -y install python3-pip python-is-python3 && \

 WORKDIR /app
 COPY ./requirements.txt ./
-RUN pip install -r requirements.txt
+RUN pip install --no-cache -r requirements.txt

 COPY . ./


--- a/docker-compose.yml
+++ b/docker-compose.yml
+version: '2.4'
+services:
+  naifu:
+    build: '.'
+    network_mode: host
+    runtime: nvidia
+    volumes:
+      - ./models:/app/models
--- a/main.py
+++ b/main.py
@@ -216,7 +216,7 @@ def generate(request: GenerationRequest, authorized: bool = Depends(verify_token
        if "CUDA out of memory" in e_s or \
                "an illegal memory access" in e_s or "CUDA" in e_s:
            logger.error("GPU error, committing seppuku.")
-            os.kill(mainpid, signal.SIGTERM)
+            # os.kill(mainpid, signal.SIGTERM)
        return {"error": str(e)}

 @app.post('/generate', response_model=Union[GenerationOutput, ErrorOutput])
@@ -267,7 +267,7 @@ def generate(request: GenerationRequest, authorized: bool = Depends(verify_token
        if "CUDA out of memory" in e_s or \
                "an illegal memory access" in e_s or "CUDA" in e_s:
            logger.error("GPU error, committing seppuku.")
-            os.kill(mainpid, signal.SIGTERM)
+            # os.kill(mainpid, signal.SIGTERM)
        return {"error": str(e)}

 @app.post('/generate-text', response_model=Union[TextOutput, ErrorOutput])
@@ -294,7 +294,7 @@ def generate_text(request: TextRequest, authorized: bool = Depends(verify_token)
        if "CUDA out of memory" in e_s or \
                "an illegal memory access" in e_s or "CUDA" in e_s:
            logger.error("GPU error, committing seppuku.")
-            os.kill(mainpid, signal.SIGTERM)
+            # os.kill(mainpid, signal.SIGTERM)
        return ErrorOutput(error=str(e))

 @app.get('/predict-tags', response_model=Union[TagOutput, ErrorOutput])
@@ -321,7 +321,7 @@ async def predict_tags(prompt="", authorized: bool = Depends(verify_token)):
        if "CUDA out of memory" in e_s or \
                "an illegal memory access" in e_s or "CUDA" in e_s:
            logger.error("GPU error, committing seppuku.")
-            os.kill(mainpid, signal.SIGTERM)
+            # os.kill(mainpid, signal.SIGTERM)
        return ErrorOutput(error=str(e))

 #@app.get('/')