oobabooga · WolframRavenwolf · Feb 9, 2024 · Feb 9, 2024 · Feb 9, 2024 · Feb 9, 2024
diff --git a/.gitignore b/.gitignore
@@ -47,4 +47,5 @@ wandb
 /docker-compose.yaml
 /docker-compose.yml
 /Dockerfile
+.dockerignore
 .env
diff --git a/docker/.env.example b/docker/.env.example
@@ -14,12 +14,14 @@ HOST_API_PORT=5000
 CONTAINER_API_PORT=5000
 # Comma separated extensions to build
 BUILD_EXTENSIONS=""
-# Set APP_RUNTIME_GID to an appropriate host system group to enable access to mounted volumes 
-# You can find your current host user group id with the command `id -g`
+# Set APP_RUNTIME_UID/APP_RUNTIME_GID to an appropriate host user/group to enable access to mounted volumes
+# You can find your current host user/group id with the command `id -u; id -g`
+APP_RUNTIME_UID=6972
 APP_RUNTIME_GID=6972
 # override default app build permissions (handy for deploying to cloud)
 #APP_GID=6972
 #APP_UID=6972
 # Set cache env
-TRANSFORMERS_CACHE=/home/app/text-generation-webui/cache/
-HF_HOME=/home/app/text-generation-webui/cache/
+TRANSFORMERS_CACHE=/home/app/text-generation-webui/cache
+HF_HOME=/home/app/text-generation-webui/cache
+PYTORCH_KERNEL_CACHE_PATH=/home/app/text-generation-webui/cache
diff --git a/docker/amd/Dockerfile → docker/Dockerfile b/docker/amd/Dockerfile → docker/Dockerfile
@@ -1,21 +1,22 @@
-# BUILDER
 FROM ubuntu:22.04
-WORKDIR /builder
+
+ARG GPU_CHOICE=${GPU_CHOICE:-A} # A: NVIDIA, B: AMD, C: APPLE, D: INTEL, N: NONE (CPU)
-ARG GPU_CHOICE=${GPU_CHOICE:-A} # A: NVIDIA, B: AMD, C: APPLE, D: INTEL, N: NONE (CPU)
+# A: NVIDIA, B: AMD, C: APPLE, D: INTEL, N: NONE (CPU)
+ARG GPU_CHOICE=A
-ARG GPU_CHOICE=${GPU_CHOICE:-A} # A: NVIDIA, B: AMD, C: APPLE, D: INTEL, N: NONE (CPU)
+# A: NVIDIA, B: AMD, C: APPLE, D: INTEL, N: NONE (CPU)
+ARG GPU_CHOICE=A
 ARG TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST:-3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX}"
 ARG BUILD_EXTENSIONS="${BUILD_EXTENSIONS:-}"
 ARG APP_UID="${APP_UID:-6972}"
 ARG APP_GID="${APP_GID:-6972}"
 
+WORKDIR /builder
 RUN --mount=type=cache,target=/var/cache/apt,sharing=locked,rw \
     apt update && \
     apt install --no-install-recommends -y git vim build-essential python3-dev pip bash curl && \
     rm -rf /var/lib/apt/lists/*
 WORKDIR /home/app/
-RUN git clone https://github.com/oobabooga/text-generation-webui.git 
+RUN git clone https://github.com/oobabooga/text-generation-webui.git
-RUN git clone https://github.com/oobabooga/text-generation-webui.git
+WORKDIR /home/app/text-generation-webui
+RUN git clone https://github.com/oobabooga/text-generation-webui.git .
-RUN git clone https://github.com/oobabooga/text-generation-webui.git
+WORKDIR /home/app/text-generation-webui
+RUN git clone https://github.com/oobabooga/text-generation-webui.git .
 WORKDIR /home/app/text-generation-webui
-RUN GPU_CHOICE=B USE_CUDA118=FALSE LAUNCH_AFTER_INSTALL=FALSE INSTALL_EXTENSIONS=TRUE ./start_linux.sh --verbose
+RUN USE_CUDA118=FALSE LAUNCH_AFTER_INSTALL=FALSE INSTALL_EXTENSIONS=TRUE ./start_linux.sh --verbose
 COPY CMD_FLAGS.txt /home/app/text-generation-webui/
 EXPOSE ${CONTAINER_PORT:-7860} ${CONTAINER_API_PORT:-5000} ${CONTAINER_API_STREAM_PORT:-5005}
-WORKDIR /home/app/text-generation-webui
+ENV HOME=/home/app/text-generation-webui
 # set umask to ensure group read / write at runtime
-CMD umask 0002 && export HOME=/home/app/text-generation-webui && ./start_linux.sh
+CMD umask 0002 && ./start_linux.sh $CLI_ARGS
-CMD umask 0002 && ./start_linux.sh $CLI_ARGS
+ENTRYPOINT [ "/home/app/text-generation-webui/start_linux.sh" ]
-CMD umask 0002 && ./start_linux.sh $CLI_ARGS
+ENTRYPOINT [ "/home/app/text-generation-webui/start_linux.sh" ]
diff --git a/docker/amd/docker-compose.yml b/docker/amd/docker-compose.yml
@@ -4,42 +4,46 @@ services:
     build:
       context: .
       args:
-        # Requirements file to use: 
-        # | GPU | CPU | requirements file to use |
-        # |--------|---------|---------|
-        # | NVIDIA | has AVX2 | `requirements.txt` |
-        # | NVIDIA | no AVX2 | `requirements_noavx2.txt` |
-        # | AMD | has AVX2 | `requirements_amd.txt` |
-        # | AMD | no AVX2 | `requirements_amd_noavx2.txt` |
-        # | CPU only | has AVX2 | `requirements_cpu_only.txt` |
-        # | CPU only | no AVX2 | `requirements_cpu_only_noavx2.txt` |
-        # | Apple | Intel | `requirements_apple_intel.txt` |
-        # | Apple | Apple Silicon | `requirements_apple_silicon.txt` |
+        GPU_CHOICE: B # AMD
+
+        # Requirements file to use:
+        # | GPU      | CPU           | requirements file to use           |
+        # | -------- | ------------- | ---------------------------------- |
+        # | NVIDIA   | has AVX2      | `requirements.txt`                 |
+        # | NVIDIA   | no AVX2       | `requirements_noavx2.txt`          |
+        # | AMD      | has AVX2      | `requirements_amd.txt`             |
+        # | AMD      | no AVX2       | `requirements_amd_noavx2.txt`      |
+        # | CPU only | has AVX2      | `requirements_cpu_only.txt`        |
+        # | CPU only | no AVX2       | `requirements_cpu_only_noavx2.txt` |
+        # | Apple    | Intel         | `requirements_apple_intel.txt`     |
+        # | Apple    | Apple Silicon | `requirements_apple_silicon.txt`   |
         # Default: requirements.txt`
         # BUILD_REQUIREMENTS: requirements.txt
-
-        # Extension requirements to build: 
-        # BUILD_EXTENSIONS: 
-
-        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
-        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5} 
+
+        # Extension requirements to build:
         BUILD_EXTENSIONS: ${BUILD_EXTENSIONS:-}
-        APP_GID: ${APP_GID:-6972} 
-        APP_UID: ${APP_UID-6972} 
+
+        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
+        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5}
+        APP_GID: ${APP_GID:-6972}
+        APP_UID: ${APP_UID:-6972}
+    container_name: text-generation-webui
     env_file: .env
+    hostname: text-generation-webui
     user: "${APP_RUNTIME_UID:-6972}:${APP_RUNTIME_GID:-6972}"
     ports:
       - "${HOST_PORT:-7860}:${CONTAINER_PORT:-7860}"
       - "${HOST_API_PORT:-5000}:${CONTAINER_API_PORT:-5000}"
+    restart: unless-stopped
     stdin_open: true
     group_add:
       - video
     tty: true
     ipc: host
     devices:
       - /dev/kfd
-      - /dev/dri 
-    cap_add: 
+      - /dev/dri
+    cap_add:
       - SYS_PTRACE
     security_opt:
       - seccomp=unconfined

diff --git a/docker/cpu/Dockerfile b/docker/cpu/Dockerfile
diff --git a/docker/cpu/docker-compose.yml b/docker/cpu/docker-compose.yml
@@ -4,33 +4,37 @@ services:
     build:
       context: .
       args:
-        # Requirements file to use: 
-        # | GPU | CPU | requirements file to use |
-        # |--------|---------|---------|
-        # | NVIDIA | has AVX2 | `requirements.txt` |
-        # | NVIDIA | no AVX2 | `requirements_noavx2.txt` |
-        # | AMD | has AVX2 | `requirements_amd.txt` |
-        # | AMD | no AVX2 | `requirements_amd_noavx2.txt` |
-        # | CPU only | has AVX2 | `requirements_cpu_only.txt` |
-        # | CPU only | no AVX2 | `requirements_cpu_only_noavx2.txt` |
-        # | Apple | Intel | `requirements_apple_intel.txt` |
-        # | Apple | Apple Silicon | `requirements_apple_silicon.txt` |
+        GPU_CHOICE: N # NONE (CPU)
+
+        # Requirements file to use:
+        # | GPU      | CPU           | requirements file to use           |
+        # | -------- | ------------- | ---------------------------------- |
+        # | NVIDIA   | has AVX2      | `requirements.txt`                 |
+        # | NVIDIA   | no AVX2       | `requirements_noavx2.txt`          |
+        # | AMD      | has AVX2      | `requirements_amd.txt`             |
+        # | AMD      | no AVX2       | `requirements_amd_noavx2.txt`      |
+        # | CPU only | has AVX2      | `requirements_cpu_only.txt`        |
+        # | CPU only | no AVX2       | `requirements_cpu_only_noavx2.txt` |
+        # | Apple    | Intel         | `requirements_apple_intel.txt`     |
+        # | Apple    | Apple Silicon | `requirements_apple_silicon.txt`   |
         # Default: requirements.txt`
         # BUILD_REQUIREMENTS: requirements.txt
-
-        # Extension requirements to build: 
-        # BUILD_EXTENSIONS: 
-
-        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
-        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5} 
+
+        # Extension requirements to build:
         BUILD_EXTENSIONS: ${BUILD_EXTENSIONS:-}
-        APP_GID: ${APP_GID:-6972} 
-        APP_UID: ${APP_UID-6972} 
+
+        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
+        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5}
+        APP_GID: ${APP_GID:-6972}
+        APP_UID: ${APP_UID:-6972}
+    container_name: text-generation-webui
     env_file: .env
+    hostname: text-generation-webui
     user: "${APP_RUNTIME_UID:-6972}:${APP_RUNTIME_GID:-6972}"
     ports:
       - "${HOST_PORT:-7860}:${CONTAINER_PORT:-7860}"
       - "${HOST_API_PORT:-5000}:${CONTAINER_API_PORT:-5000}"
+    restart: unless-stopped
     stdin_open: true
     tty: true
     volumes:

diff --git a/docker/intel/Dockerfile b/docker/intel/Dockerfile
diff --git a/docker/intel/docker-compose.yml b/docker/intel/docker-compose.yml
@@ -4,49 +4,55 @@ services:
     build:
       context: .
       args:
-        # Requirements file to use: 
-        # | GPU | CPU | requirements file to use |
-        # |--------|---------|---------|
-        # | NVIDIA | has AVX2 | `requirements.txt` |
-        # | NVIDIA | no AVX2 | `requirements_noavx2.txt` |
-        # | AMD | has AVX2 | `requirements_amd.txt` |
-        # | AMD | no AVX2 | `requirements_amd_noavx2.txt` |
-        # | CPU only | has AVX2 | `requirements_cpu_only.txt` |
-        # | CPU only | no AVX2 | `requirements_cpu_only_noavx2.txt` |
-        # | Apple | Intel | `requirements_apple_intel.txt` |
-        # | Apple | Apple Silicon | `requirements_apple_silicon.txt` |
+        GPU_CHOICE: D # INTEL
+
+        # Requirements file to use:
+        # | GPU      | CPU           | requirements file to use           |
+        # | -------- | ------------- | ---------------------------------- |
+        # | NVIDIA   | has AVX2      | `requirements.txt`                 |
+        # | NVIDIA   | no AVX2       | `requirements_noavx2.txt`          |
+        # | AMD      | has AVX2      | `requirements_amd.txt`             |
+        # | AMD      | no AVX2       | `requirements_amd_noavx2.txt`      |
+        # | CPU only | has AVX2      | `requirements_cpu_only.txt`        |
+        # | CPU only | no AVX2       | `requirements_cpu_only_noavx2.txt` |
+        # | Apple    | Intel         | `requirements_apple_intel.txt`     |
+        # | Apple    | Apple Silicon | `requirements_apple_silicon.txt`   |
         # Default: requirements.txt`
         # BUILD_REQUIREMENTS: requirements.txt
-
-        # Extension requirements to build: 
-        # BUILD_EXTENSIONS: 
-
-        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
-        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5} 
+
+        # Extension requirements to build:
         BUILD_EXTENSIONS: ${BUILD_EXTENSIONS:-}
-        APP_GID: ${APP_GID:-6972} 
-        APP_UID: ${APP_UID-6972} 
+
+        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
+        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5}
+        APP_GID: ${APP_GID:-6972}
+        APP_UID: ${APP_UID:-6972}
+    container_name: text-generation-webui
     env_file: .env
+    hostname: text-generation-webui
     user: "${APP_RUNTIME_UID:-6972}:${APP_RUNTIME_GID:-6972}"
     ports:
       - "${HOST_PORT:-7860}:${CONTAINER_PORT:-7860}"
       - "${HOST_API_PORT:-5000}:${CONTAINER_API_PORT:-5000}"
+    restart: unless-stopped
     stdin_open: true
     group_add:
       - video
     tty: true
     ipc: host
     devices:
       - /dev/kfd
-      - /dev/dri 
-    cap_add: 
+      - /dev/dri
+    cap_add:
       - SYS_PTRACE
     security_opt:
       - seccomp=unconfined
     volumes:
+      - ./cache:/home/app/text-generation-webui/cache
       - ./characters:/home/app/text-generation-webui/characters
       - ./extensions:/home/app/text-generation-webui/extensions
       - ./loras:/home/app/text-generation-webui/loras
+      - ./logs:/home/app/text-generation-webui/logs
       - ./models:/home/app/text-generation-webui/models
       - ./presets:/home/app/text-generation-webui/presets
       - ./prompts:/home/app/text-generation-webui/prompts

diff --git a/docker/nvidia/Dockerfile b/docker/nvidia/Dockerfile
diff --git a/docker/nvidia/docker-compose.yml b/docker/nvidia/docker-compose.yml
@@ -4,33 +4,37 @@ services:
     build:
       context: .
       args:
-        # Requirements file to use: 
-        # | GPU | CPU | requirements file to use |
-        # |--------|---------|---------|
-        # | NVIDIA | has AVX2 | `requirements.txt` |
-        # | NVIDIA | no AVX2 | `requirements_noavx2.txt` |
-        # | AMD | has AVX2 | `requirements_amd.txt` |
-        # | AMD | no AVX2 | `requirements_amd_noavx2.txt` |
-        # | CPU only | has AVX2 | `requirements_cpu_only.txt` |
-        # | CPU only | no AVX2 | `requirements_cpu_only_noavx2.txt` |
-        # | Apple | Intel | `requirements_apple_intel.txt` |
-        # | Apple | Apple Silicon | `requirements_apple_silicon.txt` |
+        # GPU_CHOICE: A # NVIDIA (default)
+
+        # Requirements file to use:
+        # | GPU      | CPU           | requirements file to use           |
+        # | -------- | ------------- | ---------------------------------- |
+        # | NVIDIA   | has AVX2      | `requirements.txt`                 |
+        # | NVIDIA   | no AVX2       | `requirements_noavx2.txt`          |
+        # | AMD      | has AVX2      | `requirements_amd.txt`             |
+        # | AMD      | no AVX2       | `requirements_amd_noavx2.txt`      |
+        # | CPU only | has AVX2      | `requirements_cpu_only.txt`        |
+        # | CPU only | no AVX2       | `requirements_cpu_only_noavx2.txt` |
+        # | Apple    | Intel         | `requirements_apple_intel.txt`     |
+        # | Apple    | Apple Silicon | `requirements_apple_silicon.txt`   |
         # Default: requirements.txt`
         # BUILD_REQUIREMENTS: requirements.txt
-
-        # Extension requirements to build: 
-        # BUILD_EXTENSIONS: 
-
-        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
-        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5} 
+
+        # Extension requirements to build:
         BUILD_EXTENSIONS: ${BUILD_EXTENSIONS:-}
-        APP_GID: ${APP_GID:-6972} 
-        APP_UID: ${APP_UID-6972} 
+
+        # specify which cuda version your card supports: https://developer.nvidia.com/cuda-gpus
+        TORCH_CUDA_ARCH_LIST: ${TORCH_CUDA_ARCH_LIST:-7.5}
+        APP_GID: ${APP_GID:-6972}
+        APP_UID: ${APP_UID:-6972}
+    container_name: text-generation-webui
     env_file: .env
+    hostname: text-generation-webui
     user: "${APP_RUNTIME_UID:-6972}:${APP_RUNTIME_GID:-6972}"
     ports:
       - "${HOST_PORT:-7860}:${CONTAINER_PORT:-7860}"
       - "${HOST_API_PORT:-5000}:${CONTAINER_API_PORT:-5000}"
+    restart: unless-stopped
     stdin_open: true
     tty: true
     volumes:

diff --git a/docs/09 - Docker.md b/docs/09 - Docker.md
@@ -19,9 +19,13 @@ Use these commands to launch the image:
 
 ```
 cd text-generation-webui
-ln -s docker/{nvidia/Dockerfile,docker-compose.yml,.dockerignore} .
+ln -s docker/{nvidia/docker-compose.yml,.dockerignore,Dockerfile} .
 cp docker/.env.example .env
 # Edit .env and set TORCH_CUDA_ARCH_LIST based on your GPU model
+
+# Ensure all mounted dirs exist or they'll be created by Docker as root
+mkdir -p cache cloudflared logs softprompts
+
 docker compose up --build
 ```