From 7eec56c6a7badfb3678e10cb9823f481795b57f9 Mon Sep 17 00:00:00 2001 From: Fabian Wolf Date: Mon, 26 Aug 2024 15:05:45 +0200 Subject: [PATCH] Fix docker setup --- Dockerfile | 2 +- docker-compose.yml | 3 --- 2 files changed, 1 insertion(+), 4 deletions(-) diff --git a/Dockerfile b/Dockerfile index 66cac04..e44f8ad 100644 --- a/Dockerfile +++ b/Dockerfile @@ -23,7 +23,7 @@ WORKDIR /build # Clone and build llama.cpp RUN git clone https://github.com/ggerganov/llama.cpp && \ cd llama.cpp && \ - CUDA_DOCKER_ARCH=compute_89 make GGML_CUDA=1 -j 8 + CUDA_DOCKER_ARCH=compute_86 make GGML_CUDA=1 -j 8 # Set the working directory diff --git a/docker-compose.yml b/docker-compose.yml index d9fdb66..3da4981 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -12,13 +12,10 @@ services: - PORT=${PORT:-5000} - HOST=${HOST:-0.0.0.0} - CONFIG_FILE=${CONFIG_FILE:-/models/config.yml} - - N_GPU_LAYERS=${N_GPU_LAYERS:-80} - GPU=${GPU:-ALL} - LLAMACPP_PORT=${LLAMACPP_PORT:-2929} - DEBUG=${DEBUG:-true} - MODE=${MODE:-choice} - - ENABLE_PARALLEL=${ENABLE_PARALLEL:-false} - - PARALLEL_SLOTS=${PARALLEL_SLOTS:-1} - NO_PARALLEL_PREPROCESSING=${NO_PARALLEL_PREPROCESSING:-false} - CONTEXT_SIZE=${CONTEXT_SIZE:- -1} - VERBOSE_LLAMA=${VERBOSE_LLAMA:-false}