From 0e2c422b1174578d925acb9724e79d1663428633 Mon Sep 17 00:00:00 2001 From: Robert Washbourne Date: Thu, 23 Nov 2023 23:58:40 -0500 Subject: [PATCH] remove flags --- .devops/main-cuda.Dockerfile | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/.devops/main-cuda.Dockerfile b/.devops/main-cuda.Dockerfile index 44747f000..1e7e1c4f9 100644 --- a/.devops/main-cuda.Dockerfile +++ b/.devops/main-cuda.Dockerfile @@ -23,9 +23,9 @@ COPY . . ENV CUDA_DOCKER_ARCH=${CUDA_DOCKER_ARCH} # Enable cuBLAS ENV LLAMA_CUBLAS=1 -ENV LLAMA_CUDA_MMV_Y=2 -ENV LLAMA_CUDA_DMMV_X=64 -ENV LLAMA_CUDA_F16=true +# ENV LLAMA_CUDA_MMV_Y=2 +# ENV LLAMA_CUDA_DMMV_X=64 +# ENV LLAMA_CUDA_F16=true RUN make @@ -41,7 +41,7 @@ RUN apt-get install python3 python3-pip RUN pip install --install-option="--prefix=/install" runpod FROM ${BASE_CUDA_RUN_CONTAINER} as runtime -COPY --from=build /install /usr/local + COPY --from=build /app/server /server COPY --from=build /model.gguf model.gguf COPY --from=build /app/models models