fix(deployment): resolve model deployment issue on CUDA + Windows environment

2025-05-09 13:43:29 +08:00 · 2025-05-09 13:43:29 +08:00 · bec5b8865c
parent c3855f37ad
commit bec5b8865c
1 changed files with 2 additions and 3 deletions
--- a/Dockerfile.backend.cuda
+++ b/Dockerfile.backend.cuda
@ -48,11 +48,10 @@ RUN if [ "$SKIP_LLAMA_BUILD" = "false" ]; then \
        mkdir -p build && \
        cd build && \
        echo "Starting CMake configuration with CUDA support..." && \
-        cmake -DGGML_CUDA=ON \
+        cmake -DGGML_CUDA=OFF  -DLLAMA_CUBLAS=OFF \
              -DCMAKE_BUILD_TYPE=Release \
              -DBUILD_SHARED_LIBS=OFF \
-              -DLLAMA_NATIVE=OFF \
-              -DCMAKE_CUDA_FLAGS="-Wno-deprecated-gpu-targets" \
+              -DLLAMA_NATIVE=ON \
              .. && \
        echo "Starting build process (this will take several minutes)..." && \
        cmake --build . --config Release -j --verbose && \