File tree Expand file tree Collapse file tree 2 files changed +9
-2
lines changed Expand file tree Collapse file tree 2 files changed +9
-2
lines changed Original file line number Diff line number Diff line change @@ -286,7 +286,14 @@ COPY --from=grpc /opt/grpc /usr/local
286
286
WORKDIR /build
287
287
288
288
# # Build the binary
289
- RUN make build
289
+ # # If it's CUDA, we want to skip some of the llama-compat backends to save space
290
+ # # We only leave the most CPU-optimized variant and the fallback for the cublas build
291
+ # # (both will use CUDA for the actual computation)
292
+ RUN if [ "${BUILD_TYPE}" = "cublas" ]; then \
293
+ SKIP_GRPC_BACKEND="backend-assets/grpc/llama-cpp-avx backend-assets/grpc/llama-cpp-avx2" make build; \
294
+ else \
295
+ make build; \
296
+ fi
290
297
291
298
RUN if [ ! -d "/build/sources/go-piper/piper-phonemize/pi/lib/" ]; then \
292
299
mkdir -p /build/sources/go-piper/piper-phonemize/pi/lib/ \
Original file line number Diff line number Diff line change @@ -8,7 +8,7 @@ DETECT_LIBS?=true
8
8
# llama.cpp versions
9
9
GOLLAMA_REPO? =https://github.com/go-skynet/go-llama.cpp
10
10
GOLLAMA_VERSION? =2b57a8ae43e4699d3dc5d1496a1ccd42922993be
11
- CPPLLAMA_VERSION? =3ba780e2a8f0ffe13f571b27f0bbf2ca5a199efc
11
+ CPPLLAMA_VERSION? =e11bd856d538e44d24d8cad4b0381fba0984d162
12
12
13
13
# go-rwkv version
14
14
RWKV_REPO? =https://github.com/donomii/go-rwkv.cpp
You can’t perform that action at this time.
0 commit comments