|
GOCMD=go |
|
GOTEST=$(GOCMD) test |
|
GOVET=$(GOCMD) vet |
|
BINARY_NAME=local-ai |
|
|
|
DETECT_LIBS?=true |
|
|
|
|
|
GOLLAMA_REPO?=https://github.com/go-skynet/go-llama.cpp |
|
GOLLAMA_VERSION?=2b57a8ae43e4699d3dc5d1496a1ccd42922993be |
|
CPPLLAMA_VERSION?=1e6f6554aa11fa10160a5fda689e736c3c34169f |
|
|
|
|
|
GPT4ALL_REPO?=https://github.com/nomic-ai/gpt4all |
|
GPT4ALL_VERSION?=27a8b020c36b0df8f8b82a252d261cda47cf44b8 |
|
|
|
|
|
RWKV_REPO?=https://github.com/donomii/go-rwkv.cpp |
|
RWKV_VERSION?=661e7ae26d442f5cfebd2a0881b44e8c55949ec6 |
|
|
|
|
|
WHISPER_REPO?=https://github.com/ggerganov/whisper.cpp |
|
WHISPER_CPP_VERSION?=fe36c909715e6751277ddb020e7892c7670b61d4 |
|
|
|
|
|
BERT_REPO?=https://github.com/go-skynet/go-bert.cpp |
|
BERT_VERSION?=710044b124545415f555e4260d16b146c725a6e4 |
|
|
|
|
|
PIPER_REPO?=https://github.com/mudler/go-piper |
|
PIPER_VERSION?=9d0100873a7dbb0824dfea40e8cec70a1b110759 |
|
|
|
|
|
STABLEDIFFUSION_REPO?=https://github.com/mudler/go-stable-diffusion |
|
STABLEDIFFUSION_VERSION?=4a3cd6aeae6f66ee57eae9a0075f8c58c3a6a38f |
|
|
|
|
|
TINYDREAM_REPO?=https://github.com/M0Rf30/go-tiny-dream |
|
TINYDREAM_VERSION?=c04fa463ace9d9a6464313aa5f9cd0f953b6c057 |
|
|
|
export BUILD_TYPE?= |
|
export STABLE_BUILD_TYPE?=$(BUILD_TYPE) |
|
export CMAKE_ARGS?= |
|
export BACKEND_LIBS?= |
|
|
|
CGO_LDFLAGS?= |
|
CGO_LDFLAGS_WHISPER?= |
|
CGO_LDFLAGS_WHISPER+=-lggml |
|
CUDA_LIBPATH?=/usr/local/cuda/lib64/ |
|
GO_TAGS?= |
|
BUILD_ID?= |
|
|
|
TEST_DIR=/tmp/test |
|
|
|
TEST_FLAKES?=5 |
|
|
|
RANDOM := $(shell bash -c 'echo $$RANDOM') |
|
|
|
VERSION?=$(shell git describe --always --tags || echo "dev" ) |
|
|
|
LD_FLAGS?=-s -w |
|
override LD_FLAGS += -X "github.com/mudler/LocalAI/internal.Version=$(VERSION)" |
|
override LD_FLAGS += -X "github.com/mudler/LocalAI/internal.Commit=$(shell git rev-parse HEAD)" |
|
|
|
OPTIONAL_TARGETS?= |
|
|
|
export OS := $(shell uname -s) |
|
ARCH := $(shell uname -m) |
|
GREEN := $(shell tput -Txterm setaf 2) |
|
YELLOW := $(shell tput -Txterm setaf 3) |
|
WHITE := $(shell tput -Txterm setaf 7) |
|
CYAN := $(shell tput -Txterm setaf 6) |
|
RESET := $(shell tput -Txterm sgr0) |
|
|
|
UPX?= |
|
|
|
ifeq (, $(shell which upx)) |
|
UPX= |
|
else |
|
UPX=$(shell which upx) |
|
endif |
|
|
|
|
|
E2E_BRIDGE_IP?=172.17.0.1 |
|
|
|
ifndef UNAME_S |
|
UNAME_S := $(shell uname -s) |
|
endif |
|
|
|
ifeq ($(OS),Darwin) |
|
|
|
ifeq ($(OSX_SIGNING_IDENTITY),) |
|
OSX_SIGNING_IDENTITY := $(shell security find-identity -v -p codesigning | grep '"' | head -n 1 | sed -E 's/.*"(.*)"/\1/') |
|
endif |
|
|
|
# on OSX, if BUILD_TYPE is blank, we should default to use Metal |
|
ifeq ($(BUILD_TYPE),) |
|
BUILD_TYPE=metal |
|
# disable metal if on Darwin and any other value is explicitly passed. |
|
else ifneq ($(BUILD_TYPE),metal) |
|
CMAKE_ARGS+=-DGGML_METAL=OFF |
|
export GGML_NO_ACCELERATE=1 |
|
export GGML_NO_METAL=1 |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),metal) |
|
# -lcblas removed: it seems to always be listed as a duplicate flag. |
|
CGO_LDFLAGS += -framework Accelerate |
|
endif |
|
else |
|
CGO_LDFLAGS_WHISPER+=-lgomp |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),openblas) |
|
CGO_LDFLAGS+=-lopenblas |
|
export GGML_OPENBLAS=1 |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),cublas) |
|
CGO_LDFLAGS+=-lcublas -lcudart -L$(CUDA_LIBPATH) |
|
export GGML_CUDA=1 |
|
CGO_LDFLAGS_WHISPER+=-L$(CUDA_LIBPATH)/stubs/ -lcuda -lcufft |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),vulkan) |
|
CMAKE_ARGS+=-DGGML_VULKAN=1 |
|
endif |
|
|
|
ifneq (,$(findstring sycl,$(BUILD_TYPE))) |
|
export GGML_SYCL=1 |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),sycl_f16) |
|
export GGML_SYCL_F16=1 |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),hipblas) |
|
ROCM_HOME ?= /opt/rocm |
|
ROCM_PATH ?= /opt/rocm |
|
LD_LIBRARY_PATH ?= /opt/rocm/lib:/opt/rocm/llvm/lib |
|
export CXX=$(ROCM_HOME)/llvm/bin/clang++ |
|
export CC=$(ROCM_HOME)/llvm/bin/clang |
|
# llama-ggml has no hipblas support, so override it here. |
|
export STABLE_BUILD_TYPE= |
|
export GGML_HIPBLAS=1 |
|
GPU_TARGETS ?= gfx900,gfx906,gfx908,gfx940,gfx941,gfx942,gfx90a,gfx1030,gfx1031,gfx1100,gfx1101 |
|
AMDGPU_TARGETS ?= "$(GPU_TARGETS)" |
|
CMAKE_ARGS+=-DGGML_HIPBLAS=ON -DAMDGPU_TARGETS="$(AMDGPU_TARGETS)" -DGPU_TARGETS="$(GPU_TARGETS)" |
|
CGO_LDFLAGS += -O3 --rtlib=compiler-rt -unwindlib=libgcc -lhipblas -lrocblas --hip-link -L${ROCM_HOME}/lib/llvm/lib |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),metal) |
|
CGO_LDFLAGS+=-framework Foundation -framework Metal -framework MetalKit -framework MetalPerformanceShaders |
|
export GGML_METAL=1 |
|
endif |
|
|
|
ifeq ($(BUILD_TYPE),clblas) |
|
CGO_LDFLAGS+=-lOpenCL -lclblast |
|
export GGML_OPENBLAS=1 |
|
endif |
|
|
|
# glibc-static or glibc-devel-static required |
|
ifeq ($(STATIC),true) |
|
LD_FLAGS+=-linkmode external -extldflags -static |
|
endif |
|
|
|
ifeq ($(findstring stablediffusion,$(GO_TAGS)),stablediffusion) |
|
# OPTIONAL_TARGETS+=go-stable-diffusion/libstablediffusion.a |
|
OPTIONAL_GRPC+=backend-assets/grpc/stablediffusion |
|
endif |
|
|
|
ifeq ($(findstring tinydream,$(GO_TAGS)),tinydream) |
|
# OPTIONAL_TARGETS+=go-tiny-dream/libtinydream.a |
|
OPTIONAL_GRPC+=backend-assets/grpc/tinydream |
|
endif |
|
|
|
ifeq ($(findstring tts,$(GO_TAGS)),tts) |
|
# OPTIONAL_TARGETS+=go-piper/libpiper_binding.a |
|
# OPTIONAL_TARGETS+=backend-assets/espeak-ng-data |
|
PIPER_CGO_CXXFLAGS+=-I$(CURDIR)/sources/go-piper/piper/src/cpp -I$(CURDIR)/sources/go-piper/piper/build/fi/include -I$(CURDIR)/sources/go-piper/piper/build/pi/include -I$(CURDIR)/sources/go-piper/piper/build/si/include |
|
PIPER_CGO_LDFLAGS+=-L$(CURDIR)/sources/go-piper/piper/build/fi/lib -L$(CURDIR)/sources/go-piper/piper/build/pi/lib -L$(CURDIR)/sources/go-piper/piper/build/si/lib -lfmt -lspdlog -lucd |
|
OPTIONAL_GRPC+=backend-assets/grpc/piper |
|
endif |
|
|
|
ALL_GRPC_BACKENDS=backend-assets/grpc/huggingface |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/bert-embeddings |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/llama-cpp-avx |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/llama-cpp-avx2 |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/llama-cpp-fallback |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/llama-ggml |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/llama-cpp-grpc |
|
ALL_GRPC_BACKENDS+=backend-assets/util/llama-cpp-rpc-server |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/gpt4all |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/rwkv |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/whisper |
|
ALL_GRPC_BACKENDS+=backend-assets/grpc/local-store |
|
ALL_GRPC_BACKENDS+=$(OPTIONAL_GRPC) |
|
# Use filter-out to remove the specified backends |
|
ALL_GRPC_BACKENDS := $(filter-out $(SKIP_GRPC_BACKEND),$(ALL_GRPC_BACKENDS)) |
|
|
|
GRPC_BACKENDS?=$(ALL_GRPC_BACKENDS) $(OPTIONAL_GRPC) |
|
TEST_PATHS?=./api/... ./pkg/... ./core/... |
|
|
|
# If empty, then we build all |
|
ifeq ($(GRPC_BACKENDS),) |
|
GRPC_BACKENDS=$(ALL_GRPC_BACKENDS) |
|
endif |
|
|
|
ifeq ($(BUILD_API_ONLY),true) |
|
GRPC_BACKENDS= |
|
endif |
|
|
|
.PHONY: all test build vendor get-sources prepare-sources prepare |
|
|
|
all: help |
|
|
|
## BERT embeddings |
|
sources/go-bert.cpp: |
|
mkdir -p sources/go-bert.cpp |
|
cd sources/go-bert.cpp && \ |
|
git init && \ |
|
git remote add origin $(BERT_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(BERT_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/go-bert.cpp/libgobert.a: sources/go-bert.cpp |
|
$(MAKE) -C sources/go-bert.cpp libgobert.a |
|
|
|
## go-llama.cpp |
|
sources/go-llama.cpp: |
|
mkdir -p sources/go-llama.cpp |
|
cd sources/go-llama.cpp && \ |
|
git init && \ |
|
git remote add origin $(GOLLAMA_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(GOLLAMA_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/go-llama.cpp/libbinding.a: sources/go-llama.cpp |
|
$(MAKE) -C sources/go-llama.cpp BUILD_TYPE=$(STABLE_BUILD_TYPE) libbinding.a |
|
|
|
## go-piper |
|
sources/go-piper: |
|
mkdir -p sources/go-piper |
|
cd sources/go-piper && \ |
|
git init && \ |
|
git remote add origin $(PIPER_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(PIPER_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/go-piper/libpiper_binding.a: sources/go-piper |
|
$(MAKE) -C sources/go-piper libpiper_binding.a example/main piper.o |
|
|
|
## GPT4ALL |
|
sources/gpt4all: |
|
mkdir -p sources/gpt4all |
|
cd sources/gpt4all && \ |
|
git init && \ |
|
git remote add origin $(GPT4ALL_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(GPT4ALL_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/gpt4all/gpt4all-bindings/golang/libgpt4all.a: sources/gpt4all |
|
$(MAKE) -C sources/gpt4all/gpt4all-bindings/golang/ libgpt4all.a |
|
|
|
## RWKV |
|
sources/go-rwkv.cpp: |
|
mkdir -p sources/go-rwkv.cpp |
|
cd sources/go-rwkv.cpp && \ |
|
git init && \ |
|
git remote add origin $(RWKV_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(RWKV_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/go-rwkv.cpp/librwkv.a: sources/go-rwkv.cpp |
|
cd sources/go-rwkv.cpp && cd rwkv.cpp && cmake . -DRWKV_BUILD_SHARED_LIBRARY=OFF && cmake --build . && cp librwkv.a .. |
|
|
|
## stable diffusion |
|
sources/go-stable-diffusion: |
|
mkdir -p sources/go-stable-diffusion |
|
cd sources/go-stable-diffusion && \ |
|
git init && \ |
|
git remote add origin $(STABLEDIFFUSION_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(STABLEDIFFUSION_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/go-stable-diffusion/libstablediffusion.a: sources/go-stable-diffusion |
|
CPATH="$(CPATH):/usr/include/opencv4" $(MAKE) -C sources/go-stable-diffusion libstablediffusion.a |
|
|
|
## tiny-dream |
|
sources/go-tiny-dream: |
|
mkdir -p sources/go-tiny-dream |
|
cd sources/go-tiny-dream && \ |
|
git init && \ |
|
git remote add origin $(TINYDREAM_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(TINYDREAM_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/go-tiny-dream/libtinydream.a: sources/go-tiny-dream |
|
$(MAKE) -C sources/go-tiny-dream libtinydream.a |
|
|
|
## whisper |
|
sources/whisper.cpp: |
|
mkdir -p sources/whisper.cpp |
|
cd sources/whisper.cpp && \ |
|
git init && \ |
|
git remote add origin $(WHISPER_REPO) && \ |
|
git fetch origin && \ |
|
git checkout $(WHISPER_CPP_VERSION) && \ |
|
git submodule update --init --recursive --depth 1 --single-branch |
|
|
|
sources/whisper.cpp/libwhisper.a: sources/whisper.cpp |
|
cd sources/whisper.cpp && $(MAKE) libwhisper.a libggml.a |
|
|
|
get-sources: sources/go-llama.cpp sources/gpt4all sources/go-piper sources/go-rwkv.cpp sources/whisper.cpp sources/go-bert.cpp sources/go-stable-diffusion sources/go-tiny-dream backend/cpp/llama/llama.cpp |
|
|
|
replace: |
|
$(GOCMD) mod edit -replace github.com/donomii/go-rwkv.cpp=$(CURDIR)/sources/go-rwkv.cpp |
|
$(GOCMD) mod edit -replace github.com/ggerganov/whisper.cpp=$(CURDIR)/sources/whisper.cpp |
|
$(GOCMD) mod edit -replace github.com/ggerganov/whisper.cpp/bindings/go=$(CURDIR)/sources/whisper.cpp/bindings/go |
|
$(GOCMD) mod edit -replace github.com/go-skynet/go-bert.cpp=$(CURDIR)/sources/go-bert.cpp |
|
$(GOCMD) mod edit -replace github.com/M0Rf30/go-tiny-dream=$(CURDIR)/sources/go-tiny-dream |
|
$(GOCMD) mod edit -replace github.com/mudler/go-piper=$(CURDIR)/sources/go-piper |
|
$(GOCMD) mod edit -replace github.com/mudler/go-stable-diffusion=$(CURDIR)/sources/go-stable-diffusion |
|
$(GOCMD) mod edit -replace github.com/nomic-ai/gpt4all/gpt4all-bindings/golang=$(CURDIR)/sources/gpt4all/gpt4all-bindings/golang |
|
$(GOCMD) mod edit -replace github.com/go-skynet/go-llama.cpp=$(CURDIR)/sources/go-llama.cpp |
|
|
|
dropreplace: |
|
$(GOCMD) mod edit -dropreplace github.com/donomii/go-rwkv.cpp |
|
$(GOCMD) mod edit -dropreplace github.com/ggerganov/whisper.cpp |
|
$(GOCMD) mod edit -dropreplace github.com/ggerganov/whisper.cpp/bindings/go |
|
$(GOCMD) mod edit -dropreplace github.com/go-skynet/go-bert.cpp |
|
$(GOCMD) mod edit -dropreplace github.com/M0Rf30/go-tiny-dream |
|
$(GOCMD) mod edit -dropreplace github.com/mudler/go-piper |
|
$(GOCMD) mod edit -dropreplace github.com/mudler/go-stable-diffusion |
|
$(GOCMD) mod edit -dropreplace github.com/nomic-ai/gpt4all/gpt4all-bindings/golang |
|
$(GOCMD) mod edit -dropreplace github.com/go-skynet/go-llama.cpp |
|
|
|
prepare-sources: get-sources replace |
|
$(GOCMD) mod download |
|
|
|
## GENERIC |
|
rebuild: ## Rebuilds the project |
|
$(GOCMD) clean -cache |
|
$(MAKE) -C sources/go-llama.cpp clean |
|
$(MAKE) -C sources/gpt4all/gpt4all-bindings/golang/ clean |
|
$(MAKE) -C sources/go-rwkv.cpp clean |
|
$(MAKE) -C sources/whisper.cpp clean |
|
$(MAKE) -C sources/go-stable-diffusion clean |
|
$(MAKE) -C sources/go-bert.cpp clean |
|
$(MAKE) -C sources/go-piper clean |
|
$(MAKE) -C sources/go-tiny-dream clean |
|
$(MAKE) build |
|
|
|
prepare: prepare-sources $(OPTIONAL_TARGETS) |
|
|
|
clean: ## Remove build related file |
|
$(GOCMD) clean -cache |
|
rm -f prepare |
|
rm -rf ./sources |
|
rm -rf $(BINARY_NAME) |
|
rm -rf release/ |
|
rm -rf backend-assets/* |
|
$(MAKE) -C backend/cpp/grpc clean |
|
$(MAKE) -C backend/cpp/llama clean |
|
rm -rf backend/cpp/llama-* || true |
|
$(MAKE) dropreplace |
|
$(MAKE) protogen-clean |
|
rmdir pkg/grpc/proto || true |
|
|
|
clean-tests: |
|
rm -rf test-models |
|
rm -rf test-dir |
|
rm -rf core/http/backend-assets |
|
|
|
## Build: |
|
build: prepare backend-assets grpcs ## Build the project |
|
$(info ${GREEN}I local-ai build info:${RESET}) |
|
$(info ${GREEN}I BUILD_TYPE: ${YELLOW}$(BUILD_TYPE)${RESET}) |
|
$(info ${GREEN}I GO_TAGS: ${YELLOW}$(GO_TAGS)${RESET}) |
|
$(info ${GREEN}I LD_FLAGS: ${YELLOW}$(LD_FLAGS)${RESET}) |
|
$(info ${GREEN}I UPX: ${YELLOW}$(UPX)${RESET}) |
|
ifneq ($(BACKEND_LIBS),) |
|
$(MAKE) backend-assets/lib |
|
cp -f $(BACKEND_LIBS) backend-assets/lib/ |
|
endif |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" $(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o $(BINARY_NAME) ./ |
|
|
|
build-minimal: |
|
BUILD_GRPC_FOR_BACKEND_LLAMA=true GRPC_BACKENDS="backend-assets/grpc/llama-cpp-avx2" GO_TAGS=p2p $(MAKE) build |
|
|
|
build-api: |
|
BUILD_GRPC_FOR_BACKEND_LLAMA=true BUILD_API_ONLY=true GO_TAGS=none $(MAKE) build |
|
|
|
backend-assets/lib: |
|
mkdir -p backend-assets/lib |
|
|
|
dist: |
|
$(MAKE) backend-assets/grpc/llama-cpp-avx2 |
|
ifeq ($(DETECT_LIBS),true) |
|
scripts/prepare-libs.sh backend-assets/grpc/llama-cpp-avx2 |
|
endif |
|
ifeq ($(OS),Darwin) |
|
$(info ${GREEN}I Skip CUDA/hipblas build on MacOS${RESET}) |
|
else |
|
$(MAKE) backend-assets/grpc/llama-cpp-cuda |
|
$(MAKE) backend-assets/grpc/llama-cpp-hipblas |
|
$(MAKE) backend-assets/grpc/llama-cpp-sycl_f16 |
|
$(MAKE) backend-assets/grpc/llama-cpp-sycl_f32 |
|
endif |
|
GO_TAGS="tts p2p" $(MAKE) build |
|
ifeq ($(DETECT_LIBS),true) |
|
scripts/prepare-libs.sh backend-assets/grpc/piper |
|
endif |
|
GO_TAGS="tts p2p" STATIC=true $(MAKE) build |
|
mkdir -p release |
|
# if BUILD_ID is empty, then we don't append it to the binary name |
|
ifeq ($(BUILD_ID),) |
|
cp $(BINARY_NAME) release/$(BINARY_NAME)-$(OS)-$(ARCH) |
|
shasum -a 256 release/$(BINARY_NAME)-$(OS)-$(ARCH) > release/$(BINARY_NAME)-$(OS)-$(ARCH).sha256 |
|
else |
|
cp $(BINARY_NAME) release/$(BINARY_NAME)-$(BUILD_ID)-$(OS)-$(ARCH) |
|
shasum -a 256 release/$(BINARY_NAME)-$(BUILD_ID)-$(OS)-$(ARCH) > release/$(BINARY_NAME)-$(BUILD_ID)-$(OS)-$(ARCH).sha256 |
|
endif |
|
|
|
dist-cross-linux-arm64: |
|
CMAKE_ARGS="$(CMAKE_ARGS) -DGGML_NATIVE=off" GRPC_BACKENDS="backend-assets/grpc/llama-cpp-fallback backend-assets/grpc/llama-cpp-grpc backend-assets/util/llama-cpp-rpc-server" GO_TAGS="p2p" \ |
|
STATIC=true $(MAKE) build |
|
mkdir -p release |
|
# if BUILD_ID is empty, then we don't append it to the binary name |
|
ifeq ($(BUILD_ID),) |
|
cp $(BINARY_NAME) release/$(BINARY_NAME)-$(OS)-arm64 |
|
shasum -a 256 release/$(BINARY_NAME)-$(OS)-arm64 > release/$(BINARY_NAME)-$(OS)-arm64.sha256 |
|
else |
|
cp $(BINARY_NAME) release/$(BINARY_NAME)-$(BUILD_ID)-$(OS)-arm64 |
|
shasum -a 256 release/$(BINARY_NAME)-$(BUILD_ID)-$(OS)-arm64 > release/$(BINARY_NAME)-$(BUILD_ID)-$(OS)-arm64.sha256 |
|
endif |
|
|
|
osx-signed: build |
|
codesign --deep --force --sign "$(OSX_SIGNING_IDENTITY)" --entitlements "./Entitlements.plist" "./$(BINARY_NAME)" |
|
|
|
## Run |
|
run: prepare ## run local-ai |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" $(GOCMD) run ./ |
|
|
|
test-models/testmodel.ggml: |
|
mkdir test-models |
|
mkdir test-dir |
|
wget -q https://huggingface.co/TheBloke/orca_mini_3B-GGML/resolve/main/orca-mini-3b.ggmlv3.q4_0.bin -O test-models/testmodel.ggml |
|
wget -q https://huggingface.co/ggerganov/whisper.cpp/resolve/main/ggml-base.en.bin -O test-models/whisper-en |
|
wget -q https://huggingface.co/mudler/all-MiniLM-L6-v2/resolve/main/ggml-model-q4_0.bin -O test-models/bert |
|
wget -q https://cdn.openai.com/whisper/draft-20220913a/micro-machines.wav -O test-dir/audio.wav |
|
wget -q https://huggingface.co/mudler/rwkv-4-raven-1.5B-ggml/resolve/main/RWKV-4-Raven-1B5-v11-Eng99%2525-Other1%2525-20230425-ctx4096_Q4_0.bin -O test-models/rwkv |
|
wget -q https://raw.githubusercontent.com/saharNooby/rwkv.cpp/5eb8f09c146ea8124633ab041d9ea0b1f1db4459/rwkv/20B_tokenizer.json -O test-models/rwkv.tokenizer.json |
|
cp tests/models_fixtures/* test-models |
|
|
|
prepare-test: grpcs |
|
cp -rf backend-assets core/http |
|
cp tests/models_fixtures/* test-models |
|
|
|
test: prepare test-models/testmodel.ggml grpcs |
|
@echo 'Running tests' |
|
export GO_TAGS="tts stablediffusion debug" |
|
$(MAKE) prepare-test |
|
HUGGINGFACE_GRPC=$(abspath ./)/backend/python/sentencetransformers/run.sh TEST_DIR=$(abspath ./)/test-dir/ FIXTURES=$(abspath ./)/tests/fixtures CONFIG_FILE=$(abspath ./)/test-models/config.yaml MODELS_PATH=$(abspath ./)/test-models \ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --label-filter="!gpt4all && !llama && !llama-gguf" --flake-attempts $(TEST_FLAKES) --fail-fast -v -r $(TEST_PATHS) |
|
$(MAKE) test-gpt4all |
|
$(MAKE) test-llama |
|
$(MAKE) test-llama-gguf |
|
$(MAKE) test-tts |
|
$(MAKE) test-stablediffusion |
|
|
|
prepare-e2e: |
|
mkdir -p $(TEST_DIR) |
|
cp -rfv $(abspath ./tests/e2e-fixtures)/gpu.yaml $(TEST_DIR)/gpu.yaml |
|
test -e $(TEST_DIR)/ggllm-test-model.bin || wget -q https://huggingface.co/TheBloke/CodeLlama-7B-Instruct-GGUF/resolve/main/codellama-7b-instruct.Q2_K.gguf -O $(TEST_DIR)/ggllm-test-model.bin |
|
docker build --build-arg GRPC_BACKENDS="$(GRPC_BACKENDS)" --build-arg IMAGE_TYPE=core --build-arg BUILD_TYPE=$(BUILD_TYPE) --build-arg CUDA_MAJOR_VERSION=12 --build-arg CUDA_MINOR_VERSION=0 --build-arg FFMPEG=true -t localai-tests . |
|
|
|
run-e2e-image: |
|
ls -liah $(abspath ./tests/e2e-fixtures) |
|
docker run -p 5390:8080 -e MODELS_PATH=/models -e THREADS=1 -e DEBUG=true -d --rm -v $(TEST_DIR):/models --gpus all --name e2e-tests-$(RANDOM) localai-tests |
|
|
|
run-e2e-aio: |
|
@echo 'Running e2e AIO tests' |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --flake-attempts 5 -v -r ./tests/e2e-aio |
|
|
|
test-e2e: |
|
@echo 'Running e2e tests' |
|
BUILD_TYPE=$(BUILD_TYPE) \ |
|
LOCALAI_API=http://$(E2E_BRIDGE_IP):5390/v1 \ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --flake-attempts 5 -v -r ./tests/e2e |
|
|
|
teardown-e2e: |
|
rm -rf $(TEST_DIR) || true |
|
docker stop $$(docker ps -q --filter ancestor=localai-tests) |
|
|
|
test-gpt4all: prepare-test |
|
TEST_DIR=$(abspath ./)/test-dir/ FIXTURES=$(abspath ./)/tests/fixtures CONFIG_FILE=$(abspath ./)/test-models/config.yaml MODELS_PATH=$(abspath ./)/test-models \ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --label-filter="gpt4all" --flake-attempts 5 -v -r $(TEST_PATHS) |
|
|
|
test-llama: prepare-test |
|
TEST_DIR=$(abspath ./)/test-dir/ FIXTURES=$(abspath ./)/tests/fixtures CONFIG_FILE=$(abspath ./)/test-models/config.yaml MODELS_PATH=$(abspath ./)/test-models \ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --label-filter="llama" --flake-attempts 5 -v -r $(TEST_PATHS) |
|
|
|
test-llama-gguf: prepare-test |
|
TEST_DIR=$(abspath ./)/test-dir/ FIXTURES=$(abspath ./)/tests/fixtures CONFIG_FILE=$(abspath ./)/test-models/config.yaml MODELS_PATH=$(abspath ./)/test-models \ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --label-filter="llama-gguf" --flake-attempts 5 -v -r $(TEST_PATHS) |
|
|
|
test-tts: prepare-test |
|
TEST_DIR=$(abspath ./)/test-dir/ FIXTURES=$(abspath ./)/tests/fixtures CONFIG_FILE=$(abspath ./)/test-models/config.yaml MODELS_PATH=$(abspath ./)/test-models \ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --label-filter="tts" --flake-attempts 1 -v -r $(TEST_PATHS) |
|
|
|
test-stablediffusion: prepare-test |
|
TEST_DIR=$(abspath ./)/test-dir/ FIXTURES=$(abspath ./)/tests/fixtures CONFIG_FILE=$(abspath ./)/test-models/config.yaml MODELS_PATH=$(abspath ./)/test-models \ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --label-filter="stablediffusion" --flake-attempts 1 -v -r $(TEST_PATHS) |
|
|
|
test-stores: backend-assets/grpc/local-store |
|
mkdir -p tests/integration/backend-assets/grpc |
|
cp -f backend-assets/grpc/local-store tests/integration/backend-assets/grpc/ |
|
$(GOCMD) run github.com/onsi/ginkgo/v2/ginkgo --label-filter="stores" --flake-attempts 1 -v -r tests/integration |
|
|
|
test-container: |
|
docker build --target requirements -t local-ai-test-container . |
|
docker run -ti --rm --entrypoint /bin/bash -ti -v $(abspath ./):/build local-ai-test-container |
|
|
|
## Help: |
|
help: ## Show this help. |
|
@echo '' |
|
@echo 'Usage:' |
|
@echo ' ${YELLOW}make${RESET} ${GREEN}<target>${RESET}' |
|
@echo '' |
|
@echo 'Targets:' |
|
@awk 'BEGIN {FS = ":.*? |
|
if (/^[a-zA-Z_-]+:.*? |
|
else if (/^ |
|
}' $(MAKEFILE_LIST) |
|
|
|
.PHONY: protogen |
|
protogen: protogen-go protogen-python |
|
|
|
.PHONY: protogen-clean |
|
protogen-clean: protogen-go-clean protogen-python-clean |
|
|
|
.PHONY: protogen-go |
|
protogen-go: |
|
mkdir -p pkg/grpc/proto |
|
protoc --experimental_allow_proto3_optional -Ibackend/ --go_out=pkg/grpc/proto/ --go_opt=paths=source_relative --go-grpc_out=pkg/grpc/proto/ --go-grpc_opt=paths=source_relative \ |
|
backend/backend.proto |
|
|
|
.PHONY: protogen-go-clean |
|
protogen-go-clean: |
|
$(RM) pkg/grpc/proto/backend.pb.go pkg/grpc/proto/backend_grpc.pb.go |
|
$(RM) bin/* |
|
|
|
.PHONY: protogen-python |
|
protogen-python: autogptq-protogen bark-protogen coqui-protogen diffusers-protogen exllama-protogen exllama2-protogen mamba-protogen petals-protogen rerankers-protogen sentencetransformers-protogen transformers-protogen parler-tts-protogen transformers-musicgen-protogen vall-e-x-protogen vllm-protogen openvoice-protogen |
|
|
|
.PHONY: protogen-python-clean |
|
protogen-python-clean: autogptq-protogen-clean bark-protogen-clean coqui-protogen-clean diffusers-protogen-clean exllama-protogen-clean exllama2-protogen-clean mamba-protogen-clean petals-protogen-clean sentencetransformers-protogen-clean rerankers-protogen-clean transformers-protogen-clean transformers-musicgen-protogen-clean parler-tts-protogen-clean vall-e-x-protogen-clean vllm-protogen-clean openvoice-protogen-clean |
|
|
|
.PHONY: autogptq-protogen |
|
autogptq-protogen: |
|
$(MAKE) -C backend/python/autogptq protogen |
|
|
|
.PHONY: autogptq-protogen-clean |
|
autogptq-protogen-clean: |
|
$(MAKE) -C backend/python/autogptq protogen-clean |
|
|
|
.PHONY: bark-protogen |
|
bark-protogen: |
|
$(MAKE) -C backend/python/bark protogen |
|
|
|
.PHONY: bark-protogen-clean |
|
bark-protogen-clean: |
|
$(MAKE) -C backend/python/bark protogen-clean |
|
|
|
.PHONY: coqui-protogen |
|
coqui-protogen: |
|
$(MAKE) -C backend/python/coqui protogen |
|
|
|
.PHONY: coqui-protogen-clean |
|
coqui-protogen-clean: |
|
$(MAKE) -C backend/python/coqui protogen-clean |
|
|
|
.PHONY: diffusers-protogen |
|
diffusers-protogen: |
|
$(MAKE) -C backend/python/diffusers protogen |
|
|
|
.PHONY: diffusers-protogen-clean |
|
diffusers-protogen-clean: |
|
$(MAKE) -C backend/python/diffusers protogen-clean |
|
|
|
.PHONY: exllama-protogen |
|
exllama-protogen: |
|
$(MAKE) -C backend/python/exllama protogen |
|
|
|
.PHONY: exllama-protogen-clean |
|
exllama-protogen-clean: |
|
$(MAKE) -C backend/python/exllama protogen-clean |
|
|
|
.PHONY: exllama2-protogen |
|
exllama2-protogen: |
|
$(MAKE) -C backend/python/exllama2 protogen |
|
|
|
.PHONY: exllama2-protogen-clean |
|
exllama2-protogen-clean: |
|
$(MAKE) -C backend/python/exllama2 protogen-clean |
|
|
|
.PHONY: mamba-protogen |
|
mamba-protogen: |
|
$(MAKE) -C backend/python/mamba protogen |
|
|
|
.PHONY: mamba-protogen-clean |
|
mamba-protogen-clean: |
|
$(MAKE) -C backend/python/mamba protogen-clean |
|
|
|
.PHONY: petals-protogen |
|
petals-protogen: |
|
$(MAKE) -C backend/python/petals protogen |
|
|
|
.PHONY: petals-protogen-clean |
|
petals-protogen-clean: |
|
$(MAKE) -C backend/python/petals protogen-clean |
|
|
|
.PHONY: rerankers-protogen |
|
rerankers-protogen: |
|
$(MAKE) -C backend/python/rerankers protogen |
|
|
|
.PHONY: rerankers-protogen-clean |
|
rerankers-protogen-clean: |
|
$(MAKE) -C backend/python/rerankers protogen-clean |
|
|
|
.PHONY: sentencetransformers-protogen |
|
sentencetransformers-protogen: |
|
$(MAKE) -C backend/python/sentencetransformers protogen |
|
|
|
.PHONY: sentencetransformers-protogen-clean |
|
sentencetransformers-protogen-clean: |
|
$(MAKE) -C backend/python/sentencetransformers protogen-clean |
|
|
|
.PHONY: transformers-protogen |
|
transformers-protogen: |
|
$(MAKE) -C backend/python/transformers protogen |
|
|
|
.PHONY: transformers-protogen-clean |
|
transformers-protogen-clean: |
|
$(MAKE) -C backend/python/transformers protogen-clean |
|
|
|
.PHONY: parler-tts-protogen |
|
parler-tts-protogen: |
|
$(MAKE) -C backend/python/parler-tts protogen |
|
|
|
.PHONY: parler-tts-protogen-clean |
|
parler-tts-protogen-clean: |
|
$(MAKE) -C backend/python/parler-tts protogen-clean |
|
|
|
.PHONY: transformers-musicgen-protogen |
|
transformers-musicgen-protogen: |
|
$(MAKE) -C backend/python/transformers-musicgen protogen |
|
|
|
.PHONY: transformers-musicgen-protogen-clean |
|
transformers-musicgen-protogen-clean: |
|
$(MAKE) -C backend/python/transformers-musicgen protogen-clean |
|
|
|
.PHONY: vall-e-x-protogen |
|
vall-e-x-protogen: |
|
$(MAKE) -C backend/python/vall-e-x protogen |
|
|
|
.PHONY: vall-e-x-protogen-clean |
|
vall-e-x-protogen-clean: |
|
$(MAKE) -C backend/python/vall-e-x protogen-clean |
|
|
|
.PHONY: openvoice-protogen |
|
openvoice-protogen: |
|
$(MAKE) -C backend/python/openvoice protogen |
|
|
|
.PHONY: openvoice-protogen-clean |
|
openvoice-protogen-clean: |
|
$(MAKE) -C backend/python/openvoice protogen-clean |
|
|
|
.PHONY: vllm-protogen |
|
vllm-protogen: |
|
$(MAKE) -C backend/python/vllm protogen |
|
|
|
.PHONY: vllm-protogen-clean |
|
vllm-protogen-clean: |
|
$(MAKE) -C backend/python/vllm protogen-clean |
|
|
|
|
|
|
|
prepare-extra-conda-environments: protogen-python |
|
$(MAKE) -C backend/python/autogptq |
|
$(MAKE) -C backend/python/bark |
|
$(MAKE) -C backend/python/coqui |
|
$(MAKE) -C backend/python/diffusers |
|
$(MAKE) -C backend/python/vllm |
|
$(MAKE) -C backend/python/mamba |
|
$(MAKE) -C backend/python/sentencetransformers |
|
$(MAKE) -C backend/python/rerankers |
|
$(MAKE) -C backend/python/transformers |
|
$(MAKE) -C backend/python/transformers-musicgen |
|
$(MAKE) -C backend/python/parler-tts |
|
$(MAKE) -C backend/python/vall-e-x |
|
$(MAKE) -C backend/python/openvoice |
|
$(MAKE) -C backend/python/exllama |
|
$(MAKE) -C backend/python/petals |
|
$(MAKE) -C backend/python/exllama2 |
|
|
|
prepare-test-extra: protogen-python |
|
$(MAKE) -C backend/python/transformers |
|
$(MAKE) -C backend/python/diffusers |
|
|
|
test-extra: prepare-test-extra |
|
$(MAKE) -C backend/python/transformers test |
|
$(MAKE) -C backend/python/diffusers test |
|
|
|
backend-assets: |
|
mkdir -p backend-assets |
|
ifeq ($(BUILD_API_ONLY),true) |
|
touch backend-assets/keep |
|
endif |
|
|
|
backend-assets/espeak-ng-data: sources/go-piper sources/go-piper/libpiper_binding.a |
|
mkdir -p backend-assets/espeak-ng-data |
|
@cp -rf sources/go-piper/piper-phonemize/pi/share/espeak-ng-data/. backend-assets/espeak-ng-data |
|
|
|
backend-assets/gpt4all: sources/gpt4all sources/gpt4all/gpt4all-bindings/golang/libgpt4all.a |
|
mkdir -p backend-assets/gpt4all |
|
@cp sources/gpt4all/gpt4all-bindings/golang/buildllm/*.so backend-assets/gpt4all/ || true |
|
@cp sources/gpt4all/gpt4all-bindings/golang/buildllm/*.dylib backend-assets/gpt4all/ || true |
|
@cp sources/gpt4all/gpt4all-bindings/golang/buildllm/*.dll backend-assets/gpt4all/ || true |
|
|
|
backend-assets/grpc: protogen-go replace |
|
mkdir -p backend-assets/grpc |
|
|
|
backend-assets/grpc/bert-embeddings: sources/go-bert.cpp sources/go-bert.cpp/libgobert.a backend-assets/grpc |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" C_INCLUDE_PATH=$(CURDIR)/sources/go-bert.cpp LIBRARY_PATH=$(CURDIR)/sources/go-bert.cpp \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/bert-embeddings ./backend/go/llm/bert/ |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/bert-embeddings |
|
endif |
|
|
|
backend-assets/grpc/gpt4all: sources/gpt4all sources/gpt4all/gpt4all-bindings/golang/libgpt4all.a backend-assets/gpt4all backend-assets/grpc |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" C_INCLUDE_PATH=$(CURDIR)/sources/gpt4all/gpt4all-bindings/golang/ LIBRARY_PATH=$(CURDIR)/sources/gpt4all/gpt4all-bindings/golang/ \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/gpt4all ./backend/go/llm/gpt4all/ |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/gpt4all |
|
endif |
|
|
|
backend-assets/grpc/huggingface: backend-assets/grpc |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/huggingface ./backend/go/llm/langchain/ |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/huggingface |
|
endif |
|
|
|
backend/cpp/llama/llama.cpp: |
|
LLAMA_VERSION=$(CPPLLAMA_VERSION) $(MAKE) -C backend/cpp/llama llama.cpp |
|
|
|
INSTALLED_PACKAGES=$(CURDIR)/backend/cpp/grpc/installed_packages |
|
INSTALLED_LIB_CMAKE=$(INSTALLED_PACKAGES)/lib/cmake |
|
ADDED_CMAKE_ARGS=-Dabsl_DIR=${INSTALLED_LIB_CMAKE}/absl \ |
|
-DProtobuf_DIR=${INSTALLED_LIB_CMAKE}/protobuf \ |
|
-Dutf8_range_DIR=${INSTALLED_LIB_CMAKE}/utf8_range \ |
|
-DgRPC_DIR=${INSTALLED_LIB_CMAKE}/grpc \ |
|
-DCMAKE_CXX_STANDARD_INCLUDE_DIRECTORIES=${INSTALLED_PACKAGES}/include |
|
build-llama-cpp-grpc-server: |
|
|
|
ifdef BUILD_GRPC_FOR_BACKEND_LLAMA |
|
$(MAKE) -C backend/cpp/grpc build |
|
_PROTOBUF_PROTOC=${INSTALLED_PACKAGES}/bin/proto \ |
|
_GRPC_CPP_PLUGIN_EXECUTABLE=${INSTALLED_PACKAGES}/bin/grpc_cpp_plugin \ |
|
PATH="${INSTALLED_PACKAGES}/bin:${PATH}" \ |
|
CMAKE_ARGS="${CMAKE_ARGS} ${ADDED_CMAKE_ARGS}" \ |
|
LLAMA_VERSION=$(CPPLLAMA_VERSION) \ |
|
$(MAKE) -C backend/cpp/${VARIANT} grpc-server |
|
else |
|
echo "BUILD_GRPC_FOR_BACKEND_LLAMA is not defined." |
|
LLAMA_VERSION=$(CPPLLAMA_VERSION) $(MAKE) -C backend/cpp/${VARIANT} grpc-server |
|
endif |
|
|
|
|
|
backend-assets/grpc/llama-cpp: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-cpp |
|
$(MAKE) -C backend/cpp/llama-cpp purge |
|
$(info ${GREEN}I llama-cpp build info:avx2${RESET}) |
|
$(MAKE) VARIANT="llama-cpp" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-cpp/grpc-server backend-assets/grpc/llama-cpp |
|
|
|
backend-assets/grpc/llama-cpp-avx2: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-avx2 |
|
$(MAKE) -C backend/cpp/llama-avx2 purge |
|
$(info ${GREEN}I llama-cpp build info:avx2${RESET}) |
|
CMAKE_ARGS="$(CMAKE_ARGS) -DGGML_AVX=on -DGGML_AVX2=on -DGGML_AVX512=off -DGGML_FMA=on -DGGML_F16C=on" $(MAKE) VARIANT="llama-avx2" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-avx2/grpc-server backend-assets/grpc/llama-cpp-avx2 |
|
|
|
backend-assets/grpc/llama-cpp-avx: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-avx |
|
$(MAKE) -C backend/cpp/llama-avx purge |
|
$(info ${GREEN}I llama-cpp build info:avx${RESET}) |
|
CMAKE_ARGS="$(CMAKE_ARGS) -DGGML_AVX=on -DGGML_AVX2=off -DGGML_AVX512=off -DGGML_FMA=off -DGGML_F16C=off" $(MAKE) VARIANT="llama-avx" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-avx/grpc-server backend-assets/grpc/llama-cpp-avx |
|
|
|
backend-assets/grpc/llama-cpp-fallback: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-fallback |
|
$(MAKE) -C backend/cpp/llama-fallback purge |
|
$(info ${GREEN}I llama-cpp build info:fallback${RESET}) |
|
CMAKE_ARGS="$(CMAKE_ARGS) -DGGML_AVX=off -DGGML_AVX2=off -DGGML_AVX512=off -DGGML_FMA=off -DGGML_F16C=off" $(MAKE) VARIANT="llama-fallback" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-fallback/grpc-server backend-assets/grpc/llama-cpp-fallback |
|
|
|
ifeq ($(BUILD_TYPE),metal) |
|
cp backend/cpp/llama-fallback/llama.cpp/build/bin/default.metallib backend-assets/grpc/ |
|
endif |
|
|
|
backend-assets/grpc/llama-cpp-cuda: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-cuda |
|
$(MAKE) -C backend/cpp/llama-cuda purge |
|
$(info ${GREEN}I llama-cpp build info:cuda${RESET}) |
|
CMAKE_ARGS="$(CMAKE_ARGS) -DGGML_AVX=on -DGGML_AVX2=off -DGGML_AVX512=off -DGGML_FMA=off -DGGML_F16C=off -DGGML_CUDA=ON" $(MAKE) VARIANT="llama-cuda" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-cuda/grpc-server backend-assets/grpc/llama-cpp-cuda |
|
|
|
backend-assets/grpc/llama-cpp-hipblas: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-hipblas |
|
$(MAKE) -C backend/cpp/llama-hipblas purge |
|
$(info ${GREEN}I llama-cpp build info:hipblas${RESET}) |
|
BUILD_TYPE="hipblas" $(MAKE) VARIANT="llama-hipblas" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-hipblas/grpc-server backend-assets/grpc/llama-cpp-hipblas |
|
|
|
backend-assets/grpc/llama-cpp-sycl_f16: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-sycl_f16 |
|
$(MAKE) -C backend/cpp/llama-sycl_f16 purge |
|
$(info ${GREEN}I llama-cpp build info:sycl_f16${RESET}) |
|
BUILD_TYPE="sycl_f16" $(MAKE) VARIANT="llama-sycl_f16" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-sycl_f16/grpc-server backend-assets/grpc/llama-cpp-sycl_f16 |
|
|
|
backend-assets/grpc/llama-cpp-sycl_f32: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-sycl_f32 |
|
$(MAKE) -C backend/cpp/llama-sycl_f32 purge |
|
$(info ${GREEN}I llama-cpp build info:sycl_f32${RESET}) |
|
BUILD_TYPE="sycl_f32" $(MAKE) VARIANT="llama-sycl_f32" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-sycl_f32/grpc-server backend-assets/grpc/llama-cpp-sycl_f32 |
|
|
|
backend-assets/grpc/llama-cpp-grpc: backend-assets/grpc backend/cpp/llama/llama.cpp |
|
cp -rf backend/cpp/llama backend/cpp/llama-grpc |
|
$(MAKE) -C backend/cpp/llama-grpc purge |
|
$(info ${GREEN}I llama-cpp build info:grpc${RESET}) |
|
CMAKE_ARGS="$(CMAKE_ARGS) -DGGML_RPC=ON -DGGML_AVX=off -DGGML_AVX2=off -DGGML_AVX512=off -DGGML_FMA=off -DGGML_F16C=off" TARGET="--target grpc-server --target rpc-server" $(MAKE) VARIANT="llama-grpc" build-llama-cpp-grpc-server |
|
cp -rfv backend/cpp/llama-grpc/grpc-server backend-assets/grpc/llama-cpp-grpc |
|
|
|
backend-assets/util/llama-cpp-rpc-server: backend-assets/grpc/llama-cpp-grpc |
|
mkdir -p backend-assets/util/ |
|
cp -rf backend/cpp/llama-grpc/llama.cpp/build/bin/rpc-server backend-assets/util/llama-cpp-rpc-server |
|
|
|
backend-assets/grpc/llama-ggml: sources/go-llama.cpp sources/go-llama.cpp/libbinding.a backend-assets/grpc |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" C_INCLUDE_PATH=$(CURDIR)/sources/go-llama.cpp LIBRARY_PATH=$(CURDIR)/sources/go-llama.cpp \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/llama-ggml ./backend/go/llm/llama-ggml/ |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/llama-ggml |
|
endif |
|
|
|
backend-assets/grpc/piper: sources/go-piper sources/go-piper/libpiper_binding.a backend-assets/grpc backend-assets/espeak-ng-data |
|
CGO_CXXFLAGS="$(PIPER_CGO_CXXFLAGS)" CGO_LDFLAGS="$(PIPER_CGO_LDFLAGS)" LIBRARY_PATH=$(CURDIR)/sources/go-piper \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/piper ./backend/go/tts/ |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/piper |
|
endif |
|
|
|
backend-assets/grpc/rwkv: sources/go-rwkv.cpp sources/go-rwkv.cpp/librwkv.a backend-assets/grpc |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" C_INCLUDE_PATH=$(CURDIR)/sources/go-rwkv.cpp LIBRARY_PATH=$(CURDIR)/sources/go-rwkv.cpp \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/rwkv ./backend/go/llm/rwkv |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/rwkv |
|
endif |
|
|
|
backend-assets/grpc/stablediffusion: sources/go-stable-diffusion sources/go-stable-diffusion/libstablediffusion.a backend-assets/grpc |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" CPATH="$(CPATH):$(CURDIR)/sources/go-stable-diffusion/:/usr/include/opencv4" LIBRARY_PATH=$(CURDIR)/sources/go-stable-diffusion/ \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/stablediffusion ./backend/go/image/stablediffusion |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/stablediffusion |
|
endif |
|
|
|
backend-assets/grpc/tinydream: sources/go-tiny-dream sources/go-tiny-dream/libtinydream.a backend-assets/grpc |
|
CGO_LDFLAGS="$(CGO_LDFLAGS)" LIBRARY_PATH=$(CURDIR)/go-tiny-dream \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/tinydream ./backend/go/image/tinydream |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/tinydream |
|
endif |
|
|
|
backend-assets/grpc/whisper: sources/whisper.cpp sources/whisper.cpp/libwhisper.a backend-assets/grpc |
|
CGO_LDFLAGS="$(CGO_LDFLAGS) $(CGO_LDFLAGS_WHISPER)" C_INCLUDE_PATH="$(CURDIR)/sources/whisper.cpp/include:$(CURDIR)/sources/whisper.cpp/ggml/include" LIBRARY_PATH=$(CURDIR)/sources/whisper.cpp \ |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/whisper ./backend/go/transcribe/ |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/whisper |
|
endif |
|
|
|
backend-assets/grpc/local-store: backend-assets/grpc |
|
$(GOCMD) build -ldflags "$(LD_FLAGS)" -tags "$(GO_TAGS)" -o backend-assets/grpc/local-store ./backend/go/stores/ |
|
ifneq ($(UPX),) |
|
$(UPX) backend-assets/grpc/local-store |
|
endif |
|
|
|
grpcs: prepare $(GRPC_BACKENDS) |
|
|
|
DOCKER_IMAGE?=local-ai |
|
DOCKER_AIO_IMAGE?=local-ai-aio |
|
IMAGE_TYPE?=core |
|
BASE_IMAGE?=ubuntu:22.04 |
|
|
|
docker: |
|
docker build \ |
|
--build-arg BASE_IMAGE=$(BASE_IMAGE) \ |
|
--build-arg IMAGE_TYPE=$(IMAGE_TYPE) \ |
|
--build-arg GO_TAGS="$(GO_TAGS)" \ |
|
--build-arg MAKEFLAGS="$(DOCKER_MAKEFLAGS)" \ |
|
--build-arg BUILD_TYPE=$(BUILD_TYPE) \ |
|
-t $(DOCKER_IMAGE) . |
|
|
|
docker-cuda11: |
|
docker build \ |
|
--build-arg CUDA_MAJOR_VERSION=11 \ |
|
--build-arg CUDA_MINOR_VERSION=8 \ |
|
--build-arg BASE_IMAGE=$(BASE_IMAGE) \ |
|
--build-arg IMAGE_TYPE=$(IMAGE_TYPE) \ |
|
--build-arg GO_TAGS="$(GO_TAGS)" \ |
|
--build-arg MAKEFLAGS="$(DOCKER_MAKEFLAGS)" \ |
|
--build-arg BUILD_TYPE=$(BUILD_TYPE) \ |
|
-t $(DOCKER_IMAGE)-cuda11 . |
|
|
|
docker-aio: |
|
@echo "Building AIO image with base $(BASE_IMAGE) as $(DOCKER_AIO_IMAGE)" |
|
docker build \ |
|
--build-arg BASE_IMAGE=$(BASE_IMAGE) \ |
|
--build-arg MAKEFLAGS="$(DOCKER_MAKEFLAGS)" \ |
|
-t $(DOCKER_AIO_IMAGE) -f Dockerfile.aio . |
|
|
|
docker-aio-all: |
|
$(MAKE) docker-aio DOCKER_AIO_SIZE=cpu |
|
$(MAKE) docker-aio DOCKER_AIO_SIZE=cpu |
|
|
|
docker-image-intel: |
|
docker build \ |
|
--build-arg BASE_IMAGE=intel/oneapi-basekit:2024.2.0-devel-ubuntu22.04 \ |
|
--build-arg IMAGE_TYPE=$(IMAGE_TYPE) \ |
|
--build-arg GO_TAGS="none" \ |
|
--build-arg MAKEFLAGS="$(DOCKER_MAKEFLAGS)" \ |
|
--build-arg BUILD_TYPE=sycl_f32 -t $(DOCKER_IMAGE) . |
|
|
|
docker-image-intel-xpu: |
|
docker build \ |
|
--build-arg BASE_IMAGE=intel/oneapi-basekit:2024.2.0-devel-ubuntu22.04 \ |
|
--build-arg IMAGE_TYPE=$(IMAGE_TYPE) \ |
|
--build-arg GO_TAGS="none" \ |
|
--build-arg MAKEFLAGS="$(DOCKER_MAKEFLAGS)" \ |
|
--build-arg BUILD_TYPE=sycl_f32 -t $(DOCKER_IMAGE) . |
|
|
|
.PHONY: swagger |
|
swagger: |
|
swag init -g core/http/app.go --output swagger |
|
|
|
.PHONY: gen-assets |
|
gen-assets: |
|
$(GOCMD) run core/dependencies_manager/manager.go embedded/webui_static.yaml core/http/static/assets |
|
|
|
|
|
docs/layouts/_default: |
|
mkdir -p docs/layouts/_default |
|
|
|
docs/static/gallery.html: docs/layouts/_default |
|
$(GOCMD) run ./.github/ci/modelslist.go ./gallery/index.yaml > docs/static/gallery.html |
|
|
|
docs/public: docs/layouts/_default docs/static/gallery.html |
|
cd docs && hugo --minify |
|
|
|
docs-clean: |
|
rm -rf docs/public |
|
rm -rf docs/static/gallery.html |
|
|
|
.PHONY: docs |
|
docs: docs/static/gallery.html |
|
cd docs && hugo serve |
|
|