|
1 | 1 | # Disable parallel execution for backend builds |
2 | | -.NOTPARALLEL: backends/diffusers backends/llama-cpp backends/turboquant backends/outetts backends/piper backends/stablediffusion-ggml backends/whisper backends/faster-whisper backends/silero-vad backends/local-store backends/huggingface backends/rfdetr backends/kitten-tts backends/kokoro backends/chatterbox backends/llama-cpp-darwin backends/neutts build-darwin-python-backend build-darwin-go-backend backends/mlx backends/diffuser-darwin backends/mlx-vlm backends/mlx-audio backends/mlx-distributed backends/stablediffusion-ggml-darwin backends/vllm backends/vllm-omni backends/moonshine backends/pocket-tts backends/qwen-tts backends/faster-qwen3-tts backends/qwen-asr backends/nemo backends/voxcpm backends/whisperx backends/ace-step backends/acestep-cpp backends/fish-speech backends/voxtral backends/opus backends/trl backends/llama-cpp-quantization backends/kokoros backends/sam3-cpp backends/qwen3-tts-cpp backends/tinygrad |
| 2 | +.NOTPARALLEL: backends/diffusers backends/llama-cpp backends/turboquant backends/outetts backends/piper backends/stablediffusion-ggml backends/whisper backends/faster-whisper backends/silero-vad backends/local-store backends/huggingface backends/rfdetr backends/kitten-tts backends/kokoro backends/chatterbox backends/llama-cpp-darwin backends/neutts build-darwin-python-backend build-darwin-go-backend backends/mlx backends/diffuser-darwin backends/mlx-vlm backends/mlx-audio backends/mlx-distributed backends/stablediffusion-ggml-darwin backends/vllm backends/vllm-omni backends/sglang backends/moonshine backends/pocket-tts backends/qwen-tts backends/faster-qwen3-tts backends/qwen-asr backends/nemo backends/voxcpm backends/whisperx backends/ace-step backends/acestep-cpp backends/fish-speech backends/voxtral backends/opus backends/trl backends/llama-cpp-quantization backends/kokoros backends/sam3-cpp backends/qwen3-tts-cpp backends/tinygrad |
3 | 3 |
|
4 | 4 | GOCMD=go |
5 | 5 | GOTEST=$(GOCMD) test |
@@ -419,6 +419,7 @@ prepare-test-extra: protogen-python |
419 | 419 | $(MAKE) -C backend/python/chatterbox |
420 | 420 | $(MAKE) -C backend/python/vllm |
421 | 421 | $(MAKE) -C backend/python/vllm-omni |
| 422 | + $(MAKE) -C backend/python/sglang |
422 | 423 | $(MAKE) -C backend/python/vibevoice |
423 | 424 | $(MAKE) -C backend/python/moonshine |
424 | 425 | $(MAKE) -C backend/python/pocket-tts |
@@ -602,6 +603,17 @@ test-extra-backend-tinygrad-all: \ |
602 | 603 | test-extra-backend-tinygrad-sd \ |
603 | 604 | test-extra-backend-tinygrad-whisper |
604 | 605 |
|
| 606 | +## sglang mirrors the vllm setup: HuggingFace model id, same tiny Qwen, |
| 607 | +## tool-call extraction via sglang's native qwen parser. CPU builds use |
| 608 | +## sglang's upstream pyproject_cpu.toml recipe (see backend/python/sglang/install.sh). |
| 609 | +test-extra-backend-sglang: docker-build-sglang |
| 610 | + BACKEND_IMAGE=local-ai-backend:sglang \ |
| 611 | + BACKEND_TEST_MODEL_NAME=Qwen/Qwen2.5-0.5B-Instruct \ |
| 612 | + BACKEND_TEST_CAPS=health,load,predict,stream,tools \ |
| 613 | + BACKEND_TEST_OPTIONS=tool_parser:qwen \ |
| 614 | + $(MAKE) test-extra-backend |
| 615 | + |
| 616 | + |
605 | 617 | ## mlx is Apple-Silicon-first — the MLX backend auto-detects the right tool |
606 | 618 | ## parser from the chat template, so no tool_parser: option is needed (it |
607 | 619 | ## would be ignored at runtime). Run this on macOS / arm64 with Metal; the |
@@ -741,6 +753,7 @@ BACKEND_NEUTTS = neutts|python|.|false|true |
741 | 753 | BACKEND_KOKORO = kokoro|python|.|false|true |
742 | 754 | BACKEND_VLLM = vllm|python|.|false|true |
743 | 755 | BACKEND_VLLM_OMNI = vllm-omni|python|.|false|true |
| 756 | +BACKEND_SGLANG = sglang|python|.|false|true |
744 | 757 | BACKEND_DIFFUSERS = diffusers|python|.|--progress=plain|true |
745 | 758 | BACKEND_CHATTERBOX = chatterbox|python|.|false|true |
746 | 759 | BACKEND_VIBEVOICE = vibevoice|python|.|--progress=plain|true |
@@ -811,6 +824,7 @@ $(eval $(call generate-docker-build-target,$(BACKEND_NEUTTS))) |
811 | 824 | $(eval $(call generate-docker-build-target,$(BACKEND_KOKORO))) |
812 | 825 | $(eval $(call generate-docker-build-target,$(BACKEND_VLLM))) |
813 | 826 | $(eval $(call generate-docker-build-target,$(BACKEND_VLLM_OMNI))) |
| 827 | +$(eval $(call generate-docker-build-target,$(BACKEND_SGLANG))) |
814 | 828 | $(eval $(call generate-docker-build-target,$(BACKEND_DIFFUSERS))) |
815 | 829 | $(eval $(call generate-docker-build-target,$(BACKEND_CHATTERBOX))) |
816 | 830 | $(eval $(call generate-docker-build-target,$(BACKEND_VIBEVOICE))) |
@@ -839,7 +853,7 @@ $(eval $(call generate-docker-build-target,$(BACKEND_SAM3_CPP))) |
839 | 853 | docker-save-%: backend-images |
840 | 854 | docker save local-ai-backend:$* -o backend-images/$*.tar |
841 | 855 |
|
842 | | -docker-build-backends: docker-build-llama-cpp docker-build-ik-llama-cpp docker-build-turboquant docker-build-rerankers docker-build-vllm docker-build-vllm-omni docker-build-transformers docker-build-outetts docker-build-diffusers docker-build-kokoro docker-build-faster-whisper docker-build-coqui docker-build-chatterbox docker-build-vibevoice docker-build-moonshine docker-build-pocket-tts docker-build-qwen-tts docker-build-fish-speech docker-build-faster-qwen3-tts docker-build-qwen-asr docker-build-nemo docker-build-voxcpm docker-build-whisperx docker-build-ace-step docker-build-acestep-cpp docker-build-voxtral docker-build-mlx-distributed docker-build-trl docker-build-llama-cpp-quantization docker-build-tinygrad docker-build-kokoros docker-build-sam3-cpp docker-build-qwen3-tts-cpp |
| 856 | +docker-build-backends: docker-build-llama-cpp docker-build-ik-llama-cpp docker-build-turboquant docker-build-rerankers docker-build-vllm docker-build-vllm-omni docker-build-sglang docker-build-transformers docker-build-outetts docker-build-diffusers docker-build-kokoro docker-build-faster-whisper docker-build-coqui docker-build-chatterbox docker-build-vibevoice docker-build-moonshine docker-build-pocket-tts docker-build-qwen-tts docker-build-fish-speech docker-build-faster-qwen3-tts docker-build-qwen-asr docker-build-nemo docker-build-voxcpm docker-build-whisperx docker-build-ace-step docker-build-acestep-cpp docker-build-voxtral docker-build-mlx-distributed docker-build-trl docker-build-llama-cpp-quantization docker-build-tinygrad docker-build-kokoros docker-build-sam3-cpp docker-build-qwen3-tts-cpp |
843 | 857 |
|
844 | 858 | ######################################################## |
845 | 859 | ### Mock Backend for E2E Tests |
|
0 commit comments