forked from wylab/llama-swap
bc01e6f539
Add sd-server from stable-diffusion.cpp docker image for vulkan and musa containers. closes #450
33 lines
809 B
YAML
33 lines
809 B
YAML
healthCheckTimeout: 300
|
|
logRequests: true
|
|
metricsMaxInMemory: 1000
|
|
|
|
models:
|
|
"qwen2.5":
|
|
proxy: "http://127.0.0.1:9999"
|
|
cmd: >
|
|
/app/llama-server
|
|
-hf bartowski/Qwen2.5-0.5B-Instruct-GGUF:Q4_K_M
|
|
--port 9999
|
|
|
|
"smollm2":
|
|
proxy: "http://127.0.0.1:9999"
|
|
cmd: >
|
|
/app/llama-server
|
|
-hf bartowski/SmolLM2-135M-Instruct-GGUF:Q4_K_M
|
|
--port 9999
|
|
|
|
z-image:
|
|
checkEndpoint: /
|
|
cmd: |
|
|
/app/sd-server
|
|
--listen-port 9999
|
|
--diffusion-fa
|
|
--diffusion-model /models/z_image_turbo-Q8_0.gguf
|
|
--vae /models/ae.safetensors
|
|
--llm /models/qwen3-4b-instruct-2507-q8_0.gguf
|
|
--offload-to-cpu
|
|
--cfg-scale 1.0
|
|
--height 512 --width 512
|
|
--steps 8
|
|
aliases: [gpt-image-1,dall-e-2,dall-e-3,gpt-image-1-mini,gpt-image-1.5] |