added qwable and orinth
This commit is contained in:
@@ -436,6 +436,7 @@ for svc in (
|
||||
"kimi-linear",
|
||||
"qwen3-235b",
|
||||
"qwable",
|
||||
"ornith",
|
||||
"litellm",
|
||||
"comfyui",
|
||||
"openwebui",
|
||||
@@ -726,6 +727,23 @@ for asset, mode in (
|
||||
_sudo=True,
|
||||
)
|
||||
|
||||
# Ornith operator assets. Same image as llama (kyuz0 rocm-7.2.2); MoE
|
||||
# 35B-A3B agentic-coding fine-tune of Qwen3.5. Weights live at
|
||||
# /models/qwen/Ornith-1.0-35B via manual `hf download` per the README.
|
||||
# swap-model `ornith` target.
|
||||
for asset, mode in (
|
||||
("smoke.sh", "0775"),
|
||||
("README.md", "0664"),
|
||||
):
|
||||
files.put(
|
||||
name=f"ornith: {asset}",
|
||||
src=f"compose/ornith/{asset}",
|
||||
dest=f"{COMPOSE_DIR}/ornith/{asset}",
|
||||
group="docker",
|
||||
mode=mode,
|
||||
_sudo=True,
|
||||
)
|
||||
|
||||
# LiteLLM router assets. config.yaml is the source-of-truth model
|
||||
# routing table — pyinfra syncs it on every run; edits on the box get
|
||||
# overwritten. The .env file holds LITELLM_MASTER_KEY + LITELLM_SALT_KEY
|
||||
|
||||
Reference in New Issue
Block a user