Compare commits

..

3 Commits

Author SHA1 Message Date
69da2b8c5b fix: fix bugs for initContainer in LWS 2025-12-02 16:37:57 +08:00
4e9a086547 Update values.schema.json to add numerous new model names for enhanced support
All checks were successful
Publish Helm Charts / helm-publish (push) Successful in 7s
2025-12-02 08:35:12 +00:00
5aebfc5cdf Update vllm-serve/templates/single.yaml
All checks were successful
Publish Helm Charts / helm-publish (push) Successful in 7s
2025-12-02 07:55:47 +00:00
3 changed files with 138 additions and 3 deletions

View File

@ -50,7 +50,7 @@ spec:
exit 0
fi
echo "⬇️ Starting download..."
apk add --no-cache bash aria2 wget ca-certificates
apk add --no-cache bash aria2 wget ca-certificates curl
wget https://hf-mirror.com/hfd/hfd.sh -O hfd.sh && chmod +x hfd.sh
./hfd.sh {{ .Values.model.huggingfaceName }} --tool aria2c -x 8 --local-dir "$DEST_DIR"

View File

@ -51,7 +51,7 @@ spec:
exit 0
fi
echo "⬇️ Starting download..."
apk add --no-cache bash aria2 wget ca-certificates
apk add --no-cache bash aria2 wget ca-certificates curl
wget https://hf-mirror.com/hfd/hfd.sh -O hfd.sh && chmod +x hfd.sh
./hfd.sh {{ .Values.model.huggingfaceName }} --tool aria2c -x 8 --local-dir "$DEST_DIR"

View File

@ -440,7 +440,142 @@
"tencent/DRIVE-RL",
"tencent/DRIVE-SFT",
"Qwen/Qwen2.5-14B",
"BAAI/bge-base-zh-v1.5"
"BAAI/bge-base-zh-v1.5",
"01-ai/Yi-1.5-34B",
"01-ai/Yi-1.5-6B",
"01-ai/Yi-1.5-9B",
"01-ai/Yi-34B-Chat",
"ByteDance/Dolphin-1.5",
"ByteDance/Ouro-1.4B",
"ByteDance/Ouro-1.4B-Thinking",
"ByteDance/Ouro-2.6B",
"ByteDance/Ouro-2.6B-Thinking",
"OpenGVLab/InternVL3-38B",
"OpenGVLab/InternVL3-78B",
"OpenGVLab/InternVL3_5-1B",
"OpenGVLab/InternVL3_5-30B-A3B-Instruct",
"OpenGVLab/InternVL3_5-38B",
"OpenGVLab/InternVL3_5-8B",
"OpenGVLab/InternVL3_5-GPT-OSS-20B-A4B-Preview",
"OpenGVLab/Mini-InternVL2-2B-DA-Medical",
"OpenGVLab/SDLM-32B-D4",
"Qwen/CodeQwen1.5-7B-Chat",
"Qwen/Qwen1.5-1.8B",
"Qwen/Qwen1.5-MoE-A2.7B-Chat-GPTQ-Int4",
"Qwen/Qwen2-0.5B",
"Qwen/Qwen2-Math-72B-Instruct",
"Qwen/Qwen2.5-0.5B",
"Qwen/Qwen2.5-1.5B",
"Qwen/Qwen2.5-1.5B-Instruct",
"Qwen/Qwen2.5-1.5B-Instruct-GGUF",
"Qwen/Qwen2.5-14B-Instruct",
"Qwen/Qwen2.5-14B-Instruct-1M",
"Qwen/Qwen2.5-32B-Instruct",
"Qwen/Qwen2.5-32B-Instruct-AWQ",
"Qwen/Qwen2.5-32B-Instruct-GPTQ-Int4",
"Qwen/Qwen2.5-3B-Instruct",
"Qwen/Qwen2.5-3B-Instruct-GGUF",
"Qwen/Qwen2.5-72B-Instruct",
"Qwen/Qwen2.5-7B",
"Qwen/Qwen2.5-7B-Instruct",
"Qwen/Qwen2.5-7B-Instruct-1M",
"Qwen/Qwen2.5-7B-Instruct-GGUF",
"Qwen/Qwen2.5-Coder-0.5B",
"Qwen/Qwen2.5-Coder-1.5B",
"Qwen/Qwen2.5-Coder-1.5B-Instruct",
"Qwen/Qwen2.5-Coder-14B-Instruct",
"Qwen/Qwen2.5-Coder-32B-Instruct",
"Qwen/Qwen2.5-Coder-3B-Instruct-GGUF",
"Qwen/Qwen2.5-Coder-7B-Instruct",
"Qwen/Qwen2.5-Coder-7B-Instruct-GGUF",
"Qwen/Qwen2.5-Math-72B",
"Qwen/Qwen2.5-Math-7B",
"Qwen/Qwen2.5-VL-32B-Instruct",
"Qwen/Qwen2.5-VL-72B-Instruct-AWQ",
"Qwen/Qwen2.5-VL-7B-Instruct",
"Qwen/Qwen3-0.6B",
"Qwen/Qwen3-0.6B-Base",
"Qwen/Qwen3-1.7B",
"Qwen/Qwen3-1.7B-FP8",
"Qwen/Qwen3-14B-FP8",
"Qwen/Qwen3-14B-GGUF",
"Qwen/Qwen3-30B-A3B-Base",
"Qwen/Qwen3-30B-A3B-Thinking-2507-FP8",
"Qwen/Qwen3-Next-80B-A3B-Thinking-FP8",
"Qwen/Qwen3-VL-4B-Instruct-FP8",
"baichuan-inc/Baichuan-M2-32B-GPTQ-Int4",
"baidu/ERNIE-4.5-0.3B-Base-PT",
"baidu/ERNIE-4.5-21B-A3B-Base-PT",
"baidu/ERNIE-4.5-VL-28B-A3B-Base-PT",
"baidu/ERNIE-4.5-VL-28B-A3B-Thinking",
"baidu/ERNIE-4.5-VL-424B-A47B-Base-PT",
"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
"deepseek-ai/DeepSeek-V3.1-Terminus",
"deepseek-ai/DeepSeek-V3.2-Exp",
"deepseek-ai/deepseek-coder-1.3b-base",
"deepseek-ai/deepseek-coder-1.3b-instruct",
"deepseek-ai/deepseek-coder-6.7b-instruct",
"google/codegemma-1.1-2b-GGUF",
"google/gemma-3-27b-pt",
"google/paligemma2-28b-pt-896",
"google/reformer-crime-and-punishment",
"google/reformer-enwik8",
"google/t5-11b-ssm-nq",
"google/t5-3b-ssm-nq",
"google/t5-large-ssm-nq",
"google/t5-small-ssm-nq",
"google/t5-xl-ssm-nq",
"google/t5-xxl-ssm-nq",
"google/t5gemma-ml-ml-ul2-it",
"internlm/Spatial-SSRL-7B",
"llava-hf/llava-1.5-13b-hf",
"llava-hf/llava-v1.6-34b-hf",
"meta-llama/Llama-3.1-405B",
"meta-llama/Llama-3.1-405B-Instruct",
"meta-llama/Llama-3.1-70B",
"meta-llama/Llama-3.1-70B-Instruct",
"meta-llama/Llama-3.1-8B",
"meta-llama/Llama-3.1-8B-Instruct",
"meta-llama/Llama-3.2-11B-Vision-Instruct",
"meta-llama/Llama-3.2-1B",
"meta-llama/Llama-3.2-1B-Instruct",
"meta-llama/Llama-3.2-3B",
"meta-llama/Llama-3.2-3B-Instruct",
"meta-llama/Llama-3.2-90B-Vision",
"meta-llama/Llama-3.2-90B-Vision-Instruct",
"meta-llama/Llama-3.3-70B-Instruct",
"microsoft/MediPhi-Instruct",
"microsoft/Phi-3-medium-4k-instruct-onnx-cpu",
"microsoft/Phi-3.5-mini-instruct",
"microsoft/bitnet-b1.58-2B-4T",
"microsoft/bitnet-b1.58-2B-4T-gguf",
"microsoft/kosmos-2.5",
"microsoft/kosmos-2.5-chat",
"microsoft/llava-med-v1.5-mistral-7b",
"mistralai/Mistral-7B-Instruct-v0.2",
"moonshotai/Kimi-Dev-72B",
"moonshotai/Kimi-K2-Base",
"moonshotai/Kimi-K2-Instruct",
"moonshotai/Kimi-K2-Instruct-0905",
"moonshotai/Kimi-K2-Thinking",
"moonshotai/Kimi-Linear-48B-A3B-Base",
"moonshotai/Kimi-Linear-48B-A3B-Instruct",
"moonshotai/Moonlight-16B-A3B",
"openbmb/MiniCPM4.1-8B",
"tencent/DeepSeek-V3.1-Terminus-W4AFP8",
"tencent/Hunyuan-0.5B-Pretrain",
"zai-org/GLM-4-9B-0414",
"zai-org/GLM-4.1V-9B-Base",
"zai-org/GLM-4.5-Air",
"zai-org/GLM-4.5V-FP8",
"zai-org/GLM-4.6",
"zai-org/GLM-4.6-FP8",
"zai-org/GLM-Z1-32B-0414",
"zai-org/GLM-Z1-9B-0414",
"zai-org/Glyph",
"zai-org/UI2Code_N",
"zai-org/WebVIA-Agent",
"zai-org/codegeex4-all-9b"
]
}
},