diff --git a/vllm-serve/values.schema.json b/vllm-serve/values.schema.json index c9d337c..b553aa0 100644 --- a/vllm-serve/values.schema.json +++ b/vllm-serve/values.schema.json @@ -295,11 +295,158 @@ "omni-search/Tarsier-7b", "omni-search/Tarsier-34b", "omni-research/Tarsier2-Recap-7b", - "omni-research/Tarsier2-7b-0115" + "omni-research/Tarsier2-7b-0115", + "ByteDance/Dolphin", + "ByteDance/Sa2VA-1B", + "ByteDance/Sa2VA-4B", + "ByteDance/Sa2VA-InternVL3-8B", + "ByteDance/Sa2VA-Qwen3-VL-4B", + "HuggingFaceH4/zephyr-7b-alpha", + "HuggingFaceH4/zephyr-7b-beta", + "Qwen/QwQ-32B", + "Qwen/QwQ-32B-AWQ", + "Qwen/QwQ-32B-GGUF", + "Qwen/Qwen-1_8B-Chat", + "Qwen/Qwen-Audio", + "Qwen/Qwen-Audio-Chat", + "Qwen/Qwen2-VL-2B-Instruct", + "Qwen/Qwen2-VL-2B-Instruct-GPTQ-Int4", + "Qwen/Qwen2-VL-2B-Instruct-GPTQ-Int8", + "Qwen/Qwen3-14B", + "Qwen/Qwen3-14B-AWQ", + "Qwen/Qwen3-14B-Base", + "Qwen/Qwen3-235B-A22B", + "Qwen/Qwen3-235B-A22B-Instruct-2507", + "Qwen/Qwen3-235B-A22B-Instruct-2507-FP8", + "Qwen/Qwen3-235B-A22B-Thinking-2507", + "Qwen/Qwen3-30B-A3B-Instruct-2507", + "Qwen/Qwen3-30B-A3B-Thinking-2507", + "Qwen/Qwen3-32B", + "Qwen/Qwen3-32B-FP8", + "Qwen/Qwen3-32B-GGUF", + "Qwen/Qwen3-4B", + "Qwen/Qwen3-4B-Base", + "Qwen/Qwen3-4B-FP8", + "Qwen/Qwen3-4B-GGUF", + "Qwen/Qwen3-4B-Instruct-2507", + "Qwen/Qwen3-4B-Instruct-2507-FP8", + "Qwen/Qwen3-4B-SafeRL", + "Qwen/Qwen3-4B-Thinking-2507", + "Qwen/Qwen3-4B-Thinking-2507-FP8", + "Qwen/Qwen3-8B-AWQ", + "Qwen/Qwen3-8B-Base", + "Qwen/Qwen3-8B-FP8", + "Qwen/Qwen3-8B-GGUF", + "Qwen/Qwen3-Coder-30B-A3B-Instruct", + "Qwen/Qwen3-Coder-30B-A3B-Instruct-FP8", + "Qwen/Qwen3-Coder-480B-A35B-Instruct", + "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8", + "Qwen/Qwen3-Next-80B-A3B-Instruct-FP8", + "Qwen/Qwen3-Next-80B-A3B-Thinking", + "Qwen/Qwen3-VL-2B-Instruct", + "Qwen/Qwen3-VL-2B-Instruct-FP8", + "Qwen/Qwen3-VL-2B-Instruct-GGUF", + "Qwen/Qwen3-VL-2B-Thinking", + "Qwen/Qwen3-VL-2B-Thinking-GGUF", + "Qwen/Qwen3-VL-30B-A3B-Instruct-GGUF", + "Qwen/Qwen3-VL-32B-Instruct", + "Qwen/Qwen3-VL-32B-Instruct-FP8", + "Qwen/Qwen3-VL-32B-Instruct-GGUF", + "Qwen/Qwen3-VL-32B-Thinking", + "Qwen/Qwen3-VL-4B-Instruct-GGUF", + "Qwen/Qwen3-VL-4B-Thinking", + "Qwen/Qwen3-VL-8B-Instruct", + "Qwen/Qwen3-VL-8B-Instruct-GGUF", + "Qwen/Qwen3-VL-8B-Thinking-GGUF", + "Qwen/Qwen3Guard-Gen-4B", + "Qwen/Qwen3Guard-Gen-8B", + "Skywork/Skywork-SWE-32B", + "baichuan-inc/Baichuan-M2-32B", + "deepseek-ai/DeepSeek-Coder-V2-Instruct", + "deepseek-ai/DeepSeek-Coder-V2-Lite-Base", + "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct", + "deepseek-ai/DeepSeek-Prover-V2-671B", + "deepseek-ai/DeepSeek-R1-0528", + "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + "deepseek-ai/DeepSeek-R1-Distill-Llama-70B", + "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", + "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", + "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B", + "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B", + "deepseek-ai/DeepSeek-V2-Lite-Chat", + "deepseek-ai/DeepSeek-V3-0324", + "deepseek-ai/deepseek-llm-67b-chat", + "deepseek-ai/deepseek-llm-7b-base", + "deepseek-ai/deepseek-moe-16b-base", + "deepseek-ai/deepseek-vl-7b-chat", + "google/datagemma-rag-27b-it", + "google/gemma-2-27b-it", + "google/gemma-2-2b", + "google/gemma-2-2b-it", + "google/gemma-2-9b-it", + "google/gemma-2b-it", + "google/gemma-3-12b-it", + "google/gemma-3-12b-it-qat-q4_0-gguf", + "google/gemma-3-12b-pt", + "google/gemma-3-1b-it-qat-int4-unquantized", + "google/gemma-3-1b-it-qat-q4_0-gguf", + "google/gemma-3-1b-pt", + "google/gemma-3-270m", + "google/gemma-3-270m-it", + "google/gemma-3-4b-it-qat-q4_0-gguf", + "google/gemma-3-4b-pt", + "google/gemma-3n-E2B", + "google/gemma-3n-E4B", + "google/gemma-7b", + "google/gemma-7b-it", + "google/medgemma-27b-it", + "google/medgemma-27b-text-it", + "google/medgemma-4b-it", + "google/medgemma-4b-pt", + "google/paligemma2-3b-mix-224", + "google/paligemma2-3b-mix-448", + "google/shieldgemma-2-4b-it", + "google/shieldgemma-2b", + "google/txgemma-2b-predict", + "google/vaultgemma-1b", + "meta-llama/CodeLlama-70b-hf", + "meta-llama/Llama-2-13b-hf", + "meta-llama/Llama-2-70b-chat-hf", + "meta-llama/Llama-2-7b-chat-hf", + "meta-llama/Llama-2-7b-hf", + "meta-llama/Llama-4-Scout-17B-16E", + "meta-llama/Llama-Guard-3-8B", + "meta-llama/Llama-Guard-4-12B", + "meta-llama/Meta-Llama-3-8B", + "meta-llama/Meta-Llama-3-8B-Instruct", + "meta-llama/Meta-Llama-Guard-2-8B", + "microsoft/BioGPT-Large", + "microsoft/DialoGPT-medium", + "microsoft/DialoGPT-small", + "microsoft/Florence-2-base", + "microsoft/Florence-2-large", + "microsoft/Florence-2-large-ft", + "microsoft/GUI-Actor-7B-Qwen2-VL", + "microsoft/MAI-DS-R1", + "microsoft/MAI-DS-R1-FP8", + "microsoft/MediPhi-Clinical", + "microsoft/OmniParser", + "microsoft/Phi-3-mini-4k-instruct-gguf", + "microsoft/Phi-3-mini-4k-instruct-onnx", + "microsoft/Phi-4-mini-flash-reasoning", + "microsoft/llava-med-7b-delta", + "microsoft/phi-4", + "microsoft/phi-4-gguf", + "tencent/DRIVE-RL", + "tencent/DRIVE-SFT", + "Qwen/Qwen2.5-14B", + "BAAI/bge-base-zh-v1.5" ] } }, - "required": ["huggingfaceName"] + "required": [ + "huggingfaceName" + ] }, "resources": { "type": "object", @@ -343,4 +490,4 @@ "default": "" } } -} \ No newline at end of file +}