Spaces:

Unknown504
/

web-ui

Running

App Files Files Community

web-ui / src /utils /config.py

Unknown504

Upload folder using huggingface_hub

19ea30a verified 9 days ago

raw

history blame contribute delete

4.12 kB

	PROVIDER_DISPLAY_NAMES = {
	"openai": "OpenAI",
	"azure_openai": "Azure OpenAI",
	"anthropic": "Anthropic",
	"deepseek": "DeepSeek",
	"google": "Google",
	"alibaba": "Alibaba",
	"moonshot": "MoonShot",
	"unbound": "Unbound AI",
	"ibm": "IBM",
	"grok": "Grok",
	}

	# Predefined model names for common providers
	model_names = {
	"anthropic": ["claude-3-5-sonnet-20241022", "claude-3-5-sonnet-20240620", "claude-3-opus-20240229"],
	"openai": ["gpt-4o", "gpt-4", "gpt-3.5-turbo", "o3-mini"],
	"deepseek": ["deepseek-chat", "deepseek-reasoner"],
	"google": ["gemini-2.0-flash", "gemini-2.0-flash-thinking-exp", "gemini-1.5-flash-latest",
	"gemini-1.5-flash-8b-latest", "gemini-2.0-flash-thinking-exp-01-21", "gemini-2.0-pro-exp-02-05",
	"gemini-2.5-pro-preview-03-25", "gemini-2.5-flash-preview-04-17"],
	"ollama": ["qwen2.5:7b", "qwen2.5:14b", "qwen2.5:32b", "qwen2.5-coder:14b", "qwen2.5-coder:32b", "llama2:7b",
	"deepseek-r1:14b", "deepseek-r1:32b"],
	"azure_openai": ["gpt-4o", "gpt-4", "gpt-3.5-turbo"],
	"mistral": ["pixtral-large-latest", "mistral-large-latest", "mistral-small-latest", "ministral-8b-latest"],
	"alibaba": ["qwen-plus", "qwen-max", "qwen-vl-max", "qwen-vl-plus", "qwen-turbo", "qwen-long"],
	"moonshot": ["moonshot-v1-32k-vision-preview", "moonshot-v1-8k-vision-preview"],
	"unbound": ["gemini-2.0-flash", "gpt-4o-mini", "gpt-4o", "gpt-4.5-preview"],
	"grok": [
	"grok-3",
	"grok-3-fast",
	"grok-3-mini",
	"grok-3-mini-fast",
	"grok-2-vision",
	"grok-2-image",
	"grok-2",
	],
	"siliconflow": [
	"deepseek-ai/DeepSeek-R1",
	"deepseek-ai/DeepSeek-V3",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
	"deepseek-ai/DeepSeek-V2.5",
	"deepseek-ai/deepseek-vl2",
	"Qwen/Qwen2.5-72B-Instruct-128K",
	"Qwen/Qwen2.5-72B-Instruct",
	"Qwen/Qwen2.5-32B-Instruct",
	"Qwen/Qwen2.5-14B-Instruct",
	"Qwen/Qwen2.5-7B-Instruct",
	"Qwen/Qwen2.5-Coder-32B-Instruct",
	"Qwen/Qwen2.5-Coder-7B-Instruct",
	"Qwen/Qwen2-7B-Instruct",
	"Qwen/Qwen2-1.5B-Instruct",
	"Qwen/QwQ-32B-Preview",
	"Qwen/Qwen2-VL-72B-Instruct",
	"Qwen/Qwen2.5-VL-32B-Instruct",
	"Qwen/Qwen2.5-VL-72B-Instruct",
	"TeleAI/TeleChat2",
	"THUDM/glm-4-9b-chat",
	"Vendor-A/Qwen/Qwen2.5-72B-Instruct",
	"internlm/internlm2_5-7b-chat",
	"internlm/internlm2_5-20b-chat",
	"Pro/Qwen/Qwen2.5-7B-Instruct",
	"Pro/Qwen/Qwen2-7B-Instruct",
	"Pro/Qwen/Qwen2-1.5B-Instruct",
	"Pro/THUDM/chatglm3-6b",
	"Pro/THUDM/glm-4-9b-chat",
	],
	"ibm": ["ibm/granite-vision-3.1-2b-preview", "meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
	"meta-llama/llama-3-2-90b-vision-instruct"],
	"modelscope":[
	"Qwen/Qwen2.5-Coder-32B-Instruct",
	"Qwen/Qwen2.5-Coder-14B-Instruct",
	"Qwen/Qwen2.5-Coder-7B-Instruct",
	"Qwen/Qwen2.5-72B-Instruct",
	"Qwen/Qwen2.5-32B-Instruct",
	"Qwen/Qwen2.5-14B-Instruct",
	"Qwen/Qwen2.5-7B-Instruct",
	"Qwen/QwQ-32B-Preview",
	"Qwen/Qwen2.5-VL-3B-Instruct",
	"Qwen/Qwen2.5-VL-7B-Instruct",
	"Qwen/Qwen2.5-VL-32B-Instruct",
	"Qwen/Qwen2.5-VL-72B-Instruct",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",
	"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
	"deepseek-ai/DeepSeek-R1",
	"deepseek-ai/DeepSeek-V3",
	"Qwen/Qwen3-1.7B",
	"Qwen/Qwen3-4B",
	"Qwen/Qwen3-8B",
	"Qwen/Qwen3-14B",
	"Qwen/Qwen3-30B-A3B",
	"Qwen/Qwen3-32B",
	"Qwen/Qwen3-235B-A22B",
	],
	}