cmd: add qwen3.5 context length for launch (#14626)

This commit is contained in:
Parth Sareen
2026-03-04 14:10:52 -08:00
committed by GitHub
parent 122c68c151
commit 562c76d7cc

View File

@@ -90,6 +90,7 @@ var cloudModelLimits = map[string]cloudModelLimit{
"qwen3-coder:480b": {Context: 262_144, Output: 65_536},
"qwen3-coder-next": {Context: 262_144, Output: 32_768},
"qwen3-next:80b": {Context: 262_144, Output: 32_768},
"qwen3.5": {Context: 262_144, Output: 32_768},
}
// recommendedVRAM maps local recommended models to their approximate VRAM requirement.