diff --git a/router/router.py b/router/router.py index e06b8b3..80b9f69 100644 --- a/router/router.py +++ b/router/router.py @@ -27,7 +27,7 @@ GPU_MAX_CONCURRENT = { # Context window sizes (tokens) — used for compaction signals GPU_CONTEXT = { "qwen3.6-35B-A3B": 131072, - "qwen3.6-27B-code": 65536, + "qwen3.6-27B-code": 98304, "qwen3.5-9b-vlm": 131072, }