fix: Dense context 65K→98K, parallel restored to 2

This commit is contained in:
Abiba
2026-05-19 21:20:29 +00:00
parent 6c829abef5
commit 79965450bb
+1 -1
View File
@@ -27,7 +27,7 @@ GPU_MAX_CONCURRENT = {
# Context window sizes (tokens) — used for compaction signals
GPU_CONTEXT = {
"qwen3.6-35B-A3B": 131072,
"qwen3.6-27B-code": 65536,
"qwen3.6-27B-code": 98304,
"qwen3.5-9b-vlm": 131072,
}