From 9c31b5d62274bbcea1bc19bb3c100b23000ca547 Mon Sep 17 00:00:00 2001 From: Abiba Date: Tue, 19 May 2026 15:03:34 +0000 Subject: [PATCH] May 19, 2026: Full harness update MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit - Model migration: gemma-4-E4B → qwen3.5-9b-vlm - Dashboard reorder: Usage Over Time + GPU Metrics to top - Router counter leak fix (gpu_decr in except handler) - VLM slot upgrade 1→2 - Redis stale key cleanup - Automated maintenance cron job - LiteLLM config update - GPU router config update - README update --- .gitignore | 4 +--- README.md | 2 +- dashboard/dashboard.py | 34 +++++++++++++++++----------------- gpu-router-docker.conf | 4 ++-- gpu-router.conf | 4 ++-- litellm_config.yaml | 4 ++-- router/router.py | 37 ++++++++++++++++++------------------- 7 files changed, 43 insertions(+), 46 deletions(-) diff --git a/.gitignore b/.gitignore index 1edc785..eeb7737 100644 --- a/.gitignore +++ b/.gitignore @@ -1,5 +1,3 @@ +.git __pycache__/ *.pyc -.env -redis-data/ -ssl/ diff --git a/README.md b/README.md index 4381487..04e9659 100644 --- a/README.md +++ b/README.md @@ -8,7 +8,7 @@ CT 116 Docker stack for routing local GPU models through a unified OpenAI-compat nginx :80 → router :9000 → GPU backends ├─ qwen3.6-35B-A3B (MoE) @ 192.168.68.15:8080 ├─ qwen3.6-27B-code (Dense) @ 192.168.68.8:8080 - └─ gemma-4-E4B (Light) @ 192.168.68.110:8080 + └─ qwen3.5-9b-vlm (VLM) @ 192.168.68.110:8080 LiteLLM :8081 (fallback) | Dashboard :3000 | Redis :6379 (local) ``` diff --git a/dashboard/dashboard.py b/dashboard/dashboard.py index a1e5ee6..ecda580 100644 --- a/dashboard/dashboard.py +++ b/dashboard/dashboard.py @@ -80,17 +80,7 @@ body { background: #0b0f17; color: #bcc3cd; font-family: -apple-system, BlinkMac
- -
Loading...
-
Loading...
-
Loading...
- - -
Queue Status
-
Model Distribution
-
Agent Activity
- - +
Usage Over Time
@@ -101,6 +91,16 @@ body { background: #0b0f17; color: #bcc3cd; font-family: -apple-system, BlinkMac
GPU Metrics
+ +
Loading...
+
Loading...
+
Loading...
+ + +
Queue Status
+
Model Distribution
+
Agent Activity
+
Live Stream
@@ -111,9 +111,9 @@ body { background: #0b0f17; color: #bcc3cd; font-family: -apple-system, BlinkMac