Add gemma-4-26b model via OpenRouter - loop-benchmarking - Controlled experiments across agentic coding configurations. Same task, one variable, what actually works.

commit d7591e8b6cc707665f6117797ec33c25ee70a7e9
parent 4b307139a0f8e2e5d33d38f0536a463e3c7e4e6f
Author: Brian Graham <brian@buildingbetterteams.de>
Date:   Tue,  7 Apr 2026 21:39:53 +0200

Add gemma-4-26b model via OpenRouter

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

Diffstat:
M dashboard/src/lib/colors.ts  | 3 +++
M grid.yaml  | 5 ++++-
M harness/lib/compute_grid.py  | 1 +

3 files changed, 8 insertions(+), 1 deletion(-)
diff --git a/dashboard/src/lib/colors.ts b/dashboard/src/lib/colors.ts
@@ -25,6 +25,9 @@ export const MODEL_COLORS: Record<string, string> = {
   // Qwen (OpenRouter)
   "qwen-3.6-plus": "hsl(270 40% 68%)", // lavender
 
+  // Google
+  "gemma-4-26b":  "hsl(60 50% 62%)",   // olive
+
   // Future slots
   "slot-7":      "hsl(270 40% 68%)",  // lavender
   "slot-8":      "hsl(60 50% 62%)",   // olive
diff --git a/grid.yaml b/grid.yaml
@@ -9,7 +9,7 @@ defaults:
 
 axes:
   model:
-    values: ["haiku-4.5", "sonnet-4.6", "opus-4.6", "glm-4.5-air", "glm-4.7", "glm-5.1", "qwen-3.6-plus"]
+    values: ["haiku-4.5", "sonnet-4.6", "opus-4.6", "glm-4.5-air", "glm-4.7", "glm-5.1", "qwen-3.6-plus", "gemma-4-26b"]
   effort:
     values: [high, max]
   prompt_style:
@@ -71,6 +71,7 @@ providers:
     auth_token: "dummy"
     cli_model_map:
       "qwen-3.6-plus": "openrouter/qwen/qwen3.6-plus:free"
+      "gemma-4-26b": "openrouter/google/gemma-4-26b-a4b-it"
 
 exclusions:
   # Haiku does not support extended thinking
@@ -96,6 +97,8 @@ exclusions:
   - when: { provider: zai, model: "qwen-3.6-plus" }
   # OpenRouter models only with openrouter
   - when: { provider: anthropic, model: "qwen-3.6-plus" }
+  - when: { provider: anthropic, model: "gemma-4-26b" }
+  - when: { provider: zai, model: "gemma-4-26b" }
   - when: { provider: openrouter, model: "haiku-4.5" }
   - when: { provider: openrouter, model: "sonnet-4.6" }
   - when: { provider: openrouter, model: "opus-4.6" }
diff --git a/harness/lib/compute_grid.py b/harness/lib/compute_grid.py
@@ -73,6 +73,7 @@ VALUE_ABBREV = {
     "sonnet-4.6": "sonnet46",
     "opus-4.6": "opus46",
     "qwen-3.6-plus": "qwen36p",
+    "gemma-4-26b": "gemma426b",
     "anthropic": "anth",
     "openrouter": "or",
 }

	loop-benchmarking Controlled experiments across agentic coding configurations. Same task, one variable, what actually works.
	git clone https://git.shiptheloop.com/loop-benchmarking.git
	Log \| Files \| Refs \| README

M	dashboard/src/lib/colors.ts	\|	3	+++
M	grid.yaml	\|	5	++++-
M	harness/lib/compute_grid.py	\|	1	+