loop-benchmarking

Controlled experiments across agentic coding configurations. Same task, one variable, what actually works.
git clone https://git.shiptheloop.com/loop-benchmarking.git
Log | Files | Refs | README

commit d7591e8b6cc707665f6117797ec33c25ee70a7e9
parent 4b307139a0f8e2e5d33d38f0536a463e3c7e4e6f
Author: Brian Graham <brian@buildingbetterteams.de>
Date:   Tue,  7 Apr 2026 21:39:53 +0200

Add gemma-4-26b model via OpenRouter

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

Diffstat:
Mdashboard/src/lib/colors.ts | 3+++
Mgrid.yaml | 5++++-
Mharness/lib/compute_grid.py | 1+
3 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/dashboard/src/lib/colors.ts b/dashboard/src/lib/colors.ts @@ -25,6 +25,9 @@ export const MODEL_COLORS: Record<string, string> = { // Qwen (OpenRouter) "qwen-3.6-plus": "hsl(270 40% 68%)", // lavender + // Google + "gemma-4-26b": "hsl(60 50% 62%)", // olive + // Future slots "slot-7": "hsl(270 40% 68%)", // lavender "slot-8": "hsl(60 50% 62%)", // olive diff --git a/grid.yaml b/grid.yaml @@ -9,7 +9,7 @@ defaults: axes: model: - values: ["haiku-4.5", "sonnet-4.6", "opus-4.6", "glm-4.5-air", "glm-4.7", "glm-5.1", "qwen-3.6-plus"] + values: ["haiku-4.5", "sonnet-4.6", "opus-4.6", "glm-4.5-air", "glm-4.7", "glm-5.1", "qwen-3.6-plus", "gemma-4-26b"] effort: values: [high, max] prompt_style: @@ -71,6 +71,7 @@ providers: auth_token: "dummy" cli_model_map: "qwen-3.6-plus": "openrouter/qwen/qwen3.6-plus:free" + "gemma-4-26b": "openrouter/google/gemma-4-26b-a4b-it" exclusions: # Haiku does not support extended thinking @@ -96,6 +97,8 @@ exclusions: - when: { provider: zai, model: "qwen-3.6-plus" } # OpenRouter models only with openrouter - when: { provider: anthropic, model: "qwen-3.6-plus" } + - when: { provider: anthropic, model: "gemma-4-26b" } + - when: { provider: zai, model: "gemma-4-26b" } - when: { provider: openrouter, model: "haiku-4.5" } - when: { provider: openrouter, model: "sonnet-4.6" } - when: { provider: openrouter, model: "opus-4.6" } diff --git a/harness/lib/compute_grid.py b/harness/lib/compute_grid.py @@ -73,6 +73,7 @@ VALUE_ABBREV = { "sonnet-4.6": "sonnet46", "opus-4.6": "opus46", "qwen-3.6-plus": "qwen36p", + "gemma-4-26b": "gemma426b", "anthropic": "anth", "openrouter": "or", }

Impressum · Datenschutz