commit 0af972817d114910874b95bc4ec84298b7511e40
parent 46364ff78312c3c0d5d647e2f6d59c0c40345cec
Author: Brian Graham <brian@buildingbetterteams.de>
Date: Thu, 16 Apr 2026 15:53:49 +0200
Rebuild PCA from post-reeval 510-run dataset
Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
Diffstat:
1 file changed, 7825 insertions(+), 5657 deletions(-)
diff --git a/results/analysis/pca.json b/results/analysis/pca.json
@@ -1,59 +1,70 @@
{
- "n_runs": 393,
- "n_features": 62,
+ "n_runs": 510,
+ "n_features": 73,
"n_components": 10,
"variance_explained": [
- 10.36,
- 7.74,
- 4.36,
- 4.01,
- 3.75,
- 3.44,
- 3.33,
- 3.28,
- 3.26,
- 3.24
+ 9.41,
+ 6.06,
+ 3.78,
+ 3.31,
+ 3.09,
+ 2.88,
+ 2.87,
+ 2.82,
+ 2.77,
+ 2.73
],
"scree": [
- 10.36,
- 7.74,
- 4.36,
- 4.01,
- 3.75,
- 3.44,
- 3.33,
- 3.28,
- 3.26,
- 3.24,
- 3.04,
- 2.91,
- 2.68,
- 2.66,
+ 9.41,
+ 6.06,
+ 3.79,
+ 3.31,
+ 3.09,
+ 2.89,
+ 2.88,
+ 2.86,
+ 2.78,
+ 2.76,
+ 2.75,
+ 2.6,
2.42,
- 2.25,
- 2.18,
- 2.14,
- 2.06,
- 1.93,
- 1.88,
- 1.86,
+ 2.3,
+ 2.15,
+ 2.1,
+ 1.97,
+ 1.9,
1.85,
- 1.76,
- 1.72,
- 1.68,
- 1.64,
- 1.63,
- 1.63,
- 1.63,
- 1.63,
- 1.63,
- 1.63,
- 1.56,
- 1.5,
+ 1.83,
+ 1.67,
+ 1.65,
+ 1.53,
+ 1.51,
+ 1.49,
+ 1.43,
+ 1.42,
+ 1.42,
+ 1.39,
+ 1.39,
+ 1.39,
+ 1.39,
+ 1.39,
+ 1.39,
+ 1.38,
+ 1.38,
+ 1.38,
+ 1.38,
+ 1.38,
+ 1.38,
+ 1.38,
+ 1.37,
+ 1.34,
1.33,
- 1.09,
- 0.78,
- 0.53,
+ 1.22,
+ 1.05,
+ 0.85,
+ 0.55,
+ 0.46,
+ 0.0,
0.0,
0.0,
0.0,
@@ -80,6684 +91,8673 @@
],
"points": [
{
- "run_id": "tetris_arch=bp_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "626eca1d",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.4972,
- "pc2": 0.5282,
- "pc3": 5.187,
- "pc4": -0.4356,
- "pc5": -0.9644,
- "pc6": -1.0677,
- "pc7": -0.5496,
- "pc8": -7.0631,
- "pc9": 3.1667,
- "pc10": -0.0884,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
"run_id": "tetris_arch=bp_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "42f30c6b",
"model": "glm-4.5-air",
- "score": 0.325,
- "pc1": -3.5341,
- "pc2": 0.8692,
- "pc3": 1.6114,
- "pc4": -0.0156,
- "pc5": -0.4642,
- "pc6": -0.8311,
- "pc7": -0.7712,
- "pc8": -7.0631,
- "pc9": 3.2335,
- "pc10": -0.8288,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=bp_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "9d799edc",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.5901,
- "pc2": 0.0243,
- "pc3": 3.1206,
- "pc4": -0.2767,
- "pc5": -0.4836,
- "pc6": -0.8809,
- "pc7": -0.2981,
- "pc8": -7.0631,
- "pc9": 3.2124,
- "pc10": -0.2586,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=bp_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "9f6a0368",
- "model": "qwen-3.6-plus",
- "score": 0.41,
- "pc1": -3.4591,
- "pc2": 0.5298,
- "pc3": 5.211,
- "pc4": -0.4593,
- "pc5": -1.0387,
- "pc6": -1.5732,
- "pc7": -1.103,
- "pc8": -7.0631,
- "pc9": 3.1709,
- "pc10": -0.563,
+ "score": 0.685,
+ "pc1": -2.9606,
+ "pc2": 0.6229,
+ "pc3": -0.6594,
+ "pc4": -0.153,
+ "pc5": -1.3272,
+ "pc6": -0.0408,
+ "pc7": -5.7701,
+ "pc8": 1.7324,
+ "pc9": -7.6308,
+ "pc10": -0.3101,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=bp_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "3a4446e0",
+ "model": "glm-5.1",
+ "score": 0.905,
+ "pc1": -3.1111,
+ "pc2": 0.6697,
+ "pc3": -0.9651,
+ "pc4": -0.0322,
+ "pc5": -0.9533,
+ "pc6": 0.6099,
+ "pc7": -5.3668,
+ "pc8": 1.7694,
+ "pc9": -7.56,
+ "pc10": -0.3013,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=bp_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "e9675236",
+ "model": "glm-5.1",
+ "score": 0.665,
+ "pc1": -3.1111,
+ "pc2": 0.6697,
+ "pc3": -0.9651,
+ "pc4": -0.0322,
+ "pc5": -0.9533,
+ "pc6": 0.6099,
+ "pc7": -5.3668,
+ "pc8": 1.7694,
+ "pc9": -7.56,
+ "pc10": -0.3013,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=bp_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "a6720fb3",
+ "model": "glm-5.1",
+ "score": 0.925,
+ "pc1": -3.1111,
+ "pc2": 0.6697,
+ "pc3": -0.9651,
+ "pc4": -0.0322,
+ "pc5": -0.9533,
+ "pc6": 0.6099,
+ "pc7": -5.3668,
+ "pc8": 1.7694,
+ "pc9": -7.56,
+ "pc10": -0.3013,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "ed36af6d",
"model": "gemma-4-26b",
- "score": 0.355,
- "pc1": -2.8092,
- "pc2": -0.4563,
- "pc3": 1.2217,
- "pc4": -0.7561,
- "pc5": 0.3374,
- "pc6": -2.7357,
- "pc7": 1.0456,
- "pc8": -0.0,
- "pc9": -0.0449,
- "pc10": 0.0534,
+ "score": 0.485,
+ "pc1": -1.6509,
+ "pc2": -1.0341,
+ "pc3": 4.29,
+ "pc4": -0.085,
+ "pc5": -0.7664,
+ "pc6": -1.9055,
+ "pc7": 2.3296,
+ "pc8": 1.2838,
+ "pc9": -0.5179,
+ "pc10": 0.0495,
+ "config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "df938a74",
+ "model": "gemma-4-26b",
+ "score": 0.475,
+ "pc1": -1.6509,
+ "pc2": -1.0341,
+ "pc3": 4.29,
+ "pc4": -0.085,
+ "pc5": -0.7664,
+ "pc6": -1.9055,
+ "pc7": 2.3296,
+ "pc8": 1.2838,
+ "pc9": -0.5179,
+ "pc10": 0.0495,
+ "config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "ee6e9adf",
+ "model": "gemma-4-26b",
+ "score": 0.5,
+ "pc1": -1.6509,
+ "pc2": -1.0341,
+ "pc3": 4.29,
+ "pc4": -0.085,
+ "pc5": -0.7664,
+ "pc6": -1.9055,
+ "pc7": 2.3296,
+ "pc8": 1.2838,
+ "pc9": -0.5179,
+ "pc10": 0.0495,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "35048b14",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -2.8461,
- "pc2": -0.1153,
- "pc3": -2.3539,
- "pc4": -0.3361,
- "pc5": 0.8376,
- "pc6": -2.4991,
- "pc7": 0.824,
- "pc8": -0.0,
- "pc9": 0.022,
- "pc10": -0.6871,
+ "score": 0.85,
+ "pc1": -2.1292,
+ "pc2": -0.671,
+ "pc3": 0.6484,
+ "pc4": 0.5102,
+ "pc5": -0.3214,
+ "pc6": -2.5397,
+ "pc7": 1.0637,
+ "pc8": 1.8506,
+ "pc9": -0.2808,
+ "pc10": 0.2247,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "85cfb3b7",
"model": "glm-4.7",
- "score": 0.33,
- "pc1": -2.771,
- "pc2": -0.0895,
- "pc3": -2.6988,
- "pc4": -0.2758,
- "pc5": 0.8454,
- "pc6": -3.2514,
- "pc7": 0.4224,
- "pc8": -0.0,
- "pc9": -0.0022,
- "pc10": -0.4954,
+ "score": 0.755,
+ "pc1": -2.1472,
+ "pc2": -0.6237,
+ "pc3": 0.5871,
+ "pc4": 0.606,
+ "pc5": 0.0539,
+ "pc6": -2.3992,
+ "pc7": 2.01,
+ "pc8": 1.381,
+ "pc9": -0.2487,
+ "pc10": 0.1863,
+ "config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "6614890c",
+ "model": "glm-4.7",
+ "score": 0.875,
+ "pc1": -2.1472,
+ "pc2": -0.6237,
+ "pc3": 0.5871,
+ "pc4": 0.606,
+ "pc5": 0.0539,
+ "pc6": -2.3992,
+ "pc7": 2.01,
+ "pc8": 1.381,
+ "pc9": -0.2487,
+ "pc10": 0.1863,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "c530817e",
"model": "glm-4.7",
- "score": 0.38,
- "pc1": -2.771,
- "pc2": -0.0895,
- "pc3": -2.6988,
- "pc4": -0.2758,
- "pc5": 0.8454,
- "pc6": -3.2514,
- "pc7": 0.4224,
- "pc8": -0.0,
- "pc9": -0.0022,
- "pc10": -0.4954,
+ "score": 0.9,
+ "pc1": -2.1472,
+ "pc2": -0.6237,
+ "pc3": 0.5871,
+ "pc4": 0.606,
+ "pc5": 0.0539,
+ "pc6": -2.3992,
+ "pc7": 2.01,
+ "pc8": 1.381,
+ "pc9": -0.2487,
+ "pc10": 0.1863,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "5ea5d539",
"model": "glm-5.1",
- "score": 0.38,
- "pc1": -2.7963,
- "pc2": -0.0096,
- "pc3": -2.72,
- "pc4": -0.3454,
- "pc5": 0.9807,
- "pc6": -2.4343,
- "pc7": 0.6207,
- "pc8": -0.0,
- "pc9": 0.0129,
- "pc10": -0.694,
+ "score": 0.785,
+ "pc1": -2.2798,
+ "pc2": -0.6243,
+ "pc3": 0.3426,
+ "pc4": 0.6309,
+ "pc5": 0.0525,
+ "pc6": -1.889,
+ "pc7": 1.4671,
+ "pc8": 1.8877,
+ "pc9": -0.21,
+ "pc10": 0.2335,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "f2ff7829",
"model": "glm-5.1",
- "score": 0.35,
- "pc1": -2.7963,
- "pc2": -0.0096,
- "pc3": -2.72,
- "pc4": -0.3454,
- "pc5": 0.9807,
- "pc6": -2.4343,
- "pc7": 0.6207,
- "pc8": -0.0,
- "pc9": 0.0129,
- "pc10": -0.694,
+ "score": 0.975,
+ "pc1": -2.2798,
+ "pc2": -0.6243,
+ "pc3": 0.3426,
+ "pc4": 0.6309,
+ "pc5": 0.0525,
+ "pc6": -1.889,
+ "pc7": 1.4671,
+ "pc8": 1.8877,
+ "pc9": -0.21,
+ "pc10": 0.2335,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "6b848132",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": -2.7963,
- "pc2": -0.0096,
- "pc3": -2.72,
- "pc4": -0.3454,
- "pc5": 0.9807,
- "pc6": -2.4343,
- "pc7": 0.6207,
- "pc8": -0.0,
- "pc9": 0.0129,
- "pc10": -0.694,
+ "score": 0.85,
+ "pc1": -2.2798,
+ "pc2": -0.6243,
+ "pc3": 0.3426,
+ "pc4": 0.6309,
+ "pc5": 0.0525,
+ "pc6": -1.889,
+ "pc7": 1.4671,
+ "pc8": 1.8877,
+ "pc9": -0.21,
+ "pc10": 0.2335,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "e047cf3a",
"model": "haiku-4.5",
"score": 0.885,
- "pc1": 1.2696,
- "pc2": -2.9777,
- "pc3": -0.9202,
- "pc4": -0.7276,
- "pc5": 0.6682,
- "pc6": -2.5198,
- "pc7": 1.283,
- "pc8": 0.0,
- "pc9": -0.0016,
- "pc10": 0.0565,
+ "pc1": 2.1757,
+ "pc2": -3.2824,
+ "pc3": 0.5594,
+ "pc4": 0.8544,
+ "pc5": 0.1628,
+ "pc6": -2.1294,
+ "pc7": 1.4366,
+ "pc8": 1.7254,
+ "pc9": -0.0775,
+ "pc10": 0.2594,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "5ae88633",
"model": "haiku-4.5",
- "score": 0.5,
- "pc1": 1.2696,
- "pc2": -2.9777,
- "pc3": -0.9202,
- "pc4": -0.7276,
- "pc5": 0.6682,
- "pc6": -2.5198,
- "pc7": 1.283,
- "pc8": -0.0,
- "pc9": -0.0016,
- "pc10": 0.0565,
+ "score": 0.845,
+ "pc1": 2.1757,
+ "pc2": -3.2824,
+ "pc3": 0.5594,
+ "pc4": 0.8544,
+ "pc5": 0.1628,
+ "pc6": -2.1294,
+ "pc7": 1.4366,
+ "pc8": 1.7254,
+ "pc9": -0.0775,
+ "pc10": 0.2594,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "1d08ee76",
"model": "haiku-4.5",
- "score": 0.5,
- "pc1": 1.2696,
- "pc2": -2.9777,
- "pc3": -0.9202,
- "pc4": -0.7276,
- "pc5": 0.6682,
- "pc6": -2.5198,
- "pc7": 1.283,
- "pc8": 0.0,
- "pc9": -0.0016,
- "pc10": 0.0565,
+ "score": 0.925,
+ "pc1": 2.1757,
+ "pc2": -3.2824,
+ "pc3": 0.5594,
+ "pc4": 0.8544,
+ "pc5": 0.1628,
+ "pc6": -2.1294,
+ "pc7": 1.4366,
+ "pc8": 1.7254,
+ "pc9": -0.0775,
+ "pc10": 0.2594,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "cf4290a4",
"model": "haiku-4.5",
- "score": 0.3,
- "pc1": -0.9021,
- "pc2": -0.9601,
- "pc3": -0.8447,
- "pc4": -0.5972,
- "pc5": 0.8182,
- "pc6": -2.549,
- "pc7": 1.2971,
- "pc8": 0.0,
- "pc9": 0.0008,
- "pc10": -0.1169,
+ "score": 0.78,
+ "pc1": -0.0535,
+ "pc2": -1.3177,
+ "pc3": 1.2156,
+ "pc4": 0.5329,
+ "pc5": 0.006,
+ "pc6": -2.1885,
+ "pc7": 1.6343,
+ "pc8": 1.6643,
+ "pc9": -0.1521,
+ "pc10": 0.1257,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "fe66c902",
"model": "opus-4.6",
- "score": 0.355,
- "pc1": 1.1625,
- "pc2": -3.5988,
- "pc3": -1.1989,
- "pc4": -0.9669,
- "pc5": 0.6277,
- "pc6": -2.5977,
- "pc7": 1.0395,
- "pc8": -0.0,
- "pc9": -0.0035,
- "pc10": -0.0684,
+ "score": 0.67,
+ "pc1": 2.0015,
+ "pc2": -4.0196,
+ "pc3": 0.4888,
+ "pc4": 1.1612,
+ "pc5": 0.24,
+ "pc6": -2.0646,
+ "pc7": 1.2378,
+ "pc8": 1.7873,
+ "pc9": -0.1376,
+ "pc10": 0.3507,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "f437a754",
"model": "opus-4.6",
- "score": 0.47,
- "pc1": 1.1625,
- "pc2": -3.5988,
- "pc3": -1.1989,
- "pc4": -0.9669,
- "pc5": 0.6277,
- "pc6": -2.5977,
- "pc7": 1.0395,
- "pc8": -0.0,
- "pc9": -0.0035,
- "pc10": -0.0684,
+ "score": 0.945,
+ "pc1": 2.0015,
+ "pc2": -4.0196,
+ "pc3": 0.4888,
+ "pc4": 1.1612,
+ "pc5": 0.24,
+ "pc6": -2.0646,
+ "pc7": 1.2378,
+ "pc8": 1.7873,
+ "pc9": -0.1376,
+ "pc10": 0.3507,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "6f157de1",
"model": "opus-4.6",
- "score": 0.77,
- "pc1": 1.1625,
- "pc2": -3.5988,
- "pc3": -1.1989,
- "pc4": -0.9669,
- "pc5": 0.6277,
- "pc6": -2.5977,
- "pc7": 1.0395,
- "pc8": -0.0,
- "pc9": -0.0035,
- "pc10": -0.0684,
+ "score": 0.825,
+ "pc1": 2.0015,
+ "pc2": -4.0196,
+ "pc3": 0.4888,
+ "pc4": 1.1612,
+ "pc5": 0.24,
+ "pc6": -2.0646,
+ "pc7": 1.2378,
+ "pc8": 1.7873,
+ "pc9": -0.1376,
+ "pc10": 0.3507,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "2763232d",
"model": "qwen-3.6-plus",
- "score": 0.38,
- "pc1": -2.7711,
- "pc2": -0.4547,
- "pc3": 1.2457,
- "pc4": -0.7798,
- "pc5": 0.263,
- "pc6": -3.2413,
- "pc7": 0.4922,
- "pc8": -0.0,
- "pc9": -0.0407,
- "pc10": -0.4213,
+ "score": 0.95,
+ "pc1": -1.6858,
+ "pc2": -1.0994,
+ "pc3": 4.2126,
+ "pc4": -0.273,
+ "pc5": -1.2304,
+ "pc6": -1.6169,
+ "pc7": 1.7492,
+ "pc8": 1.4139,
+ "pc9": -0.1266,
+ "pc10": 0.3547,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "aec24c80",
"model": "sonnet-4.6",
- "score": 0.425,
- "pc1": 1.153,
- "pc2": -3.593,
- "pc3": -1.1967,
- "pc4": -0.9667,
- "pc5": 0.6298,
- "pc6": -2.5959,
- "pc7": 1.0431,
- "pc8": -0.0,
- "pc9": -0.0035,
- "pc10": -0.067,
+ "score": 0.895,
+ "pc1": 1.9935,
+ "pc2": -4.0115,
+ "pc3": 0.4927,
+ "pc4": 1.1813,
+ "pc5": 0.2024,
+ "pc6": -2.0007,
+ "pc7": 1.3189,
+ "pc8": 1.6503,
+ "pc9": 0.0082,
+ "pc10": 0.3962,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "f451b3e8",
"model": "sonnet-4.6",
- "score": 0.43,
- "pc1": 1.153,
- "pc2": -3.593,
- "pc3": -1.1967,
- "pc4": -0.9667,
- "pc5": 0.6298,
- "pc6": -2.5959,
- "pc7": 1.0431,
- "pc8": -0.0,
- "pc9": -0.0035,
- "pc10": -0.067,
+ "score": 0.75,
+ "pc1": 1.9935,
+ "pc2": -4.0115,
+ "pc3": 0.4927,
+ "pc4": 1.1813,
+ "pc5": 0.2024,
+ "pc6": -2.0007,
+ "pc7": 1.3189,
+ "pc8": 1.6503,
+ "pc9": 0.0082,
+ "pc10": 0.3962,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "59fdb0fc",
"model": "sonnet-4.6",
- "score": 0.5,
- "pc1": 1.153,
- "pc2": -3.593,
- "pc3": -1.1967,
- "pc4": -0.9667,
- "pc5": 0.6298,
- "pc6": -2.5959,
- "pc7": 1.0431,
- "pc8": -0.0,
- "pc9": -0.0035,
- "pc10": -0.067,
+ "score": 0.95,
+ "pc1": 1.9935,
+ "pc2": -4.0115,
+ "pc3": 0.4927,
+ "pc4": 1.1813,
+ "pc5": 0.2024,
+ "pc6": -2.0007,
+ "pc7": 1.3189,
+ "pc8": 1.6503,
+ "pc9": 0.0082,
+ "pc10": 0.3962,
"config_summary": "effort=high, prompt_style=simple, language=javascript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=high_model=haiku45_pw=off_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=off_tread=off_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=high_model=haiku45_pw=off_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=off_tread=off_twrite=on_web=on_run2",
"short_id": "dcbf6400",
"model": "haiku-4.5",
- "score": 0.53,
- "pc1": 6.1226,
- "pc2": 5.3892,
- "pc3": 0.4006,
- "pc4": -0.4122,
- "pc5": -1.3519,
- "pc6": -0.5491,
- "pc7": -1.1715,
- "pc8": -0.0,
- "pc9": -0.1508,
- "pc10": 4.4656,
+ "score": 0.925,
+ "pc1": 7.0742,
+ "pc2": 5.9801,
+ "pc3": -0.2458,
+ "pc4": 0.4841,
+ "pc5": -0.8621,
+ "pc6": 0.7,
+ "pc7": 0.1324,
+ "pc8": 0.483,
+ "pc9": -0.5123,
+ "pc10": 2.1292,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=high_model=haiku45_pw=off_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=off_tread=off_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=high_model=haiku45_pw=off_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=off_tread=off_twrite=on_web=on_run4",
"short_id": "b13fad58",
"model": "haiku-4.5",
- "score": 0.425,
- "pc1": 6.1226,
- "pc2": 5.3892,
- "pc3": 0.4006,
- "pc4": -0.4122,
- "pc5": -1.3519,
- "pc6": -0.5491,
- "pc7": -1.1715,
- "pc8": -0.0,
- "pc9": -0.1508,
- "pc10": 4.4656,
+ "score": 0.785,
+ "pc1": 7.0742,
+ "pc2": 5.9801,
+ "pc3": -0.2458,
+ "pc4": 0.4841,
+ "pc5": -0.8621,
+ "pc6": 0.7,
+ "pc7": 0.1324,
+ "pc8": 0.483,
+ "pc9": -0.5123,
+ "pc10": 2.1292,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=high, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "c1013100",
"model": "gemma-4-26b",
- "score": 0.41,
- "pc1": -1.6755,
- "pc2": 1.8125,
- "pc3": 1.9691,
- "pc4": -1.128,
- "pc5": -0.0382,
- "pc6": -0.4646,
- "pc7": -1.3465,
- "pc8": -0.0,
- "pc9": -0.1068,
- "pc10": 2.1998,
+ "score": 0.475,
+ "pc1": -0.6696,
+ "pc2": 1.5827,
+ "pc3": 3.8132,
+ "pc4": 0.2171,
+ "pc5": -0.2671,
+ "pc6": 0.2054,
+ "pc7": 0.5241,
+ "pc8": -0.0614,
+ "pc9": -0.6054,
+ "pc10": 2.1539,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "975be3a7",
+ "model": "gemma-4-26b",
+ "score": 0.5,
+ "pc1": -0.6696,
+ "pc2": 1.5827,
+ "pc3": 3.8132,
+ "pc4": 0.2171,
+ "pc5": -0.2671,
+ "pc6": 0.2054,
+ "pc7": 0.5241,
+ "pc8": -0.0614,
+ "pc9": -0.6054,
+ "pc10": 2.1539,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "3b743736",
+ "model": "gemma-4-26b",
+ "score": 0.5,
+ "pc1": -0.6696,
+ "pc2": 1.5827,
+ "pc3": 3.8132,
+ "pc4": 0.2171,
+ "pc5": -0.2671,
+ "pc6": 0.2054,
+ "pc7": 0.5241,
+ "pc8": -0.0614,
+ "pc9": -0.6054,
+ "pc10": 2.1539,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm45air_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "cbd2d1e2",
"model": "glm-4.5-air",
- "score": 0.35,
- "pc1": 0.136,
- "pc2": 4.8426,
- "pc3": -2.6187,
- "pc4": -2.4138,
- "pc5": -3.7869,
- "pc6": -0.3756,
- "pc7": -1.9287,
- "pc8": -0.0,
- "pc9": -0.0743,
- "pc10": 2.375,
+ "score": 0.835,
+ "pc1": 0.8468,
+ "pc2": 5.005,
+ "pc3": -0.9117,
+ "pc4": 4.0836,
+ "pc5": -3.6502,
+ "pc6": -0.4505,
+ "pc7": 0.3696,
+ "pc8": -0.0343,
+ "pc9": -0.803,
+ "pc10": 3.3049,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "e7dbe3e8",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.7124,
- "pc2": 2.1536,
- "pc3": -1.6065,
- "pc4": -0.708,
- "pc5": 0.462,
- "pc6": -0.228,
- "pc7": -1.5681,
- "pc8": -0.0,
- "pc9": -0.0399,
- "pc10": 1.4593,
+ "score": 0.875,
+ "pc1": -1.148,
+ "pc2": 1.9458,
+ "pc3": 0.1716,
+ "pc4": 0.8124,
+ "pc5": 0.1779,
+ "pc6": -0.4289,
+ "pc7": -0.7417,
+ "pc8": 0.5054,
+ "pc9": -0.3683,
+ "pc10": 2.3292,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm47_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "f76992f1",
"model": "glm-4.7",
- "score": 0.305,
- "pc1": 0.2112,
- "pc2": 4.8684,
- "pc3": -2.9637,
- "pc4": -2.3535,
- "pc5": -3.7791,
- "pc6": -1.1279,
- "pc7": -2.3303,
- "pc8": -0.0,
- "pc9": -0.0984,
- "pc10": 2.5666,
+ "score": 0.92,
+ "pc1": 0.8288,
+ "pc2": 5.0523,
+ "pc3": -0.973,
+ "pc4": 4.1793,
+ "pc5": -3.2749,
+ "pc6": -0.3099,
+ "pc7": 1.3159,
+ "pc8": -0.5039,
+ "pc9": -0.7709,
+ "pc10": 3.2664,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "413c1f93",
"model": "glm-4.7",
- "score": 0.795,
- "pc1": -0.6145,
- "pc2": 3.793,
- "pc3": -2.3309,
- "pc4": -1.0164,
- "pc5": -1.0136,
- "pc6": -1.0628,
- "pc7": -2.1043,
- "pc8": -0.0,
- "pc9": -0.0624,
- "pc10": 1.4353,
+ "score": 0.86,
+ "pc1": -0.126,
+ "pc2": 3.8086,
+ "pc3": -0.2181,
+ "pc4": 1.9331,
+ "pc5": -0.8543,
+ "pc6": -0.4059,
+ "pc7": 0.6815,
+ "pc8": -0.37,
+ "pc9": -0.5019,
+ "pc10": 2.6913,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "9a9774f0",
"model": "glm-4.7",
- "score": 0.37,
- "pc1": -1.6372,
- "pc2": 2.1793,
- "pc3": -1.9515,
- "pc4": -0.6477,
- "pc5": 0.4698,
- "pc6": -0.9803,
- "pc7": -1.9697,
- "pc8": -0.0,
- "pc9": -0.0641,
- "pc10": 1.651,
+ "score": 0.835,
+ "pc1": -1.166,
+ "pc2": 1.9932,
+ "pc3": 0.1103,
+ "pc4": 0.9082,
+ "pc5": 0.5532,
+ "pc6": -0.2883,
+ "pc7": 0.2046,
+ "pc8": 0.0358,
+ "pc9": -0.3362,
+ "pc10": 2.2907,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "4a154f54",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -1.6372,
- "pc2": 2.1793,
- "pc3": -1.9515,
- "pc4": -0.6477,
- "pc5": 0.4698,
- "pc6": -0.9803,
- "pc7": -1.9697,
- "pc8": -0.0,
- "pc9": -0.0641,
- "pc10": 1.651,
+ "score": 0.705,
+ "pc1": -1.166,
+ "pc2": 1.9932,
+ "pc3": 0.1103,
+ "pc4": 0.9082,
+ "pc5": 0.5532,
+ "pc6": -0.2883,
+ "pc7": 0.2046,
+ "pc8": 0.0358,
+ "pc9": -0.3362,
+ "pc10": 2.2907,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "d072c92b",
+ "model": "glm-4.7",
+ "score": 0.705,
+ "pc1": -1.166,
+ "pc2": 1.9932,
+ "pc3": 0.1103,
+ "pc4": 0.9082,
+ "pc5": 0.5532,
+ "pc6": -0.2883,
+ "pc7": 0.2046,
+ "pc8": 0.0358,
+ "pc9": -0.3362,
+ "pc10": 2.2907,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm51_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "05601da1",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": 0.1858,
- "pc2": 4.9483,
- "pc3": -2.9848,
- "pc4": -2.4231,
- "pc5": -3.6438,
- "pc6": -0.3109,
- "pc7": -2.132,
- "pc8": -0.0,
- "pc9": -0.0834,
- "pc10": 2.3681,
+ "score": 0.8,
+ "pc1": 0.6962,
+ "pc2": 5.0518,
+ "pc3": -1.2174,
+ "pc4": 4.2043,
+ "pc5": -3.2763,
+ "pc6": 0.2003,
+ "pc7": 0.773,
+ "pc8": 0.0027,
+ "pc9": -0.7322,
+ "pc10": 3.3136,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "a6d9fb9c",
"model": "glm-5.1",
- "score": 0.355,
- "pc1": -0.6398,
- "pc2": 3.873,
- "pc3": -2.3521,
- "pc4": -1.086,
- "pc5": -0.8783,
- "pc6": -0.2458,
- "pc7": -1.906,
- "pc8": -0.0,
- "pc9": -0.0474,
- "pc10": 1.2367,
+ "score": 0.61,
+ "pc1": -0.2586,
+ "pc2": 3.808,
+ "pc3": -0.4626,
+ "pc4": 1.958,
+ "pc5": -0.8557,
+ "pc6": 0.1044,
+ "pc7": 0.1385,
+ "pc8": 0.1366,
+ "pc9": -0.4632,
+ "pc10": 2.7385,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "7c167ef9",
"model": "glm-5.1",
- "score": 0.255,
- "pc1": -1.6626,
- "pc2": 2.2593,
- "pc3": -1.9727,
- "pc4": -0.7173,
- "pc5": 0.6052,
- "pc6": -0.1632,
- "pc7": -1.7714,
- "pc8": -0.0,
- "pc9": -0.049,
- "pc10": 1.4524,
+ "score": 0.67,
+ "pc1": -1.2985,
+ "pc2": 1.9926,
+ "pc3": -0.1341,
+ "pc4": 0.9331,
+ "pc5": 0.5518,
+ "pc6": 0.2219,
+ "pc7": -0.3384,
+ "pc8": 0.5425,
+ "pc9": -0.2975,
+ "pc10": 2.3379,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "cce71fd1",
"model": "glm-5.1",
- "score": 0.33,
- "pc1": -1.6626,
- "pc2": 2.2593,
- "pc3": -1.9727,
- "pc4": -0.7173,
- "pc5": 0.6052,
- "pc6": -0.1632,
- "pc7": -1.7714,
- "pc8": -0.0,
- "pc9": -0.049,
- "pc10": 1.4524,
+ "score": 0.665,
+ "pc1": -1.2985,
+ "pc2": 1.9926,
+ "pc3": -0.1341,
+ "pc4": 0.9331,
+ "pc5": 0.5518,
+ "pc6": 0.2219,
+ "pc7": -0.3384,
+ "pc8": 0.5425,
+ "pc9": -0.2975,
+ "pc10": 2.3379,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "9b785a51",
"model": "glm-5.1",
- "score": 0.65,
- "pc1": -1.6626,
- "pc2": 2.2593,
- "pc3": -1.9727,
- "pc4": -0.7173,
- "pc5": 0.6052,
- "pc6": -0.1632,
- "pc7": -1.7714,
- "pc8": -0.0,
- "pc9": -0.049,
- "pc10": 1.4524,
+ "score": 0.805,
+ "pc1": -1.2985,
+ "pc2": 1.9926,
+ "pc3": -0.1341,
+ "pc4": 0.9331,
+ "pc5": 0.5518,
+ "pc6": 0.2219,
+ "pc7": -0.3384,
+ "pc8": 0.5425,
+ "pc9": -0.2975,
+ "pc10": 2.3379,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "062f01a0",
"model": "haiku-4.5",
- "score": 0.19,
- "pc1": 2.4034,
- "pc2": -0.7088,
- "pc3": -0.1729,
- "pc4": -1.0995,
- "pc5": 0.2926,
- "pc6": -0.2487,
- "pc7": -1.1091,
- "pc8": -0.0,
- "pc9": -0.0635,
- "pc10": 2.2029,
+ "score": 0.275,
+ "pc1": 3.1569,
+ "pc2": -0.6656,
+ "pc3": 0.0826,
+ "pc4": 1.1565,
+ "pc5": 0.6621,
+ "pc6": -0.0186,
+ "pc7": -0.3688,
+ "pc8": 0.3803,
+ "pc9": -0.165,
+ "pc10": 2.3638,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "586c6b0a",
"model": "haiku-4.5",
- "score": 0.405,
- "pc1": 2.4034,
- "pc2": -0.7088,
- "pc3": -0.1729,
- "pc4": -1.0995,
- "pc5": 0.2926,
- "pc6": -0.2487,
- "pc7": -1.1091,
- "pc8": -0.0,
- "pc9": -0.0635,
- "pc10": 2.2029,
+ "score": 0.545,
+ "pc1": 3.1569,
+ "pc2": -0.6656,
+ "pc3": 0.0826,
+ "pc4": 1.1565,
+ "pc5": 0.6621,
+ "pc6": -0.0186,
+ "pc7": -0.3688,
+ "pc8": 0.3803,
+ "pc9": -0.165,
+ "pc10": 2.3638,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "71fa204f",
"model": "haiku-4.5",
- "score": 0.68,
- "pc1": 2.4034,
- "pc2": -0.7088,
- "pc3": -0.1729,
- "pc4": -1.0995,
- "pc5": 0.2926,
- "pc6": -0.2487,
- "pc7": -1.1091,
- "pc8": -0.0,
- "pc9": -0.0635,
- "pc10": 2.2029,
+ "score": 0.65,
+ "pc1": 3.1569,
+ "pc2": -0.6656,
+ "pc3": 0.0826,
+ "pc4": 1.1565,
+ "pc5": 0.6621,
+ "pc6": -0.0186,
+ "pc7": -0.3688,
+ "pc8": 0.3803,
+ "pc9": -0.165,
+ "pc10": 2.3638,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=detailed_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=detailed_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run2",
"short_id": "c151a356",
"model": "haiku-4.5",
- "score": 0.5,
- "pc1": 2.0801,
- "pc2": 3.9977,
- "pc3": -1.1095,
- "pc4": -2.6749,
- "pc5": -3.8064,
- "pc6": -0.4255,
- "pc7": -1.4556,
- "pc8": -0.0,
- "pc9": -0.0954,
- "pc10": 2.9452,
+ "score": 0.95,
+ "pc1": 2.9225,
+ "pc2": 4.3583,
+ "pc3": -0.3445,
+ "pc4": 4.1062,
+ "pc5": -3.3228,
+ "pc6": -0.0992,
+ "pc7": 0.9403,
+ "pc8": -0.2206,
+ "pc9": -0.6743,
+ "pc10": 3.2058,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "f89a8a70",
- "model": "haiku-4.5",
- "score": 0.745,
- "pc1": 0.2316,
- "pc2": 1.3087,
- "pc3": -0.0974,
- "pc4": -0.9691,
- "pc5": 0.4426,
- "pc6": -0.2779,
- "pc7": -1.095,
- "pc8": -0.0,
- "pc9": -0.0611,
- "pc10": 2.0295,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=off_twrite=off_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=off_twrite=off_web=off_run4",
"short_id": "b29d066e",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 6.7116,
- "pc2": 9.3841,
- "pc3": 1.4325,
- "pc4": -3.25,
- "pc5": 4.5193,
- "pc6": -0.0799,
- "pc7": 0.2008,
- "pc8": 0.0,
- "pc9": 0.0164,
- "pc10": -0.6899,
+ "score": 0.705,
+ "pc1": 7.2012,
+ "pc2": 10.207,
+ "pc3": 2.8966,
+ "pc4": 1.7973,
+ "pc5": 4.8405,
+ "pc6": -0.1982,
+ "pc7": -1.123,
+ "pc8": 0.3862,
+ "pc9": 0.3571,
+ "pc10": -0.2443,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=off_twrite=off_web=off_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=off_twrite=off_web=off_run5",
"short_id": "1e13c72f",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 6.7116,
- "pc2": 9.3841,
- "pc3": 1.4325,
- "pc4": -3.25,
- "pc5": 4.5193,
- "pc6": -0.0799,
- "pc7": 0.2008,
- "pc8": 0.0,
- "pc9": 0.0164,
- "pc10": -0.6899,
+ "score": 0.61,
+ "pc1": 7.2012,
+ "pc2": 10.207,
+ "pc3": 2.8966,
+ "pc4": 1.7973,
+ "pc5": 4.8405,
+ "pc6": -0.1982,
+ "pc7": -1.123,
+ "pc8": 0.3862,
+ "pc9": 0.3571,
+ "pc10": -0.2443,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=off_twrite=off_web=off_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=off_twrite=off_web=off_run6",
"short_id": "56088123",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 6.7116,
- "pc2": 9.3841,
- "pc3": 1.4325,
- "pc4": -3.25,
- "pc5": 4.5193,
- "pc6": -0.0799,
- "pc7": 0.2008,
- "pc8": 0.0,
- "pc9": 0.0164,
- "pc10": -0.6899,
+ "score": 0.665,
+ "pc1": 7.2012,
+ "pc2": 10.207,
+ "pc3": 2.8966,
+ "pc4": 1.7973,
+ "pc5": 4.8405,
+ "pc6": -0.1982,
+ "pc7": -1.123,
+ "pc8": 0.3862,
+ "pc9": 0.3571,
+ "pc10": -0.2443,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run2",
"short_id": "1fdd595b",
"model": "haiku-4.5",
- "score": 0.355,
- "pc1": 1.2544,
- "pc2": 2.9224,
- "pc3": -0.4768,
- "pc4": -1.3378,
- "pc5": -1.0409,
- "pc6": -0.3604,
- "pc7": -1.2295,
- "pc8": -0.0,
- "pc9": -0.0594,
- "pc10": 1.8138,
+ "score": 0.835,
+ "pc1": 1.9678,
+ "pc2": 3.1146,
+ "pc3": 0.4104,
+ "pc4": 1.8599,
+ "pc5": -0.9022,
+ "pc6": -0.1951,
+ "pc7": 0.3058,
+ "pc8": -0.0867,
+ "pc9": -0.4053,
+ "pc10": 2.6306,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "f89a8a70",
+ "model": "haiku-4.5",
+ "score": 0.87,
+ "pc1": 0.9278,
+ "pc2": 1.2991,
+ "pc3": 0.7388,
+ "pc4": 0.835,
+ "pc5": 0.5053,
+ "pc6": -0.0776,
+ "pc7": -0.1711,
+ "pc8": 0.3191,
+ "pc9": -0.2396,
+ "pc10": 2.2301,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "bd51c309",
"model": "opus-4.6",
- "score": 0.49,
- "pc1": 2.2962,
- "pc2": -1.33,
- "pc3": -0.4515,
- "pc4": -1.3388,
- "pc5": 0.2521,
- "pc6": -0.3265,
- "pc7": -1.3526,
- "pc8": -0.0,
- "pc9": -0.0654,
- "pc10": 2.078,
+ "score": 0.84,
+ "pc1": 2.9827,
+ "pc2": -1.4028,
+ "pc3": 0.0121,
+ "pc4": 1.4634,
+ "pc5": 0.7393,
+ "pc6": 0.0463,
+ "pc7": -0.5676,
+ "pc8": 0.4421,
+ "pc9": -0.2251,
+ "pc10": 2.4551,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "d184704b",
"model": "opus-4.6",
- "score": 0.915,
- "pc1": 2.2962,
- "pc2": -1.33,
- "pc3": -0.4515,
- "pc4": -1.3388,
- "pc5": 0.2521,
- "pc6": -0.3265,
- "pc7": -1.3526,
- "pc8": -0.0,
- "pc9": -0.0654,
- "pc10": 2.078,
+ "score": 0.92,
+ "pc1": 2.9827,
+ "pc2": -1.4028,
+ "pc3": 0.0121,
+ "pc4": 1.4634,
+ "pc5": 0.7393,
+ "pc6": 0.0463,
+ "pc7": -0.5676,
+ "pc8": 0.4421,
+ "pc9": -0.2251,
+ "pc10": 2.4551,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "135b43a3",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 2.2962,
- "pc2": -1.33,
- "pc3": -0.4515,
- "pc4": -1.3388,
- "pc5": 0.2521,
- "pc6": -0.3265,
- "pc7": -1.3526,
- "pc8": -0.0,
- "pc9": -0.0654,
- "pc10": 2.078,
+ "score": 0.625,
+ "pc1": 2.9827,
+ "pc2": -1.4028,
+ "pc3": 0.0121,
+ "pc4": 1.4634,
+ "pc5": 0.7393,
+ "pc6": 0.0463,
+ "pc7": -0.5676,
+ "pc8": 0.4421,
+ "pc9": -0.2251,
+ "pc10": 2.4551,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "e0c413bd",
"model": "qwen-3.6-plus",
- "score": 0.305,
- "pc1": -1.6374,
- "pc2": 1.8141,
- "pc3": 1.993,
- "pc4": -1.1517,
- "pc5": -0.1125,
- "pc6": -0.9702,
- "pc7": -1.8998,
- "pc8": -0.0,
- "pc9": -0.1025,
- "pc10": 1.7251,
+ "score": 0.44,
+ "pc1": -0.7046,
+ "pc2": 1.5175,
+ "pc3": 3.7359,
+ "pc4": 0.0292,
+ "pc5": -0.7311,
+ "pc6": 0.494,
+ "pc7": -0.0562,
+ "pc8": 0.0687,
+ "pc9": -0.2141,
+ "pc10": 2.4591,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "05536f95",
"model": "sonnet-4.6",
- "score": 0.37,
- "pc1": 2.2867,
- "pc2": -1.3242,
- "pc3": -0.4493,
- "pc4": -1.3386,
- "pc5": 0.2542,
- "pc6": -0.3248,
- "pc7": -1.349,
- "pc8": -0.0,
- "pc9": -0.0654,
- "pc10": 2.0794,
+ "score": 0.835,
+ "pc1": 2.9748,
+ "pc2": -1.3947,
+ "pc3": 0.016,
+ "pc4": 1.4835,
+ "pc5": 0.7017,
+ "pc6": 0.1101,
+ "pc7": -0.4865,
+ "pc8": 0.3051,
+ "pc9": -0.0793,
+ "pc10": 2.5006,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "f8a57948",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.2867,
- "pc2": -1.3242,
- "pc3": -0.4493,
- "pc4": -1.3386,
- "pc5": 0.2542,
- "pc6": -0.3248,
- "pc7": -1.349,
- "pc8": -0.0,
- "pc9": -0.0654,
- "pc10": 2.0794,
+ "score": 0.835,
+ "pc1": 2.9748,
+ "pc2": -1.3947,
+ "pc3": 0.016,
+ "pc4": 1.4835,
+ "pc5": 0.7017,
+ "pc6": 0.1101,
+ "pc7": -0.4865,
+ "pc8": 0.3051,
+ "pc9": -0.0793,
+ "pc10": 2.5006,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "69bb8919",
"model": "sonnet-4.6",
- "score": 0.835,
- "pc1": 2.2867,
- "pc2": -1.3242,
- "pc3": -0.4493,
- "pc4": -1.3386,
- "pc5": 0.2542,
- "pc6": -0.3248,
- "pc7": -1.349,
- "pc8": -0.0,
- "pc9": -0.0654,
- "pc10": 2.0794,
+ "score": 0.915,
+ "pc1": 2.9748,
+ "pc2": -1.3947,
+ "pc3": 0.016,
+ "pc4": 1.4835,
+ "pc5": 0.7017,
+ "pc6": 0.1101,
+ "pc7": -0.4865,
+ "pc8": 0.3051,
+ "pc9": -0.0793,
+ "pc10": 2.5006,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "5a56e90e",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -1.9115,
- "pc2": 0.3439,
- "pc3": 2.4833,
- "pc4": 3.2233,
- "pc5": -1.1141,
- "pc6": -0.216,
- "pc7": -0.1643,
- "pc8": -0.0,
- "pc9": -0.0827,
- "pc10": 1.4035,
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "1f33a77b",
+ "model": "glm-4.7",
+ "score": 0.555,
+ "pc1": -1.2354,
+ "pc2": 0.3704,
+ "pc3": -1.5769,
+ "pc4": -3.3946,
+ "pc5": -1.0821,
+ "pc6": -0.0277,
+ "pc7": 1.1105,
+ "pc8": -0.1709,
+ "pc9": -0.3879,
+ "pc10": 0.0056,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "1f33a77b",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "006df88f",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -1.8732,
- "pc2": 0.7107,
- "pc3": -1.4373,
- "pc4": 3.7036,
- "pc5": -0.6061,
- "pc6": -0.7316,
- "pc7": -0.7875,
- "pc8": -0.0,
- "pc9": -0.04,
- "pc10": 0.8547,
+ "score": 0.63,
+ "pc1": -1.2354,
+ "pc2": 0.3704,
+ "pc3": -1.5769,
+ "pc4": -3.3946,
+ "pc5": -1.0821,
+ "pc6": -0.0277,
+ "pc7": 1.1105,
+ "pc8": -0.1709,
+ "pc9": -0.3879,
+ "pc10": 0.0056,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "f2b6194f",
"model": "glm-4.7",
- "score": 0.595,
- "pc1": -1.8732,
- "pc2": 0.7107,
- "pc3": -1.4373,
- "pc4": 3.7036,
- "pc5": -0.6061,
- "pc6": -0.7316,
- "pc7": -0.7875,
- "pc8": -0.0,
- "pc9": -0.04,
- "pc10": 0.8547,
+ "score": 0.77,
+ "pc1": -1.2354,
+ "pc2": 0.3704,
+ "pc3": -1.5769,
+ "pc4": -3.3946,
+ "pc5": -1.0821,
+ "pc6": -0.0277,
+ "pc7": 1.1105,
+ "pc8": -0.1709,
+ "pc9": -0.3879,
+ "pc10": 0.0056,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "ec163e63",
"model": "glm-5.1",
- "score": 0.3,
- "pc1": -1.8986,
- "pc2": 0.7906,
- "pc3": -1.4585,
- "pc4": 3.634,
- "pc5": -0.4707,
- "pc6": 0.0854,
- "pc7": -0.5892,
- "pc8": -0.0,
- "pc9": -0.0249,
- "pc10": 0.6562,
+ "score": 0.825,
+ "pc1": -1.3679,
+ "pc2": 0.3698,
+ "pc3": -1.8214,
+ "pc4": -3.3696,
+ "pc5": -1.0835,
+ "pc6": 0.4825,
+ "pc7": 0.5676,
+ "pc8": 0.3357,
+ "pc9": -0.3492,
+ "pc10": 0.0528,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "38de2555",
"model": "glm-5.1",
- "score": 0.23,
- "pc1": -1.8986,
- "pc2": 0.7906,
- "pc3": -1.4585,
- "pc4": 3.634,
- "pc5": -0.4707,
- "pc6": 0.0854,
- "pc7": -0.5892,
- "pc8": -0.0,
- "pc9": -0.0249,
- "pc10": 0.6562,
+ "score": 0.785,
+ "pc1": -1.3679,
+ "pc2": 0.3698,
+ "pc3": -1.8214,
+ "pc4": -3.3696,
+ "pc5": -1.0835,
+ "pc6": 0.4825,
+ "pc7": 0.5676,
+ "pc8": 0.3357,
+ "pc9": -0.3492,
+ "pc10": 0.0528,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "11d06468",
"model": "glm-5.1",
- "score": 0.325,
- "pc1": -1.8986,
- "pc2": 0.7906,
- "pc3": -1.4585,
- "pc4": 3.634,
- "pc5": -0.4707,
- "pc6": 0.0854,
- "pc7": -0.5892,
- "pc8": -0.0,
- "pc9": -0.0249,
- "pc10": 0.6562,
+ "score": 0.855,
+ "pc1": -1.3679,
+ "pc2": 0.3698,
+ "pc3": -1.8214,
+ "pc4": -3.3696,
+ "pc5": -1.0835,
+ "pc6": 0.4825,
+ "pc7": 0.5676,
+ "pc8": 0.3357,
+ "pc9": -0.3492,
+ "pc10": 0.0528,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "004dc1a5",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 2.1674,
- "pc2": -2.1775,
- "pc3": 0.3413,
- "pc4": 3.2518,
- "pc5": -0.7833,
- "pc6": -0.0,
- "pc7": 0.0731,
- "pc8": 0.0,
- "pc9": -0.0394,
- "pc10": 1.4066,
+ "score": 0.625,
+ "pc1": 3.0875,
+ "pc2": -2.2884,
+ "pc3": -1.6046,
+ "pc4": -3.1462,
+ "pc5": -0.9732,
+ "pc6": 0.242,
+ "pc7": 0.5372,
+ "pc8": 0.1735,
+ "pc9": -0.2167,
+ "pc10": 0.0787,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "95414e63",
"model": "haiku-4.5",
- "score": 0.34,
- "pc1": 2.1674,
- "pc2": -2.1775,
- "pc3": 0.3413,
- "pc4": 3.2518,
- "pc5": -0.7833,
- "pc6": -0.0,
- "pc7": 0.0731,
- "pc8": 0.0,
- "pc9": -0.0394,
- "pc10": 1.4066,
+ "score": 0.61,
+ "pc1": 3.0875,
+ "pc2": -2.2884,
+ "pc3": -1.6046,
+ "pc4": -3.1462,
+ "pc5": -0.9732,
+ "pc6": 0.242,
+ "pc7": 0.5372,
+ "pc8": 0.1735,
+ "pc9": -0.2167,
+ "pc10": 0.0787,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "805f705d",
"model": "haiku-4.5",
- "score": 0.405,
- "pc1": 2.1674,
- "pc2": -2.1775,
- "pc3": 0.3413,
- "pc4": 3.2518,
- "pc5": -0.7833,
- "pc6": -0.0,
- "pc7": 0.0731,
- "pc8": 0.0,
- "pc9": -0.0394,
- "pc10": 1.4066,
+ "score": 0.665,
+ "pc1": 3.0875,
+ "pc2": -2.2884,
+ "pc3": -1.6046,
+ "pc4": -3.1462,
+ "pc5": -0.9732,
+ "pc6": 0.242,
+ "pc7": 0.5372,
+ "pc8": 0.1735,
+ "pc9": -0.2167,
+ "pc10": 0.0787,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "b51daba4",
"model": "opus-4.6",
- "score": 0.835,
- "pc1": 2.0602,
- "pc2": -2.7987,
- "pc3": 0.0627,
- "pc4": 3.0125,
- "pc5": -0.8238,
- "pc6": -0.0779,
- "pc7": -0.1704,
- "pc8": 0.0,
- "pc9": -0.0413,
- "pc10": 1.2818,
+ "score": 0.87,
+ "pc1": 2.9133,
+ "pc2": -3.0256,
+ "pc3": -1.6751,
+ "pc4": -2.8393,
+ "pc5": -0.896,
+ "pc6": 0.3069,
+ "pc7": 0.3384,
+ "pc8": 0.2354,
+ "pc9": -0.2768,
+ "pc10": 0.1699,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "c946c543",
"model": "opus-4.6",
- "score": 0.49,
- "pc1": 2.0602,
- "pc2": -2.7987,
- "pc3": 0.0627,
- "pc4": 3.0125,
- "pc5": -0.8238,
- "pc6": -0.0779,
- "pc7": -0.1704,
- "pc8": 0.0,
- "pc9": -0.0413,
- "pc10": 1.2818,
+ "score": 0.935,
+ "pc1": 2.9133,
+ "pc2": -3.0256,
+ "pc3": -1.6751,
+ "pc4": -2.8393,
+ "pc5": -0.896,
+ "pc6": 0.3069,
+ "pc7": 0.3384,
+ "pc8": 0.2354,
+ "pc9": -0.2768,
+ "pc10": 0.1699,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "66d681fb",
"model": "opus-4.6",
- "score": 0.835,
- "pc1": 2.0602,
- "pc2": -2.7987,
- "pc3": 0.0627,
- "pc4": 3.0125,
- "pc5": -0.8238,
- "pc6": -0.0779,
- "pc7": -0.1704,
- "pc8": 0.0,
- "pc9": -0.0413,
- "pc10": 1.2818,
+ "score": 0.765,
+ "pc1": 2.9133,
+ "pc2": -3.0256,
+ "pc3": -1.6751,
+ "pc4": -2.8393,
+ "pc5": -0.896,
+ "pc6": 0.3069,
+ "pc7": 0.3384,
+ "pc8": 0.2354,
+ "pc9": -0.2768,
+ "pc10": 0.1699,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "2a96cb7b",
"model": "qwen-3.6-plus",
- "score": 0.255,
- "pc1": -1.8734,
- "pc2": 0.3455,
- "pc3": 2.5073,
- "pc4": 3.1996,
- "pc5": -1.1884,
- "pc6": -0.7215,
- "pc7": -0.7176,
- "pc8": -0.0,
- "pc9": -0.0785,
- "pc10": 0.9288,
+ "score": 0.7,
+ "pc1": -0.774,
+ "pc2": -0.1053,
+ "pc3": 2.0487,
+ "pc4": -4.2735,
+ "pc5": -2.3664,
+ "pc6": 0.7546,
+ "pc7": 0.8497,
+ "pc8": -0.138,
+ "pc9": -0.2658,
+ "pc10": 0.174,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "671816fb",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.0507,
- "pc2": -2.7928,
- "pc3": 0.0649,
- "pc4": 3.0128,
- "pc5": -0.8217,
- "pc6": -0.0762,
- "pc7": -0.1668,
- "pc8": -0.0,
- "pc9": -0.0413,
- "pc10": 1.2831,
+ "score": 0.835,
+ "pc1": 2.9054,
+ "pc2": -3.0174,
+ "pc3": -1.6712,
+ "pc4": -2.8192,
+ "pc5": -0.9336,
+ "pc6": 0.3707,
+ "pc7": 0.4195,
+ "pc8": 0.0984,
+ "pc9": -0.131,
+ "pc10": 0.2155,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "4ba3ba91",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.0507,
- "pc2": -2.7928,
- "pc3": 0.0649,
- "pc4": 3.0128,
- "pc5": -0.8217,
- "pc6": -0.0762,
- "pc7": -0.1668,
- "pc8": -0.0,
- "pc9": -0.0413,
- "pc10": 1.2831,
+ "score": 0.625,
+ "pc1": 2.9054,
+ "pc2": -3.0174,
+ "pc3": -1.6712,
+ "pc4": -2.8192,
+ "pc5": -0.9336,
+ "pc6": 0.3707,
+ "pc7": 0.4195,
+ "pc8": 0.0984,
+ "pc9": -0.131,
+ "pc10": 0.2155,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "d7998414",
"model": "sonnet-4.6",
- "score": 0.19,
- "pc1": 2.0507,
- "pc2": -2.7928,
- "pc3": 0.0649,
- "pc4": 3.0128,
- "pc5": -0.8217,
- "pc6": -0.0762,
- "pc7": -0.1668,
- "pc8": -0.0,
- "pc9": -0.0413,
- "pc10": 1.2831,
+ "score": 0.715,
+ "pc1": 2.9054,
+ "pc2": -3.0174,
+ "pc3": -1.6712,
+ "pc4": -2.8192,
+ "pc5": -0.9336,
+ "pc6": 0.3707,
+ "pc7": 0.4195,
+ "pc8": 0.0984,
+ "pc9": -0.131,
+ "pc10": 0.2155,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=avail_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "0aebd636",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -1.4135,
- "pc2": -0.6547,
- "pc3": 2.2399,
- "pc4": -0.4133,
- "pc5": -0.2853,
- "pc6": 0.0183,
- "pc7": 0.1742,
- "pc8": -0.0,
- "pc9": -0.0373,
- "pc10": 0.3127,
+ "score": 0.5,
+ "pc1": -0.4063,
+ "pc2": -0.9935,
+ "pc3": 3.0475,
+ "pc4": -0.3883,
+ "pc5": -0.4689,
+ "pc6": 0.1777,
+ "pc7": 0.5913,
+ "pc8": -0.3174,
+ "pc9": -0.257,
+ "pc10": -0.22,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=avail_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "d4bac5c7",
+ "model": "gemma-4-26b",
+ "score": 0.3,
+ "pc1": -0.4063,
+ "pc2": -0.9935,
+ "pc3": 3.0475,
+ "pc4": -0.3883,
+ "pc5": -0.4689,
+ "pc6": 0.1777,
+ "pc7": 0.5913,
+ "pc8": -0.3174,
+ "pc9": -0.257,
+ "pc10": -0.22,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=inst_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "f8db33ba",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -2.3603,
- "pc2": -0.1459,
- "pc3": 2.2985,
- "pc4": -0.3352,
- "pc5": -0.2931,
- "pc6": -0.1057,
- "pc7": -0.0737,
- "pc8": -0.0,
- "pc9": -0.0457,
- "pc10": 0.1495,
+ "score": 0.5,
+ "pc1": -1.2546,
+ "pc2": -0.5868,
+ "pc3": 3.5851,
+ "pc4": -0.7229,
+ "pc5": -0.6786,
+ "pc6": 0.055,
+ "pc7": 1.0188,
+ "pc8": -0.1456,
+ "pc9": -0.5455,
+ "pc10": -0.3283,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=detailed_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "aafd88ff",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=inst_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "716e5464",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -1.7163,
- "pc2": 1.3971,
- "pc3": 1.7118,
- "pc4": -1.5302,
- "pc5": -3.0862,
- "pc6": -0.0977,
- "pc7": -0.1063,
- "pc8": -0.0,
- "pc9": -0.0785,
- "pc10": 1.4823,
- "config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
+ "score": 0.575,
+ "pc1": -1.2546,
+ "pc2": -0.5868,
+ "pc3": 3.5851,
+ "pc4": -0.7229,
+ "pc5": -0.6786,
+ "pc6": 0.055,
+ "pc7": 1.0188,
+ "pc8": -0.1456,
+ "pc9": -0.5455,
+ "pc10": -0.3283,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=inst_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "7eabfdf7",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -1.2546,
+ "pc2": -0.5868,
+ "pc3": 3.5851,
+ "pc4": -0.7229,
+ "pc5": -0.6786,
+ "pc6": 0.055,
+ "pc7": 1.0188,
+ "pc8": -0.1456,
+ "pc9": -0.5455,
+ "pc10": -0.3283,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "765055ed",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.4855,
- "pc2": 0.5816,
- "pc3": 2.4865,
- "pc4": 0.027,
- "pc5": 0.2573,
- "pc6": 3.6594,
- "pc7": 4.0252,
- "pc8": 0.0,
- "pc9": -0.059,
- "pc10": 3.4459,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=dom_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "fce1a2a3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=detailed_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "8ea242de",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.5469,
- "pc2": 0.6499,
- "pc3": 1.869,
- "pc4": 0.1033,
- "pc5": 0.3832,
- "pc6": 3.7586,
- "pc7": 3.8448,
- "pc8": 0.0,
- "pc9": -0.0489,
- "pc10": 3.244,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "54fda709",
+ "score": 0.5,
+ "pc1": -0.6295,
+ "pc2": 1.2069,
+ "pc3": 2.5848,
+ "pc4": 1.5711,
+ "pc5": -3.1289,
+ "pc6": 0.2735,
+ "pc7": 1.3928,
+ "pc8": -0.5251,
+ "pc9": -0.6096,
+ "pc10": 0.3385,
+ "config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "d6aa17b0",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -2.4141,
- "pc2": -0.2109,
- "pc3": 2.3441,
- "pc4": -0.043,
- "pc5": -0.4864,
- "pc6": -0.3226,
- "pc7": -0.2019,
- "pc8": -0.0,
- "pc9": -0.0618,
- "pc10": 0.4976,
+ "score": 0.785,
+ "pc1": -1.3534,
+ "pc2": -0.6237,
+ "pc3": 3.3821,
+ "pc4": -0.9134,
+ "pc5": -1.1948,
+ "pc6": 0.2715,
+ "pc7": 0.9022,
+ "pc8": -0.5108,
+ "pc9": -0.3235,
+ "pc10": -0.5779,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "c19f52ca",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -2.3759,
- "pc2": -0.2572,
- "pc3": 2.9884,
- "pc4": -0.1445,
- "pc5": -0.5781,
- "pc6": -0.1282,
- "pc7": 0.0043,
- "pc8": -0.0,
- "pc9": -0.0674,
- "pc10": 0.5848,
+ "score": 0.5,
+ "pc1": -1.4128,
+ "pc2": -0.5892,
+ "pc3": 3.0218,
+ "pc4": -0.7738,
+ "pc5": -1.0241,
+ "pc6": 0.3239,
+ "pc7": 1.1914,
+ "pc8": -0.6302,
+ "pc9": -0.4691,
+ "pc10": -0.0027,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "bf3b4c1a",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -2.4061,
- "pc2": -0.2176,
- "pc3": 2.4864,
- "pc4": -0.0739,
- "pc5": -0.4894,
- "pc6": -0.155,
- "pc7": -0.1232,
- "pc8": -0.0,
- "pc9": -0.0605,
- "pc10": 0.4833,
+ "score": 0.785,
+ "pc1": -1.3705,
+ "pc2": -0.6117,
+ "pc3": 3.4813,
+ "pc4": -0.7167,
+ "pc5": -1.0782,
+ "pc6": -0.0654,
+ "pc7": 1.1098,
+ "pc8": -0.6266,
+ "pc9": -0.6948,
+ "pc10": -0.3319,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "57f6ae14",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -1.3705,
+ "pc2": -0.6117,
+ "pc3": 3.4813,
+ "pc4": -0.7167,
+ "pc5": -1.0782,
+ "pc6": -0.0654,
+ "pc7": 1.1098,
+ "pc8": -0.6266,
+ "pc9": -0.6948,
+ "pc10": -0.3319,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "c34e2662",
"model": "gemma-4-26b",
- "score": 0.365,
- "pc1": -1.4093,
- "pc2": 1.6852,
- "pc3": 2.8484,
- "pc4": 0.1538,
- "pc5": 0.6821,
- "pc6": 0.1197,
- "pc7": 0.9968,
- "pc8": 0.0,
- "pc9": -0.0028,
- "pc10": -0.9367,
+ "score": 0.485,
+ "pc1": -0.5008,
+ "pc2": 1.455,
+ "pc3": 3.7391,
+ "pc4": -1.4769,
+ "pc5": 0.0017,
+ "pc6": 0.2178,
+ "pc7": 0.5827,
+ "pc8": -0.8742,
+ "pc9": 0.0056,
+ "pc10": -2.1981,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "cdf78fbb",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -0.5008,
+ "pc2": 1.455,
+ "pc3": 3.7391,
+ "pc4": -1.4769,
+ "pc5": 0.0017,
+ "pc6": 0.2178,
+ "pc7": 0.5827,
+ "pc8": -0.8742,
+ "pc9": 0.0056,
+ "pc10": -2.1981,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "446f509a",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -0.5008,
+ "pc2": 1.455,
+ "pc3": 3.7391,
+ "pc4": -1.4769,
+ "pc5": 0.0017,
+ "pc6": 0.2178,
+ "pc7": 0.5827,
+ "pc8": -0.8742,
+ "pc9": 0.0056,
+ "pc10": -2.1981,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "e7f9904c",
"model": "gemma-4-26b",
- "score": 0.355,
- "pc1": -1.5859,
- "pc2": 1.4417,
- "pc3": 2.924,
- "pc4": -1.6221,
- "pc5": 1.7909,
- "pc6": 0.3955,
- "pc7": 1.4863,
- "pc8": 0.0,
- "pc9": 0.0299,
- "pc10": -1.7495,
+ "score": 0.5,
+ "pc1": -0.755,
+ "pc2": 1.1341,
+ "pc3": 4.4658,
+ "pc4": 0.0021,
+ "pc5": 1.6465,
+ "pc6": 0.1741,
+ "pc7": 0.1295,
+ "pc8": -0.1417,
+ "pc9": 0.3502,
+ "pc10": -2.7717,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "d4e67364",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -0.755,
+ "pc2": 1.1341,
+ "pc3": 4.4658,
+ "pc4": 0.0021,
+ "pc5": 1.6465,
+ "pc6": 0.1741,
+ "pc7": 0.1295,
+ "pc8": -0.1417,
+ "pc9": 0.3502,
+ "pc10": -2.7717,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "bbf13f79",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -0.755,
+ "pc2": 1.1341,
+ "pc3": 4.4658,
+ "pc4": 0.0021,
+ "pc5": 1.6465,
+ "pc6": 0.1741,
+ "pc7": 0.1295,
+ "pc8": -0.1417,
+ "pc9": 0.3502,
+ "pc10": -2.7717,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
"short_id": "dd347ea0",
"model": "gemma-4-26b",
- "score": 0.425,
- "pc1": -1.4756,
- "pc2": 1.6331,
- "pc3": 2.6179,
- "pc4": -0.7046,
- "pc5": 1.4599,
- "pc6": -0.3509,
- "pc7": -0.9106,
- "pc8": -0.0,
- "pc9": -0.0915,
- "pc10": 1.7676,
+ "score": 0.575,
+ "pc1": -0.477,
+ "pc2": 1.4449,
+ "pc3": 3.9481,
+ "pc4": -0.6642,
+ "pc5": 1.2875,
+ "pc6": 0.0238,
+ "pc7": 0.0297,
+ "pc8": -0.0456,
+ "pc9": -0.4759,
+ "pc10": 1.4214,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run2",
+ "short_id": "152581f0",
+ "model": "gemma-4-26b",
+ "score": 0.59,
+ "pc1": -0.477,
+ "pc2": 1.4449,
+ "pc3": 3.9481,
+ "pc4": -0.6642,
+ "pc5": 1.2875,
+ "pc6": 0.0238,
+ "pc7": 0.0297,
+ "pc8": -0.0456,
+ "pc9": -0.4759,
+ "pc10": 1.4214,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run3",
+ "short_id": "67559863",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -0.477,
+ "pc2": 1.4449,
+ "pc3": 3.9481,
+ "pc4": -0.6642,
+ "pc5": 1.2875,
+ "pc6": 0.0238,
+ "pc7": 0.0297,
+ "pc8": -0.0456,
+ "pc9": -0.4759,
+ "pc10": 1.4214,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
"short_id": "05eb856a",
"model": "gemma-4-26b",
- "score": 0.425,
- "pc1": -1.3495,
- "pc2": 1.6713,
- "pc3": 2.5303,
- "pc4": -1.6407,
- "pc5": -1.1543,
- "pc6": 0.1323,
- "pc7": 0.775,
- "pc8": 0.0,
- "pc9": -0.0388,
- "pc10": 0.2623,
+ "score": 0.485,
+ "pc1": -0.4799,
+ "pc2": 1.4382,
+ "pc3": 3.6796,
+ "pc4": 0.8942,
+ "pc5": -1.0844,
+ "pc6": 0.6256,
+ "pc7": 0.6907,
+ "pc8": -0.0664,
+ "pc9": -0.2298,
+ "pc10": -0.832,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run2",
+ "short_id": "6c6ed5be",
+ "model": "gemma-4-26b",
+ "score": 0.395,
+ "pc1": -0.4799,
+ "pc2": 1.4382,
+ "pc3": 3.6796,
+ "pc4": 0.8942,
+ "pc5": -1.0844,
+ "pc6": 0.6256,
+ "pc7": 0.6907,
+ "pc8": -0.0664,
+ "pc9": -0.2298,
+ "pc10": -0.832,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
"short_id": "e8bc86cf",
"model": "gemma-4-26b",
- "score": 0.44,
- "pc1": -1.4325,
- "pc2": 1.6395,
- "pc3": 2.7115,
- "pc4": 0.9358,
- "pc5": 1.178,
- "pc6": -0.1792,
- "pc7": -0.3187,
- "pc8": -0.0,
- "pc9": -0.0332,
- "pc10": -0.0928,
+ "score": 0.485,
+ "pc1": -0.4754,
+ "pc2": 1.4361,
+ "pc3": 3.352,
+ "pc4": -2.1938,
+ "pc5": 0.3497,
+ "pc6": -0.1565,
+ "pc7": 0.9305,
+ "pc8": -0.3552,
+ "pc9": -0.5908,
+ "pc10": 0.3219,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run2",
+ "short_id": "c43a1165",
+ "model": "gemma-4-26b",
+ "score": 0.5,
+ "pc1": -0.4754,
+ "pc2": 1.4361,
+ "pc3": 3.352,
+ "pc4": -2.1938,
+ "pc5": 0.3497,
+ "pc6": -0.1565,
+ "pc7": 0.9305,
+ "pc8": -0.3552,
+ "pc9": -0.5908,
+ "pc10": 0.3219,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run3",
+ "short_id": "ecb56903",
+ "model": "gemma-4-26b",
+ "score": 0.275,
+ "pc1": -0.4754,
+ "pc2": 1.4361,
+ "pc3": 3.352,
+ "pc4": -2.1938,
+ "pc5": 0.3497,
+ "pc6": -0.1565,
+ "pc7": 0.9305,
+ "pc8": -0.3552,
+ "pc9": -0.5908,
+ "pc10": 0.3219,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
- "short_id": "74535069",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run3",
+ "short_id": "cbfdd709",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -1.5193,
- "pc2": 1.9355,
- "pc3": 1.9652,
- "pc4": -0.5618,
- "pc5": -1.8042,
- "pc6": -0.1152,
- "pc7": -0.0148,
- "pc8": -0.0,
- "pc9": -0.0408,
- "pc10": 0.1352,
+ "score": 0.5,
+ "pc1": -0.5443,
+ "pc2": 1.7786,
+ "pc3": 3.0112,
+ "pc4": 0.3497,
+ "pc5": -2.1159,
+ "pc6": 0.06,
+ "pc7": 1.2353,
+ "pc8": -0.797,
+ "pc9": -0.5063,
+ "pc10": 0.1638,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "40e5421b",
"model": "gemma-4-26b",
- "score": 0.425,
- "pc1": -2.542,
- "pc2": 0.3218,
- "pc3": 2.3446,
- "pc4": -0.1931,
- "pc5": -0.3208,
- "pc6": -0.0326,
- "pc7": 0.1197,
- "pc8": -0.0,
- "pc9": -0.0424,
- "pc10": 0.3509,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "bb2a4c1f",
+ "score": 0.475,
+ "pc1": -1.5843,
+ "pc2": -0.0368,
+ "pc3": 3.3397,
+ "pc4": -0.6752,
+ "pc5": -0.7084,
+ "pc6": 0.1776,
+ "pc7": 0.7584,
+ "pc8": -0.3912,
+ "pc9": -0.3406,
+ "pc10": -0.2367,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "bb129727",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -2.3942,
- "pc2": -0.2314,
- "pc3": 2.6867,
- "pc4": -0.1071,
- "pc5": -0.5146,
- "pc6": -0.0704,
- "pc7": -0.0526,
- "pc8": -0.0,
- "pc9": -0.0618,
- "pc10": 0.5039,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
+ "score": 0.485,
+ "pc1": -1.5843,
+ "pc2": -0.0368,
+ "pc3": 3.3397,
+ "pc4": -0.6752,
+ "pc5": -0.7084,
+ "pc6": 0.1776,
+ "pc7": 0.7584,
+ "pc8": -0.3912,
+ "pc9": -0.3406,
+ "pc10": -0.2367,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=review_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "c1f41f91",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "c429af1c",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -2.3478,
- "pc2": -0.2607,
- "pc3": 2.7029,
- "pc4": -0.1076,
- "pc5": -0.5008,
- "pc6": 0.0166,
- "pc7": 0.1389,
- "pc8": -0.0,
- "pc9": -0.059,
- "pc10": 0.6272,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=review"
+ "score": 0.485,
+ "pc1": -1.5843,
+ "pc2": -0.0368,
+ "pc3": 3.3397,
+ "pc4": -0.6752,
+ "pc5": -0.7084,
+ "pc6": 0.1776,
+ "pc7": 0.7584,
+ "pc8": -0.3912,
+ "pc9": -0.3406,
+ "pc10": -0.2367,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=split_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "fd6ec8c6",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "b8bf00a6",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -2.3759,
- "pc2": -0.2572,
- "pc3": 2.9884,
- "pc4": -0.1445,
- "pc5": -0.5781,
- "pc6": -0.1282,
- "pc7": 0.0043,
- "pc8": 0.0,
- "pc9": -0.0674,
- "pc10": 0.5848,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=split_work"
+ "score": 0.485,
+ "pc1": -1.3721,
+ "pc2": -0.6343,
+ "pc3": 3.3133,
+ "pc4": -0.7927,
+ "pc5": -1.1273,
+ "pc6": 0.417,
+ "pc7": 0.9125,
+ "pc8": -0.3667,
+ "pc9": -0.4357,
+ "pc10": -0.1679,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=review_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "72b46432",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -1.4085,
+ "pc2": -0.6092,
+ "pc3": 3.2426,
+ "pc4": -0.8032,
+ "pc5": -0.9402,
+ "pc6": 0.5734,
+ "pc7": 0.6908,
+ "pc8": -0.1724,
+ "pc9": -0.3785,
+ "pc10": -0.6129,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=review"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "c870aa38",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -1.4988,
- "pc2": -0.7193,
- "pc3": 2.3737,
- "pc4": -0.1034,
- "pc5": -0.5062,
- "pc6": -0.0544,
- "pc7": 0.0512,
- "pc8": -0.0,
- "pc9": -0.05,
- "pc10": 0.5626,
+ "score": 0.485,
+ "pc1": -0.5333,
+ "pc2": -1.0449,
+ "pc3": 2.9756,
+ "pc4": -0.6406,
+ "pc5": -0.7911,
+ "pc6": 0.2364,
+ "pc7": 0.7278,
+ "pc8": -0.4039,
+ "pc9": -0.3495,
+ "pc10": -0.1197,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "3f1a821a",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.4855,
- "pc2": 0.5816,
- "pc3": 2.4865,
- "pc4": 0.027,
- "pc5": 0.2573,
- "pc6": 3.6594,
- "pc7": 4.0252,
- "pc8": 0.0,
- "pc9": -0.059,
- "pc10": 3.4459,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=webgl_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "d1e64a6c",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "9331c142",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.5153,
- "pc2": 0.6153,
- "pc3": 2.1798,
- "pc4": 0.0646,
- "pc5": 0.3191,
- "pc6": 3.7041,
- "pc7": 3.9309,
- "pc8": 0.0,
- "pc9": -0.054,
- "pc10": 3.3419,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ "score": 0.445,
+ "pc1": -0.5333,
+ "pc2": -1.0449,
+ "pc3": 2.9756,
+ "pc4": -0.6406,
+ "pc5": -0.7911,
+ "pc6": 0.2364,
+ "pc7": 0.7278,
+ "pc8": -0.4039,
+ "pc9": -0.3495,
+ "pc10": -0.1197,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "50989696",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.4504,
- "pc2": -0.3136,
- "pc3": -1.3357,
- "pc4": 0.0067,
- "pc5": 0.215,
- "pc6": 0.255,
- "pc7": -0.0474,
- "pc8": 0.0,
- "pc9": 0.0296,
- "pc10": -0.4278,
+ "score": 0.73,
+ "pc1": -0.8846,
+ "pc2": -0.6304,
+ "pc3": -0.5941,
+ "pc4": 0.207,
+ "pc5": -0.0239,
+ "pc6": -0.4565,
+ "pc7": -0.6746,
+ "pc8": 0.2495,
+ "pc9": -0.0199,
+ "pc10": -0.0448,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "1c26e1d8",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.4504,
- "pc2": -0.3136,
- "pc3": -1.3357,
- "pc4": 0.0067,
- "pc5": 0.215,
- "pc6": 0.255,
- "pc7": -0.0474,
- "pc8": 0.0,
- "pc9": 0.0296,
- "pc10": -0.4278,
+ "score": 0.73,
+ "pc1": -0.8846,
+ "pc2": -0.6304,
+ "pc3": -0.5941,
+ "pc4": 0.207,
+ "pc5": -0.0239,
+ "pc6": -0.4565,
+ "pc7": -0.6746,
+ "pc8": 0.2495,
+ "pc9": -0.0199,
+ "pc10": -0.0448,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "bbbed1d6",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -2.3973,
- "pc2": 0.1951,
- "pc3": -1.2771,
- "pc4": 0.0847,
- "pc5": 0.2071,
- "pc6": 0.1309,
- "pc7": -0.2953,
- "pc8": 0.0,
- "pc9": 0.0211,
- "pc10": -0.591,
+ "score": 0.5,
+ "pc1": -1.733,
+ "pc2": -0.2237,
+ "pc3": -0.0566,
+ "pc4": -0.1276,
+ "pc5": -0.2336,
+ "pc6": -0.5793,
+ "pc7": -0.2471,
+ "pc8": 0.4213,
+ "pc9": -0.3084,
+ "pc10": -0.153,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "a5c5892c",
"model": "glm-4.5-air",
- "score": 0.355,
- "pc1": -1.7532,
- "pc2": 1.7382,
- "pc3": -1.8638,
- "pc4": -1.1103,
- "pc5": -2.586,
- "pc6": 0.1389,
- "pc7": -0.3279,
- "pc8": -0.0,
- "pc9": -0.0116,
- "pc10": 0.7418,
+ "score": 0.785,
+ "pc1": -1.1079,
+ "pc2": 1.57,
+ "pc3": -1.0568,
+ "pc4": 2.1663,
+ "pc5": -2.684,
+ "pc6": -0.3608,
+ "pc7": 0.127,
+ "pc8": 0.0418,
+ "pc9": -0.3725,
+ "pc10": 0.5137,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "9df04c44",
"model": "glm-4.5-air",
- "score": 0.155,
- "pc1": -3.5224,
- "pc2": 0.9226,
- "pc3": -1.0891,
- "pc4": 0.4469,
- "pc5": 0.7576,
- "pc6": 3.896,
- "pc7": 3.8036,
- "pc8": 0.0,
- "pc9": 0.0079,
- "pc10": 2.7054,
+ "score": 0.15,
+ "pc1": -2.9821,
+ "pc2": 0.6673,
+ "pc3": -1.5143,
+ "pc4": 0.2826,
+ "pc5": 0.4957,
+ "pc6": -4.7197,
+ "pc7": -1.707,
+ "pc8": -3.1224,
+ "pc9": 0.7763,
+ "pc10": -0.2362,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=dom_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "f2b81da0",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -3.5838,
- "pc2": 0.9909,
- "pc3": -1.7066,
- "pc4": 0.5232,
- "pc5": 0.8835,
- "pc6": 3.9952,
- "pc7": 3.6232,
- "pc8": 0.0,
- "pc9": 0.0179,
- "pc10": 2.5035,
+ "score": 0.665,
+ "pc1": -2.9827,
+ "pc2": 0.6518,
+ "pc3": -1.5751,
+ "pc4": 0.057,
+ "pc5": 0.4306,
+ "pc6": -4.4937,
+ "pc7": -2.2412,
+ "pc8": -3.5033,
+ "pc9": 0.8145,
+ "pc10": -0.0592,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "b06a6737",
"model": "glm-4.5-air",
- "score": 0.28,
- "pc1": -2.4511,
- "pc2": 0.1302,
- "pc3": -1.2315,
- "pc4": 0.377,
- "pc5": 0.0138,
- "pc6": -0.086,
- "pc7": -0.4235,
- "pc8": 0.0,
- "pc9": 0.0051,
- "pc10": -0.2429,
+ "score": 0.47,
+ "pc1": -1.8317,
+ "pc2": -0.2606,
+ "pc3": -0.2595,
+ "pc4": -0.3182,
+ "pc5": -0.7498,
+ "pc6": -0.3627,
+ "pc7": -0.3637,
+ "pc8": 0.0561,
+ "pc9": -0.0863,
+ "pc10": -0.4027,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "bf949cb8",
"model": "glm-4.5-air",
- "score": 0.355,
- "pc1": -2.4129,
- "pc2": 0.0838,
- "pc3": -0.5872,
- "pc4": 0.2755,
- "pc5": -0.0778,
- "pc6": 0.1085,
- "pc7": -0.2173,
- "pc8": -0.0,
- "pc9": -0.0005,
- "pc10": -0.1557,
+ "score": 0.81,
+ "pc1": -1.8911,
+ "pc2": -0.2261,
+ "pc3": -0.6199,
+ "pc4": -0.1786,
+ "pc5": -0.5791,
+ "pc6": -0.3104,
+ "pc7": -0.0744,
+ "pc8": -0.0633,
+ "pc9": -0.2319,
+ "pc10": 0.1726,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "fc29c0fe",
"model": "glm-4.5-air",
- "score": 0.155,
- "pc1": -2.443,
- "pc2": 0.1234,
- "pc3": -1.0892,
- "pc4": 0.346,
- "pc5": 0.0108,
- "pc6": 0.0816,
- "pc7": -0.3448,
- "pc8": -0.0,
- "pc9": 0.0064,
- "pc10": -0.2572,
+ "score": 0.66,
+ "pc1": -1.8488,
+ "pc2": -0.2486,
+ "pc3": -0.1603,
+ "pc4": -0.1214,
+ "pc5": -0.6333,
+ "pc6": -0.6997,
+ "pc7": -0.156,
+ "pc8": -0.0598,
+ "pc9": -0.4577,
+ "pc10": -0.1566,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "aeff2667",
"model": "glm-4.5-air",
- "score": 0.255,
- "pc1": -1.4462,
- "pc2": 2.0262,
- "pc3": -0.7272,
- "pc4": 0.5737,
- "pc5": 1.1823,
- "pc6": 0.3563,
- "pc7": 0.7752,
- "pc8": 0.0,
- "pc9": 0.0641,
- "pc10": -1.6772,
+ "score": 0.835,
+ "pc1": -0.9791,
+ "pc2": 1.8181,
+ "pc3": 0.0975,
+ "pc4": -0.8817,
+ "pc5": 0.4467,
+ "pc6": -0.4165,
+ "pc7": -0.6831,
+ "pc8": -0.3073,
+ "pc9": 0.2428,
+ "pc10": -2.0229,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "99c88e4d",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.6228,
- "pc2": 1.7828,
- "pc3": -0.6516,
- "pc4": -1.2022,
- "pc5": 2.2911,
- "pc6": 0.6321,
- "pc7": 1.2647,
- "pc8": 0.0,
- "pc9": 0.0968,
- "pc10": -2.49,
+ "score": 0.66,
+ "pc1": -1.2334,
+ "pc2": 1.4972,
+ "pc3": 0.8242,
+ "pc4": 0.5974,
+ "pc5": 2.0914,
+ "pc6": -0.4601,
+ "pc7": -1.1363,
+ "pc8": 0.4252,
+ "pc9": 0.5874,
+ "pc10": -2.5964,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
"short_id": "9f153cfc",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.5125,
- "pc2": 1.9741,
- "pc3": -0.9577,
- "pc4": -0.2847,
- "pc5": 1.9601,
- "pc6": -0.1143,
- "pc7": -1.1322,
- "pc8": -0.0,
- "pc9": -0.0246,
- "pc10": 1.0272,
+ "score": 0.65,
+ "pc1": -0.9553,
+ "pc2": 1.808,
+ "pc3": 0.3065,
+ "pc4": -0.069,
+ "pc5": 1.7324,
+ "pc6": -0.6105,
+ "pc7": -1.2362,
+ "pc8": 0.5213,
+ "pc9": -0.2387,
+ "pc10": 1.5967,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
"short_id": "6edd480e",
"model": "glm-4.5-air",
- "score": 0.23,
- "pc1": -1.3864,
- "pc2": 2.0123,
- "pc3": -1.0453,
- "pc4": -1.2207,
- "pc5": -0.6541,
- "pc6": 0.3689,
- "pc7": 0.5534,
- "pc8": 0.0,
- "pc9": 0.0281,
- "pc10": -0.4781,
+ "score": 0.61,
+ "pc1": -0.9582,
+ "pc2": 1.8013,
+ "pc3": 0.038,
+ "pc4": 1.4895,
+ "pc5": -0.6395,
+ "pc6": -0.0087,
+ "pc7": -0.5751,
+ "pc8": 0.5005,
+ "pc9": 0.0074,
+ "pc10": -0.6567,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
"short_id": "1b923d69",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -1.4695,
- "pc2": 1.9805,
- "pc3": -0.8641,
- "pc4": 1.3558,
- "pc5": 1.6782,
- "pc6": 0.0575,
- "pc7": -0.5403,
- "pc8": -0.0,
- "pc9": 0.0337,
- "pc10": -0.8333,
+ "score": 0.78,
+ "pc1": -0.9538,
+ "pc2": 1.7992,
+ "pc3": -0.2897,
+ "pc4": -1.5985,
+ "pc5": 0.7946,
+ "pc6": -0.7908,
+ "pc7": -0.3353,
+ "pc8": 0.2117,
+ "pc9": -0.3536,
+ "pc10": 0.4972,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run3",
"short_id": "5141dfbf",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.4695,
- "pc2": 1.9805,
- "pc3": -0.8641,
- "pc4": 1.3558,
- "pc5": 1.6782,
- "pc6": 0.0575,
- "pc7": -0.5403,
- "pc8": -0.0,
- "pc9": 0.0337,
- "pc10": -0.8333,
+ "score": 0.79,
+ "pc1": -0.9538,
+ "pc2": 1.7992,
+ "pc3": -0.2897,
+ "pc4": -1.5985,
+ "pc5": 0.7946,
+ "pc6": -0.7908,
+ "pc7": -0.3353,
+ "pc8": 0.2117,
+ "pc9": -0.3536,
+ "pc10": 0.4972,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "c4e635d1",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.5562,
- "pc2": 2.2765,
- "pc3": -1.6104,
- "pc4": -0.1419,
- "pc5": -1.304,
- "pc6": 0.1214,
- "pc7": -0.2364,
- "pc8": -0.0,
- "pc9": 0.0261,
- "pc10": -0.6053,
+ "score": 0.66,
+ "pc1": -1.0227,
+ "pc2": 2.1417,
+ "pc3": -0.6304,
+ "pc4": 0.945,
+ "pc5": -1.6709,
+ "pc6": -0.5742,
+ "pc7": -0.0305,
+ "pc8": -0.2301,
+ "pc9": -0.2691,
+ "pc10": 0.3391,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "3f7bdd4d",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -2.5789,
- "pc2": 0.6628,
- "pc3": -1.231,
- "pc4": 0.2268,
- "pc5": 0.1795,
- "pc6": 0.204,
- "pc7": -0.1019,
- "pc8": 0.0,
- "pc9": 0.0244,
- "pc10": -0.3895,
+ "score": 0.785,
+ "pc1": -2.0627,
+ "pc2": 0.3263,
+ "pc3": -0.3019,
+ "pc4": -0.0799,
+ "pc5": -0.2634,
+ "pc6": -0.4567,
+ "pc7": -0.5074,
+ "pc8": 0.1757,
+ "pc9": -0.1034,
+ "pc10": -0.0615,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "456d514c",
"model": "glm-4.5-air",
- "score": 0.155,
- "pc1": -2.5789,
- "pc2": 0.6628,
- "pc3": -1.231,
- "pc4": 0.2268,
- "pc5": 0.1795,
- "pc6": 0.204,
- "pc7": -0.1019,
- "pc8": 0.0,
- "pc9": 0.0244,
- "pc10": -0.3895,
+ "score": 0.595,
+ "pc1": -2.0627,
+ "pc2": 0.3263,
+ "pc3": -0.3019,
+ "pc4": -0.0799,
+ "pc5": -0.2634,
+ "pc6": -0.4567,
+ "pc7": -0.5074,
+ "pc8": 0.1757,
+ "pc9": -0.1034,
+ "pc10": -0.0615,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "9bdf645c",
"model": "glm-4.5-air",
- "score": 0.155,
- "pc1": -2.5789,
- "pc2": 0.6628,
- "pc3": -1.231,
- "pc4": 0.2268,
- "pc5": 0.1795,
- "pc6": 0.204,
- "pc7": -0.1019,
- "pc8": 0.0,
- "pc9": 0.0244,
- "pc10": -0.3895,
+ "score": 0.64,
+ "pc1": -2.0627,
+ "pc2": 0.3263,
+ "pc3": -0.3019,
+ "pc4": -0.0799,
+ "pc5": -0.2634,
+ "pc6": -0.4567,
+ "pc7": -0.5074,
+ "pc8": 0.1757,
+ "pc9": -0.1034,
+ "pc10": -0.0615,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "bcf5c94f",
"model": "glm-4.5-air",
- "score": 0.25,
- "pc1": -2.4312,
- "pc2": 0.1096,
- "pc3": -0.8889,
- "pc4": 0.3129,
- "pc5": -0.0143,
- "pc6": 0.1662,
- "pc7": -0.2742,
- "pc8": -0.0,
- "pc9": 0.0051,
- "pc10": -0.2366,
+ "score": 0.585,
+ "pc1": -1.8505,
+ "pc2": -0.2712,
+ "pc3": -0.3283,
+ "pc4": -0.1974,
+ "pc5": -0.6823,
+ "pc6": -0.2173,
+ "pc7": -0.3533,
+ "pc8": 0.2002,
+ "pc9": -0.1986,
+ "pc10": 0.0074,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=review_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "a735c6a6",
"model": "glm-4.5-air",
- "score": 0.28,
- "pc1": -2.3847,
- "pc2": 0.0803,
- "pc3": -0.8727,
- "pc4": 0.3124,
- "pc5": -0.0006,
- "pc6": 0.2533,
- "pc7": -0.0827,
- "pc8": 0.0,
- "pc9": 0.0078,
- "pc10": -0.1133,
+ "score": 0.785,
+ "pc1": -1.8869,
+ "pc2": -0.2461,
+ "pc3": -0.399,
+ "pc4": -0.208,
+ "pc5": -0.4952,
+ "pc6": -0.0609,
+ "pc7": -0.5751,
+ "pc8": 0.3945,
+ "pc9": -0.1413,
+ "pc10": -0.4377,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=review"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=split_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "cf58411d",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -2.4129,
- "pc2": 0.0838,
- "pc3": -0.5872,
- "pc4": 0.2755,
- "pc5": -0.0778,
- "pc6": 0.1085,
- "pc7": -0.2173,
- "pc8": 0.0,
- "pc9": -0.0005,
- "pc10": -0.1557,
+ "score": 0.705,
+ "pc1": -1.8922,
+ "pc2": -0.2308,
+ "pc3": -0.327,
+ "pc4": -0.1945,
+ "pc5": -0.5059,
+ "pc6": -0.2377,
+ "pc7": -0.4884,
+ "pc8": 0.2139,
+ "pc9": -0.3963,
+ "pc10": -0.0643,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=split_work"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "22684291",
"model": "glm-4.5-air",
- "score": 0.255,
- "pc1": -1.5357,
- "pc2": -0.3783,
- "pc3": -1.2019,
- "pc4": 0.3165,
- "pc5": -0.006,
- "pc6": 0.1822,
- "pc7": -0.1704,
- "pc8": -0.0,
- "pc9": 0.0168,
- "pc10": -0.1779,
+ "score": 0.35,
+ "pc1": -1.0116,
+ "pc2": -0.6818,
+ "pc3": -0.666,
+ "pc4": -0.0454,
+ "pc5": -0.3461,
+ "pc6": -0.3978,
+ "pc7": -0.538,
+ "pc8": 0.163,
+ "pc9": -0.1124,
+ "pc10": 0.0556,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "971a1a50",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -3.5224,
- "pc2": 0.9226,
- "pc3": -1.0891,
- "pc4": 0.4469,
- "pc5": 0.7576,
- "pc6": 3.896,
- "pc7": 3.8036,
- "pc8": 0.0,
- "pc9": 0.0079,
- "pc10": 2.7054,
+ "score": 0.61,
+ "pc1": -2.9822,
+ "pc2": 0.6558,
+ "pc3": -1.7144,
+ "pc4": 0.1114,
+ "pc5": 0.2832,
+ "pc6": -4.3202,
+ "pc7": -1.6782,
+ "pc8": -2.9977,
+ "pc9": 0.745,
+ "pc10": 0.1517,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=webgl_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "53ca551d",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -3.5522,
- "pc2": 0.9563,
- "pc3": -1.3958,
- "pc4": 0.4846,
- "pc5": 0.8194,
- "pc6": 3.9408,
- "pc7": 3.7093,
- "pc8": 0.0,
- "pc9": 0.0129,
- "pc10": 2.6015,
+ "score": 0.71,
+ "pc1": -2.9822,
+ "pc2": 0.6397,
+ "pc3": -1.8112,
+ "pc4": 0.1137,
+ "pc5": 0.4698,
+ "pc6": -4.3443,
+ "pc7": -1.5346,
+ "pc8": -2.7553,
+ "pc9": 0.8175,
+ "pc10": 0.2907,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "fa2674ac",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -1.3752,
- "pc2": -0.2879,
- "pc3": -1.6807,
- "pc4": 0.067,
- "pc5": 0.2228,
- "pc6": -0.4973,
- "pc7": -0.449,
- "pc8": 0.0,
- "pc9": 0.0055,
- "pc10": -0.2361,
+ "score": 0.68,
+ "pc1": -0.9026,
+ "pc2": -0.583,
+ "pc3": -0.6554,
+ "pc4": 0.3028,
+ "pc5": 0.3514,
+ "pc6": -0.316,
+ "pc7": 0.2717,
+ "pc8": -0.2201,
+ "pc9": 0.0122,
+ "pc10": -0.0832,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "c22109f8",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "1a707fda",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -2.3221,
- "pc2": 0.2209,
- "pc3": -1.6221,
- "pc4": 0.1451,
- "pc5": 0.2149,
- "pc6": -0.6213,
- "pc7": -0.6969,
- "pc8": 0.0,
- "pc9": -0.003,
- "pc10": -0.3993,
+ "score": 0.68,
+ "pc1": -0.9026,
+ "pc2": -0.583,
+ "pc3": -0.6554,
+ "pc4": 0.3028,
+ "pc5": 0.3514,
+ "pc6": -0.316,
+ "pc7": 0.2717,
+ "pc8": -0.2201,
+ "pc9": 0.0122,
+ "pc10": -0.0832,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
- "short_id": "56afde62",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "579bb01f",
"model": "glm-4.7",
- "score": 0.305,
- "pc1": -1.6781,
- "pc2": 1.7639,
- "pc3": -2.2088,
- "pc4": -1.0499,
- "pc5": -2.5782,
- "pc6": -0.6133,
- "pc7": -0.7295,
- "pc8": -0.0,
- "pc9": -0.0357,
- "pc10": 0.9335,
+ "score": 0.71,
+ "pc1": -0.9026,
+ "pc2": -0.583,
+ "pc3": -0.6554,
+ "pc4": 0.3028,
+ "pc5": 0.3514,
+ "pc6": -0.316,
+ "pc7": 0.2717,
+ "pc8": -0.2201,
+ "pc9": 0.0122,
+ "pc10": -0.0832,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "c22109f8",
+ "model": "glm-4.7",
+ "score": 0.46,
+ "pc1": -1.751,
+ "pc2": -0.1764,
+ "pc3": -0.1178,
+ "pc4": -0.0319,
+ "pc5": 0.1417,
+ "pc6": -0.4388,
+ "pc7": 0.6992,
+ "pc8": -0.0483,
+ "pc9": -0.2763,
+ "pc10": -0.1914,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "b29d8782",
+ "model": "glm-4.7",
+ "score": 0.51,
+ "pc1": -1.751,
+ "pc2": -0.1764,
+ "pc3": -0.1178,
+ "pc4": -0.0319,
+ "pc5": 0.1417,
+ "pc6": -0.4388,
+ "pc7": 0.6992,
+ "pc8": -0.0483,
+ "pc9": -0.2763,
+ "pc10": -0.1914,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "0172e311",
+ "model": "glm-4.7",
+ "score": 0.68,
+ "pc1": -1.751,
+ "pc2": -0.1764,
+ "pc3": -0.1178,
+ "pc4": -0.0319,
+ "pc5": 0.1417,
+ "pc6": -0.4388,
+ "pc7": 0.6992,
+ "pc8": -0.0483,
+ "pc9": -0.2763,
+ "pc10": -0.1914,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "df766a22",
+ "model": "glm-4.7",
+ "score": 0.775,
+ "pc1": -1.1259,
+ "pc2": 1.6173,
+ "pc3": -1.1181,
+ "pc4": 2.2621,
+ "pc5": -2.3087,
+ "pc6": -0.2202,
+ "pc7": 1.0733,
+ "pc8": -0.4278,
+ "pc9": -0.3404,
+ "pc10": 0.4753,
+ "config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "56afde62",
+ "model": "glm-4.7",
+ "score": 0.865,
+ "pc1": -1.1259,
+ "pc2": 1.6173,
+ "pc3": -1.1181,
+ "pc4": 2.2621,
+ "pc5": -2.3087,
+ "pc6": -0.2202,
+ "pc7": 1.0733,
+ "pc8": -0.4278,
+ "pc9": -0.3404,
+ "pc10": 0.4753,
+ "config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "9539a678",
+ "model": "glm-4.7",
+ "score": 0.95,
+ "pc1": -1.1259,
+ "pc2": 1.6173,
+ "pc3": -1.1181,
+ "pc4": 2.2621,
+ "pc5": -2.3087,
+ "pc6": -0.2202,
+ "pc7": 1.0733,
+ "pc8": -0.4278,
+ "pc9": -0.3404,
+ "pc10": 0.4753,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "08a7e577",
+ "model": "glm-4.7",
+ "score": 0.81,
+ "pc1": -3.0001,
+ "pc2": 0.7146,
+ "pc3": -1.5756,
+ "pc4": 0.3783,
+ "pc5": 0.871,
+ "pc6": -4.5792,
+ "pc7": -0.7607,
+ "pc8": -3.592,
+ "pc9": 0.8083,
+ "pc10": -0.2746,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "72e3256f",
+ "model": "glm-4.7",
+ "score": 0.725,
+ "pc1": -3.0001,
+ "pc2": 0.7146,
+ "pc3": -1.5756,
+ "pc4": 0.3783,
+ "pc5": 0.871,
+ "pc6": -4.5792,
+ "pc7": -0.7607,
+ "pc8": -3.592,
+ "pc9": 0.8083,
+ "pc10": -0.2746,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "8170834b",
+ "model": "glm-4.7",
+ "score": 0.715,
+ "pc1": -3.0001,
+ "pc2": 0.7146,
+ "pc3": -1.5756,
+ "pc4": 0.3783,
+ "pc5": 0.871,
+ "pc6": -4.5792,
+ "pc7": -0.7607,
+ "pc8": -3.592,
+ "pc9": 0.8083,
+ "pc10": -0.2746,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=dom_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "0048ecdc",
+ "model": "glm-4.7",
+ "score": 0.735,
+ "pc1": -3.0007,
+ "pc2": 0.6992,
+ "pc3": -1.6364,
+ "pc4": 0.1527,
+ "pc5": 0.8059,
+ "pc6": -4.3532,
+ "pc7": -1.2949,
+ "pc8": -3.9729,
+ "pc9": 0.8465,
+ "pc10": -0.0976,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "6a743388",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -2.3759,
- "pc2": 0.1559,
- "pc3": -1.5765,
- "pc4": 0.4373,
- "pc5": 0.0216,
- "pc6": -0.8382,
- "pc7": -0.8251,
- "pc8": 0.0,
- "pc9": -0.0191,
- "pc10": -0.0512,
+ "score": 0.61,
+ "pc1": -1.8498,
+ "pc2": -0.2132,
+ "pc3": -0.3208,
+ "pc4": -0.2224,
+ "pc5": -0.3745,
+ "pc6": -0.2222,
+ "pc7": 0.5826,
+ "pc8": -0.4136,
+ "pc9": -0.0543,
+ "pc10": -0.4411,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "af5e84fc",
"model": "glm-4.7",
- "score": 0.305,
- "pc1": -2.3759,
- "pc2": 0.1559,
- "pc3": -1.5765,
- "pc4": 0.4373,
- "pc5": 0.0216,
- "pc6": -0.8382,
- "pc7": -0.8251,
- "pc8": 0.0,
- "pc9": -0.0191,
- "pc10": -0.0512,
+ "score": 0.61,
+ "pc1": -1.8498,
+ "pc2": -0.2132,
+ "pc3": -0.3208,
+ "pc4": -0.2224,
+ "pc5": -0.3745,
+ "pc6": -0.2222,
+ "pc7": 0.5826,
+ "pc8": -0.4136,
+ "pc9": -0.0543,
+ "pc10": -0.4411,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "2f761815",
"model": "glm-4.7",
- "score": 0.355,
- "pc1": -2.3759,
- "pc2": 0.1559,
- "pc3": -1.5765,
- "pc4": 0.4373,
- "pc5": 0.0216,
- "pc6": -0.8382,
- "pc7": -0.8251,
- "pc8": 0.0,
- "pc9": -0.0191,
- "pc10": -0.0512,
+ "score": 0.835,
+ "pc1": -1.8498,
+ "pc2": -0.2132,
+ "pc3": -0.3208,
+ "pc4": -0.2224,
+ "pc5": -0.3745,
+ "pc6": -0.2222,
+ "pc7": 0.5826,
+ "pc8": -0.4136,
+ "pc9": -0.0543,
+ "pc10": -0.4411,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
},
{
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "7fc5c868",
+ "model": "glm-4.7",
+ "score": 0.785,
+ "pc1": -1.9092,
+ "pc2": -0.1788,
+ "pc3": -0.6811,
+ "pc4": -0.0828,
+ "pc5": -0.2038,
+ "pc6": -0.1698,
+ "pc7": 0.8719,
+ "pc8": -0.5329,
+ "pc9": -0.1998,
+ "pc10": 0.1342,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "725bc5af",
+ "model": "glm-4.7",
+ "score": 0.61,
+ "pc1": -1.9092,
+ "pc2": -0.1788,
+ "pc3": -0.6811,
+ "pc4": -0.0828,
+ "pc5": -0.2038,
+ "pc6": -0.1698,
+ "pc7": 0.8719,
+ "pc8": -0.5329,
+ "pc9": -0.1998,
+ "pc10": 0.1342,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
+ },
+ {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "e0237626",
"model": "glm-4.7",
- "score": 0.34,
- "pc1": -2.3678,
- "pc2": 0.1491,
- "pc3": -1.4342,
- "pc4": 0.4064,
- "pc5": 0.0186,
- "pc6": -0.6707,
- "pc7": -0.7463,
- "pc8": -0.0,
- "pc9": -0.0178,
- "pc10": -0.0655,
+ "score": 0.835,
+ "pc1": -1.8669,
+ "pc2": -0.2012,
+ "pc3": -0.2216,
+ "pc4": -0.0257,
+ "pc5": -0.258,
+ "pc6": -0.5592,
+ "pc7": 0.7902,
+ "pc8": -0.5294,
+ "pc9": -0.4256,
+ "pc10": -0.195,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "b02a62f0",
+ "model": "glm-4.7",
+ "score": 0.715,
+ "pc1": -1.8669,
+ "pc2": -0.2012,
+ "pc3": -0.2216,
+ "pc4": -0.0257,
+ "pc5": -0.258,
+ "pc6": -0.5592,
+ "pc7": 0.7902,
+ "pc8": -0.5294,
+ "pc9": -0.4256,
+ "pc10": -0.195,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "d46e8439",
+ "model": "glm-4.7",
+ "score": 0.92,
+ "pc1": -1.8669,
+ "pc2": -0.2012,
+ "pc3": -0.2216,
+ "pc4": -0.0257,
+ "pc5": -0.258,
+ "pc6": -0.5592,
+ "pc7": 0.7902,
+ "pc8": -0.5294,
+ "pc9": -0.4256,
+ "pc10": -0.195,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
},
{
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "ae68d5c1",
+ "model": "glm-4.7",
+ "score": 0.835,
+ "pc1": -0.9972,
+ "pc2": 1.8654,
+ "pc3": 0.0362,
+ "pc4": -0.7859,
+ "pc5": 0.822,
+ "pc6": -0.276,
+ "pc7": 0.2631,
+ "pc8": -0.7769,
+ "pc9": 0.2748,
+ "pc10": -2.0613,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "31a529dc",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -1.371,
- "pc2": 2.052,
- "pc3": -1.0722,
- "pc4": 0.6341,
- "pc5": 1.1901,
- "pc6": -0.3959,
- "pc7": 0.3737,
- "pc8": 0.0,
- "pc9": 0.0399,
- "pc10": -1.4855,
+ "score": 0.8,
+ "pc1": -0.9972,
+ "pc2": 1.8654,
+ "pc3": 0.0362,
+ "pc4": -0.7859,
+ "pc5": 0.822,
+ "pc6": -0.276,
+ "pc7": 0.2631,
+ "pc8": -0.7769,
+ "pc9": 0.2748,
+ "pc10": -2.0613,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "1d046ee9",
+ "model": "glm-4.7",
+ "score": 0.835,
+ "pc1": -0.9972,
+ "pc2": 1.8654,
+ "pc3": 0.0362,
+ "pc4": -0.7859,
+ "pc5": 0.822,
+ "pc6": -0.276,
+ "pc7": 0.2631,
+ "pc8": -0.7769,
+ "pc9": 0.2748,
+ "pc10": -2.0613,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "97dcc55e",
+ "model": "glm-4.7",
+ "score": 0.68,
+ "pc1": -1.2514,
+ "pc2": 1.5445,
+ "pc3": 0.7629,
+ "pc4": 0.6932,
+ "pc5": 2.4667,
+ "pc6": -0.3196,
+ "pc7": -0.1901,
+ "pc8": -0.0444,
+ "pc9": 0.6195,
+ "pc10": -2.6348,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "fe0ccd52",
+ "model": "glm-4.7",
+ "score": 0.66,
+ "pc1": -1.2514,
+ "pc2": 1.5445,
+ "pc3": 0.7629,
+ "pc4": 0.6932,
+ "pc5": 2.4667,
+ "pc6": -0.3196,
+ "pc7": -0.1901,
+ "pc8": -0.0444,
+ "pc9": 0.6195,
+ "pc10": -2.6348,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "65b5c05a",
+ "model": "glm-4.7",
+ "score": 0.61,
+ "pc1": -1.2514,
+ "pc2": 1.5445,
+ "pc3": 0.7629,
+ "pc4": 0.6932,
+ "pc5": 2.4667,
+ "pc6": -0.3196,
+ "pc7": -0.1901,
+ "pc8": -0.0444,
+ "pc9": 0.6195,
+ "pc10": -2.6348,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
"short_id": "6a018f5e",
"model": "glm-4.7",
- "score": 0.19,
- "pc1": -1.4373,
- "pc2": 1.9999,
- "pc3": -1.3027,
- "pc4": -0.2244,
- "pc5": 1.9679,
- "pc6": -0.8665,
- "pc7": -1.5337,
- "pc8": -0.0,
- "pc9": -0.0487,
- "pc10": 1.2188,
+ "score": 0.675,
+ "pc1": -0.9734,
+ "pc2": 1.8553,
+ "pc3": 0.2452,
+ "pc4": 0.0268,
+ "pc5": 2.1078,
+ "pc6": -0.4699,
+ "pc7": -0.2899,
+ "pc8": 0.0516,
+ "pc9": -0.2067,
+ "pc10": 1.5583,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run2",
+ "short_id": "03271a40",
+ "model": "glm-4.7",
+ "score": 0.655,
+ "pc1": -0.9734,
+ "pc2": 1.8553,
+ "pc3": 0.2452,
+ "pc4": 0.0268,
+ "pc5": 2.1078,
+ "pc6": -0.4699,
+ "pc7": -0.2899,
+ "pc8": 0.0516,
+ "pc9": -0.2067,
+ "pc10": 1.5583,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run3",
"short_id": "ed0b0147",
"model": "glm-4.7",
- "score": 0.255,
- "pc1": -1.4373,
- "pc2": 1.9999,
- "pc3": -1.3027,
- "pc4": -0.2244,
- "pc5": 1.9679,
- "pc6": -0.8665,
- "pc7": -1.5337,
- "pc8": -0.0,
- "pc9": -0.0487,
- "pc10": 1.2188,
+ "score": 0.69,
+ "pc1": -0.9734,
+ "pc2": 1.8553,
+ "pc3": 0.2452,
+ "pc4": 0.0268,
+ "pc5": 2.1078,
+ "pc6": -0.4699,
+ "pc7": -0.2899,
+ "pc8": 0.0516,
+ "pc9": -0.2067,
+ "pc10": 1.5583,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
+ "short_id": "43bf214b",
+ "model": "glm-4.7",
+ "score": 0.64,
+ "pc1": -0.9763,
+ "pc2": 1.8486,
+ "pc3": -0.0233,
+ "pc4": 1.5853,
+ "pc5": -0.2642,
+ "pc6": 0.1318,
+ "pc7": 0.3712,
+ "pc8": 0.0309,
+ "pc9": 0.0394,
+ "pc10": -0.6951,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run2",
+ "short_id": "b1f67906",
+ "model": "glm-4.7",
+ "score": 0.78,
+ "pc1": -0.9763,
+ "pc2": 1.8486,
+ "pc3": -0.0233,
+ "pc4": 1.5853,
+ "pc5": -0.2642,
+ "pc6": 0.1318,
+ "pc7": 0.3712,
+ "pc8": 0.0309,
+ "pc9": 0.0394,
+ "pc10": -0.6951,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run3",
+ "short_id": "34c22060",
+ "model": "glm-4.7",
+ "score": 0.645,
+ "pc1": -0.9763,
+ "pc2": 1.8486,
+ "pc3": -0.0233,
+ "pc4": 1.5853,
+ "pc5": -0.2642,
+ "pc6": 0.1318,
+ "pc7": 0.3712,
+ "pc8": 0.0309,
+ "pc9": 0.0394,
+ "pc10": -0.6951,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
+ "short_id": "f4d7e3a0",
+ "model": "glm-4.7",
+ "score": 0.275,
+ "pc1": -0.9718,
+ "pc2": 1.8465,
+ "pc3": -0.3509,
+ "pc4": -1.5028,
+ "pc5": 1.1699,
+ "pc6": -0.6502,
+ "pc7": 0.6109,
+ "pc8": -0.2579,
+ "pc9": -0.3216,
+ "pc10": 0.4588,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run2",
"short_id": "e8d32946",
"model": "glm-4.7",
- "score": 0.29,
- "pc1": -1.3943,
- "pc2": 2.0063,
- "pc3": -1.209,
- "pc4": 1.4161,
- "pc5": 1.686,
- "pc6": -0.6948,
- "pc7": -0.9419,
- "pc8": -0.0,
- "pc9": 0.0096,
- "pc10": -0.6416,
+ "score": 0.835,
+ "pc1": -0.9718,
+ "pc2": 1.8465,
+ "pc3": -0.3509,
+ "pc4": -1.5028,
+ "pc5": 1.1699,
+ "pc6": -0.6502,
+ "pc7": 0.6109,
+ "pc8": -0.2579,
+ "pc9": -0.3216,
+ "pc10": 0.4588,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run3",
+ "short_id": "184f81dd",
+ "model": "glm-4.7",
+ "score": 0.5,
+ "pc1": -0.9718,
+ "pc2": 1.8465,
+ "pc3": -0.3509,
+ "pc4": -1.5028,
+ "pc5": 1.1699,
+ "pc6": -0.6502,
+ "pc7": 0.6109,
+ "pc8": -0.2579,
+ "pc9": -0.3216,
+ "pc10": 0.4588,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
+ "short_id": "b025b603",
+ "model": "glm-4.7",
+ "score": 0.835,
+ "pc1": -1.0407,
+ "pc2": 2.1891,
+ "pc3": -0.6917,
+ "pc4": 1.0408,
+ "pc5": -1.2956,
+ "pc6": -0.4337,
+ "pc7": 0.9157,
+ "pc8": -0.6998,
+ "pc9": -0.2371,
+ "pc10": 0.3007,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run2",
+ "short_id": "76f89680",
+ "model": "glm-4.7",
+ "score": 0.65,
+ "pc1": -1.0407,
+ "pc2": 2.1891,
+ "pc3": -0.6917,
+ "pc4": 1.0408,
+ "pc5": -1.2956,
+ "pc6": -0.4337,
+ "pc7": 0.9157,
+ "pc8": -0.6998,
+ "pc9": -0.2371,
+ "pc10": 0.3007,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run3",
+ "short_id": "2e5ad7e5",
+ "model": "glm-4.7",
+ "score": 0.76,
+ "pc1": -1.0407,
+ "pc2": 2.1891,
+ "pc3": -0.6917,
+ "pc4": 1.0408,
+ "pc5": -1.2956,
+ "pc6": -0.4337,
+ "pc7": 0.9157,
+ "pc8": -0.6998,
+ "pc9": -0.2371,
+ "pc10": 0.3007,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "0a030357",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -2.5037,
- "pc2": 0.6886,
- "pc3": -1.576,
- "pc4": 0.2872,
- "pc5": 0.1873,
- "pc6": -0.5483,
- "pc7": -0.5035,
- "pc8": -0.0,
- "pc9": 0.0003,
- "pc10": -0.1979,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
- "short_id": "fd037e18",
+ "score": 0.55,
+ "pc1": -2.0807,
+ "pc2": 0.3736,
+ "pc3": -0.3632,
+ "pc4": 0.0158,
+ "pc5": 0.1119,
+ "pc6": -0.3162,
+ "pc7": 0.4388,
+ "pc8": -0.2939,
+ "pc9": -0.0714,
+ "pc10": -0.0999,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "101e6752",
+ "model": "glm-4.7",
+ "score": 0.835,
+ "pc1": -1.8685,
+ "pc2": -0.2238,
+ "pc3": -0.3896,
+ "pc4": -0.1017,
+ "pc5": -0.307,
+ "pc6": -0.0767,
+ "pc7": 0.5929,
+ "pc8": -0.2694,
+ "pc9": -0.1665,
+ "pc10": -0.031,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "626b3efd",
+ "model": "glm-4.7",
+ "score": 0.715,
+ "pc1": -1.8685,
+ "pc2": -0.2238,
+ "pc3": -0.3896,
+ "pc4": -0.1017,
+ "pc5": -0.307,
+ "pc6": -0.0767,
+ "pc7": 0.5929,
+ "pc8": -0.2694,
+ "pc9": -0.1665,
+ "pc10": -0.031,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "0d5536fc",
+ "model": "glm-4.7",
+ "score": 0.665,
+ "pc1": -1.8685,
+ "pc2": -0.2238,
+ "pc3": -0.3896,
+ "pc4": -0.1017,
+ "pc5": -0.307,
+ "pc6": -0.0767,
+ "pc7": 0.5929,
+ "pc8": -0.2694,
+ "pc9": -0.1665,
+ "pc10": -0.031,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "60136e04",
+ "model": "glm-4.7",
+ "score": 0.47,
+ "pc1": -1.0297,
+ "pc2": -0.6345,
+ "pc3": -0.7273,
+ "pc4": 0.0504,
+ "pc5": 0.0292,
+ "pc6": -0.2573,
+ "pc7": 0.4083,
+ "pc8": -0.3066,
+ "pc9": -0.0803,
+ "pc10": 0.0172,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "2e6a64f1",
+ "model": "glm-4.7",
+ "score": 0.5,
+ "pc1": -1.0297,
+ "pc2": -0.6345,
+ "pc3": -0.7273,
+ "pc4": 0.0504,
+ "pc5": 0.0292,
+ "pc6": -0.2573,
+ "pc7": 0.4083,
+ "pc8": -0.3066,
+ "pc9": -0.0803,
+ "pc10": 0.0172,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "750d7f27",
+ "model": "glm-4.7",
+ "score": 0.705,
+ "pc1": -1.0297,
+ "pc2": -0.6345,
+ "pc3": -0.7273,
+ "pc4": 0.0504,
+ "pc5": 0.0292,
+ "pc6": -0.2573,
+ "pc7": 0.4083,
+ "pc8": -0.3066,
+ "pc9": -0.0803,
+ "pc10": 0.0172,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "a41e7e52",
+ "model": "glm-4.7",
+ "score": 0.715,
+ "pc1": -3.0003,
+ "pc2": 0.7031,
+ "pc3": -1.7757,
+ "pc4": 0.2072,
+ "pc5": 0.6585,
+ "pc6": -4.1796,
+ "pc7": -0.7319,
+ "pc8": -3.4673,
+ "pc9": 0.7771,
+ "pc10": 0.1133,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "a23cb59b",
"model": "glm-4.7",
- "score": 0.34,
- "pc1": -2.5037,
- "pc2": 0.6886,
- "pc3": -1.576,
- "pc4": 0.2872,
- "pc5": 0.1873,
- "pc6": -0.5483,
- "pc7": -0.5035,
- "pc8": -0.0,
- "pc9": 0.0003,
- "pc10": -0.1979,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
- "short_id": "ad716871",
+ "score": 0.64,
+ "pc1": -3.0003,
+ "pc2": 0.7031,
+ "pc3": -1.7757,
+ "pc4": 0.2072,
+ "pc5": 0.6585,
+ "pc6": -4.1796,
+ "pc7": -0.7319,
+ "pc8": -3.4673,
+ "pc9": 0.7771,
+ "pc10": 0.1133,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "9fed9f45",
"model": "glm-4.7",
- "score": 0.155,
- "pc1": -2.5037,
- "pc2": 0.6886,
- "pc3": -1.576,
- "pc4": 0.2872,
- "pc5": 0.1873,
- "pc6": -0.5483,
- "pc7": -0.5035,
- "pc8": -0.0,
- "pc9": 0.0003,
- "pc10": -0.1979,
+ "score": 0.765,
+ "pc1": -3.0003,
+ "pc2": 0.7031,
+ "pc3": -1.7757,
+ "pc4": 0.2072,
+ "pc5": 0.6585,
+ "pc6": -4.1796,
+ "pc7": -0.7319,
+ "pc8": -3.4673,
+ "pc9": 0.7771,
+ "pc10": 0.1133,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "7c7dfa27",
"model": "glm-5.1",
- "score": 0.33,
- "pc1": -1.4005,
- "pc2": -0.2079,
- "pc3": -1.7018,
- "pc4": -0.0026,
- "pc5": 0.3581,
- "pc6": 0.3197,
- "pc7": -0.2507,
- "pc8": -0.0,
- "pc9": 0.0205,
- "pc10": -0.4347,
+ "score": 0.835,
+ "pc1": -1.0352,
+ "pc2": -0.5836,
+ "pc3": -0.8999,
+ "pc4": 0.3277,
+ "pc5": 0.35,
+ "pc6": 0.1942,
+ "pc7": -0.2713,
+ "pc8": 0.2865,
+ "pc9": 0.0509,
+ "pc10": -0.036,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "5afe9b8e",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": -1.4005,
- "pc2": -0.2079,
- "pc3": -1.7018,
- "pc4": -0.0026,
- "pc5": 0.3581,
- "pc6": 0.3197,
- "pc7": -0.2507,
- "pc8": -0.0,
- "pc9": 0.0205,
- "pc10": -0.4347,
+ "score": 0.945,
+ "pc1": -1.0352,
+ "pc2": -0.5836,
+ "pc3": -0.8999,
+ "pc4": 0.3277,
+ "pc5": 0.35,
+ "pc6": 0.1942,
+ "pc7": -0.2713,
+ "pc8": 0.2865,
+ "pc9": 0.0509,
+ "pc10": -0.036,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=avail_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "7e2cf342",
"model": "glm-5.1",
- "score": 0.355,
- "pc1": -1.4005,
- "pc2": -0.2079,
- "pc3": -1.7018,
- "pc4": -0.0026,
- "pc5": 0.3581,
- "pc6": 0.3197,
- "pc7": -0.2507,
- "pc8": -0.0,
- "pc9": 0.0205,
- "pc10": -0.4347,
+ "score": 0.85,
+ "pc1": -1.0352,
+ "pc2": -0.5836,
+ "pc3": -0.8999,
+ "pc4": 0.3277,
+ "pc5": 0.35,
+ "pc6": 0.1942,
+ "pc7": -0.2713,
+ "pc8": 0.2865,
+ "pc9": 0.0509,
+ "pc10": -0.036,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "437b474b",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -1.8835,
+ "pc2": -0.177,
+ "pc3": -0.3623,
+ "pc4": -0.0069,
+ "pc5": 0.1403,
+ "pc6": 0.0714,
+ "pc7": 0.1563,
+ "pc8": 0.4583,
+ "pc9": -0.2376,
+ "pc10": -0.1442,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "c5ae5908",
+ "model": "glm-5.1",
+ "score": 0.65,
+ "pc1": -1.8835,
+ "pc2": -0.177,
+ "pc3": -0.3623,
+ "pc4": -0.0069,
+ "pc5": 0.1403,
+ "pc6": 0.0714,
+ "pc7": 0.1563,
+ "pc8": 0.4583,
+ "pc9": -0.2376,
+ "pc10": -0.1442,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=inst_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "98dee8cd",
"model": "glm-5.1",
- "score": 0.155,
- "pc1": -2.3474,
- "pc2": 0.3008,
- "pc3": -1.6432,
- "pc4": 0.0754,
- "pc5": 0.3503,
- "pc6": 0.1957,
- "pc7": -0.4986,
- "pc8": 0.0,
- "pc9": 0.012,
- "pc10": -0.5978,
+ "score": 0.46,
+ "pc1": -1.8835,
+ "pc2": -0.177,
+ "pc3": -0.3623,
+ "pc4": -0.0069,
+ "pc5": 0.1403,
+ "pc6": 0.0714,
+ "pc7": 0.1563,
+ "pc8": 0.4583,
+ "pc9": -0.2376,
+ "pc10": -0.1442,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "6abf96c7",
"model": "glm-5.1",
- "score": 0.155,
- "pc1": -1.7034,
- "pc2": 1.8439,
- "pc3": -2.2299,
- "pc4": -1.1196,
- "pc5": -2.4429,
- "pc6": 0.2037,
- "pc7": -0.5312,
- "pc8": -0.0,
- "pc9": -0.0207,
- "pc10": 0.735,
+ "score": 0.575,
+ "pc1": -1.2584,
+ "pc2": 1.6168,
+ "pc3": -1.3625,
+ "pc4": 2.2871,
+ "pc5": -2.3101,
+ "pc6": 0.29,
+ "pc7": 0.5303,
+ "pc8": 0.0788,
+ "pc9": -0.3017,
+ "pc10": 0.5225,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "8bcd3ae0",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": -1.7034,
- "pc2": 1.8439,
- "pc3": -2.2299,
- "pc4": -1.1196,
- "pc5": -2.4429,
- "pc6": 0.2037,
- "pc7": -0.5312,
- "pc8": -0.0,
- "pc9": -0.0207,
- "pc10": 0.735,
+ "score": 0.77,
+ "pc1": -1.2584,
+ "pc2": 1.6168,
+ "pc3": -1.3625,
+ "pc4": 2.2871,
+ "pc5": -2.3101,
+ "pc6": 0.29,
+ "pc7": 0.5303,
+ "pc8": 0.0788,
+ "pc9": -0.3017,
+ "pc10": 0.5225,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=detailed_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "496e0334",
"model": "glm-5.1",
- "score": 0.155,
- "pc1": -1.7034,
- "pc2": 1.8439,
- "pc3": -2.2299,
- "pc4": -1.1196,
- "pc5": -2.4429,
- "pc6": 0.2037,
- "pc7": -0.5312,
- "pc8": -0.0,
- "pc9": -0.0207,
- "pc10": 0.735,
+ "score": 0.925,
+ "pc1": -1.2584,
+ "pc2": 1.6168,
+ "pc3": -1.3625,
+ "pc4": 2.2871,
+ "pc5": -2.3101,
+ "pc6": 0.29,
+ "pc7": 0.5303,
+ "pc8": 0.0788,
+ "pc9": -0.3017,
+ "pc10": 0.5225,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "30531578",
+ "model": "glm-5.1",
+ "score": 0.715,
+ "pc1": -3.1326,
+ "pc2": 0.714,
+ "pc3": -1.8201,
+ "pc4": 0.4033,
+ "pc5": 0.8696,
+ "pc6": -4.069,
+ "pc7": -1.3036,
+ "pc8": -3.0854,
+ "pc9": 0.8471,
+ "pc10": -0.2274,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "d8fc25ba",
+ "model": "glm-5.1",
+ "score": 0.84,
+ "pc1": -3.1326,
+ "pc2": 0.714,
+ "pc3": -1.8201,
+ "pc4": 0.4033,
+ "pc5": 0.8696,
+ "pc6": -4.069,
+ "pc7": -1.3036,
+ "pc8": -3.0854,
+ "pc9": 0.8471,
+ "pc10": -0.2274,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "aa3d18d8",
+ "model": "glm-5.1",
+ "score": 0.925,
+ "pc1": -3.1326,
+ "pc2": 0.714,
+ "pc3": -1.8201,
+ "pc4": 0.4033,
+ "pc5": 0.8696,
+ "pc6": -4.069,
+ "pc7": -1.3036,
+ "pc8": -3.0854,
+ "pc9": 0.8471,
+ "pc10": -0.2274,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=dom_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "11b37482",
"model": "glm-5.1",
- "score": 0.705,
- "pc1": -3.534,
- "pc2": 1.0966,
- "pc3": -2.0727,
- "pc4": 0.5139,
- "pc5": 1.0266,
- "pc6": 4.06,
- "pc7": 3.4199,
- "pc8": 0.0,
- "pc9": 0.0088,
- "pc10": 2.4967,
+ "score": 0.735,
+ "pc1": -3.1332,
+ "pc2": 0.6986,
+ "pc3": -1.8809,
+ "pc4": 0.1777,
+ "pc5": 0.8044,
+ "pc6": -3.843,
+ "pc7": -1.8379,
+ "pc8": -3.4663,
+ "pc9": 0.8853,
+ "pc10": -0.0504,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=dom_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "63c0c2ab",
"model": "glm-5.1",
- "score": 0.8,
- "pc1": -3.534,
- "pc2": 1.0966,
- "pc3": -2.0727,
- "pc4": 0.5139,
- "pc5": 1.0266,
- "pc6": 4.06,
- "pc7": 3.4199,
- "pc8": 0.0,
- "pc9": 0.0088,
- "pc10": 2.4967,
+ "score": 1.0,
+ "pc1": -3.1332,
+ "pc2": 0.6986,
+ "pc3": -1.8809,
+ "pc4": 0.1777,
+ "pc5": 0.8044,
+ "pc6": -3.843,
+ "pc7": -1.8379,
+ "pc8": -3.4663,
+ "pc9": 0.8853,
+ "pc10": -0.0504,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=dom_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "5da14018",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": -3.534,
- "pc2": 1.0966,
- "pc3": -2.0727,
- "pc4": 0.5139,
- "pc5": 1.0266,
- "pc6": 4.06,
- "pc7": 3.4199,
- "pc8": 0.0,
- "pc9": 0.0088,
- "pc10": 2.4967,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ "score": 0.61,
+ "pc1": -3.1332,
+ "pc2": 0.6986,
+ "pc3": -1.8809,
+ "pc4": 0.1777,
+ "pc5": 0.8044,
+ "pc6": -3.843,
+ "pc7": -1.8379,
+ "pc8": -3.4663,
+ "pc9": 0.8853,
+ "pc10": -0.0504,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "c2652712",
+ "model": "glm-5.1",
+ "score": 0.44,
+ "pc1": -1.9823,
+ "pc2": -0.2138,
+ "pc3": -0.5652,
+ "pc4": -0.1974,
+ "pc5": -0.3759,
+ "pc6": 0.288,
+ "pc7": 0.0396,
+ "pc8": 0.0931,
+ "pc9": -0.0155,
+ "pc10": -0.3939,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "84fc4ae0",
+ "model": "glm-5.1",
+ "score": 0.615,
+ "pc1": -2.0417,
+ "pc2": -0.1793,
+ "pc3": -0.9256,
+ "pc4": -0.0578,
+ "pc5": -0.2053,
+ "pc6": 0.3404,
+ "pc7": 0.3289,
+ "pc8": -0.0263,
+ "pc9": -0.1611,
+ "pc10": 0.1814,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "d8fe95e5",
+ "model": "glm-5.1",
+ "score": 0.69,
+ "pc1": -2.0417,
+ "pc2": -0.1793,
+ "pc3": -0.9256,
+ "pc4": -0.0578,
+ "pc5": -0.2053,
+ "pc6": 0.3404,
+ "pc7": 0.3289,
+ "pc8": -0.0263,
+ "pc9": -0.1611,
+ "pc10": 0.1814,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "62f7453c",
+ "model": "glm-5.1",
+ "score": 0.95,
+ "pc1": -2.0417,
+ "pc2": -0.1793,
+ "pc3": -0.9256,
+ "pc4": -0.0578,
+ "pc5": -0.2053,
+ "pc6": 0.3404,
+ "pc7": 0.3289,
+ "pc8": -0.0263,
+ "pc9": -0.1611,
+ "pc10": 0.1814,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "b77a5e30",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": -2.3931,
- "pc2": 0.2291,
- "pc3": -1.4554,
- "pc4": 0.3367,
- "pc5": 0.1539,
- "pc6": 0.1464,
- "pc7": -0.5481,
- "pc8": -0.0,
- "pc9": -0.0027,
- "pc10": -0.264,
+ "score": 0.785,
+ "pc1": -1.9994,
+ "pc2": -0.2018,
+ "pc3": -0.4661,
+ "pc4": -0.0007,
+ "pc5": -0.2594,
+ "pc6": -0.0489,
+ "pc7": 0.2473,
+ "pc8": -0.0227,
+ "pc9": -0.3869,
+ "pc10": -0.1478,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "03c54dda",
+ "model": "glm-5.1",
+ "score": 0.835,
+ "pc1": -1.9994,
+ "pc2": -0.2018,
+ "pc3": -0.4661,
+ "pc4": -0.0007,
+ "pc5": -0.2594,
+ "pc6": -0.0489,
+ "pc7": 0.2473,
+ "pc8": -0.0227,
+ "pc9": -0.3869,
+ "pc10": -0.1478,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "fa543cfc",
+ "model": "glm-5.1",
+ "score": 0.81,
+ "pc1": -1.9994,
+ "pc2": -0.2018,
+ "pc3": -0.4661,
+ "pc4": -0.0007,
+ "pc5": -0.2594,
+ "pc6": -0.0489,
+ "pc7": 0.2473,
+ "pc8": -0.0227,
+ "pc9": -0.3869,
+ "pc10": -0.1478,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "140cba7f",
"model": "glm-5.1",
- "score": 0.33,
- "pc1": -1.3964,
- "pc2": 2.1319,
- "pc3": -1.0933,
- "pc4": 0.5644,
- "pc5": 1.3255,
- "pc6": 0.4211,
- "pc7": 0.5719,
- "pc8": 0.0,
- "pc9": 0.055,
- "pc10": -1.684,
+ "score": 0.91,
+ "pc1": -1.1297,
+ "pc2": 1.8649,
+ "pc3": -0.2083,
+ "pc4": -0.7609,
+ "pc5": 0.8206,
+ "pc6": 0.2342,
+ "pc7": -0.2798,
+ "pc8": -0.2703,
+ "pc9": 0.3136,
+ "pc10": -2.0141,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "06c93bc4",
"model": "glm-5.1",
- "score": 0.33,
- "pc1": -1.3964,
- "pc2": 2.1319,
- "pc3": -1.0933,
- "pc4": 0.5644,
- "pc5": 1.3255,
- "pc6": 0.4211,
- "pc7": 0.5719,
- "pc8": 0.0,
- "pc9": 0.055,
- "pc10": -1.684,
+ "score": 0.945,
+ "pc1": -1.1297,
+ "pc2": 1.8649,
+ "pc3": -0.2083,
+ "pc4": -0.7609,
+ "pc5": 0.8206,
+ "pc6": 0.2342,
+ "pc7": -0.2798,
+ "pc8": -0.2703,
+ "pc9": 0.3136,
+ "pc10": -2.0141,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "6a89452c",
"model": "glm-5.1",
- "score": 0.255,
- "pc1": -1.3964,
- "pc2": 2.1319,
- "pc3": -1.0933,
- "pc4": 0.5644,
- "pc5": 1.3255,
- "pc6": 0.4211,
- "pc7": 0.5719,
- "pc8": 0.0,
- "pc9": 0.055,
- "pc10": -1.684,
+ "score": 0.73,
+ "pc1": -1.1297,
+ "pc2": 1.8649,
+ "pc3": -0.2083,
+ "pc4": -0.7609,
+ "pc5": 0.8206,
+ "pc6": 0.2342,
+ "pc7": -0.2798,
+ "pc8": -0.2703,
+ "pc9": 0.3136,
+ "pc10": -2.0141,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "5e2f9389",
"model": "glm-5.1",
- "score": 0.155,
- "pc1": -1.5729,
- "pc2": 1.8885,
- "pc3": -1.0177,
- "pc4": -1.2115,
- "pc5": 2.4342,
- "pc6": 0.6969,
- "pc7": 1.0614,
- "pc8": 0.0,
- "pc9": 0.0877,
- "pc10": -2.4969,
+ "score": 0.535,
+ "pc1": -1.3839,
+ "pc2": 1.544,
+ "pc3": 0.5184,
+ "pc4": 0.7181,
+ "pc5": 2.4653,
+ "pc6": 0.1906,
+ "pc7": -0.733,
+ "pc8": 0.4622,
+ "pc9": 0.6582,
+ "pc10": -2.5876,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "6cf8d774",
"model": "glm-5.1",
- "score": 0.73,
- "pc1": -1.5729,
- "pc2": 1.8885,
- "pc3": -1.0177,
- "pc4": -1.2115,
- "pc5": 2.4342,
- "pc6": 0.6969,
- "pc7": 1.0614,
- "pc8": 0.0,
- "pc9": 0.0877,
- "pc10": -2.4969,
+ "score": 0.87,
+ "pc1": -1.3839,
+ "pc2": 1.544,
+ "pc3": 0.5184,
+ "pc4": 0.7181,
+ "pc5": 2.4653,
+ "pc6": 0.1906,
+ "pc7": -0.733,
+ "pc8": 0.4622,
+ "pc9": 0.6582,
+ "pc10": -2.5876,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "61f8b45c",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": -1.5729,
- "pc2": 1.8885,
- "pc3": -1.0177,
- "pc4": -1.2115,
- "pc5": 2.4342,
- "pc6": 0.6969,
- "pc7": 1.0614,
- "pc8": 0.0,
- "pc9": 0.0877,
- "pc10": -2.4969,
+ "score": 0.685,
+ "pc1": -1.3839,
+ "pc2": 1.544,
+ "pc3": 0.5184,
+ "pc4": 0.7181,
+ "pc5": 2.4653,
+ "pc6": 0.1906,
+ "pc7": -0.733,
+ "pc8": 0.4622,
+ "pc9": 0.6582,
+ "pc10": -2.5876,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
"short_id": "b1e752d7",
"model": "glm-5.1",
- "score": 0.385,
- "pc1": -1.4627,
- "pc2": 2.0798,
- "pc3": -1.3239,
- "pc4": -0.294,
- "pc5": 2.1032,
- "pc6": -0.0495,
- "pc7": -1.3355,
- "pc8": -0.0,
- "pc9": -0.0337,
- "pc10": 1.0203,
+ "score": 0.925,
+ "pc1": -1.1059,
+ "pc2": 1.8548,
+ "pc3": 0.0007,
+ "pc4": 0.0517,
+ "pc5": 2.1063,
+ "pc6": 0.0403,
+ "pc7": -0.8328,
+ "pc8": 0.5583,
+ "pc9": -0.1679,
+ "pc10": 1.6055,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run2",
"short_id": "ad47b58e",
"model": "glm-5.1",
- "score": 0.37,
- "pc1": -1.4627,
- "pc2": 2.0798,
- "pc3": -1.3239,
- "pc4": -0.294,
- "pc5": 2.1032,
- "pc6": -0.0495,
- "pc7": -1.3355,
- "pc8": -0.0,
- "pc9": -0.0337,
- "pc10": 1.0203,
+ "score": 0.58,
+ "pc1": -1.1059,
+ "pc2": 1.8548,
+ "pc3": 0.0007,
+ "pc4": 0.0517,
+ "pc5": 2.1063,
+ "pc6": 0.0403,
+ "pc7": -0.8328,
+ "pc8": 0.5583,
+ "pc9": -0.1679,
+ "pc10": 1.6055,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run3",
"short_id": "689ef4b4",
"model": "glm-5.1",
- "score": 0.385,
- "pc1": -1.4627,
- "pc2": 2.0798,
- "pc3": -1.3239,
- "pc4": -0.294,
- "pc5": 2.1032,
- "pc6": -0.0495,
- "pc7": -1.3355,
- "pc8": -0.0,
- "pc9": -0.0337,
- "pc10": 1.0203,
+ "score": 0.92,
+ "pc1": -1.1059,
+ "pc2": 1.8548,
+ "pc3": 0.0007,
+ "pc4": 0.0517,
+ "pc5": 2.1063,
+ "pc6": 0.0403,
+ "pc7": -0.8328,
+ "pc8": 0.5583,
+ "pc9": -0.1679,
+ "pc10": 1.6055,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
"short_id": "5e839ecf",
"model": "glm-5.1",
- "score": 0.34,
- "pc1": -1.3366,
- "pc2": 2.118,
- "pc3": -1.4115,
- "pc4": -1.23,
- "pc5": -0.511,
- "pc6": 0.4337,
- "pc7": 0.3501,
- "pc8": 0.0,
- "pc9": 0.019,
- "pc10": -0.485,
+ "score": 0.97,
+ "pc1": -1.1088,
+ "pc2": 1.8481,
+ "pc3": -0.2678,
+ "pc4": 1.6102,
+ "pc5": -0.2656,
+ "pc6": 0.642,
+ "pc7": -0.1718,
+ "pc8": 0.5376,
+ "pc9": 0.0782,
+ "pc10": -0.6479,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run2",
"short_id": "40e70ba8",
"model": "glm-5.1",
- "score": 0.355,
- "pc1": -1.3366,
- "pc2": 2.118,
- "pc3": -1.4115,
- "pc4": -1.23,
- "pc5": -0.511,
- "pc6": 0.4337,
- "pc7": 0.3501,
- "pc8": 0.0,
- "pc9": 0.019,
- "pc10": -0.485,
+ "score": 0.835,
+ "pc1": -1.1088,
+ "pc2": 1.8481,
+ "pc3": -0.2678,
+ "pc4": 1.6102,
+ "pc5": -0.2656,
+ "pc6": 0.642,
+ "pc7": -0.1718,
+ "pc8": 0.5376,
+ "pc9": 0.0782,
+ "pc10": -0.6479,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run3",
"short_id": "2d900db2",
"model": "glm-5.1",
- "score": 0.225,
- "pc1": -1.3366,
- "pc2": 2.118,
- "pc3": -1.4115,
- "pc4": -1.23,
- "pc5": -0.511,
- "pc6": 0.4337,
- "pc7": 0.3501,
- "pc8": 0.0,
- "pc9": 0.019,
- "pc10": -0.485,
+ "score": 0.95,
+ "pc1": -1.1088,
+ "pc2": 1.8481,
+ "pc3": -0.2678,
+ "pc4": 1.6102,
+ "pc5": -0.2656,
+ "pc6": 0.642,
+ "pc7": -0.1718,
+ "pc8": 0.5376,
+ "pc9": 0.0782,
+ "pc10": -0.6479,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
"short_id": "dec1df41",
"model": "glm-5.1",
- "score": 0.29,
- "pc1": -1.4196,
- "pc2": 2.0862,
- "pc3": -1.2302,
- "pc4": 1.3464,
- "pc5": 1.8214,
- "pc6": 0.1223,
- "pc7": -0.7436,
- "pc8": -0.0,
- "pc9": 0.0246,
- "pc10": -0.8401,
+ "score": 0.835,
+ "pc1": -1.1043,
+ "pc2": 1.8459,
+ "pc3": -0.5954,
+ "pc4": -1.4778,
+ "pc5": 1.1685,
+ "pc6": -0.14,
+ "pc7": 0.068,
+ "pc8": 0.2487,
+ "pc9": -0.2828,
+ "pc10": 0.5059,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run2",
"short_id": "7165dc1a",
"model": "glm-5.1",
- "score": 0.295,
- "pc1": -1.4196,
- "pc2": 2.0862,
- "pc3": -1.2302,
- "pc4": 1.3464,
- "pc5": 1.8214,
- "pc6": 0.1223,
- "pc7": -0.7436,
- "pc8": -0.0,
- "pc9": 0.0246,
- "pc10": -0.8401,
+ "score": 0.94,
+ "pc1": -1.1043,
+ "pc2": 1.8459,
+ "pc3": -0.5954,
+ "pc4": -1.4778,
+ "pc5": 1.1685,
+ "pc6": -0.14,
+ "pc7": 0.068,
+ "pc8": 0.2487,
+ "pc9": -0.2828,
+ "pc10": 0.5059,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run3",
"short_id": "b656c546",
"model": "glm-5.1",
- "score": 0.255,
- "pc1": -1.4196,
- "pc2": 2.0862,
- "pc3": -1.2302,
- "pc4": 1.3464,
- "pc5": 1.8214,
- "pc6": 0.1223,
- "pc7": -0.7436,
- "pc8": -0.0,
- "pc9": 0.0246,
- "pc10": -0.8401,
+ "score": 0.78,
+ "pc1": -1.1043,
+ "pc2": 1.8459,
+ "pc3": -0.5954,
+ "pc4": -1.4778,
+ "pc5": 1.1685,
+ "pc6": -0.14,
+ "pc7": 0.068,
+ "pc8": 0.2487,
+ "pc9": -0.2828,
+ "pc10": 0.5059,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "05ad5c61",
"model": "glm-5.1",
- "score": 0.355,
- "pc1": -1.5063,
- "pc2": 2.3822,
- "pc3": -1.9766,
- "pc4": -0.1512,
- "pc5": -1.1608,
- "pc6": 0.1862,
- "pc7": -0.4397,
- "pc8": -0.0,
- "pc9": 0.017,
- "pc10": -0.6121,
+ "score": 0.835,
+ "pc1": -1.1732,
+ "pc2": 2.1885,
+ "pc3": -0.9362,
+ "pc4": 1.0657,
+ "pc5": -1.297,
+ "pc6": 0.0765,
+ "pc7": 0.3728,
+ "pc8": -0.1931,
+ "pc9": -0.1983,
+ "pc10": 0.3479,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run2",
"short_id": "79bef8d0",
"model": "glm-5.1",
- "score": 0.155,
- "pc1": -1.5063,
- "pc2": 2.3822,
- "pc3": -1.9766,
- "pc4": -0.1512,
- "pc5": -1.1608,
- "pc6": 0.1862,
- "pc7": -0.4397,
- "pc8": -0.0,
- "pc9": 0.017,
- "pc10": -0.6121,
+ "score": 0.59,
+ "pc1": -1.1732,
+ "pc2": 2.1885,
+ "pc3": -0.9362,
+ "pc4": 1.0657,
+ "pc5": -1.297,
+ "pc6": 0.0765,
+ "pc7": 0.3728,
+ "pc8": -0.1931,
+ "pc9": -0.1983,
+ "pc10": 0.3479,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run3",
"short_id": "bb3dc885",
"model": "glm-5.1",
- "score": 0.355,
- "pc1": -1.5063,
- "pc2": 2.3822,
- "pc3": -1.9766,
- "pc4": -0.1512,
- "pc5": -1.1608,
- "pc6": 0.1862,
- "pc7": -0.4397,
- "pc8": -0.0,
- "pc9": 0.017,
- "pc10": -0.6121,
+ "score": 0.95,
+ "pc1": -1.1732,
+ "pc2": 2.1885,
+ "pc3": -0.9362,
+ "pc4": 1.0657,
+ "pc5": -1.297,
+ "pc6": 0.0765,
+ "pc7": 0.3728,
+ "pc8": -0.1931,
+ "pc9": -0.1983,
+ "pc10": 0.3479,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "71d588fb",
"model": "glm-5.1",
- "score": 0.78,
- "pc1": -2.5291,
- "pc2": 0.7685,
- "pc3": -1.5972,
- "pc4": 0.2175,
- "pc5": 0.3226,
- "pc6": 0.2688,
- "pc7": -0.3052,
- "pc8": -0.0,
- "pc9": 0.0153,
- "pc10": -0.3964,
+ "score": 0.65,
+ "pc1": -2.2132,
+ "pc2": 0.373,
+ "pc3": -0.6077,
+ "pc4": 0.0408,
+ "pc5": 0.1105,
+ "pc6": 0.1941,
+ "pc7": -0.1041,
+ "pc8": 0.2127,
+ "pc9": -0.0326,
+ "pc10": -0.0527,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "781c564b",
"model": "glm-5.1",
- "score": 0.38,
- "pc1": -2.5291,
- "pc2": 0.7685,
- "pc3": -1.5972,
- "pc4": 0.2175,
- "pc5": 0.3226,
- "pc6": 0.2688,
- "pc7": -0.3052,
- "pc8": -0.0,
- "pc9": 0.0153,
- "pc10": -0.3964,
+ "score": 0.785,
+ "pc1": -2.2132,
+ "pc2": 0.373,
+ "pc3": -0.6077,
+ "pc4": 0.0408,
+ "pc5": 0.1105,
+ "pc6": 0.1941,
+ "pc7": -0.1041,
+ "pc8": 0.2127,
+ "pc9": -0.0326,
+ "pc10": -0.0527,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "3e9975cb",
"model": "glm-5.1",
- "score": 0.33,
- "pc1": -2.5291,
- "pc2": 0.7685,
- "pc3": -1.5972,
- "pc4": 0.2175,
- "pc5": 0.3226,
- "pc6": 0.2688,
- "pc7": -0.3052,
- "pc8": -0.0,
- "pc9": 0.0153,
- "pc10": -0.3964,
+ "score": 0.835,
+ "pc1": -2.2132,
+ "pc2": 0.373,
+ "pc3": -0.6077,
+ "pc4": 0.0408,
+ "pc5": 0.1105,
+ "pc6": 0.1941,
+ "pc7": -0.1041,
+ "pc8": 0.2127,
+ "pc9": -0.0326,
+ "pc10": -0.0527,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "f8d9ace7",
+ "model": "glm-5.1",
+ "score": 0.795,
+ "pc1": -2.0011,
+ "pc2": -0.2244,
+ "pc3": -0.6341,
+ "pc4": -0.0767,
+ "pc5": -0.3085,
+ "pc6": 0.4335,
+ "pc7": 0.05,
+ "pc8": 0.2372,
+ "pc9": -0.1278,
+ "pc10": 0.0162,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "2620a1cf",
+ "model": "glm-5.1",
+ "score": 0.665,
+ "pc1": -2.0011,
+ "pc2": -0.2244,
+ "pc3": -0.6341,
+ "pc4": -0.0767,
+ "pc5": -0.3085,
+ "pc6": 0.4335,
+ "pc7": 0.05,
+ "pc8": 0.2372,
+ "pc9": -0.1278,
+ "pc10": 0.0162,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
+ },
+ {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "0503113f",
"model": "glm-5.1",
- "score": 0.23,
- "pc1": -2.3813,
- "pc2": 0.2153,
- "pc3": -1.2551,
- "pc4": 0.3035,
- "pc5": 0.1288,
- "pc6": 0.231,
- "pc7": -0.4775,
- "pc8": -0.0,
- "pc9": -0.004,
- "pc10": -0.2434,
+ "score": 0.785,
+ "pc1": -2.0011,
+ "pc2": -0.2244,
+ "pc3": -0.6341,
+ "pc4": -0.0767,
+ "pc5": -0.3085,
+ "pc6": 0.4335,
+ "pc7": 0.05,
+ "pc8": 0.2372,
+ "pc9": -0.1278,
+ "pc10": 0.0162,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
},
{
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=review_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "a4d1e302",
+ "model": "glm-5.1",
+ "score": 0.685,
+ "pc1": -2.0374,
+ "pc2": -0.1993,
+ "pc3": -0.7047,
+ "pc4": -0.0873,
+ "pc5": -0.1213,
+ "pc6": 0.5899,
+ "pc7": -0.1717,
+ "pc8": 0.4315,
+ "pc9": -0.0705,
+ "pc10": -0.4289,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=review"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=review_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "2267b9f4",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -2.0374,
+ "pc2": -0.1993,
+ "pc3": -0.7047,
+ "pc4": -0.0873,
+ "pc5": -0.1213,
+ "pc6": 0.5899,
+ "pc7": -0.1717,
+ "pc8": 0.4315,
+ "pc9": -0.0705,
+ "pc10": -0.4289,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=review"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=review_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "e3a6ea3c",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -2.0374,
+ "pc2": -0.1993,
+ "pc3": -0.7047,
+ "pc4": -0.0873,
+ "pc5": -0.1213,
+ "pc6": 0.5899,
+ "pc7": -0.1717,
+ "pc8": 0.4315,
+ "pc9": -0.0705,
+ "pc10": -0.4289,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=review"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=split_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "bb361eb9",
+ "model": "glm-5.1",
+ "score": 0.5,
+ "pc1": -2.0427,
+ "pc2": -0.184,
+ "pc3": -0.6327,
+ "pc4": -0.0738,
+ "pc5": -0.132,
+ "pc6": 0.4131,
+ "pc7": -0.0851,
+ "pc8": 0.2509,
+ "pc9": -0.3255,
+ "pc10": -0.0555,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=split_work"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=split_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "28bf03d9",
+ "model": "glm-5.1",
+ "score": 0.5,
+ "pc1": -2.0427,
+ "pc2": -0.184,
+ "pc3": -0.6327,
+ "pc4": -0.0738,
+ "pc5": -0.132,
+ "pc6": 0.4131,
+ "pc7": -0.0851,
+ "pc8": 0.2509,
+ "pc9": -0.3255,
+ "pc10": -0.0555,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=split_work"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=split_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "63a42bc7",
+ "model": "glm-5.1",
+ "score": 0.475,
+ "pc1": -2.0427,
+ "pc2": -0.184,
+ "pc3": -0.6327,
+ "pc4": -0.0738,
+ "pc5": -0.132,
+ "pc6": 0.4131,
+ "pc7": -0.0851,
+ "pc8": 0.2509,
+ "pc9": -0.3255,
+ "pc10": -0.0555,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=split_work"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "ede08543",
+ "model": "glm-5.1",
+ "score": 0.81,
+ "pc1": -1.1622,
+ "pc2": -0.635,
+ "pc3": -0.9717,
+ "pc4": 0.0754,
+ "pc5": 0.0278,
+ "pc6": 0.2529,
+ "pc7": -0.1347,
+ "pc8": 0.2,
+ "pc9": -0.0415,
+ "pc10": 0.0644,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "d65aa9f3",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -1.1622,
+ "pc2": -0.635,
+ "pc3": -0.9717,
+ "pc4": 0.0754,
+ "pc5": 0.0278,
+ "pc6": 0.2529,
+ "pc7": -0.1347,
+ "pc8": 0.2,
+ "pc9": -0.0415,
+ "pc10": 0.0644,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "5514ba1d",
+ "model": "glm-5.1",
+ "score": 0.545,
+ "pc1": -1.1622,
+ "pc2": -0.635,
+ "pc3": -0.9717,
+ "pc4": 0.0754,
+ "pc5": 0.0278,
+ "pc6": 0.2529,
+ "pc7": -0.1347,
+ "pc8": 0.2,
+ "pc9": -0.0415,
+ "pc10": 0.0644,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "f3626e24",
+ "model": "glm-5.1",
+ "score": 0.835,
+ "pc1": -3.1328,
+ "pc2": 0.7025,
+ "pc3": -2.0202,
+ "pc4": 0.2322,
+ "pc5": 0.657,
+ "pc6": -3.6694,
+ "pc7": -1.2748,
+ "pc8": -2.9607,
+ "pc9": 0.8158,
+ "pc10": 0.1605,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "5411d5ce",
+ "model": "glm-5.1",
+ "score": 0.39,
+ "pc1": -3.1328,
+ "pc2": 0.7025,
+ "pc3": -2.0202,
+ "pc4": 0.2322,
+ "pc5": 0.657,
+ "pc6": -3.6694,
+ "pc7": -1.2748,
+ "pc8": -2.9607,
+ "pc9": 0.8158,
+ "pc10": 0.1605,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "8cf0fbde",
+ "model": "glm-5.1",
+ "score": 0.5,
+ "pc1": -3.1328,
+ "pc2": 0.7025,
+ "pc3": -2.0202,
+ "pc4": 0.2322,
+ "pc5": 0.657,
+ "pc6": -3.6694,
+ "pc7": -1.2748,
+ "pc8": -2.9607,
+ "pc9": 0.8158,
+ "pc10": 0.1605,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=webgl_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "16dab3d1",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -3.1327,
+ "pc2": 0.6865,
+ "pc3": -2.1169,
+ "pc4": 0.2344,
+ "pc5": 0.8437,
+ "pc6": -3.6935,
+ "pc7": -1.1313,
+ "pc8": -2.7182,
+ "pc9": 0.8883,
+ "pc10": 0.2994,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=webgl_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "14486646",
"model": "glm-5.1",
- "score": 0.365,
- "pc1": -3.5024,
- "pc2": 1.062,
- "pc3": -1.7619,
- "pc4": 0.4752,
- "pc5": 0.9625,
- "pc6": 4.0055,
- "pc7": 3.506,
- "pc8": 0.0,
- "pc9": 0.0038,
- "pc10": 2.5946,
+ "score": 0.575,
+ "pc1": -3.1327,
+ "pc2": 0.6865,
+ "pc3": -2.1169,
+ "pc4": 0.2344,
+ "pc5": 0.8437,
+ "pc6": -3.6935,
+ "pc7": -1.1313,
+ "pc8": -2.7182,
+ "pc9": 0.8883,
+ "pc10": 0.2994,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=webgl_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "31d60e5a",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -3.1327,
+ "pc2": 0.6865,
+ "pc3": -2.1169,
+ "pc4": 0.2344,
+ "pc5": 0.8437,
+ "pc6": -3.6935,
+ "pc7": -1.1313,
+ "pc8": -2.7182,
+ "pc9": 0.8883,
+ "pc10": 0.2994,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "cbbff570",
"model": "haiku-4.5",
- "score": 0.515,
- "pc1": 2.3625,
- "pc2": -1.1242,
- "pc3": -0.4301,
- "pc4": -1.5018,
- "pc5": -2.7554,
- "pc6": 0.1183,
- "pc7": 0.1311,
- "pc8": -0.0,
- "pc9": -0.0352,
- "pc10": 1.4855,
+ "score": 0.925,
+ "pc1": 3.197,
+ "pc2": -1.0414,
+ "pc3": -1.1458,
+ "pc4": 2.5105,
+ "pc5": -2.1998,
+ "pc6": 0.0495,
+ "pc7": 0.4999,
+ "pc8": -0.0834,
+ "pc9": -0.1691,
+ "pc10": 0.5484,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "62c70152",
"model": "haiku-4.5",
- "score": 0.34,
- "pc1": 2.3625,
- "pc2": -1.1242,
- "pc3": -0.4301,
- "pc4": -1.5018,
- "pc5": -2.7554,
- "pc6": 0.1183,
- "pc7": 0.1311,
- "pc8": -0.0,
- "pc9": -0.0352,
- "pc10": 1.4855,
+ "score": 0.89,
+ "pc1": 3.197,
+ "pc2": -1.0414,
+ "pc3": -1.1458,
+ "pc4": 2.5105,
+ "pc5": -2.1998,
+ "pc6": 0.0495,
+ "pc7": 0.4999,
+ "pc8": -0.0834,
+ "pc9": -0.1691,
+ "pc10": 0.5484,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "80f1c3d5",
"model": "haiku-4.5",
- "score": 0.565,
- "pc1": 2.3625,
- "pc2": -1.1242,
- "pc3": -0.4301,
- "pc4": -1.5018,
- "pc5": -2.7554,
- "pc6": 0.1183,
- "pc7": 0.1311,
- "pc8": -0.0,
- "pc9": -0.0352,
- "pc10": 1.4855,
+ "score": 0.86,
+ "pc1": 3.197,
+ "pc2": -1.0414,
+ "pc3": -1.1458,
+ "pc4": 2.5105,
+ "pc5": -2.1998,
+ "pc6": 0.0495,
+ "pc7": 0.4999,
+ "pc8": -0.0834,
+ "pc9": -0.1691,
+ "pc10": 0.5484,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "3fc392c9",
"model": "haiku-4.5",
- "score": 0.275,
- "pc1": 0.4937,
- "pc2": -1.1585,
- "pc3": 0.1735,
- "pc4": -0.2544,
- "pc5": 0.1955,
- "pc6": 0.2051,
- "pc7": 0.4257,
- "pc8": 0.0,
- "pc9": 0.0084,
- "pc10": 0.1424,
+ "score": 0.66,
+ "pc1": 1.1911,
+ "pc2": -1.2771,
+ "pc3": -0.0269,
+ "pc4": 0.2296,
+ "pc5": 0.3035,
+ "pc6": -0.1053,
+ "pc7": -0.104,
+ "pc8": 0.0632,
+ "pc9": 0.1088,
+ "pc10": -0.1438,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "a30100ff",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 0.4937,
- "pc2": -1.1585,
- "pc3": 0.1735,
- "pc4": -0.2544,
- "pc5": 0.1955,
- "pc6": 0.2051,
- "pc7": 0.4257,
- "pc8": 0.0,
- "pc9": 0.0084,
- "pc10": 0.1424,
+ "score": 0.57,
+ "pc1": 1.1911,
+ "pc2": -1.2771,
+ "pc3": -0.0269,
+ "pc4": 0.2296,
+ "pc5": 0.3035,
+ "pc6": -0.1053,
+ "pc7": -0.104,
+ "pc8": 0.0632,
+ "pc9": 0.1088,
+ "pc10": -0.1438,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "645e0c8f",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 0.4937,
- "pc2": -1.1585,
- "pc3": 0.1735,
- "pc4": -0.2544,
- "pc5": 0.1955,
- "pc6": 0.2051,
- "pc7": 0.4257,
- "pc8": 0.0,
- "pc9": 0.0084,
- "pc10": 0.1424,
+ "score": 0.61,
+ "pc1": 1.1911,
+ "pc2": -1.2771,
+ "pc3": -0.0269,
+ "pc4": 0.2296,
+ "pc5": 0.3035,
+ "pc6": -0.1053,
+ "pc7": -0.104,
+ "pc8": 0.0632,
+ "pc9": 0.1088,
+ "pc10": -0.1438,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "188635cc",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 2.6696,
- "pc2": -0.8362,
- "pc3": 0.7065,
- "pc4": 0.1822,
- "pc5": 1.0129,
- "pc6": 0.3357,
- "pc7": 1.2343,
- "pc8": 0.0,
- "pc9": 0.0405,
- "pc10": -0.9335,
+ "score": 0.78,
+ "pc1": 3.3257,
+ "pc2": -0.7933,
+ "pc3": 0.0085,
+ "pc4": -0.5375,
+ "pc5": 0.9309,
+ "pc6": -0.0062,
+ "pc7": -0.3102,
+ "pc8": -0.4325,
+ "pc9": 0.4461,
+ "pc10": -1.9882,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "9805c24a",
"model": "haiku-4.5",
- "score": 0.565,
- "pc1": 2.6696,
- "pc2": -0.8362,
- "pc3": 0.7065,
- "pc4": 0.1822,
- "pc5": 1.0129,
- "pc6": 0.3357,
- "pc7": 1.2343,
- "pc8": 0.0,
- "pc9": 0.0405,
- "pc10": -0.9335,
+ "score": 0.74,
+ "pc1": 3.3257,
+ "pc2": -0.7933,
+ "pc3": 0.0085,
+ "pc4": -0.5375,
+ "pc5": 0.9309,
+ "pc6": -0.0062,
+ "pc7": -0.3102,
+ "pc8": -0.4325,
+ "pc9": 0.4461,
+ "pc10": -1.9882,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "5cdb89b6",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 2.6696,
- "pc2": -0.8362,
- "pc3": 0.7065,
- "pc4": 0.1822,
- "pc5": 1.0129,
- "pc6": 0.3357,
- "pc7": 1.2343,
- "pc8": 0.0,
- "pc9": 0.0405,
- "pc10": -0.9335,
+ "score": 0.78,
+ "pc1": 3.3257,
+ "pc2": -0.7933,
+ "pc3": 0.0085,
+ "pc4": -0.5375,
+ "pc5": 0.9309,
+ "pc6": -0.0062,
+ "pc7": -0.3102,
+ "pc8": -0.4325,
+ "pc9": 0.4461,
+ "pc10": -1.9882,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "4949d521",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 2.493,
- "pc2": -1.0796,
- "pc3": 0.7821,
- "pc4": -1.5937,
- "pc5": 2.1217,
- "pc6": 0.6115,
- "pc7": 1.7238,
- "pc8": 0.0,
- "pc9": 0.0732,
- "pc10": -1.7464,
+ "score": 0.5,
+ "pc1": 3.0715,
+ "pc2": -1.1142,
+ "pc3": 0.7352,
+ "pc4": 0.9416,
+ "pc5": 2.5757,
+ "pc6": -0.0498,
+ "pc7": -0.7634,
+ "pc8": 0.3,
+ "pc9": 0.7907,
+ "pc10": -2.5618,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "165fb66f",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 2.493,
- "pc2": -1.0796,
- "pc3": 0.7821,
- "pc4": -1.5937,
- "pc5": 2.1217,
- "pc6": 0.6115,
- "pc7": 1.7238,
- "pc8": 0.0,
- "pc9": 0.0732,
- "pc10": -1.7464,
+ "score": 0.515,
+ "pc1": 3.0715,
+ "pc2": -1.1142,
+ "pc3": 0.7352,
+ "pc4": 0.9416,
+ "pc5": 2.5757,
+ "pc6": -0.0498,
+ "pc7": -0.7634,
+ "pc8": 0.3,
+ "pc9": 0.7907,
+ "pc10": -2.5618,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "af738eee",
"model": "haiku-4.5",
- "score": 0.28,
- "pc1": 2.493,
- "pc2": -1.0796,
- "pc3": 0.7821,
- "pc4": -1.5937,
- "pc5": 2.1217,
- "pc6": 0.6115,
- "pc7": 1.7238,
- "pc8": 0.0,
- "pc9": 0.0732,
- "pc10": -1.7464,
+ "score": 0.78,
+ "pc1": 3.0715,
+ "pc2": -1.1142,
+ "pc3": 0.7352,
+ "pc4": 0.9416,
+ "pc5": 2.5757,
+ "pc6": -0.0498,
+ "pc7": -0.7634,
+ "pc8": 0.3,
+ "pc9": 0.7907,
+ "pc10": -2.5618,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run4",
"short_id": "da87903f",
"model": "haiku-4.5",
- "score": 0.755,
- "pc1": 2.6033,
- "pc2": -0.8883,
- "pc3": 0.4759,
- "pc4": -0.6762,
- "pc5": 1.7907,
- "pc6": -0.1349,
- "pc7": -0.6731,
- "pc8": -0.0,
- "pc9": -0.0482,
- "pc10": 1.7708,
+ "score": 0.88,
+ "pc1": 3.3495,
+ "pc2": -0.8034,
+ "pc3": 0.2175,
+ "pc4": 0.2752,
+ "pc5": 2.2167,
+ "pc6": -0.2002,
+ "pc7": -0.8633,
+ "pc8": 0.3961,
+ "pc9": -0.0354,
+ "pc10": 1.6313,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run5",
"short_id": "49012037",
"model": "haiku-4.5",
- "score": 0.315,
- "pc1": 2.6033,
- "pc2": -0.8883,
- "pc3": 0.4759,
- "pc4": -0.6762,
- "pc5": 1.7907,
- "pc6": -0.1349,
- "pc7": -0.6731,
- "pc8": -0.0,
- "pc9": -0.0482,
- "pc10": 1.7708,
+ "score": 0.765,
+ "pc1": 3.3495,
+ "pc2": -0.8034,
+ "pc3": 0.2175,
+ "pc4": 0.2752,
+ "pc5": 2.2167,
+ "pc6": -0.2002,
+ "pc7": -0.8633,
+ "pc8": 0.3961,
+ "pc9": -0.0354,
+ "pc10": 1.6313,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run6",
"short_id": "4b5f4543",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 2.6033,
- "pc2": -0.8883,
- "pc3": 0.4759,
- "pc4": -0.6762,
- "pc5": 1.7907,
- "pc6": -0.1349,
- "pc7": -0.6731,
- "pc8": -0.0,
- "pc9": -0.0482,
- "pc10": 1.7708,
+ "score": 0.71,
+ "pc1": 3.3495,
+ "pc2": -0.8034,
+ "pc3": 0.2175,
+ "pc4": 0.2752,
+ "pc5": 2.2167,
+ "pc6": -0.2002,
+ "pc7": -0.8633,
+ "pc8": 0.3961,
+ "pc9": -0.0354,
+ "pc10": 1.6313,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run4",
"short_id": "37c69c60",
"model": "haiku-4.5",
- "score": 0.19,
- "pc1": 2.7293,
- "pc2": -0.8501,
- "pc3": 0.3883,
- "pc4": -1.6122,
- "pc5": -0.8235,
- "pc6": 0.3483,
- "pc7": 1.0124,
- "pc8": 0.0,
- "pc9": 0.0045,
- "pc10": 0.2655,
+ "score": 0.83,
+ "pc1": 3.3466,
+ "pc2": -0.8101,
+ "pc3": -0.051,
+ "pc4": 1.8336,
+ "pc5": -0.1553,
+ "pc6": 0.4016,
+ "pc7": -0.2022,
+ "pc8": 0.3753,
+ "pc9": 0.2107,
+ "pc10": -0.6221,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run5",
"short_id": "77c2245c",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 2.7293,
- "pc2": -0.8501,
- "pc3": 0.3883,
- "pc4": -1.6122,
- "pc5": -0.8235,
- "pc6": 0.3483,
- "pc7": 1.0124,
- "pc8": 0.0,
- "pc9": 0.0045,
- "pc10": 0.2655,
+ "score": 0.46,
+ "pc1": 3.3466,
+ "pc2": -0.8101,
+ "pc3": -0.051,
+ "pc4": 1.8336,
+ "pc5": -0.1553,
+ "pc6": 0.4016,
+ "pc7": -0.2022,
+ "pc8": 0.3753,
+ "pc9": 0.2107,
+ "pc10": -0.6221,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run6",
"short_id": "fe986bd0",
"model": "haiku-4.5",
- "score": 0.405,
- "pc1": 2.7293,
- "pc2": -0.8501,
- "pc3": 0.3883,
- "pc4": -1.6122,
- "pc5": -0.8235,
- "pc6": 0.3483,
- "pc7": 1.0124,
- "pc8": 0.0,
- "pc9": 0.0045,
- "pc10": 0.2655,
+ "score": 0.715,
+ "pc1": 3.3466,
+ "pc2": -0.8101,
+ "pc3": -0.051,
+ "pc4": 1.8336,
+ "pc5": -0.1553,
+ "pc6": 0.4016,
+ "pc7": -0.2022,
+ "pc8": 0.3753,
+ "pc9": 0.2107,
+ "pc10": -0.6221,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run4",
"short_id": "0d40c124",
"model": "haiku-4.5",
- "score": 0.87,
- "pc1": 2.6463,
- "pc2": -0.8819,
- "pc3": 0.5696,
- "pc4": 0.9642,
- "pc5": 1.5088,
- "pc6": 0.0368,
- "pc7": -0.0813,
- "pc8": -0.0,
- "pc9": 0.0101,
- "pc10": -0.0896,
+ "score": 0.94,
+ "pc1": 3.3511,
+ "pc2": -0.8123,
+ "pc3": -0.3786,
+ "pc4": -1.2544,
+ "pc5": 1.2788,
+ "pc6": -0.3805,
+ "pc7": 0.0376,
+ "pc8": 0.0865,
+ "pc9": -0.1503,
+ "pc10": 0.5318,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run5",
"short_id": "4d6ff9c9",
"model": "haiku-4.5",
- "score": 0.34,
- "pc1": 2.6463,
- "pc2": -0.8819,
- "pc3": 0.5696,
- "pc4": 0.9642,
- "pc5": 1.5088,
- "pc6": 0.0368,
- "pc7": -0.0813,
- "pc8": -0.0,
- "pc9": 0.0101,
- "pc10": -0.0896,
+ "score": 0.85,
+ "pc1": 3.3511,
+ "pc2": -0.8123,
+ "pc3": -0.3786,
+ "pc4": -1.2544,
+ "pc5": 1.2788,
+ "pc6": -0.3805,
+ "pc7": 0.0376,
+ "pc8": 0.0865,
+ "pc9": -0.1503,
+ "pc10": 0.5318,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run6",
"short_id": "1a5b849b",
"model": "haiku-4.5",
- "score": 0.405,
- "pc1": 2.6463,
- "pc2": -0.8819,
- "pc3": 0.5696,
- "pc4": 0.9642,
- "pc5": 1.5088,
- "pc6": 0.0368,
- "pc7": -0.0813,
- "pc8": -0.0,
- "pc9": 0.0101,
- "pc10": -0.0896,
+ "score": 0.725,
+ "pc1": 3.3511,
+ "pc2": -0.8123,
+ "pc3": -0.3786,
+ "pc4": -1.2544,
+ "pc5": 1.2788,
+ "pc6": -0.3805,
+ "pc7": 0.0376,
+ "pc8": 0.0865,
+ "pc9": -0.1503,
+ "pc10": 0.5318,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run3",
"short_id": "e01fbfa7",
"model": "haiku-4.5",
- "score": 0.33,
- "pc1": 2.5596,
- "pc2": -0.5859,
- "pc3": -0.1768,
- "pc4": -0.5334,
- "pc5": -1.4734,
- "pc6": 0.1008,
- "pc7": 0.2226,
- "pc8": 0.0,
- "pc9": 0.0025,
- "pc10": 0.1384,
+ "score": 0.785,
+ "pc1": 3.2822,
+ "pc2": -0.4697,
+ "pc3": -0.7194,
+ "pc4": 1.2891,
+ "pc5": -1.1867,
+ "pc6": -0.1639,
+ "pc7": 0.3424,
+ "pc8": -0.3553,
+ "pc9": -0.0658,
+ "pc10": 0.3737,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run4",
"short_id": "bf5c394f",
"model": "haiku-4.5",
- "score": 0.875,
- "pc1": 2.5596,
- "pc2": -0.5859,
- "pc3": -0.1768,
- "pc4": -0.5334,
- "pc5": -1.4734,
- "pc6": 0.1008,
- "pc7": 0.2226,
- "pc8": 0.0,
- "pc9": 0.0025,
- "pc10": 0.1384,
+ "score": 0.925,
+ "pc1": 3.2822,
+ "pc2": -0.4697,
+ "pc3": -0.7194,
+ "pc4": 1.2891,
+ "pc5": -1.1867,
+ "pc6": -0.1639,
+ "pc7": 0.3424,
+ "pc8": -0.3553,
+ "pc9": -0.0658,
+ "pc10": 0.3737,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "4bdcef51",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 1.5369,
- "pc2": -2.1996,
- "pc3": 0.2026,
- "pc4": -0.1647,
- "pc5": 0.0101,
- "pc6": 0.1834,
- "pc7": 0.3572,
- "pc8": 0.0,
- "pc9": 0.0008,
- "pc10": 0.3541,
+ "score": 0.62,
+ "pc1": 2.2422,
+ "pc2": -2.2851,
+ "pc3": -0.3909,
+ "pc4": 0.2642,
+ "pc5": 0.2208,
+ "pc6": -0.0464,
+ "pc7": -0.1345,
+ "pc8": 0.0505,
+ "pc9": 0.0999,
+ "pc10": -0.0268,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "4db28f22",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 1.5369,
- "pc2": -2.1996,
- "pc3": 0.2026,
- "pc4": -0.1647,
- "pc5": 0.0101,
- "pc6": 0.1834,
- "pc7": 0.3572,
- "pc8": 0.0,
- "pc9": 0.0008,
- "pc10": 0.3541,
+ "score": 0.735,
+ "pc1": 2.2422,
+ "pc2": -2.2851,
+ "pc3": -0.3909,
+ "pc4": 0.2642,
+ "pc5": 0.2208,
+ "pc6": -0.0464,
+ "pc7": -0.1345,
+ "pc8": 0.0505,
+ "pc9": 0.0999,
+ "pc10": -0.0268,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "6b13f05b",
"model": "haiku-4.5",
- "score": 0.675,
- "pc1": 1.5369,
- "pc2": -2.1996,
- "pc3": 0.2026,
- "pc4": -0.1647,
- "pc5": 0.0101,
- "pc6": 0.1834,
- "pc7": 0.3572,
- "pc8": 0.0,
- "pc9": 0.0008,
- "pc10": 0.3541,
+ "score": 0.705,
+ "pc1": 2.2422,
+ "pc2": -2.2851,
+ "pc3": -0.3909,
+ "pc4": 0.2642,
+ "pc5": 0.2208,
+ "pc6": -0.0464,
+ "pc7": -0.1345,
+ "pc8": 0.0505,
+ "pc9": 0.0999,
+ "pc10": -0.0268,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=detailed_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "e5a1fdcc",
"model": "haiku-4.5",
- "score": 0.355,
- "pc1": 0.1908,
- "pc2": 0.8933,
- "pc3": -0.3546,
- "pc4": -1.3713,
- "pc5": -2.6055,
- "pc6": 0.0891,
- "pc7": 0.1452,
- "pc8": -0.0,
- "pc9": -0.0327,
- "pc10": 1.3121,
+ "score": 0.95,
+ "pc1": 0.9679,
+ "pc2": 0.9233,
+ "pc3": -0.4896,
+ "pc4": 2.189,
+ "pc5": -2.3566,
+ "pc6": -0.0095,
+ "pc7": 0.6976,
+ "pc8": -0.1446,
+ "pc9": -0.2438,
+ "pc10": 0.4147,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=canvas_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "671f2f16",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.5783,
- "pc2": 0.0777,
- "pc3": 0.4201,
- "pc4": 0.1858,
- "pc5": 0.7381,
- "pc6": 3.8462,
- "pc7": 4.2767,
- "pc8": 0.0,
- "pc9": -0.0132,
- "pc10": 3.2757,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=dom_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "6134c96d",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.6398,
- "pc2": 0.146,
- "pc3": -0.1974,
- "pc4": 0.2622,
- "pc5": 0.864,
- "pc6": 3.9454,
- "pc7": 4.0963,
- "pc8": 0.0,
- "pc9": -0.0032,
- "pc10": 3.0738,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "17cc50c2",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": -0.507,
- "pc2": -0.7147,
- "pc3": 0.2776,
- "pc4": 0.1159,
- "pc5": -0.0057,
- "pc6": -0.1358,
- "pc7": 0.0496,
- "pc8": 0.0,
- "pc9": -0.0161,
- "pc10": 0.3273,
+ "score": 0.535,
+ "pc1": 0.244,
+ "pc2": -0.9073,
+ "pc3": 0.3077,
+ "pc4": -0.2955,
+ "pc5": -0.4224,
+ "pc6": -0.0115,
+ "pc7": 0.2069,
+ "pc8": -0.1303,
+ "pc9": 0.0423,
+ "pc10": -0.5017,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "efb51112",
- "model": "haiku-4.5",
- "score": 0.305,
- "pc1": -0.4688,
- "pc2": -0.7611,
- "pc3": 0.9219,
- "pc4": 0.0144,
- "pc5": -0.0973,
- "pc6": 0.0586,
- "pc7": 0.2558,
- "pc8": -0.0,
- "pc9": -0.0217,
- "pc10": 0.4145,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
- },
- {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "0d11620e",
"model": "haiku-4.5",
- "score": 0.275,
- "pc1": -0.4989,
- "pc2": -0.7215,
- "pc3": 0.4199,
- "pc4": 0.085,
- "pc5": -0.0087,
- "pc6": 0.0317,
- "pc7": 0.1284,
- "pc8": 0.0,
- "pc9": -0.0148,
- "pc10": 0.3131,
+ "score": 0.72,
+ "pc1": 0.2269,
+ "pc2": -0.8953,
+ "pc3": 0.4069,
+ "pc4": -0.0988,
+ "pc5": -0.3059,
+ "pc6": -0.3484,
+ "pc7": 0.4146,
+ "pc8": -0.2461,
+ "pc9": -0.329,
+ "pc10": -0.2557,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "03d2b4a7",
"model": "haiku-4.5",
- "score": 0.855,
- "pc1": 0.4979,
- "pc2": 1.1813,
- "pc3": 0.782,
- "pc4": 0.3127,
- "pc5": 1.1629,
- "pc6": 0.3065,
- "pc7": 1.2484,
- "pc8": 0.0,
- "pc9": 0.0429,
- "pc10": -1.1069,
+ "score": 0.92,
+ "pc1": 1.0966,
+ "pc2": 1.1714,
+ "pc3": 0.6647,
+ "pc4": -0.859,
+ "pc5": 0.7741,
+ "pc6": -0.0653,
+ "pc7": -0.1125,
+ "pc8": -0.4937,
+ "pc9": 0.3714,
+ "pc10": -2.1219,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "40ab6d27",
"model": "haiku-4.5",
- "score": 0.295,
- "pc1": 0.3213,
- "pc2": 0.9379,
- "pc3": 0.8576,
- "pc4": -1.4633,
- "pc5": 2.2717,
- "pc6": 0.5823,
- "pc7": 1.7379,
- "pc8": 0.0,
- "pc9": 0.0756,
- "pc10": -1.9198,
+ "score": 0.895,
+ "pc1": 0.8424,
+ "pc2": 0.8505,
+ "pc3": 1.3914,
+ "pc4": 0.62,
+ "pc5": 2.4188,
+ "pc6": -0.1089,
+ "pc7": -0.5657,
+ "pc8": 0.2389,
+ "pc9": 0.7161,
+ "pc10": -2.6955,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
"short_id": "8a258788",
"model": "haiku-4.5",
- "score": 0.78,
- "pc1": 0.4315,
- "pc2": 1.1292,
- "pc3": 0.5514,
- "pc4": -0.5458,
- "pc5": 1.9406,
- "pc6": -0.1641,
- "pc7": -0.659,
- "pc8": -0.0,
- "pc9": -0.0458,
- "pc10": 1.5974,
+ "score": 0.92,
+ "pc1": 1.1204,
+ "pc2": 1.1613,
+ "pc3": 0.8737,
+ "pc4": -0.0463,
+ "pc5": 2.0598,
+ "pc6": -0.2592,
+ "pc7": -0.6655,
+ "pc8": 0.3349,
+ "pc9": -0.1101,
+ "pc10": 1.4976,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
"short_id": "030815a1",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 0.5576,
- "pc2": 1.1674,
- "pc3": 0.4638,
- "pc4": -1.4818,
- "pc5": -0.6736,
- "pc6": 0.3191,
- "pc7": 1.0265,
- "pc8": 0.0,
- "pc9": 0.0069,
- "pc10": 0.0921,
+ "score": 0.73,
+ "pc1": 1.1175,
+ "pc2": 1.1546,
+ "pc3": 0.6052,
+ "pc4": 1.5121,
+ "pc5": -0.3121,
+ "pc6": 0.3425,
+ "pc7": -0.0045,
+ "pc8": 0.3142,
+ "pc9": 0.136,
+ "pc10": -0.7558,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
"short_id": "7d789f16",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 0.4746,
- "pc2": 1.1356,
- "pc3": 0.6451,
- "pc4": 1.0947,
- "pc5": 1.6588,
- "pc6": 0.0076,
- "pc7": -0.0672,
- "pc8": -0.0,
- "pc9": 0.0126,
- "pc10": -0.263,
+ "score": 0.625,
+ "pc1": 1.122,
+ "pc2": 1.1525,
+ "pc3": 0.2776,
+ "pc4": -1.5759,
+ "pc5": 1.122,
+ "pc6": -0.4395,
+ "pc7": 0.2353,
+ "pc8": 0.0253,
+ "pc9": -0.225,
+ "pc10": 0.3981,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "ddb0ec43",
"model": "haiku-4.5",
- "score": 0.41,
- "pc1": -0.6349,
- "pc2": -0.1821,
- "pc3": 0.2781,
- "pc4": -0.0343,
- "pc5": 0.16,
- "pc6": 0.1542,
- "pc7": 0.3712,
- "pc8": 0.0,
- "pc9": 0.0033,
- "pc10": 0.1807,
+ "score": 0.505,
+ "pc1": 0.0131,
+ "pc2": -0.3204,
+ "pc3": 0.2653,
+ "pc4": -0.0573,
+ "pc5": 0.064,
+ "pc6": -0.1054,
+ "pc7": 0.0632,
+ "pc8": -0.0107,
+ "pc9": 0.0252,
+ "pc10": -0.1605,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "d09227cd",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -0.4871,
- "pc2": -0.7352,
- "pc3": 0.6202,
- "pc4": 0.0518,
- "pc5": -0.0338,
- "pc6": 0.1164,
- "pc7": 0.1989,
- "pc8": 0.0,
- "pc9": -0.016,
- "pc10": 0.3337,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=review_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "54f12a41",
- "model": "haiku-4.5",
- "score": 0.255,
- "pc1": -0.4407,
- "pc2": -0.7646,
- "pc3": 0.6365,
- "pc4": 0.0513,
- "pc5": -0.02,
- "pc6": 0.2034,
- "pc7": 0.3904,
- "pc8": 0.0,
- "pc9": -0.0133,
- "pc10": 0.4569,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=review"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=split_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "d5bdcb08",
- "model": "haiku-4.5",
- "score": 0.3,
- "pc1": -0.4688,
- "pc2": -0.7611,
- "pc3": 0.9219,
- "pc4": 0.0144,
- "pc5": -0.0973,
- "pc6": 0.0586,
- "pc7": 0.2558,
- "pc8": 0.0,
- "pc9": -0.0217,
- "pc10": 0.4145,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=split_work"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "d654ce03",
- "model": "haiku-4.5",
- "score": 0.3,
- "pc1": 0.4083,
- "pc2": -1.2232,
- "pc3": 0.3073,
- "pc4": 0.0554,
- "pc5": -0.0254,
- "pc6": 0.1324,
- "pc7": 0.3027,
- "pc8": 0.0,
- "pc9": -0.0043,
- "pc10": 0.3924,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=svg_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "536e0111",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
+ "short_id": "79675074",
"model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.5783,
- "pc2": 0.0777,
- "pc3": 0.4201,
- "pc4": 0.1858,
- "pc5": 0.7381,
- "pc6": 3.8462,
- "pc7": 4.2767,
- "pc8": 0.0,
- "pc9": -0.0132,
- "pc10": 3.2757,
+ "score": 0.5,
+ "pc1": 0.0131,
+ "pc2": -0.3204,
+ "pc3": 0.2653,
+ "pc4": -0.0573,
+ "pc5": 0.064,
+ "pc6": -0.1054,
+ "pc7": 0.0632,
+ "pc8": -0.0107,
+ "pc9": 0.0252,
+ "pc10": -0.1605,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=webgl_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "a481cf35",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
+ "short_id": "c0d3fd49",
"model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.6082,
- "pc2": 0.1114,
- "pc3": 0.1134,
- "pc4": 0.2235,
- "pc5": 0.7999,
- "pc6": 3.8909,
- "pc7": 4.1825,
- "pc8": 0.0,
- "pc9": -0.0082,
- "pc10": 3.1717,
+ "score": 0.84,
+ "pc1": 0.0131,
+ "pc2": -0.3204,
+ "pc3": 0.2653,
+ "pc4": -0.0573,
+ "pc5": 0.064,
+ "pc6": -0.1054,
+ "pc7": 0.0632,
+ "pc8": -0.0107,
+ "pc9": 0.0252,
+ "pc10": -0.1605,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "79675074",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run7",
+ "short_id": "1fbd2965",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": -0.6349,
- "pc2": -0.1821,
- "pc3": 0.2781,
- "pc4": -0.0343,
- "pc5": 0.16,
- "pc6": 0.1542,
- "pc7": 0.3712,
- "pc8": 0.0,
- "pc9": 0.0033,
- "pc10": 0.1807,
+ "score": 0.85,
+ "pc1": 0.0131,
+ "pc2": -0.3204,
+ "pc3": 0.2653,
+ "pc4": -0.0573,
+ "pc5": 0.064,
+ "pc6": -0.1054,
+ "pc7": 0.0632,
+ "pc8": -0.0107,
+ "pc9": 0.0252,
+ "pc10": -0.1605,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
- "short_id": "c0d3fd49",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "d09227cd",
"model": "haiku-4.5",
- "score": 0.34,
- "pc1": -0.6349,
- "pc2": -0.1821,
- "pc3": 0.2781,
- "pc4": -0.0343,
- "pc5": 0.16,
- "pc6": 0.1542,
- "pc7": 0.3712,
- "pc8": 0.0,
- "pc9": 0.0033,
- "pc10": 0.1807,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ "score": 0.75,
+ "pc1": 0.2253,
+ "pc2": -0.9178,
+ "pc3": 0.2389,
+ "pc4": -0.1748,
+ "pc5": -0.3549,
+ "pc6": 0.134,
+ "pc7": 0.2173,
+ "pc8": 0.0139,
+ "pc9": -0.0699,
+ "pc10": -0.0917,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
- "short_id": "1fbd2965",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "d654ce03",
"model": "haiku-4.5",
- "score": 0.34,
- "pc1": -0.6349,
- "pc2": -0.1821,
- "pc3": 0.2781,
- "pc4": -0.0343,
- "pc5": 0.16,
- "pc6": 0.1542,
- "pc7": 0.3712,
- "pc8": 0.0,
- "pc9": 0.0033,
- "pc10": 0.1807,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ "score": 0.8,
+ "pc1": 1.0641,
+ "pc2": -1.3285,
+ "pc3": -0.0988,
+ "pc4": -0.0227,
+ "pc5": -0.0187,
+ "pc6": -0.0466,
+ "pc7": 0.0326,
+ "pc8": -0.0233,
+ "pc9": 0.0163,
+ "pc10": -0.0435,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "c9b0a190",
"model": "haiku-4.5",
- "score": 0.76,
- "pc1": 0.4083,
- "pc2": -1.2232,
- "pc3": 0.3073,
- "pc4": 0.0554,
- "pc5": -0.0254,
- "pc6": 0.1324,
- "pc7": 0.3027,
- "pc8": 0.0,
- "pc9": -0.0043,
- "pc10": 0.3924,
+ "score": 0.9,
+ "pc1": 1.0641,
+ "pc2": -1.3285,
+ "pc3": -0.0988,
+ "pc4": -0.0227,
+ "pc5": -0.0187,
+ "pc6": -0.0466,
+ "pc7": 0.0326,
+ "pc8": -0.0233,
+ "pc9": 0.0163,
+ "pc10": -0.0435,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "c31b514e",
"model": "haiku-4.5",
- "score": 0.715,
- "pc1": 0.4083,
- "pc2": -1.2232,
- "pc3": 0.3073,
- "pc4": 0.0554,
- "pc5": -0.0254,
- "pc6": 0.1324,
- "pc7": 0.3027,
- "pc8": 0.0,
- "pc9": -0.0043,
- "pc10": 0.3924,
+ "score": 0.92,
+ "pc1": 1.0641,
+ "pc2": -1.3285,
+ "pc3": -0.0988,
+ "pc4": -0.0227,
+ "pc5": -0.0187,
+ "pc6": -0.0466,
+ "pc7": 0.0326,
+ "pc8": -0.0233,
+ "pc9": 0.0163,
+ "pc10": -0.0435,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run7",
"short_id": "8de1a3c2",
"model": "haiku-4.5",
- "score": 0.415,
- "pc1": 0.4083,
- "pc2": -1.2232,
- "pc3": 0.3073,
- "pc4": 0.0554,
- "pc5": -0.0254,
- "pc6": 0.1324,
- "pc7": 0.3027,
- "pc8": 0.0,
- "pc9": -0.0043,
- "pc10": 0.3924,
+ "score": 0.765,
+ "pc1": 1.0641,
+ "pc2": -1.3285,
+ "pc3": -0.0988,
+ "pc4": -0.0227,
+ "pc5": -0.0187,
+ "pc6": -0.0466,
+ "pc7": 0.0326,
+ "pc8": -0.0233,
+ "pc9": 0.0163,
+ "pc10": -0.0435,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=kimi25_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "5d8c8a9f",
+ "model": "kimi-k2.5",
+ "score": 0.625,
+ "pc1": -1.681,
+ "pc2": -0.1252,
+ "pc3": 3.061,
+ "pc4": -0.6772,
+ "pc5": -0.9887,
+ "pc6": 0.0006,
+ "pc7": 0.6996,
+ "pc8": -0.6345,
+ "pc9": -0.1268,
+ "pc10": -0.7318,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=kimi25_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "605e4afa",
+ "model": "kimi-k2.5",
+ "score": 0.605,
+ "pc1": -1.681,
+ "pc2": -0.1252,
+ "pc3": 3.061,
+ "pc4": -0.6772,
+ "pc5": -0.9887,
+ "pc6": 0.0006,
+ "pc7": 0.6996,
+ "pc8": -0.6345,
+ "pc9": -0.1268,
+ "pc10": -0.7318,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=kimi25_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "ed113d25",
+ "model": "kimi-k2.5",
+ "score": 0.47,
+ "pc1": -1.681,
+ "pc2": -0.1252,
+ "pc3": 3.061,
+ "pc4": -0.6772,
+ "pc5": -0.9887,
+ "pc6": 0.0006,
+ "pc7": 0.6996,
+ "pc8": -0.6345,
+ "pc9": -0.1268,
+ "pc10": -0.7318,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=mmx27_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "4a2436b3",
+ "model": "minimax-m2.7",
+ "score": 0.7,
+ "pc1": -1.6773,
+ "pc2": -0.1396,
+ "pc3": 3.1882,
+ "pc4": -0.6718,
+ "pc5": -0.5996,
+ "pc6": 0.1881,
+ "pc7": 0.3655,
+ "pc8": -0.5516,
+ "pc9": -0.4313,
+ "pc10": -0.0909,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=mmx27_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "4cb74ec4",
+ "model": "minimax-m2.7",
+ "score": 0.81,
+ "pc1": -1.6773,
+ "pc2": -0.1396,
+ "pc3": 3.1882,
+ "pc4": -0.6718,
+ "pc5": -0.5996,
+ "pc6": 0.1881,
+ "pc7": 0.3655,
+ "pc8": -0.5516,
+ "pc9": -0.4313,
+ "pc10": -0.0909,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=mmx27_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "368df7f1",
+ "model": "minimax-m2.7",
+ "score": 0.665,
+ "pc1": -1.6773,
+ "pc2": -0.1396,
+ "pc3": 3.1882,
+ "pc4": -0.6718,
+ "pc5": -0.5996,
+ "pc6": 0.1881,
+ "pc7": 0.3655,
+ "pc8": -0.5516,
+ "pc9": -0.4313,
+ "pc10": -0.0909,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "9cd7d12a",
"model": "opus-4.6",
- "score": 0.305,
- "pc1": 2.2554,
- "pc2": -1.7454,
- "pc3": -0.7088,
- "pc4": -1.7411,
- "pc5": -2.796,
- "pc6": 0.0404,
- "pc7": -0.1124,
- "pc8": -0.0,
- "pc9": -0.0371,
- "pc10": 1.3606,
+ "score": 0.805,
+ "pc1": 3.0228,
+ "pc2": -1.7786,
+ "pc3": -1.2163,
+ "pc4": 2.8174,
+ "pc5": -2.1226,
+ "pc6": 0.1144,
+ "pc7": 0.3011,
+ "pc8": -0.0216,
+ "pc9": -0.2293,
+ "pc10": 0.6397,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "28abb304",
"model": "opus-4.6",
- "score": 0.205,
- "pc1": 2.2554,
- "pc2": -1.7454,
- "pc3": -0.7088,
- "pc4": -1.7411,
- "pc5": -2.796,
- "pc6": 0.0404,
- "pc7": -0.1124,
- "pc8": -0.0,
- "pc9": -0.0371,
- "pc10": 1.3606,
+ "score": 0.765,
+ "pc1": 3.0228,
+ "pc2": -1.7786,
+ "pc3": -1.2163,
+ "pc4": 2.8174,
+ "pc5": -2.1226,
+ "pc6": 0.1144,
+ "pc7": 0.3011,
+ "pc8": -0.0216,
+ "pc9": -0.2293,
+ "pc10": 0.6397,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "30bc2917",
"model": "opus-4.6",
- "score": 0.305,
- "pc1": 2.2554,
- "pc2": -1.7454,
- "pc3": -0.7088,
- "pc4": -1.7411,
- "pc5": -2.796,
- "pc6": 0.0404,
- "pc7": -0.1124,
- "pc8": -0.0,
- "pc9": -0.0371,
- "pc10": 1.3606,
+ "score": 0.815,
+ "pc1": 3.0228,
+ "pc2": -1.7786,
+ "pc3": -1.2163,
+ "pc4": 2.8174,
+ "pc5": -2.1226,
+ "pc6": 0.1144,
+ "pc7": 0.3011,
+ "pc8": -0.0216,
+ "pc9": -0.2293,
+ "pc10": 0.6397,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "b9ce8930",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 0.3865,
- "pc2": -1.7797,
- "pc3": -0.1052,
- "pc4": -0.4937,
- "pc5": 0.155,
- "pc6": 0.1272,
- "pc7": 0.1821,
- "pc8": 0.0,
- "pc9": 0.0066,
- "pc10": 0.0175,
+ "score": 0.655,
+ "pc1": 1.017,
+ "pc2": -2.0143,
+ "pc3": -0.0975,
+ "pc4": 0.5365,
+ "pc5": 0.3807,
+ "pc6": -0.0404,
+ "pc7": -0.3028,
+ "pc8": 0.125,
+ "pc9": 0.0487,
+ "pc10": -0.0525,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "6c694ce9",
"model": "opus-4.6",
- "score": 0.405,
- "pc1": 0.3865,
- "pc2": -1.7797,
- "pc3": -0.1052,
- "pc4": -0.4937,
- "pc5": 0.155,
- "pc6": 0.1272,
- "pc7": 0.1821,
- "pc8": 0.0,
- "pc9": 0.0066,
- "pc10": 0.0175,
+ "score": 0.935,
+ "pc1": 1.017,
+ "pc2": -2.0143,
+ "pc3": -0.0975,
+ "pc4": 0.5365,
+ "pc5": 0.3807,
+ "pc6": -0.0404,
+ "pc7": -0.3028,
+ "pc8": 0.125,
+ "pc9": 0.0487,
+ "pc10": -0.0525,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "83b4415b",
"model": "opus-4.6",
- "score": 0.895,
- "pc1": 0.3865,
- "pc2": -1.7797,
- "pc3": -0.1052,
- "pc4": -0.4937,
- "pc5": 0.155,
- "pc6": 0.1272,
- "pc7": 0.1821,
- "pc8": 0.0,
- "pc9": 0.0066,
- "pc10": 0.0175,
+ "score": 0.84,
+ "pc1": 1.017,
+ "pc2": -2.0143,
+ "pc3": -0.0975,
+ "pc4": 0.5365,
+ "pc5": 0.3807,
+ "pc6": -0.0404,
+ "pc7": -0.3028,
+ "pc8": 0.125,
+ "pc9": 0.0487,
+ "pc10": -0.0525,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "37932d12",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 2.5625,
- "pc2": -1.4574,
- "pc3": 0.4278,
- "pc4": -0.0571,
- "pc5": 0.9724,
- "pc6": 0.2578,
- "pc7": 0.9907,
- "pc8": 0.0,
- "pc9": 0.0386,
- "pc10": -1.0584,
+ "score": 0.655,
+ "pc1": 3.1516,
+ "pc2": -1.5305,
+ "pc3": -0.062,
+ "pc4": -0.2306,
+ "pc5": 1.0081,
+ "pc6": 0.0586,
+ "pc7": -0.509,
+ "pc8": -0.3707,
+ "pc9": 0.3859,
+ "pc10": -1.8969,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "b53d8e6f",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 2.5625,
- "pc2": -1.4574,
- "pc3": 0.4278,
- "pc4": -0.0571,
- "pc5": 0.9724,
- "pc6": 0.2578,
- "pc7": 0.9907,
- "pc8": 0.0,
- "pc9": 0.0386,
- "pc10": -1.0584,
+ "score": 0.625,
+ "pc1": 3.1516,
+ "pc2": -1.5305,
+ "pc3": -0.062,
+ "pc4": -0.2306,
+ "pc5": 1.0081,
+ "pc6": 0.0586,
+ "pc7": -0.509,
+ "pc8": -0.3707,
+ "pc9": 0.3859,
+ "pc10": -1.8969,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "53a9f7eb",
"model": "opus-4.6",
- "score": 0.28,
- "pc1": 2.5625,
- "pc2": -1.4574,
- "pc3": 0.4278,
- "pc4": -0.0571,
- "pc5": 0.9724,
- "pc6": 0.2578,
- "pc7": 0.9907,
- "pc8": 0.0,
- "pc9": 0.0386,
- "pc10": -1.0584,
+ "score": 0.78,
+ "pc1": 3.1516,
+ "pc2": -1.5305,
+ "pc3": -0.062,
+ "pc4": -0.2306,
+ "pc5": 1.0081,
+ "pc6": 0.0586,
+ "pc7": -0.509,
+ "pc8": -0.3707,
+ "pc9": 0.3859,
+ "pc10": -1.8969,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "71eeae15",
"model": "opus-4.6",
- "score": 0.43,
- "pc1": 2.3859,
- "pc2": -1.7008,
- "pc3": 0.5034,
- "pc4": -1.833,
- "pc5": 2.0811,
- "pc6": 0.5336,
- "pc7": 1.4802,
- "pc8": 0.0,
- "pc9": 0.0713,
- "pc10": -1.8713,
+ "score": 0.93,
+ "pc1": 2.8973,
+ "pc2": -1.8514,
+ "pc3": 0.6646,
+ "pc4": 1.2484,
+ "pc5": 2.6528,
+ "pc6": 0.015,
+ "pc7": -0.9622,
+ "pc8": 0.3619,
+ "pc9": 0.7306,
+ "pc10": -2.4705,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "868a617f",
"model": "opus-4.6",
- "score": 0.28,
- "pc1": 2.3859,
- "pc2": -1.7008,
- "pc3": 0.5034,
- "pc4": -1.833,
- "pc5": 2.0811,
- "pc6": 0.5336,
- "pc7": 1.4802,
- "pc8": 0.0,
- "pc9": 0.0713,
- "pc10": -1.8713,
+ "score": 0.825,
+ "pc1": 2.8973,
+ "pc2": -1.8514,
+ "pc3": 0.6646,
+ "pc4": 1.2484,
+ "pc5": 2.6528,
+ "pc6": 0.015,
+ "pc7": -0.9622,
+ "pc8": 0.3619,
+ "pc9": 0.7306,
+ "pc10": -2.4705,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "8c6cb19c",
"model": "opus-4.6",
- "score": 0.805,
- "pc1": 2.3859,
- "pc2": -1.7008,
- "pc3": 0.5034,
- "pc4": -1.833,
- "pc5": 2.0811,
- "pc6": 0.5336,
- "pc7": 1.4802,
- "pc8": 0.0,
- "pc9": 0.0713,
- "pc10": -1.8713,
+ "score": 0.79,
+ "pc1": 2.8973,
+ "pc2": -1.8514,
+ "pc3": 0.6646,
+ "pc4": 1.2484,
+ "pc5": 2.6528,
+ "pc6": 0.015,
+ "pc7": -0.9622,
+ "pc8": 0.3619,
+ "pc9": 0.7306,
+ "pc10": -2.4705,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run4",
"short_id": "68a6572f",
"model": "opus-4.6",
- "score": 0.475,
- "pc1": 2.4961,
- "pc2": -1.5095,
- "pc3": 0.1973,
- "pc4": -0.9155,
- "pc5": 1.7501,
- "pc6": -0.2128,
- "pc7": -0.9167,
- "pc8": -0.0,
- "pc9": -0.0501,
- "pc10": 1.6459,
+ "score": 0.765,
+ "pc1": 3.1754,
+ "pc2": -1.5406,
+ "pc3": 0.147,
+ "pc4": 0.582,
+ "pc5": 2.2939,
+ "pc6": -0.1353,
+ "pc7": -1.0621,
+ "pc8": 0.4579,
+ "pc9": -0.0955,
+ "pc10": 1.7226,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run5",
"short_id": "00b5cb8a",
"model": "opus-4.6",
- "score": 0.365,
- "pc1": 2.4961,
- "pc2": -1.5095,
- "pc3": 0.1973,
- "pc4": -0.9155,
- "pc5": 1.7501,
- "pc6": -0.2128,
- "pc7": -0.9167,
- "pc8": -0.0,
- "pc9": -0.0501,
- "pc10": 1.6459,
+ "score": 0.915,
+ "pc1": 3.1754,
+ "pc2": -1.5406,
+ "pc3": 0.147,
+ "pc4": 0.582,
+ "pc5": 2.2939,
+ "pc6": -0.1353,
+ "pc7": -1.0621,
+ "pc8": 0.4579,
+ "pc9": -0.0955,
+ "pc10": 1.7226,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run6",
"short_id": "e2cb7f2b",
"model": "opus-4.6",
- "score": 0.865,
- "pc1": 2.4961,
- "pc2": -1.5095,
- "pc3": 0.1973,
- "pc4": -0.9155,
- "pc5": 1.7501,
- "pc6": -0.2128,
- "pc7": -0.9167,
- "pc8": -0.0,
- "pc9": -0.0501,
- "pc10": 1.6459,
+ "score": 0.915,
+ "pc1": 3.1754,
+ "pc2": -1.5406,
+ "pc3": 0.147,
+ "pc4": 0.582,
+ "pc5": 2.2939,
+ "pc6": -0.1353,
+ "pc7": -1.0621,
+ "pc8": 0.4579,
+ "pc9": -0.0955,
+ "pc10": 1.7226,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run4",
"short_id": "4d465534",
"model": "opus-4.6",
- "score": 0.765,
- "pc1": 2.6222,
- "pc2": -1.4713,
- "pc3": 0.1097,
- "pc4": -1.8515,
- "pc5": -0.8641,
- "pc6": 0.2704,
- "pc7": 0.7689,
- "pc8": 0.0,
- "pc9": 0.0026,
- "pc10": 0.1406,
+ "score": 0.97,
+ "pc1": 3.1725,
+ "pc2": -1.5473,
+ "pc3": -0.1216,
+ "pc4": 2.1405,
+ "pc5": -0.0781,
+ "pc6": 0.4664,
+ "pc7": -0.401,
+ "pc8": 0.4372,
+ "pc9": 0.1505,
+ "pc10": -0.5308,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run5",
"short_id": "330aae5e",
"model": "opus-4.6",
- "score": 0.205,
- "pc1": 2.6222,
- "pc2": -1.4713,
- "pc3": 0.1097,
- "pc4": -1.8515,
- "pc5": -0.8641,
- "pc6": 0.2704,
- "pc7": 0.7689,
- "pc8": 0.0,
- "pc9": 0.0026,
- "pc10": 0.1406,
+ "score": 0.595,
+ "pc1": 3.1725,
+ "pc2": -1.5473,
+ "pc3": -0.1216,
+ "pc4": 2.1405,
+ "pc5": -0.0781,
+ "pc6": 0.4664,
+ "pc7": -0.401,
+ "pc8": 0.4372,
+ "pc9": 0.1505,
+ "pc10": -0.5308,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run6",
"short_id": "a59bd13b",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 2.6222,
- "pc2": -1.4713,
- "pc3": 0.1097,
- "pc4": -1.8515,
- "pc5": -0.8641,
- "pc6": 0.2704,
- "pc7": 0.7689,
- "pc8": 0.0,
- "pc9": 0.0026,
- "pc10": 0.1406,
+ "score": 0.78,
+ "pc1": 3.1725,
+ "pc2": -1.5473,
+ "pc3": -0.1216,
+ "pc4": 2.1405,
+ "pc5": -0.0781,
+ "pc6": 0.4664,
+ "pc7": -0.401,
+ "pc8": 0.4372,
+ "pc9": 0.1505,
+ "pc10": -0.5308,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run4",
"short_id": "6c4adfb0",
"model": "opus-4.6",
- "score": 0.865,
- "pc1": 2.5392,
- "pc2": -1.5031,
- "pc3": 0.2909,
- "pc4": 0.725,
- "pc5": 1.4683,
- "pc6": -0.0411,
- "pc7": -0.3248,
- "pc8": -0.0,
- "pc9": 0.0082,
- "pc10": -0.2145,
+ "score": 0.955,
+ "pc1": 3.1769,
+ "pc2": -1.5494,
+ "pc3": -0.4492,
+ "pc4": -0.9475,
+ "pc5": 1.356,
+ "pc6": -0.3156,
+ "pc7": -0.1612,
+ "pc8": 0.1483,
+ "pc9": -0.2104,
+ "pc10": 0.6231,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run5",
"short_id": "e5199e69",
"model": "opus-4.6",
- "score": 0.91,
- "pc1": 2.5392,
- "pc2": -1.5031,
- "pc3": 0.2909,
- "pc4": 0.725,
- "pc5": 1.4683,
- "pc6": -0.0411,
- "pc7": -0.3248,
- "pc8": -0.0,
- "pc9": 0.0082,
- "pc10": -0.2145,
+ "score": 0.945,
+ "pc1": 3.1769,
+ "pc2": -1.5494,
+ "pc3": -0.4492,
+ "pc4": -0.9475,
+ "pc5": 1.356,
+ "pc6": -0.3156,
+ "pc7": -0.1612,
+ "pc8": 0.1483,
+ "pc9": -0.2104,
+ "pc10": 0.6231,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run6",
"short_id": "c049fcf5",
"model": "opus-4.6",
- "score": 0.245,
- "pc1": 2.5392,
- "pc2": -1.5031,
- "pc3": 0.2909,
- "pc4": 0.725,
- "pc5": 1.4683,
- "pc6": -0.0411,
- "pc7": -0.3248,
- "pc8": -0.0,
- "pc9": 0.0082,
- "pc10": -0.2145,
+ "score": 0.55,
+ "pc1": 3.1769,
+ "pc2": -1.5494,
+ "pc3": -0.4492,
+ "pc4": -0.9475,
+ "pc5": 1.356,
+ "pc6": -0.3156,
+ "pc7": -0.1612,
+ "pc8": 0.1483,
+ "pc9": -0.2104,
+ "pc10": 0.6231,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run4",
"short_id": "feb7d705",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 2.4525,
- "pc2": -1.2071,
- "pc3": -0.4554,
- "pc4": -0.7727,
- "pc5": -1.5139,
- "pc6": 0.0229,
- "pc7": -0.0209,
- "pc8": -0.0,
- "pc9": 0.0006,
- "pc10": 0.0135,
+ "score": 0.64,
+ "pc1": 3.108,
+ "pc2": -1.2069,
+ "pc3": -0.79,
+ "pc4": 1.596,
+ "pc5": -1.1095,
+ "pc6": -0.0991,
+ "pc7": 0.1436,
+ "pc8": -0.2935,
+ "pc9": -0.126,
+ "pc10": 0.465,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run5",
"short_id": "3c9d94f5",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 2.4525,
- "pc2": -1.2071,
- "pc3": -0.4554,
- "pc4": -0.7727,
- "pc5": -1.5139,
- "pc6": 0.0229,
- "pc7": -0.0209,
- "pc8": -0.0,
- "pc9": 0.0006,
- "pc10": 0.0135,
+ "score": 0.95,
+ "pc1": 3.108,
+ "pc2": -1.2069,
+ "pc3": -0.79,
+ "pc4": 1.596,
+ "pc5": -1.1095,
+ "pc6": -0.0991,
+ "pc7": 0.1436,
+ "pc8": -0.2935,
+ "pc9": -0.126,
+ "pc10": 0.465,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run6",
"short_id": "1a10ac67",
"model": "opus-4.6",
- "score": 0.475,
- "pc1": 2.4525,
- "pc2": -1.2071,
- "pc3": -0.4554,
- "pc4": -0.7727,
- "pc5": -1.5139,
- "pc6": 0.0229,
- "pc7": -0.0209,
- "pc8": -0.0,
- "pc9": 0.0006,
- "pc10": 0.0135,
+ "score": 0.92,
+ "pc1": 3.108,
+ "pc2": -1.2069,
+ "pc3": -0.79,
+ "pc4": 1.596,
+ "pc5": -1.1095,
+ "pc6": -0.0991,
+ "pc7": 0.1436,
+ "pc8": -0.2935,
+ "pc9": -0.126,
+ "pc10": 0.465,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "67153cc8",
"model": "opus-4.6",
- "score": 0.315,
- "pc1": 1.4297,
- "pc2": -2.8208,
- "pc3": -0.076,
- "pc4": -0.404,
- "pc5": -0.0305,
- "pc6": 0.1055,
- "pc7": 0.1136,
- "pc8": 0.0,
- "pc9": -0.001,
- "pc10": 0.2292,
+ "score": 0.625,
+ "pc1": 2.068,
+ "pc2": -3.0223,
+ "pc3": -0.4615,
+ "pc4": 0.5711,
+ "pc5": 0.298,
+ "pc6": 0.0184,
+ "pc7": -0.3333,
+ "pc8": 0.1123,
+ "pc9": 0.0397,
+ "pc10": 0.0645,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "cde3d475",
"model": "opus-4.6",
- "score": 0.385,
- "pc1": 1.4297,
- "pc2": -2.8208,
- "pc3": -0.076,
- "pc4": -0.404,
- "pc5": -0.0305,
- "pc6": 0.1055,
- "pc7": 0.1136,
- "pc8": 0.0,
- "pc9": -0.001,
- "pc10": 0.2292,
+ "score": 0.835,
+ "pc1": 2.068,
+ "pc2": -3.0223,
+ "pc3": -0.4615,
+ "pc4": 0.5711,
+ "pc5": 0.298,
+ "pc6": 0.0184,
+ "pc7": -0.3333,
+ "pc8": 0.1123,
+ "pc9": 0.0397,
+ "pc10": 0.0645,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "b7e96026",
"model": "opus-4.6",
- "score": 0.88,
- "pc1": 1.4297,
- "pc2": -2.8208,
- "pc3": -0.076,
- "pc4": -0.404,
- "pc5": -0.0305,
- "pc6": 0.1055,
- "pc7": 0.1136,
- "pc8": 0.0,
- "pc9": -0.001,
- "pc10": 0.2292,
+ "score": 0.78,
+ "pc1": 2.068,
+ "pc2": -3.0223,
+ "pc3": -0.4615,
+ "pc4": 0.5711,
+ "pc5": 0.298,
+ "pc6": 0.0184,
+ "pc7": -0.3333,
+ "pc8": 0.1123,
+ "pc9": 0.0397,
+ "pc10": 0.0645,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "835cad49",
"model": "opus-4.6",
- "score": 0.385,
- "pc1": -0.742,
- "pc2": -0.8032,
- "pc3": -0.0005,
- "pc4": -0.2735,
- "pc5": 0.1195,
- "pc6": 0.0763,
- "pc7": 0.1277,
- "pc8": 0.0,
- "pc9": 0.0014,
- "pc10": 0.0558,
+ "score": 0.835,
+ "pc1": -0.1611,
+ "pc2": -1.0576,
+ "pc3": 0.1947,
+ "pc4": 0.2496,
+ "pc5": 0.1412,
+ "pc6": -0.0406,
+ "pc7": -0.1356,
+ "pc8": 0.0512,
+ "pc9": -0.0349,
+ "pc10": -0.0692,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "886f5323",
"model": "opus-4.6",
- "score": 0.49,
- "pc1": 0.3012,
- "pc2": -1.8443,
- "pc3": 0.0286,
- "pc4": -0.1838,
- "pc5": -0.066,
- "pc6": 0.0545,
- "pc7": 0.0592,
- "pc8": 0.0,
- "pc9": -0.0062,
- "pc10": 0.2675,
+ "score": 0.935,
+ "pc1": 0.89,
+ "pc2": -2.0657,
+ "pc3": -0.1693,
+ "pc4": 0.2841,
+ "pc5": 0.0585,
+ "pc6": 0.0183,
+ "pc7": -0.1662,
+ "pc8": 0.0385,
+ "pc9": -0.0438,
+ "pc10": 0.0478,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "d6549fa2",
"model": "opus-4.6",
- "score": 0.825,
- "pc1": 0.3012,
- "pc2": -1.8443,
- "pc3": 0.0286,
- "pc4": -0.1838,
- "pc5": -0.066,
- "pc6": 0.0545,
- "pc7": 0.0592,
- "pc8": 0.0,
- "pc9": -0.0062,
- "pc10": 0.2675,
+ "score": 0.795,
+ "pc1": 0.89,
+ "pc2": -2.0657,
+ "pc3": -0.1693,
+ "pc4": 0.2841,
+ "pc5": 0.0585,
+ "pc6": 0.0183,
+ "pc7": -0.1662,
+ "pc8": 0.0385,
+ "pc9": -0.0438,
+ "pc10": 0.0478,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "6ccb77f1",
"model": "opus-4.6",
- "score": 0.46,
- "pc1": 0.3012,
- "pc2": -1.8443,
- "pc3": 0.0286,
- "pc4": -0.1838,
- "pc5": -0.066,
- "pc6": 0.0545,
- "pc7": 0.0592,
- "pc8": 0.0,
- "pc9": -0.0062,
- "pc10": 0.2675,
+ "score": 0.835,
+ "pc1": 0.89,
+ "pc2": -2.0657,
+ "pc3": -0.1693,
+ "pc4": 0.2841,
+ "pc5": 0.0585,
+ "pc6": 0.0183,
+ "pc7": -0.1662,
+ "pc8": 0.0385,
+ "pc9": -0.0438,
+ "pc10": 0.0478,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=avail_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "2940c4cb",
"model": "qwen-3.6-plus",
- "score": 0.305,
- "pc1": -1.3753,
- "pc2": -0.6531,
- "pc3": 2.2639,
- "pc4": -0.437,
- "pc5": -0.3596,
- "pc6": -0.4872,
- "pc7": -0.3791,
- "pc8": -0.0,
- "pc9": -0.033,
- "pc10": -0.162,
+ "score": 0.9,
+ "pc1": -0.4412,
+ "pc2": -1.0587,
+ "pc3": 2.9701,
+ "pc4": -0.5762,
+ "pc5": -0.9328,
+ "pc6": 0.4663,
+ "pc7": 0.0109,
+ "pc8": -0.1872,
+ "pc9": 0.1343,
+ "pc10": 0.0852,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=inst_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "e797a7a2",
"model": "qwen-3.6-plus",
- "score": 0.37,
- "pc1": -2.3222,
- "pc2": -0.1443,
- "pc3": 2.3225,
- "pc4": -0.359,
- "pc5": -0.3674,
- "pc6": -0.6112,
- "pc7": -0.6271,
- "pc8": 0.0,
- "pc9": -0.0415,
- "pc10": -0.3252,
+ "score": 0.905,
+ "pc1": -1.2895,
+ "pc2": -0.6521,
+ "pc3": 3.5077,
+ "pc4": -0.9108,
+ "pc5": -1.1426,
+ "pc6": 0.3436,
+ "pc7": 0.4384,
+ "pc8": -0.0154,
+ "pc9": -0.1542,
+ "pc10": -0.0231,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=detailed_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "2860212a",
- "model": "qwen-3.6-plus",
- "score": 0.325,
- "pc1": -1.6782,
- "pc2": 1.3987,
- "pc3": 1.7358,
- "pc4": -1.554,
- "pc5": -3.1606,
- "pc6": -0.6032,
- "pc7": -0.6596,
- "pc8": -0.0,
- "pc9": -0.0742,
- "pc10": 1.0076,
- "config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
- },
- {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=cv_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "438b74fe",
"model": "qwen-3.6-plus",
- "score": 0.355,
- "pc1": -2.376,
- "pc2": -0.2093,
- "pc3": 2.368,
- "pc4": -0.0667,
- "pc5": -0.5608,
- "pc6": -0.8281,
- "pc7": -0.7552,
- "pc8": -0.0,
- "pc9": -0.0576,
- "pc10": 0.0229,
+ "score": 0.5,
+ "pc1": -1.3883,
+ "pc2": -0.6889,
+ "pc3": 3.3048,
+ "pc4": -1.1014,
+ "pc5": -1.6588,
+ "pc6": 0.5601,
+ "pc7": 0.3218,
+ "pc8": -0.3807,
+ "pc9": 0.0678,
+ "pc10": -0.2727,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=creative_validate"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=delegate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "6873ee5b",
- "model": "qwen-3.6-plus",
- "score": 0.41,
- "pc1": -2.3378,
- "pc2": -0.2556,
- "pc3": 3.0124,
- "pc4": -0.1682,
- "pc5": -0.6524,
- "pc6": -0.6337,
- "pc7": -0.549,
- "pc8": -0.0,
- "pc9": -0.0631,
- "pc10": 0.1101,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=delegate"
- },
- {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=iterate_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "69976c08",
"model": "qwen-3.6-plus",
- "score": 0.37,
- "pc1": -2.3679,
- "pc2": -0.2161,
- "pc3": 2.5104,
- "pc4": -0.0976,
- "pc5": -0.5638,
- "pc6": -0.6605,
- "pc7": -0.6765,
- "pc8": -0.0,
- "pc9": -0.0563,
- "pc10": 0.0086,
+ "score": 0.5,
+ "pc1": -1.4054,
+ "pc2": -0.6769,
+ "pc3": 3.404,
+ "pc4": -0.9046,
+ "pc5": -1.5422,
+ "pc6": 0.2232,
+ "pc7": 0.5294,
+ "pc8": -0.4965,
+ "pc9": -0.3035,
+ "pc10": -0.0267,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=iterate"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "29796092",
"model": "qwen-3.6-plus",
- "score": 0.33,
- "pc1": -1.3711,
- "pc2": 1.6867,
- "pc3": 2.8724,
- "pc4": 0.1301,
- "pc5": 0.6078,
- "pc6": -0.3858,
- "pc7": 0.4435,
- "pc8": 0.0,
- "pc9": 0.0014,
- "pc10": -1.4114,
+ "score": 0.49,
+ "pc1": -0.5357,
+ "pc2": 1.3897,
+ "pc3": 3.6618,
+ "pc4": -1.6648,
+ "pc5": -0.4623,
+ "pc6": 0.5064,
+ "pc7": 0.0023,
+ "pc8": -0.744,
+ "pc9": 0.3969,
+ "pc10": -1.8929,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "70ec796c",
"model": "qwen-3.6-plus",
- "score": 0.325,
- "pc1": -1.5477,
- "pc2": 1.4433,
- "pc3": 2.948,
- "pc4": -1.6459,
- "pc5": 1.7165,
- "pc6": -0.11,
- "pc7": 0.933,
- "pc8": 0.0,
- "pc9": 0.0342,
- "pc10": -2.2242,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
- "short_id": "e0a7d71a",
- "model": "qwen-3.6-plus",
- "score": 0.325,
- "pc1": -1.4375,
- "pc2": 1.6346,
- "pc3": 2.6418,
- "pc4": -0.7284,
- "pc5": 1.3855,
- "pc6": -0.8564,
- "pc7": -1.4639,
- "pc8": -0.0,
- "pc9": -0.0872,
- "pc10": 1.293,
+ "score": 0.665,
+ "pc1": -0.79,
+ "pc2": 1.0688,
+ "pc3": 4.3884,
+ "pc4": -0.1858,
+ "pc5": 1.1825,
+ "pc6": 0.4628,
+ "pc7": -0.4509,
+ "pc8": -0.0115,
+ "pc9": 0.7416,
+ "pc10": -2.4665,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
"short_id": "45e1ddec",
"model": "qwen-3.6-plus",
- "score": 0.33,
- "pc1": -1.3114,
- "pc2": 1.6728,
- "pc3": 2.5543,
- "pc4": -1.6644,
- "pc5": -1.2287,
- "pc6": -0.3732,
- "pc7": 0.2217,
- "pc8": 0.0,
- "pc9": -0.0346,
- "pc10": -0.2123,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
- "short_id": "179ad7a0",
- "model": "qwen-3.6-plus",
- "score": 0.3,
- "pc1": -1.3944,
- "pc2": 1.641,
- "pc3": 2.7355,
- "pc4": 0.9121,
- "pc5": 1.1037,
- "pc6": -0.6847,
- "pc7": -0.872,
- "pc8": -0.0,
- "pc9": -0.0289,
- "pc10": -0.5675,
+ "score": 0.855,
+ "pc1": -0.5148,
+ "pc2": 1.3729,
+ "pc3": 3.6022,
+ "pc4": 0.7063,
+ "pc5": -1.5484,
+ "pc6": 0.9142,
+ "pc7": 0.1103,
+ "pc8": 0.0638,
+ "pc9": 0.1615,
+ "pc10": -0.5268,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
"short_id": "b5af3c93",
"model": "qwen-3.6-plus",
- "score": 0.77,
- "pc1": -1.4811,
- "pc2": 1.9371,
- "pc3": 1.9891,
- "pc4": -0.5856,
- "pc5": -1.8785,
- "pc6": -0.6207,
- "pc7": -0.5681,
- "pc8": -0.0,
- "pc9": -0.0365,
- "pc10": -0.3395,
+ "score": 0.715,
+ "pc1": -0.5793,
+ "pc2": 1.7134,
+ "pc3": 2.9338,
+ "pc4": 0.1618,
+ "pc5": -2.5799,
+ "pc6": 0.3486,
+ "pc7": 0.6549,
+ "pc8": -0.6669,
+ "pc9": -0.115,
+ "pc10": 0.469,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "3146a5e9",
"model": "qwen-3.6-plus",
- "score": 0.385,
- "pc1": -2.5039,
- "pc2": 0.3234,
- "pc3": 2.3685,
- "pc4": -0.2169,
- "pc5": -0.3951,
- "pc6": -0.5381,
- "pc7": -0.4336,
- "pc8": -0.0,
- "pc9": -0.0382,
- "pc10": -0.1237,
+ "score": 0.665,
+ "pc1": -1.6192,
+ "pc2": -0.1021,
+ "pc3": 3.2623,
+ "pc4": -0.8631,
+ "pc5": -1.1724,
+ "pc6": 0.4662,
+ "pc7": 0.178,
+ "pc8": -0.261,
+ "pc9": 0.0507,
+ "pc10": 0.0685,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=plan_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "78a1905c",
"model": "qwen-3.6-plus",
- "score": 0.37,
- "pc1": -2.3561,
- "pc2": -0.2298,
- "pc3": 2.7106,
- "pc4": -0.1308,
- "pc5": -0.5889,
- "pc6": -0.5759,
- "pc7": -0.6059,
- "pc8": -0.0,
- "pc9": -0.0575,
- "pc10": 0.0292,
+ "score": 0.835,
+ "pc1": -1.4071,
+ "pc2": -0.6995,
+ "pc3": 3.236,
+ "pc4": -0.9806,
+ "pc5": -1.5913,
+ "pc6": 0.7056,
+ "pc7": 0.3321,
+ "pc8": -0.2365,
+ "pc9": -0.0444,
+ "pc10": 0.1374,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=plan_first"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=split_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "01aed128",
"model": "qwen-3.6-plus",
- "score": 0.255,
- "pc1": -2.3378,
- "pc2": -0.2556,
- "pc3": 3.0124,
- "pc4": -0.1682,
- "pc5": -0.6524,
- "pc6": -0.6337,
- "pc7": -0.549,
- "pc8": 0.0,
- "pc9": -0.0631,
- "pc10": 0.1101,
+ "score": 0.5,
+ "pc1": -1.4487,
+ "pc2": -0.6591,
+ "pc3": 3.2373,
+ "pc4": -0.9777,
+ "pc5": -1.4148,
+ "pc6": 0.6852,
+ "pc7": 0.197,
+ "pc8": -0.2228,
+ "pc9": -0.2421,
+ "pc10": 0.0657,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=split_work"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "0a9479c0",
"model": "qwen-3.6-plus",
- "score": 0.385,
- "pc1": -1.4607,
- "pc2": -0.7177,
- "pc3": 2.3977,
- "pc4": -0.1272,
- "pc5": -0.5805,
- "pc6": -0.5599,
- "pc7": -0.5021,
- "pc8": -0.0,
- "pc9": -0.0458,
- "pc10": 0.0879,
+ "score": 0.93,
+ "pc1": -0.5682,
+ "pc2": -1.1101,
+ "pc3": 2.8983,
+ "pc4": -0.8286,
+ "pc5": -1.2551,
+ "pc6": 0.525,
+ "pc7": 0.1475,
+ "pc8": -0.2737,
+ "pc9": 0.0418,
+ "pc10": 0.1855,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "de9c4cc0",
"model": "sonnet-4.6",
- "score": 0.155,
- "pc1": 2.2459,
- "pc2": -1.7396,
- "pc3": -0.7066,
- "pc4": -1.7408,
- "pc5": -2.7938,
- "pc6": 0.0421,
- "pc7": -0.1088,
- "pc8": -0.0,
- "pc9": -0.0371,
- "pc10": 1.3619,
+ "score": 0.605,
+ "pc1": 3.0149,
+ "pc2": -1.7705,
+ "pc3": -1.2124,
+ "pc4": 2.8375,
+ "pc5": -2.1601,
+ "pc6": 0.1782,
+ "pc7": 0.3822,
+ "pc8": -0.1585,
+ "pc9": -0.0835,
+ "pc10": 0.6852,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "536bc021",
"model": "sonnet-4.6",
- "score": 0.18,
- "pc1": 2.2459,
- "pc2": -1.7396,
- "pc3": -0.7066,
- "pc4": -1.7408,
- "pc5": -2.7938,
- "pc6": 0.0421,
- "pc7": -0.1088,
- "pc8": -0.0,
- "pc9": -0.0371,
- "pc10": 1.3619,
+ "score": 0.675,
+ "pc1": 3.0149,
+ "pc2": -1.7705,
+ "pc3": -1.2124,
+ "pc4": 2.8375,
+ "pc5": -2.1601,
+ "pc6": 0.1782,
+ "pc7": 0.3822,
+ "pc8": -0.1585,
+ "pc9": -0.0835,
+ "pc10": 0.6852,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "92665abf",
"model": "sonnet-4.6",
- "score": 0.715,
- "pc1": 2.2459,
- "pc2": -1.7396,
- "pc3": -0.7066,
- "pc4": -1.7408,
- "pc5": -2.7938,
- "pc6": 0.0421,
- "pc7": -0.1088,
- "pc8": -0.0,
- "pc9": -0.0371,
- "pc10": 1.3619,
+ "score": 0.86,
+ "pc1": 3.0149,
+ "pc2": -1.7705,
+ "pc3": -1.2124,
+ "pc4": 2.8375,
+ "pc5": -2.1601,
+ "pc6": 0.1782,
+ "pc7": 0.3822,
+ "pc8": -0.1585,
+ "pc9": -0.0835,
+ "pc10": 0.6852,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "d2c1efc6",
"model": "sonnet-4.6",
- "score": 0.305,
- "pc1": 0.377,
- "pc2": -1.7738,
- "pc3": -0.103,
- "pc4": -0.4934,
- "pc5": 0.1571,
- "pc6": 0.1289,
- "pc7": 0.1858,
- "pc8": 0.0,
- "pc9": 0.0066,
- "pc10": 0.0188,
+ "score": 0.975,
+ "pc1": 1.009,
+ "pc2": -2.0061,
+ "pc3": -0.0936,
+ "pc4": 0.5566,
+ "pc5": 0.3431,
+ "pc6": 0.0234,
+ "pc7": -0.2217,
+ "pc8": -0.012,
+ "pc9": 0.1944,
+ "pc10": -0.007,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "b9741b31",
"model": "sonnet-4.6",
- "score": 0.315,
- "pc1": 0.377,
- "pc2": -1.7738,
- "pc3": -0.103,
- "pc4": -0.4934,
- "pc5": 0.1571,
- "pc6": 0.1289,
- "pc7": 0.1858,
- "pc8": 0.0,
- "pc9": 0.0066,
- "pc10": 0.0188,
+ "score": 0.685,
+ "pc1": 1.009,
+ "pc2": -2.0061,
+ "pc3": -0.0936,
+ "pc4": 0.5566,
+ "pc5": 0.3431,
+ "pc6": 0.0234,
+ "pc7": -0.2217,
+ "pc8": -0.012,
+ "pc9": 0.1944,
+ "pc10": -0.007,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "b683745c",
"model": "sonnet-4.6",
- "score": 0.425,
- "pc1": 0.377,
- "pc2": -1.7738,
- "pc3": -0.103,
- "pc4": -0.4934,
- "pc5": 0.1571,
- "pc6": 0.1289,
- "pc7": 0.1858,
- "pc8": 0.0,
- "pc9": 0.0066,
- "pc10": 0.0188,
+ "score": 0.87,
+ "pc1": 1.009,
+ "pc2": -2.0061,
+ "pc3": -0.0936,
+ "pc4": 0.5566,
+ "pc5": 0.3431,
+ "pc6": 0.0234,
+ "pc7": -0.2217,
+ "pc8": -0.012,
+ "pc9": 0.1944,
+ "pc10": -0.007,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "c13f247e",
"model": "sonnet-4.6",
- "score": 0.49,
- "pc1": 2.553,
- "pc2": -1.4515,
- "pc3": 0.43,
- "pc4": -0.0568,
- "pc5": 0.9745,
- "pc6": 0.2595,
- "pc7": 0.9944,
- "pc8": 0.0,
- "pc9": 0.0386,
- "pc10": -1.0571,
+ "score": 0.97,
+ "pc1": 3.1436,
+ "pc2": -1.5224,
+ "pc3": -0.0581,
+ "pc4": -0.2105,
+ "pc5": 0.9705,
+ "pc6": 0.1225,
+ "pc7": -0.4279,
+ "pc8": -0.5076,
+ "pc9": 0.5317,
+ "pc10": -1.8514,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "0f0815e0",
"model": "sonnet-4.6",
- "score": 0.475,
- "pc1": 2.553,
- "pc2": -1.4515,
- "pc3": 0.43,
- "pc4": -0.0568,
- "pc5": 0.9745,
- "pc6": 0.2595,
- "pc7": 0.9944,
- "pc8": 0.0,
- "pc9": 0.0386,
- "pc10": -1.0571,
+ "score": 0.945,
+ "pc1": 3.1436,
+ "pc2": -1.5224,
+ "pc3": -0.0581,
+ "pc4": -0.2105,
+ "pc5": 0.9705,
+ "pc6": 0.1225,
+ "pc7": -0.4279,
+ "pc8": -0.5076,
+ "pc9": 0.5317,
+ "pc10": -1.8514,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "f967cca3",
"model": "sonnet-4.6",
- "score": 0.385,
- "pc1": 2.553,
- "pc2": -1.4515,
- "pc3": 0.43,
- "pc4": -0.0568,
- "pc5": 0.9745,
- "pc6": 0.2595,
- "pc7": 0.9944,
- "pc8": 0.0,
- "pc9": 0.0386,
- "pc10": -1.0571,
+ "score": 0.835,
+ "pc1": 3.1436,
+ "pc2": -1.5224,
+ "pc3": -0.0581,
+ "pc4": -0.2105,
+ "pc5": 0.9705,
+ "pc6": 0.1225,
+ "pc7": -0.4279,
+ "pc8": -0.5076,
+ "pc9": 0.5317,
+ "pc10": -1.8514,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "9378b63f",
"model": "sonnet-4.6",
- "score": 0.76,
- "pc1": 2.3764,
- "pc2": -1.695,
- "pc3": 0.5056,
- "pc4": -1.8327,
- "pc5": 2.0833,
- "pc6": 0.5353,
- "pc7": 1.4839,
- "pc8": 0.0,
- "pc9": 0.0713,
- "pc10": -1.87,
+ "score": 0.975,
+ "pc1": 2.8894,
+ "pc2": -1.8433,
+ "pc3": 0.6685,
+ "pc4": 1.2685,
+ "pc5": 2.6153,
+ "pc6": 0.0789,
+ "pc7": -0.8811,
+ "pc8": 0.2249,
+ "pc9": 0.8764,
+ "pc10": -2.425,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "63d07a83",
"model": "sonnet-4.6",
- "score": 0.75,
- "pc1": 2.3764,
- "pc2": -1.695,
- "pc3": 0.5056,
- "pc4": -1.8327,
- "pc5": 2.0833,
- "pc6": 0.5353,
- "pc7": 1.4839,
- "pc8": 0.0,
- "pc9": 0.0713,
- "pc10": -1.87,
+ "score": 0.955,
+ "pc1": 2.8894,
+ "pc2": -1.8433,
+ "pc3": 0.6685,
+ "pc4": 1.2685,
+ "pc5": 2.6153,
+ "pc6": 0.0789,
+ "pc7": -0.8811,
+ "pc8": 0.2249,
+ "pc9": 0.8764,
+ "pc10": -2.425,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=off_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "89f5d666",
"model": "sonnet-4.6",
- "score": 0.255,
- "pc1": 2.3764,
- "pc2": -1.695,
- "pc3": 0.5056,
- "pc4": -1.8327,
- "pc5": 2.0833,
- "pc6": 0.5353,
- "pc7": 1.4839,
- "pc8": 0.0,
- "pc9": 0.0713,
- "pc10": -1.87,
+ "score": 0.795,
+ "pc1": 2.8894,
+ "pc2": -1.8433,
+ "pc3": 0.6685,
+ "pc4": 1.2685,
+ "pc5": 2.6153,
+ "pc6": 0.0789,
+ "pc7": -0.8811,
+ "pc8": 0.2249,
+ "pc9": 0.8764,
+ "pc10": -2.425,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run4",
"short_id": "222c497a",
"model": "sonnet-4.6",
- "score": 0.44,
- "pc1": 2.4866,
- "pc2": -1.5036,
- "pc3": 0.1995,
- "pc4": -0.9152,
- "pc5": 1.7523,
- "pc6": -0.2111,
- "pc7": -0.913,
- "pc8": -0.0,
- "pc9": -0.0501,
- "pc10": 1.6472,
+ "score": 0.975,
+ "pc1": 3.1674,
+ "pc2": -1.5325,
+ "pc3": 0.1509,
+ "pc4": 0.6021,
+ "pc5": 2.2563,
+ "pc6": -0.0715,
+ "pc7": -0.9809,
+ "pc8": 0.3209,
+ "pc9": 0.0503,
+ "pc10": 1.7681,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run5",
"short_id": "a0b46dce",
"model": "sonnet-4.6",
- "score": 0.72,
- "pc1": 2.4866,
- "pc2": -1.5036,
- "pc3": 0.1995,
- "pc4": -0.9152,
- "pc5": 1.7523,
- "pc6": -0.2111,
- "pc7": -0.913,
- "pc8": -0.0,
- "pc9": -0.0501,
- "pc10": 1.6472,
+ "score": 0.93,
+ "pc1": 3.1674,
+ "pc2": -1.5325,
+ "pc3": 0.1509,
+ "pc4": 0.6021,
+ "pc5": 2.2563,
+ "pc6": -0.0715,
+ "pc7": -0.9809,
+ "pc8": 0.3209,
+ "pc9": 0.0503,
+ "pc10": 1.7681,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=on_twrite=on_web=on_run6",
"short_id": "9d5d71af",
"model": "sonnet-4.6",
- "score": 0.41,
- "pc1": 2.4866,
- "pc2": -1.5036,
- "pc3": 0.1995,
- "pc4": -0.9152,
- "pc5": 1.7523,
- "pc6": -0.2111,
- "pc7": -0.913,
- "pc8": -0.0,
- "pc9": -0.0501,
- "pc10": 1.6472,
+ "score": 0.7,
+ "pc1": 3.1674,
+ "pc2": -1.5325,
+ "pc3": 0.1509,
+ "pc4": 0.6021,
+ "pc5": 2.2563,
+ "pc6": -0.0715,
+ "pc7": -0.9809,
+ "pc8": 0.3209,
+ "pc9": 0.0503,
+ "pc10": 1.7681,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run4",
"short_id": "3bbc243e",
"model": "sonnet-4.6",
- "score": 0.365,
- "pc1": 2.6127,
- "pc2": -1.4655,
- "pc3": 0.1119,
- "pc4": -1.8513,
- "pc5": -0.8619,
- "pc6": 0.2721,
- "pc7": 0.7725,
- "pc8": 0.0,
- "pc9": 0.0026,
- "pc10": 0.1419,
+ "score": 0.835,
+ "pc1": 3.1645,
+ "pc2": -1.5392,
+ "pc3": -0.1177,
+ "pc4": 2.1606,
+ "pc5": -0.1156,
+ "pc6": 0.5303,
+ "pc7": -0.3199,
+ "pc8": 0.3002,
+ "pc9": 0.2963,
+ "pc10": -0.4853,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run5",
"short_id": "ada76b96",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.6127,
- "pc2": -1.4655,
- "pc3": 0.1119,
- "pc4": -1.8513,
- "pc5": -0.8619,
- "pc6": 0.2721,
- "pc7": 0.7725,
- "pc8": 0.0,
- "pc9": 0.0026,
- "pc10": 0.1419,
+ "score": 0.835,
+ "pc1": 3.1645,
+ "pc2": -1.5392,
+ "pc3": -0.1177,
+ "pc4": 2.1606,
+ "pc5": -0.1156,
+ "pc6": 0.5303,
+ "pc7": -0.3199,
+ "pc8": 0.3002,
+ "pc9": 0.2963,
+ "pc10": -0.4853,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=off_twrite=on_web=on_run6",
"short_id": "3ca73775",
"model": "sonnet-4.6",
- "score": 0.495,
- "pc1": 2.6127,
- "pc2": -1.4655,
- "pc3": 0.1119,
- "pc4": -1.8513,
- "pc5": -0.8619,
- "pc6": 0.2721,
- "pc7": 0.7725,
- "pc8": 0.0,
- "pc9": 0.0026,
- "pc10": 0.1419,
+ "score": 0.835,
+ "pc1": 3.1645,
+ "pc2": -1.5392,
+ "pc3": -0.1177,
+ "pc4": 2.1606,
+ "pc5": -0.1156,
+ "pc6": 0.5303,
+ "pc7": -0.3199,
+ "pc8": 0.3002,
+ "pc9": 0.2963,
+ "pc10": -0.4853,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run4",
"short_id": "225f2763",
"model": "sonnet-4.6",
- "score": 0.33,
- "pc1": 2.5297,
- "pc2": -1.4972,
- "pc3": 0.2932,
- "pc4": 0.7252,
- "pc5": 1.4704,
- "pc6": -0.0393,
- "pc7": -0.3212,
- "pc8": -0.0,
- "pc9": 0.0082,
- "pc10": -0.2132,
+ "score": 1.0,
+ "pc1": 3.169,
+ "pc2": -1.5413,
+ "pc3": -0.4453,
+ "pc4": -0.9274,
+ "pc5": 1.3185,
+ "pc6": -0.2518,
+ "pc7": -0.0801,
+ "pc8": 0.0113,
+ "pc9": -0.0647,
+ "pc10": 0.6686,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run5",
"short_id": "0bee082b",
"model": "sonnet-4.6",
- "score": 0.34,
- "pc1": 2.5297,
- "pc2": -1.4972,
- "pc3": 0.2932,
- "pc4": 0.7252,
- "pc5": 1.4704,
- "pc6": -0.0393,
- "pc7": -0.3212,
- "pc8": -0.0,
- "pc9": 0.0082,
- "pc10": -0.2132,
+ "score": 0.61,
+ "pc1": 3.169,
+ "pc2": -1.5413,
+ "pc3": -0.4453,
+ "pc4": -0.9274,
+ "pc5": 1.3185,
+ "pc6": -0.2518,
+ "pc7": -0.0801,
+ "pc8": 0.0113,
+ "pc9": -0.0647,
+ "pc10": 0.6686,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=off_web=on_run6",
"short_id": "81d1772b",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.5297,
- "pc2": -1.4972,
- "pc3": 0.2932,
- "pc4": 0.7252,
- "pc5": 1.4704,
- "pc6": -0.0393,
- "pc7": -0.3212,
- "pc8": -0.0,
- "pc9": 0.0082,
- "pc10": -0.2132,
+ "score": 0.895,
+ "pc1": 3.169,
+ "pc2": -1.5413,
+ "pc3": -0.4453,
+ "pc4": -0.9274,
+ "pc5": 1.3185,
+ "pc6": -0.2518,
+ "pc7": -0.0801,
+ "pc8": 0.0113,
+ "pc9": -0.0647,
+ "pc10": 0.6686,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run4",
"short_id": "f91e3319",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.443,
- "pc2": -1.2012,
- "pc3": -0.4532,
- "pc4": -0.7724,
- "pc5": -1.5118,
- "pc6": 0.0246,
- "pc7": -0.0173,
- "pc8": -0.0,
- "pc9": 0.0006,
- "pc10": 0.0148,
+ "score": 0.61,
+ "pc1": 3.1001,
+ "pc2": -1.1988,
+ "pc3": -0.7861,
+ "pc4": 1.6161,
+ "pc5": -1.1471,
+ "pc6": -0.0352,
+ "pc7": 0.2247,
+ "pc8": -0.4305,
+ "pc9": 0.0198,
+ "pc10": 0.5105,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run5",
"short_id": "6a1b6728",
"model": "sonnet-4.6",
- "score": 0.325,
- "pc1": 2.443,
- "pc2": -1.2012,
- "pc3": -0.4532,
- "pc4": -0.7724,
- "pc5": -1.5118,
- "pc6": 0.0246,
- "pc7": -0.0173,
- "pc8": -0.0,
- "pc9": 0.0006,
- "pc10": 0.0148,
+ "score": 0.61,
+ "pc1": 3.1001,
+ "pc2": -1.1988,
+ "pc3": -0.7861,
+ "pc4": 1.6161,
+ "pc5": -1.1471,
+ "pc6": -0.0352,
+ "pc7": 0.2247,
+ "pc8": -0.4305,
+ "pc9": 0.0198,
+ "pc10": 0.5105,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=off_run6",
"short_id": "5a0dcfdc",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.443,
- "pc2": -1.2012,
- "pc3": -0.4532,
- "pc4": -0.7724,
- "pc5": -1.5118,
- "pc6": 0.0246,
- "pc7": -0.0173,
- "pc8": -0.0,
- "pc9": 0.0006,
- "pc10": 0.0148,
+ "score": 0.835,
+ "pc1": 3.1001,
+ "pc2": -1.1988,
+ "pc3": -0.7861,
+ "pc4": 1.6161,
+ "pc5": -1.1471,
+ "pc6": -0.0352,
+ "pc7": 0.2247,
+ "pc8": -0.4305,
+ "pc9": 0.0198,
+ "pc10": 0.5105,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "f333a385",
"model": "sonnet-4.6",
- "score": 0.155,
- "pc1": 1.4202,
- "pc2": -2.8149,
- "pc3": -0.0738,
- "pc4": -0.4037,
- "pc5": -0.0283,
- "pc6": 0.1072,
- "pc7": 0.1172,
- "pc8": -0.0,
- "pc9": -0.001,
- "pc10": 0.2305,
+ "score": 0.61,
+ "pc1": 2.0601,
+ "pc2": -3.0142,
+ "pc3": -0.4576,
+ "pc4": 0.5912,
+ "pc5": 0.2604,
+ "pc6": 0.0823,
+ "pc7": -0.2522,
+ "pc8": -0.0246,
+ "pc9": 0.1855,
+ "pc10": 0.11,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "edfd3f04",
"model": "sonnet-4.6",
- "score": 0.33,
- "pc1": 1.4202,
- "pc2": -2.8149,
- "pc3": -0.0738,
- "pc4": -0.4037,
- "pc5": -0.0283,
- "pc6": 0.1072,
- "pc7": 0.1172,
- "pc8": -0.0,
- "pc9": -0.001,
- "pc10": 0.2305,
+ "score": 0.915,
+ "pc1": 2.0601,
+ "pc2": -3.0142,
+ "pc3": -0.4576,
+ "pc4": 0.5912,
+ "pc5": 0.2604,
+ "pc6": 0.0823,
+ "pc7": -0.2522,
+ "pc8": -0.0246,
+ "pc9": 0.1855,
+ "pc10": 0.11,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "dec59666",
"model": "sonnet-4.6",
- "score": 0.41,
- "pc1": 1.4202,
- "pc2": -2.8149,
- "pc3": -0.0738,
- "pc4": -0.4037,
- "pc5": -0.0283,
- "pc6": 0.1072,
- "pc7": 0.1172,
- "pc8": -0.0,
- "pc9": -0.001,
- "pc10": 0.2305,
+ "score": 0.835,
+ "pc1": 2.0601,
+ "pc2": -3.0142,
+ "pc3": -0.4576,
+ "pc4": 0.5912,
+ "pc5": 0.2604,
+ "pc6": 0.0823,
+ "pc7": -0.2522,
+ "pc8": -0.0246,
+ "pc9": 0.1855,
+ "pc10": 0.11,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "9f634fd1",
"model": "sonnet-4.6",
- "score": 0.225,
- "pc1": -0.7515,
- "pc2": -0.7974,
- "pc3": 0.0017,
- "pc4": -0.2733,
- "pc5": 0.1216,
- "pc6": 0.078,
- "pc7": 0.1313,
- "pc8": 0.0,
- "pc9": 0.0014,
- "pc10": 0.0571,
+ "score": 0.95,
+ "pc1": -0.169,
+ "pc2": -1.0495,
+ "pc3": 0.1986,
+ "pc4": 0.2697,
+ "pc5": 0.1036,
+ "pc6": 0.0233,
+ "pc7": -0.0545,
+ "pc8": -0.0858,
+ "pc9": 0.1109,
+ "pc10": -0.0237,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "81d56cf5",
"model": "sonnet-4.6",
- "score": 0.42,
- "pc1": -0.7515,
- "pc2": -0.7974,
- "pc3": 0.0017,
- "pc4": -0.2733,
- "pc5": 0.1216,
- "pc6": 0.078,
- "pc7": 0.1313,
- "pc8": 0.0,
- "pc9": 0.0014,
- "pc10": 0.0571,
+ "score": 0.835,
+ "pc1": -0.169,
+ "pc2": -1.0495,
+ "pc3": 0.1986,
+ "pc4": 0.2697,
+ "pc5": 0.1036,
+ "pc6": 0.0233,
+ "pc7": -0.0545,
+ "pc8": -0.0858,
+ "pc9": 0.1109,
+ "pc10": -0.0237,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "6a78fb22",
"model": "sonnet-4.6",
- "score": 0.8,
- "pc1": 0.2917,
- "pc2": -1.8385,
- "pc3": 0.0308,
- "pc4": -0.1836,
- "pc5": -0.0638,
- "pc6": 0.0562,
- "pc7": 0.0628,
- "pc8": -0.0,
- "pc9": -0.0062,
- "pc10": 0.2688,
+ "score": 0.955,
+ "pc1": 0.882,
+ "pc2": -2.0576,
+ "pc3": -0.1654,
+ "pc4": 0.3042,
+ "pc5": 0.0209,
+ "pc6": 0.0821,
+ "pc7": -0.0851,
+ "pc8": -0.0985,
+ "pc9": 0.102,
+ "pc10": 0.0933,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "4b3f7365",
"model": "sonnet-4.6",
- "score": 0.315,
- "pc1": 0.2917,
- "pc2": -1.8385,
- "pc3": 0.0308,
- "pc4": -0.1836,
- "pc5": -0.0638,
- "pc6": 0.0562,
- "pc7": 0.0628,
- "pc8": -0.0,
- "pc9": -0.0062,
- "pc10": 0.2688,
+ "score": 0.835,
+ "pc1": 0.882,
+ "pc2": -2.0576,
+ "pc3": -0.1654,
+ "pc4": 0.3042,
+ "pc5": 0.0209,
+ "pc6": 0.0821,
+ "pc7": -0.0851,
+ "pc8": -0.0985,
+ "pc9": 0.102,
+ "pc10": 0.0933,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "fa4f71b7",
"model": "sonnet-4.6",
- "score": 0.355,
- "pc1": 0.2917,
- "pc2": -1.8385,
- "pc3": 0.0308,
- "pc4": -0.1836,
- "pc5": -0.0638,
- "pc6": 0.0562,
- "pc7": 0.0628,
- "pc8": -0.0,
- "pc9": -0.0062,
- "pc10": 0.2688,
+ "score": 0.835,
+ "pc1": 0.882,
+ "pc2": -2.0576,
+ "pc3": -0.1654,
+ "pc4": 0.3042,
+ "pc5": 0.0209,
+ "pc6": 0.0821,
+ "pc7": -0.0851,
+ "pc8": -0.0985,
+ "pc9": 0.102,
+ "pc10": 0.0933,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "3108fdb3",
"model": "gemma-4-26b",
- "score": 0.355,
- "pc1": -2.8733,
- "pc2": -0.3899,
- "pc3": 1.1262,
- "pc4": -0.7272,
- "pc5": 0.3524,
- "pc6": -2.7715,
- "pc7": 0.9962,
- "pc8": -0.0,
- "pc9": -0.0435,
- "pc10": -0.0044,
+ "score": 0.485,
+ "pc1": -1.6761,
+ "pc2": -1.0086,
+ "pc3": 4.2268,
+ "pc4": -0.1793,
+ "pc5": -0.7101,
+ "pc6": -1.8131,
+ "pc7": 2.1606,
+ "pc8": 1.479,
+ "pc9": -0.4707,
+ "pc10": 0.214,
+ "config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "b8454ec4",
+ "model": "gemma-4-26b",
+ "score": 0.485,
+ "pc1": -1.6761,
+ "pc2": -1.0086,
+ "pc3": 4.2268,
+ "pc4": -0.1793,
+ "pc5": -0.7101,
+ "pc6": -1.8131,
+ "pc7": 2.1606,
+ "pc8": 1.479,
+ "pc9": -0.4707,
+ "pc10": 0.214,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "ba5e058a",
"model": "glm-4.5-air",
- "score": 0.355,
- "pc1": -2.9102,
- "pc2": -0.0489,
- "pc3": -2.4494,
- "pc4": -0.3072,
- "pc5": 0.8526,
- "pc6": -2.5349,
- "pc7": 0.7746,
- "pc8": 0.0,
- "pc9": 0.0233,
- "pc10": -0.7449,
+ "score": 0.81,
+ "pc1": -2.1545,
+ "pc2": -0.6455,
+ "pc3": 0.5852,
+ "pc4": 0.416,
+ "pc5": -0.2651,
+ "pc6": -2.4473,
+ "pc7": 0.8947,
+ "pc8": 2.0459,
+ "pc9": -0.2336,
+ "pc10": 0.3892,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "961a7131",
"model": "glm-4.5-air",
- "score": 0.38,
- "pc1": -2.9102,
- "pc2": -0.0489,
- "pc3": -2.4494,
- "pc4": -0.3072,
- "pc5": 0.8526,
- "pc6": -2.5349,
- "pc7": 0.7746,
- "pc8": 0.0,
- "pc9": 0.0233,
- "pc10": -0.7449,
+ "score": 0.45,
+ "pc1": -2.1545,
+ "pc2": -0.6455,
+ "pc3": 0.5852,
+ "pc4": 0.416,
+ "pc5": -0.2651,
+ "pc6": -2.4473,
+ "pc7": 0.8947,
+ "pc8": 2.0459,
+ "pc9": -0.2336,
+ "pc10": 0.3892,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "299b6c41",
"model": "glm-4.7",
- "score": 0.38,
- "pc1": -2.8351,
- "pc2": -0.0231,
- "pc3": -2.7944,
- "pc4": -0.2469,
- "pc5": 0.8604,
- "pc6": -3.2871,
- "pc7": 0.373,
- "pc8": -0.0,
- "pc9": -0.0008,
- "pc10": -0.5532,
+ "score": 0.9,
+ "pc1": -2.1725,
+ "pc2": -0.5981,
+ "pc3": 0.5239,
+ "pc4": 0.5118,
+ "pc5": 0.1102,
+ "pc6": -2.3068,
+ "pc7": 1.841,
+ "pc8": 1.5763,
+ "pc9": -0.2015,
+ "pc10": 0.3508,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "0693e74d",
"model": "glm-4.7",
- "score": 0.38,
- "pc1": -2.8351,
- "pc2": -0.0231,
- "pc3": -2.7944,
- "pc4": -0.2469,
- "pc5": 0.8604,
- "pc6": -3.2871,
- "pc7": 0.373,
- "pc8": -0.0,
- "pc9": -0.0008,
- "pc10": -0.5532,
+ "score": 0.87,
+ "pc1": -2.1725,
+ "pc2": -0.5981,
+ "pc3": 0.5239,
+ "pc4": 0.5118,
+ "pc5": 0.1102,
+ "pc6": -2.3068,
+ "pc7": 1.841,
+ "pc8": 1.5763,
+ "pc9": -0.2015,
+ "pc10": 0.3508,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "255de2c3",
"model": "glm-4.7",
- "score": 0.38,
- "pc1": -2.8351,
- "pc2": -0.0231,
- "pc3": -2.7944,
- "pc4": -0.2469,
- "pc5": 0.8604,
- "pc6": -3.2871,
- "pc7": 0.373,
- "pc8": -0.0,
- "pc9": -0.0008,
- "pc10": -0.5532,
+ "score": 0.895,
+ "pc1": -2.1725,
+ "pc2": -0.5981,
+ "pc3": 0.5239,
+ "pc4": 0.5118,
+ "pc5": 0.1102,
+ "pc6": -2.3068,
+ "pc7": 1.841,
+ "pc8": 1.5763,
+ "pc9": -0.2015,
+ "pc10": 0.3508,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "a1c761c9",
"model": "glm-5.1",
- "score": 0.38,
- "pc1": -2.8604,
- "pc2": 0.0568,
- "pc3": -2.8156,
- "pc4": -0.3165,
- "pc5": 0.9958,
- "pc6": -2.4701,
- "pc7": 0.5713,
- "pc8": -0.0,
- "pc9": 0.0142,
- "pc10": -0.7518,
+ "score": 0.785,
+ "pc1": -2.305,
+ "pc2": -0.5987,
+ "pc3": 0.2794,
+ "pc4": 0.5367,
+ "pc5": 0.1088,
+ "pc6": -1.7966,
+ "pc7": 1.2981,
+ "pc8": 2.0829,
+ "pc9": -0.1628,
+ "pc10": 0.398,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "c2541fee",
"model": "glm-5.1",
- "score": 0.38,
- "pc1": -2.8604,
- "pc2": 0.0568,
- "pc3": -2.8156,
- "pc4": -0.3165,
- "pc5": 0.9958,
- "pc6": -2.4701,
- "pc7": 0.5713,
- "pc8": -0.0,
- "pc9": 0.0142,
- "pc10": -0.7518,
+ "score": 0.785,
+ "pc1": -2.305,
+ "pc2": -0.5987,
+ "pc3": 0.2794,
+ "pc4": 0.5367,
+ "pc5": 0.1088,
+ "pc6": -1.7966,
+ "pc7": 1.2981,
+ "pc8": 2.0829,
+ "pc9": -0.1628,
+ "pc10": 0.398,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "d61bbd6f",
"model": "glm-5.1",
- "score": 0.305,
- "pc1": -2.8604,
- "pc2": 0.0568,
- "pc3": -2.8156,
- "pc4": -0.3165,
- "pc5": 0.9958,
- "pc6": -2.4701,
- "pc7": 0.5713,
- "pc8": -0.0,
- "pc9": 0.0142,
- "pc10": -0.7518,
+ "score": 0.785,
+ "pc1": -2.305,
+ "pc2": -0.5987,
+ "pc3": 0.2794,
+ "pc4": 0.5367,
+ "pc5": 0.1088,
+ "pc6": -1.7966,
+ "pc7": 1.2981,
+ "pc8": 2.0829,
+ "pc9": -0.1628,
+ "pc10": 0.398,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "7a348b81",
"model": "haiku-4.5",
- "score": 0.485,
- "pc1": 1.2055,
- "pc2": -2.9113,
- "pc3": -1.0158,
- "pc4": -0.6987,
- "pc5": 0.6832,
- "pc6": -2.5555,
- "pc7": 1.2337,
- "pc8": 0.0,
- "pc9": -0.0003,
- "pc10": -0.0013,
+ "score": 0.785,
+ "pc1": 2.1504,
+ "pc2": -3.2569,
+ "pc3": 0.4962,
+ "pc4": 0.7601,
+ "pc5": 0.2191,
+ "pc6": -2.0371,
+ "pc7": 1.2676,
+ "pc8": 1.9207,
+ "pc9": -0.0303,
+ "pc10": 0.4239,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "8fe72fce",
"model": "haiku-4.5",
- "score": 0.515,
- "pc1": 1.2055,
- "pc2": -2.9113,
- "pc3": -1.0158,
- "pc4": -0.6987,
- "pc5": 0.6832,
- "pc6": -2.5555,
- "pc7": 1.2337,
- "pc8": 0.0,
- "pc9": -0.0003,
- "pc10": -0.0013,
+ "score": 0.95,
+ "pc1": 2.1504,
+ "pc2": -3.2569,
+ "pc3": 0.4962,
+ "pc4": 0.7601,
+ "pc5": 0.2191,
+ "pc6": -2.0371,
+ "pc7": 1.2676,
+ "pc8": 1.9207,
+ "pc9": -0.0303,
+ "pc10": 0.4239,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "7f20d924",
"model": "haiku-4.5",
- "score": 0.205,
- "pc1": -0.9662,
- "pc2": -0.8938,
- "pc3": -0.9403,
- "pc4": -0.5683,
- "pc5": 0.8332,
- "pc6": -2.5847,
- "pc7": 1.2477,
- "pc8": 0.0,
- "pc9": 0.0022,
- "pc10": -0.1747,
+ "score": 0.715,
+ "pc1": -0.0787,
+ "pc2": -1.2922,
+ "pc3": 1.1524,
+ "pc4": 0.4386,
+ "pc5": 0.0623,
+ "pc6": -2.0961,
+ "pc7": 1.4654,
+ "pc8": 1.8595,
+ "pc9": -0.1049,
+ "pc10": 0.2902,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "8932f117",
"model": "opus-4.6",
- "score": 0.47,
- "pc1": 1.0984,
- "pc2": -3.5325,
- "pc3": -1.2944,
- "pc4": -0.938,
- "pc5": 0.6427,
- "pc6": -2.6334,
- "pc7": 0.9901,
- "pc8": 0.0,
- "pc9": -0.0021,
- "pc10": -0.1262,
+ "score": 0.785,
+ "pc1": 1.9762,
+ "pc2": -3.9941,
+ "pc3": 0.4256,
+ "pc4": 1.067,
+ "pc5": 0.2963,
+ "pc6": -1.9722,
+ "pc7": 1.0688,
+ "pc8": 1.9825,
+ "pc9": -0.0904,
+ "pc10": 0.5152,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "52f8ab88",
"model": "opus-4.6",
- "score": 0.5,
- "pc1": 1.0984,
- "pc2": -3.5325,
- "pc3": -1.2944,
- "pc4": -0.938,
- "pc5": 0.6427,
- "pc6": -2.6334,
- "pc7": 0.9901,
- "pc8": 0.0,
- "pc9": -0.0021,
- "pc10": -0.1262,
+ "score": 0.945,
+ "pc1": 1.9762,
+ "pc2": -3.9941,
+ "pc3": 0.4256,
+ "pc4": 1.067,
+ "pc5": 0.2963,
+ "pc6": -1.9722,
+ "pc7": 1.0688,
+ "pc8": 1.9825,
+ "pc9": -0.0904,
+ "pc10": 0.5152,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "d6187c89",
"model": "opus-4.6",
- "score": 0.5,
- "pc1": 1.0984,
- "pc2": -3.5325,
- "pc3": -1.2944,
- "pc4": -0.938,
- "pc5": 0.6427,
- "pc6": -2.6334,
- "pc7": 0.9901,
- "pc8": 0.0,
- "pc9": -0.0021,
- "pc10": -0.1262,
+ "score": 0.945,
+ "pc1": 1.9762,
+ "pc2": -3.9941,
+ "pc3": 0.4256,
+ "pc4": 1.067,
+ "pc5": 0.2963,
+ "pc6": -1.9722,
+ "pc7": 1.0688,
+ "pc8": 1.9825,
+ "pc9": -0.0904,
+ "pc10": 0.5152,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "1e83d6cf",
"model": "qwen-3.6-plus",
- "score": 0.38,
- "pc1": -2.8352,
- "pc2": -0.3884,
- "pc3": 1.1502,
- "pc4": -0.7509,
- "pc5": 0.2781,
- "pc6": -3.277,
- "pc7": 0.4429,
- "pc8": -0.0,
- "pc9": -0.0393,
- "pc10": -0.4791,
+ "score": 0.925,
+ "pc1": -1.711,
+ "pc2": -1.0738,
+ "pc3": 4.1494,
+ "pc4": -0.3672,
+ "pc5": -1.1741,
+ "pc6": -1.5245,
+ "pc7": 1.5802,
+ "pc8": 1.6092,
+ "pc9": -0.0794,
+ "pc10": 0.5192,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "a1f49ced",
"model": "sonnet-4.6",
- "score": 0.485,
- "pc1": 1.0889,
- "pc2": -3.5266,
- "pc3": -1.2922,
- "pc4": -0.9378,
- "pc5": 0.6448,
- "pc6": -2.6317,
- "pc7": 0.9937,
- "pc8": -0.0,
- "pc9": -0.0021,
- "pc10": -0.1248,
+ "score": 0.975,
+ "pc1": 1.9683,
+ "pc2": -3.986,
+ "pc3": 0.4295,
+ "pc4": 1.0871,
+ "pc5": 0.2587,
+ "pc6": -1.9083,
+ "pc7": 1.15,
+ "pc8": 1.8455,
+ "pc9": 0.0554,
+ "pc10": 0.5607,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "414139b2",
"model": "sonnet-4.6",
- "score": 0.5,
- "pc1": 1.0889,
- "pc2": -3.5266,
- "pc3": -1.2922,
- "pc4": -0.9378,
- "pc5": 0.6448,
- "pc6": -2.6317,
- "pc7": 0.9937,
- "pc8": -0.0,
- "pc9": -0.0021,
- "pc10": -0.1248,
+ "score": 0.785,
+ "pc1": 1.9683,
+ "pc2": -3.986,
+ "pc3": 0.4295,
+ "pc4": 1.0871,
+ "pc5": 0.2587,
+ "pc6": -1.9083,
+ "pc7": 1.15,
+ "pc8": 1.8455,
+ "pc9": 0.0554,
+ "pc10": 0.5607,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=uns_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "ad21bf3b",
"model": "sonnet-4.6",
- "score": 0.365,
- "pc1": 1.0889,
- "pc2": -3.5266,
- "pc3": -1.2922,
- "pc4": -0.9378,
- "pc5": 0.6448,
- "pc6": -2.6317,
- "pc7": 0.9937,
- "pc8": -0.0,
- "pc9": -0.0021,
- "pc10": -0.1248,
+ "score": 0.785,
+ "pc1": 1.9683,
+ "pc2": -3.986,
+ "pc3": 0.4295,
+ "pc4": 1.0871,
+ "pc5": 0.2587,
+ "pc6": -1.9083,
+ "pc7": 1.15,
+ "pc8": 1.8455,
+ "pc9": 0.0554,
+ "pc10": 0.5607,
"config_summary": "effort=high, prompt_style=simple, language=unspecified, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "211866f9",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -1.7429,
- "pc2": 1.1632,
- "pc3": 2.0512,
- "pc4": 0.9412,
- "pc5": -2.6408,
- "pc6": 0.2311,
- "pc7": 1.3727,
- "pc8": 0.0,
- "pc9": 0.0347,
- "pc10": -2.0578,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "179f583c",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -1.7798,
- "pc2": 1.5042,
- "pc3": -1.5244,
- "pc4": 1.3612,
- "pc5": -2.1405,
- "pc6": 0.4677,
- "pc7": 1.1511,
- "pc8": 0.0,
- "pc9": 0.1016,
- "pc10": -2.7983,
+ "score": 0.645,
+ "pc1": -1.0732,
+ "pc2": 1.2996,
+ "pc3": -1.2443,
+ "pc4": -0.6112,
+ "pc5": -2.7968,
+ "pc6": -0.252,
+ "pc7": -0.2152,
+ "pc8": -0.1438,
+ "pc9": 0.176,
+ "pc10": -2.6791,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "ea686a12",
"model": "glm-4.5-air",
- "score": 0.155,
- "pc1": -1.7798,
- "pc2": 1.5042,
- "pc3": -1.5244,
- "pc4": 1.3612,
- "pc5": -2.1405,
- "pc6": 0.4677,
- "pc7": 1.1511,
- "pc8": 0.0,
- "pc9": 0.1016,
- "pc10": -2.7983,
+ "score": 0.825,
+ "pc1": -1.0732,
+ "pc2": 1.2996,
+ "pc3": -1.2443,
+ "pc4": -0.6112,
+ "pc5": -2.7968,
+ "pc6": -0.252,
+ "pc7": -0.2152,
+ "pc8": -0.1438,
+ "pc9": 0.176,
+ "pc10": -2.6791,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "fa02f9f7",
"model": "glm-4.5-air",
- "score": 0.18,
- "pc1": -1.7798,
- "pc2": 1.5042,
- "pc3": -1.5244,
- "pc4": 1.3612,
- "pc5": -2.1405,
- "pc6": 0.4677,
- "pc7": 1.1511,
- "pc8": 0.0,
- "pc9": 0.1016,
- "pc10": -2.7983,
+ "score": 0.825,
+ "pc1": -1.0732,
+ "pc2": 1.2996,
+ "pc3": -1.2443,
+ "pc4": -0.6112,
+ "pc5": -2.7968,
+ "pc6": -0.252,
+ "pc7": -0.2152,
+ "pc8": -0.1438,
+ "pc9": 0.176,
+ "pc10": -2.6791,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "586b5641",
+ "model": "glm-4.7",
+ "score": 0.69,
+ "pc1": -1.0912,
+ "pc2": 1.347,
+ "pc3": -1.3056,
+ "pc4": -0.5155,
+ "pc5": -2.4215,
+ "pc6": -0.1114,
+ "pc7": 0.7311,
+ "pc8": -0.6135,
+ "pc9": 0.2081,
+ "pc10": -2.7175,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "7c1248e2",
"model": "glm-4.7",
- "score": 0.315,
- "pc1": -1.7046,
- "pc2": 1.53,
- "pc3": -1.8694,
- "pc4": 1.4215,
- "pc5": -2.1327,
- "pc6": -0.2845,
- "pc7": 0.7495,
- "pc8": 0.0,
- "pc9": 0.0775,
- "pc10": -2.6066,
+ "score": 0.715,
+ "pc1": -1.0912,
+ "pc2": 1.347,
+ "pc3": -1.3056,
+ "pc4": -0.5155,
+ "pc5": -2.4215,
+ "pc6": -0.1114,
+ "pc7": 0.7311,
+ "pc8": -0.6135,
+ "pc9": 0.2081,
+ "pc10": -2.7175,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "c924670c",
"model": "glm-4.7",
- "score": 0.305,
- "pc1": -1.7046,
- "pc2": 1.53,
- "pc3": -1.8694,
- "pc4": 1.4215,
- "pc5": -2.1327,
- "pc6": -0.2845,
- "pc7": 0.7495,
- "pc8": 0.0,
- "pc9": 0.0775,
- "pc10": -2.6066,
+ "score": 0.61,
+ "pc1": -1.0912,
+ "pc2": 1.347,
+ "pc3": -1.3056,
+ "pc4": -0.5155,
+ "pc5": -2.4215,
+ "pc6": -0.1114,
+ "pc7": 0.7311,
+ "pc8": -0.6135,
+ "pc9": 0.2081,
+ "pc10": -2.7175,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "187c67ef",
"model": "glm-5.1",
- "score": 0.255,
- "pc1": -1.7299,
- "pc2": 1.6099,
- "pc3": -1.8906,
- "pc4": 1.3519,
- "pc5": -1.9974,
- "pc6": 0.5325,
- "pc7": 0.9478,
- "pc8": 0.0,
- "pc9": 0.0925,
- "pc10": -2.8052,
+ "score": 0.835,
+ "pc1": -1.2238,
+ "pc2": 1.3464,
+ "pc3": -1.5501,
+ "pc4": -0.4905,
+ "pc5": -2.423,
+ "pc6": 0.3988,
+ "pc7": 0.1881,
+ "pc8": -0.1068,
+ "pc9": 0.2468,
+ "pc10": -2.6703,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "5ca32e79",
"model": "glm-5.1",
- "score": 0.155,
- "pc1": -1.7299,
- "pc2": 1.6099,
- "pc3": -1.8906,
- "pc4": 1.3519,
- "pc5": -1.9974,
- "pc6": 0.5325,
- "pc7": 0.9478,
- "pc8": 0.0,
- "pc9": 0.0925,
- "pc10": -2.8052,
+ "score": 0.605,
+ "pc1": -1.2238,
+ "pc2": 1.3464,
+ "pc3": -1.5501,
+ "pc4": -0.4905,
+ "pc5": -2.423,
+ "pc6": 0.3988,
+ "pc7": 0.1881,
+ "pc8": -0.1068,
+ "pc9": 0.2468,
+ "pc10": -2.6703,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "9d78ce6d",
"model": "glm-5.1",
- "score": 0.37,
- "pc1": -1.7299,
- "pc2": 1.6099,
- "pc3": -1.8906,
- "pc4": 1.3519,
- "pc5": -1.9974,
- "pc6": 0.5325,
- "pc7": 0.9478,
- "pc8": 0.0,
- "pc9": 0.0925,
- "pc10": -2.8052,
+ "score": 0.785,
+ "pc1": -1.2238,
+ "pc2": 1.3464,
+ "pc3": -1.5501,
+ "pc4": -0.4905,
+ "pc5": -2.423,
+ "pc6": 0.3988,
+ "pc7": 0.1881,
+ "pc8": -0.1068,
+ "pc9": 0.2468,
+ "pc10": -2.6703,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=on_tread=off_twrite=on_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=on_tread=off_twrite=on_web=off_run4",
"short_id": "0feabf41",
"model": "haiku-4.5",
- "score": 0.47,
- "pc1": 6.4226,
- "pc2": 6.2047,
- "pc3": 0.137,
- "pc4": -3.3555,
- "pc5": -4.0926,
- "pc6": 1.0665,
- "pc7": 4.2171,
- "pc8": 0.0,
- "pc9": 0.1668,
- "pc10": -4.8274,
+ "score": 0.76,
+ "pc1": 7.1926,
+ "pc2": 6.8932,
+ "pc3": -0.1871,
+ "pc4": 4.4146,
+ "pc5": -3.3692,
+ "pc6": 0.5626,
+ "pc7": 0.4273,
+ "pc8": -0.7047,
+ "pc9": 1.1014,
+ "pc10": -6.8775,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=on_tread=off_twrite=on_web=off_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=on_tread=off_twrite=on_web=off_run5",
"short_id": "4c7db3b9",
"model": "haiku-4.5",
- "score": 0.485,
- "pc1": 6.4226,
- "pc2": 6.2047,
- "pc3": 0.137,
- "pc4": -3.3555,
- "pc5": -4.0926,
- "pc6": 1.0665,
- "pc7": 4.2171,
- "pc8": 0.0,
- "pc9": 0.1668,
- "pc10": -4.8274,
+ "score": 0.95,
+ "pc1": 7.1926,
+ "pc2": 6.8932,
+ "pc3": -0.1871,
+ "pc4": 4.4146,
+ "pc5": -3.3692,
+ "pc6": 0.5626,
+ "pc7": 0.4273,
+ "pc8": -0.7047,
+ "pc9": 1.1014,
+ "pc10": -6.8775,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=on_tread=off_twrite=on_web=off_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=on_tread=off_twrite=on_web=off_run6",
"short_id": "40f9a902",
"model": "haiku-4.5",
- "score": 0.79,
- "pc1": 6.4226,
- "pc2": 6.2047,
- "pc3": 0.137,
- "pc4": -3.3555,
- "pc5": -4.0926,
- "pc6": 1.0665,
- "pc7": 4.2171,
- "pc8": 0.0,
- "pc9": 0.1668,
- "pc10": -4.8274,
+ "score": 0.89,
+ "pc1": 7.1926,
+ "pc2": 6.8932,
+ "pc3": -0.1871,
+ "pc4": 4.4146,
+ "pc5": -3.3692,
+ "pc6": 0.5626,
+ "pc7": 0.4273,
+ "pc8": -0.7047,
+ "pc9": 1.1014,
+ "pc10": -6.8775,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "e2e04e75",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 2.336,
- "pc2": -1.3582,
- "pc3": -0.0908,
- "pc4": 0.9697,
- "pc5": -2.3099,
- "pc6": 0.4471,
- "pc7": 1.6101,
- "pc8": 0.0,
- "pc9": 0.078,
- "pc10": -2.0547,
+ "score": 0.875,
+ "pc1": 3.2316,
+ "pc2": -1.3118,
+ "pc3": -1.3333,
+ "pc4": -0.2671,
+ "pc5": -2.3126,
+ "pc6": 0.1583,
+ "pc7": 0.1577,
+ "pc8": -0.269,
+ "pc9": 0.3793,
+ "pc10": -2.6445,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "b04257bc",
"model": "haiku-4.5",
- "score": 0.28,
- "pc1": 2.336,
- "pc2": -1.3582,
- "pc3": -0.0908,
- "pc4": 0.9697,
- "pc5": -2.3099,
- "pc6": 0.4471,
- "pc7": 1.6101,
- "pc8": 0.0,
- "pc9": 0.078,
- "pc10": -2.0547,
+ "score": 0.66,
+ "pc1": 3.2316,
+ "pc2": -1.3118,
+ "pc3": -1.3333,
+ "pc4": -0.2671,
+ "pc5": -2.3126,
+ "pc6": 0.1583,
+ "pc7": 0.1577,
+ "pc8": -0.269,
+ "pc9": 0.3793,
+ "pc10": -2.6445,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "9b0e0479",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 2.336,
- "pc2": -1.3582,
- "pc3": -0.0908,
- "pc4": 0.9697,
- "pc5": -2.3099,
- "pc6": 0.4471,
- "pc7": 1.6101,
- "pc8": 0.0,
- "pc9": 0.078,
- "pc10": -2.0547,
+ "score": 0.67,
+ "pc1": 3.2316,
+ "pc2": -1.3118,
+ "pc3": -1.3333,
+ "pc4": -0.2671,
+ "pc5": -2.3126,
+ "pc6": 0.1583,
+ "pc7": 0.1577,
+ "pc8": -0.269,
+ "pc9": 0.3793,
+ "pc10": -2.6445,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "83f0bb2a",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 0.1643,
- "pc2": 0.6593,
- "pc3": -0.0153,
- "pc4": 1.1001,
- "pc5": -2.16,
- "pc6": 0.4179,
- "pc7": 1.6242,
- "pc8": 0.0,
- "pc9": 0.0805,
- "pc10": -2.2281,
+ "score": 0.66,
+ "pc1": 1.0025,
+ "pc2": 0.653,
+ "pc3": -0.6771,
+ "pc4": -0.5886,
+ "pc5": -2.4694,
+ "pc6": 0.0993,
+ "pc7": 0.3554,
+ "pc8": -0.3302,
+ "pc9": 0.3047,
+ "pc10": -2.7782,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "daaf1998",
"model": "opus-4.6",
- "score": 0.365,
- "pc1": 2.2289,
- "pc2": -1.9794,
- "pc3": -0.3694,
- "pc4": 0.7304,
- "pc5": -2.3505,
- "pc6": 0.3692,
- "pc7": 1.3666,
- "pc8": 0.0,
- "pc9": 0.0761,
- "pc10": -2.1796,
+ "score": 0.84,
+ "pc1": 3.0575,
+ "pc2": -2.049,
+ "pc3": -1.4039,
+ "pc4": 0.0398,
+ "pc5": -2.2354,
+ "pc6": 0.2232,
+ "pc7": -0.0411,
+ "pc8": -0.2072,
+ "pc9": 0.3192,
+ "pc10": -2.5532,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "f3f3cd51",
"model": "opus-4.6",
- "score": 0.755,
- "pc1": 2.2289,
- "pc2": -1.9794,
- "pc3": -0.3694,
- "pc4": 0.7304,
- "pc5": -2.3505,
- "pc6": 0.3692,
- "pc7": 1.3666,
- "pc8": 0.0,
- "pc9": 0.0761,
- "pc10": -2.1796,
+ "score": 0.975,
+ "pc1": 3.0575,
+ "pc2": -2.049,
+ "pc3": -1.4039,
+ "pc4": 0.0398,
+ "pc5": -2.2354,
+ "pc6": 0.2232,
+ "pc7": -0.0411,
+ "pc8": -0.2072,
+ "pc9": 0.3192,
+ "pc10": -2.5532,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "bdd519b4",
"model": "opus-4.6",
- "score": 0.46,
- "pc1": 2.2289,
- "pc2": -1.9794,
- "pc3": -0.3694,
- "pc4": 0.7304,
- "pc5": -2.3505,
- "pc6": 0.3692,
- "pc7": 1.3666,
- "pc8": 0.0,
- "pc9": 0.0761,
- "pc10": -2.1796,
+ "score": 0.95,
+ "pc1": 3.0575,
+ "pc2": -2.049,
+ "pc3": -1.4039,
+ "pc4": 0.0398,
+ "pc5": -2.2354,
+ "pc6": 0.2232,
+ "pc7": -0.0411,
+ "pc8": -0.2072,
+ "pc9": 0.3192,
+ "pc10": -2.5532,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "20a18690",
"model": "qwen-3.6-plus",
- "score": 0.33,
- "pc1": -1.7047,
- "pc2": 1.1647,
- "pc3": 2.0752,
- "pc4": 0.9175,
- "pc5": -2.7151,
- "pc6": -0.2744,
- "pc7": 0.8194,
- "pc8": 0.0,
- "pc9": 0.039,
- "pc10": -2.5325,
+ "score": 0.685,
+ "pc1": -0.6298,
+ "pc2": 0.8713,
+ "pc3": 2.3199,
+ "pc4": -1.3944,
+ "pc5": -3.7058,
+ "pc6": 0.6709,
+ "pc7": 0.4702,
+ "pc8": -0.5805,
+ "pc9": 0.3302,
+ "pc10": -2.5492,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "92501938",
"model": "sonnet-4.6",
- "score": 0.415,
- "pc1": 2.2194,
- "pc2": -1.9735,
- "pc3": -0.3672,
- "pc4": 0.7307,
- "pc5": -2.3484,
- "pc6": 0.3709,
- "pc7": 1.3702,
- "pc8": 0.0,
- "pc9": 0.0761,
- "pc10": -2.1783,
+ "score": 0.805,
+ "pc1": 3.0495,
+ "pc2": -2.0408,
+ "pc3": -1.4,
+ "pc4": 0.0599,
+ "pc5": -2.273,
+ "pc6": 0.287,
+ "pc7": 0.04,
+ "pc8": -0.3442,
+ "pc9": 0.465,
+ "pc10": -2.5077,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "12f4a113",
"model": "sonnet-4.6",
- "score": 0.29,
- "pc1": 2.2194,
- "pc2": -1.9735,
- "pc3": -0.3672,
- "pc4": 0.7307,
- "pc5": -2.3484,
- "pc6": 0.3709,
- "pc7": 1.3702,
- "pc8": 0.0,
- "pc9": 0.0761,
- "pc10": -2.1783,
+ "score": 0.97,
+ "pc1": 3.0495,
+ "pc2": -2.0408,
+ "pc3": -1.4,
+ "pc4": 0.0599,
+ "pc5": -2.273,
+ "pc6": 0.287,
+ "pc7": 0.04,
+ "pc8": -0.3442,
+ "pc9": 0.465,
+ "pc10": -2.5077,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "6031abcf",
"model": "sonnet-4.6",
- "score": 0.315,
- "pc1": 2.2194,
- "pc2": -1.9735,
- "pc3": -0.3672,
- "pc4": 0.7307,
- "pc5": -2.3484,
- "pc6": 0.3709,
- "pc7": 1.3702,
- "pc8": 0.0,
- "pc9": 0.0761,
- "pc10": -2.1783,
+ "score": 0.82,
+ "pc1": 3.0495,
+ "pc2": -2.0408,
+ "pc3": -1.4,
+ "pc4": 0.0599,
+ "pc5": -2.273,
+ "pc6": 0.287,
+ "pc7": 0.04,
+ "pc8": -0.3442,
+ "pc9": 0.465,
+ "pc10": -2.5077,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=sv_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "eba9a5d5",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.49,
- "pc2": 0.5264,
- "pc3": 5.1288,
- "pc4": -0.4289,
- "pc5": -0.9392,
- "pc6": -0.9682,
- "pc7": -0.3883,
- "pc8": 0.0,
- "pc9": -12.5861,
- "pc10": -0.5153,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=sv_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "fadc2681",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -3.5269,
- "pc2": 0.8674,
- "pc3": 1.5532,
- "pc4": -0.009,
- "pc5": -0.439,
- "pc6": -0.7316,
- "pc7": -0.6099,
- "pc8": 0.0,
- "pc9": -12.5193,
- "pc10": -1.2557,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=sv_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "9ec8bb27",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.5829,
- "pc2": 0.0225,
- "pc3": 3.0624,
- "pc4": -0.27,
- "pc5": -0.4584,
- "pc6": -0.7814,
- "pc7": -0.1368,
- "pc8": 0.0,
- "pc9": -12.5404,
- "pc10": -0.6855,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=sv_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "4a42d14a",
- "model": "qwen-3.6-plus",
- "score": 0.325,
- "pc1": -3.4519,
- "pc2": 0.5279,
- "pc3": 5.1528,
- "pc4": -0.4526,
- "pc5": -1.0135,
- "pc6": -1.4737,
- "pc7": -0.9417,
- "pc8": 0.0,
- "pc9": -12.5819,
- "pc10": -0.9899,
+ "score": 0.785,
+ "pc1": -2.9653,
+ "pc2": 0.6501,
+ "pc3": -1.6918,
+ "pc4": -0.0491,
+ "pc5": 0.4543,
+ "pc6": -0.8946,
+ "pc7": -6.069,
+ "pc8": 8.5934,
+ "pc9": 1.4539,
+ "pc10": -4.2224,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=sv_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "44bdca2e",
+ "model": "glm-5.1",
+ "score": 0.81,
+ "pc1": -3.1159,
+ "pc2": 0.6968,
+ "pc3": -1.9976,
+ "pc4": 0.0717,
+ "pc5": 0.8282,
+ "pc6": -0.2438,
+ "pc7": -5.6657,
+ "pc8": 8.6305,
+ "pc9": 1.5247,
+ "pc10": -4.2136,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=sv_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "039adf80",
+ "model": "glm-5.1",
+ "score": 0.61,
+ "pc1": -3.1159,
+ "pc2": 0.6968,
+ "pc3": -1.9976,
+ "pc4": 0.0717,
+ "pc5": 0.8282,
+ "pc6": -0.2438,
+ "pc7": -5.6657,
+ "pc8": 8.6305,
+ "pc9": 1.5247,
+ "pc10": -4.2136,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=sv_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "b21b62e8",
+ "model": "glm-5.1",
+ "score": 0.635,
+ "pc1": -3.1159,
+ "pc2": 0.6968,
+ "pc3": -1.9976,
+ "pc4": 0.0717,
+ "pc5": 0.8282,
+ "pc6": -0.2438,
+ "pc7": -5.6657,
+ "pc8": 8.6305,
+ "pc9": 1.5247,
+ "pc10": -4.2136,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "165fc6e4",
"model": "gemma-4-26b",
- "score": 0.425,
- "pc1": -2.6075,
- "pc2": -0.6916,
- "pc3": 2.0886,
- "pc4": -1.0269,
- "pc5": -0.1616,
- "pc6": 3.9969,
- "pc7": -4.0123,
- "pc8": -0.0,
- "pc9": -0.0084,
- "pc10": -1.8233,
+ "score": 0.5,
+ "pc1": -1.5985,
+ "pc2": -1.0992,
+ "pc3": 3.9135,
+ "pc4": -0.1272,
+ "pc5": -0.1303,
+ "pc6": 3.551,
+ "pc7": -1.245,
+ "pc8": -4.1142,
+ "pc9": -0.5701,
+ "pc10": -0.1224,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "d2e96e2c",
+ "model": "gemma-4-26b",
+ "score": 0.475,
+ "pc1": -1.5985,
+ "pc2": -1.0992,
+ "pc3": 3.9135,
+ "pc4": -0.1272,
+ "pc5": -0.1303,
+ "pc6": 3.551,
+ "pc7": -1.245,
+ "pc8": -4.1142,
+ "pc9": -0.5701,
+ "pc10": -0.1224,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "d179f825",
"model": "glm-4.5-air",
- "score": 0.18,
- "pc1": -2.6444,
- "pc2": -0.3506,
- "pc3": -1.487,
- "pc4": -0.6069,
- "pc5": 0.3386,
- "pc6": 4.2336,
- "pc7": -4.2339,
- "pc8": -0.0,
- "pc9": 0.0585,
- "pc10": -2.5638,
+ "score": 0.47,
+ "pc1": -2.0768,
+ "pc2": -0.736,
+ "pc3": 0.2719,
+ "pc4": 0.4681,
+ "pc5": 0.3146,
+ "pc6": 2.9168,
+ "pc7": -2.5108,
+ "pc8": -3.5473,
+ "pc9": -0.333,
+ "pc10": 0.0529,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "ef24fb84",
+ "model": "glm-4.7",
+ "score": 0.73,
+ "pc1": -2.0948,
+ "pc2": -0.6887,
+ "pc3": 0.2106,
+ "pc4": 0.5638,
+ "pc5": 0.6899,
+ "pc6": 3.0573,
+ "pc7": -1.5646,
+ "pc8": -4.0169,
+ "pc9": -0.3009,
+ "pc10": 0.0145,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "1e9c0a3b",
+ "model": "glm-4.7",
+ "score": 0.635,
+ "pc1": -2.0948,
+ "pc2": -0.6887,
+ "pc3": 0.2106,
+ "pc4": 0.5638,
+ "pc5": 0.6899,
+ "pc6": 3.0573,
+ "pc7": -1.5646,
+ "pc8": -4.0169,
+ "pc9": -0.3009,
+ "pc10": 0.0145,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "76c2aa85",
+ "model": "glm-4.7",
+ "score": 0.705,
+ "pc1": -2.0948,
+ "pc2": -0.6887,
+ "pc3": 0.2106,
+ "pc4": 0.5638,
+ "pc5": 0.6899,
+ "pc6": 3.0573,
+ "pc7": -1.5646,
+ "pc8": -4.0169,
+ "pc9": -0.3009,
+ "pc10": 0.0145,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "e128b57c",
"model": "glm-5.1",
- "score": 0.34,
- "pc1": -2.5946,
- "pc2": -0.2449,
- "pc3": -1.8532,
- "pc4": -0.6162,
- "pc5": 0.4817,
- "pc6": 4.2984,
- "pc7": -4.4372,
- "pc8": -0.0,
- "pc9": 0.0494,
- "pc10": -2.5706,
+ "score": 0.91,
+ "pc1": -2.2274,
+ "pc2": -0.6893,
+ "pc3": -0.0339,
+ "pc4": 0.5888,
+ "pc5": 0.6885,
+ "pc6": 3.5675,
+ "pc7": -2.1075,
+ "pc8": -3.5103,
+ "pc9": -0.2622,
+ "pc10": 0.0617,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "025bcc22",
"model": "glm-5.1",
- "score": 0.34,
- "pc1": -2.5946,
- "pc2": -0.2449,
- "pc3": -1.8532,
- "pc4": -0.6162,
- "pc5": 0.4817,
- "pc6": 4.2984,
- "pc7": -4.4372,
- "pc8": -0.0,
- "pc9": 0.0494,
- "pc10": -2.5706,
+ "score": 0.825,
+ "pc1": -2.2274,
+ "pc2": -0.6893,
+ "pc3": -0.0339,
+ "pc4": 0.5888,
+ "pc5": 0.6885,
+ "pc6": 3.5675,
+ "pc7": -2.1075,
+ "pc8": -3.5103,
+ "pc9": -0.2622,
+ "pc10": 0.0617,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "cd3f3c84",
"model": "glm-5.1",
- "score": 0.34,
- "pc1": -2.5946,
- "pc2": -0.2449,
- "pc3": -1.8532,
- "pc4": -0.6162,
- "pc5": 0.4817,
- "pc6": 4.2984,
- "pc7": -4.4372,
- "pc8": -0.0,
- "pc9": 0.0494,
- "pc10": -2.5706,
+ "score": 0.5,
+ "pc1": -2.2274,
+ "pc2": -0.6893,
+ "pc3": -0.0339,
+ "pc4": 0.5888,
+ "pc5": 0.6885,
+ "pc6": 3.5675,
+ "pc7": -2.1075,
+ "pc8": -3.5103,
+ "pc9": -0.2622,
+ "pc10": 0.0617,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "7e61c670",
"model": "haiku-4.5",
- "score": 0.715,
- "pc1": 1.4714,
- "pc2": -3.213,
- "pc3": -0.0534,
- "pc4": -0.9984,
- "pc5": 0.1692,
- "pc6": 4.2129,
- "pc7": -3.7748,
- "pc8": -0.0,
- "pc9": 0.0349,
- "pc10": -1.8201,
+ "score": 0.725,
+ "pc1": 2.228,
+ "pc2": -3.3475,
+ "pc3": 0.1829,
+ "pc4": 0.8122,
+ "pc5": 0.7989,
+ "pc6": 3.3271,
+ "pc7": -2.1379,
+ "pc8": -3.6725,
+ "pc9": -0.1297,
+ "pc10": 0.0875,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "6b33ee07",
"model": "haiku-4.5",
- "score": 0.34,
- "pc1": 1.4714,
- "pc2": -3.213,
- "pc3": -0.0534,
- "pc4": -0.9984,
- "pc5": 0.1692,
- "pc6": 4.2129,
- "pc7": -3.7748,
- "pc8": -0.0,
- "pc9": 0.0349,
- "pc10": -1.8201,
+ "score": 0.82,
+ "pc1": 2.228,
+ "pc2": -3.3475,
+ "pc3": 0.1829,
+ "pc4": 0.8122,
+ "pc5": 0.7989,
+ "pc6": 3.3271,
+ "pc7": -2.1379,
+ "pc8": -3.6725,
+ "pc9": -0.1297,
+ "pc10": 0.0875,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "89be04d9",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 1.4714,
- "pc2": -3.213,
- "pc3": -0.0534,
- "pc4": -0.9984,
- "pc5": 0.1692,
- "pc6": 4.2129,
- "pc7": -3.7748,
- "pc8": -0.0,
- "pc9": 0.0349,
- "pc10": -1.8201,
+ "score": 0.655,
+ "pc1": 2.228,
+ "pc2": -3.3475,
+ "pc3": 0.1829,
+ "pc4": 0.8122,
+ "pc5": 0.7989,
+ "pc6": 3.3271,
+ "pc7": -2.1379,
+ "pc8": -3.6725,
+ "pc9": -0.1297,
+ "pc10": 0.0875,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
+ "short_id": "59e8da6e",
+ "model": "opus-4.6",
+ "score": 0.835,
+ "pc1": 2.0539,
+ "pc2": -4.0846,
+ "pc3": 0.1123,
+ "pc4": 1.1191,
+ "pc5": 0.876,
+ "pc6": 3.3919,
+ "pc7": -2.3367,
+ "pc8": -3.6107,
+ "pc9": -0.1898,
+ "pc10": 0.1788,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
+ "short_id": "f501a861",
+ "model": "opus-4.6",
+ "score": 0.835,
+ "pc1": 2.0539,
+ "pc2": -4.0846,
+ "pc3": 0.1123,
+ "pc4": 1.1191,
+ "pc5": 0.876,
+ "pc6": 3.3919,
+ "pc7": -2.3367,
+ "pc8": -3.6107,
+ "pc9": -0.1898,
+ "pc10": 0.1788,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
+ "short_id": "9720d53e",
+ "model": "opus-4.6",
+ "score": 0.795,
+ "pc1": 2.0539,
+ "pc2": -4.0846,
+ "pc3": 0.1123,
+ "pc4": 1.1191,
+ "pc5": 0.876,
+ "pc6": 3.3919,
+ "pc7": -2.3367,
+ "pc8": -3.6107,
+ "pc9": -0.1898,
+ "pc10": 0.1788,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "09b8d56a",
+ "model": "qwen-3.6-plus",
+ "score": 0.5,
+ "pc1": -1.6334,
+ "pc2": -1.1644,
+ "pc3": 3.8361,
+ "pc4": -0.3151,
+ "pc5": -0.5943,
+ "pc6": 3.8396,
+ "pc7": -1.8254,
+ "pc8": -3.984,
+ "pc9": -0.1788,
+ "pc10": 0.1829,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
+ "short_id": "5d88e9c7",
+ "model": "sonnet-4.6",
+ "score": 0.775,
+ "pc1": 2.0459,
+ "pc2": -4.0765,
+ "pc3": 0.1162,
+ "pc4": 1.1392,
+ "pc5": 0.8385,
+ "pc6": 3.4558,
+ "pc7": -2.2556,
+ "pc8": -3.7477,
+ "pc9": -0.044,
+ "pc10": 0.2244,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
+ "short_id": "20dc3752",
+ "model": "sonnet-4.6",
+ "score": 0.97,
+ "pc1": 2.0459,
+ "pc2": -4.0765,
+ "pc3": 0.1162,
+ "pc4": 1.1392,
+ "pc5": 0.8385,
+ "pc6": 3.4558,
+ "pc7": -2.2556,
+ "pc8": -3.7477,
+ "pc9": -0.044,
+ "pc10": 0.2244,
+ "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
+ "short_id": "4905874d",
+ "model": "sonnet-4.6",
+ "score": 0.85,
+ "pc1": 2.0459,
+ "pc2": -4.0765,
+ "pc3": 0.1162,
+ "pc4": 1.1392,
+ "pc5": 0.8385,
+ "pc6": 3.4558,
+ "pc7": -2.2556,
+ "pc8": -3.7477,
+ "pc9": -0.044,
+ "pc10": 0.2244,
"config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "59e8da6e",
- "model": "opus-4.6",
- "score": 0.39,
- "pc1": 1.3642,
- "pc2": -3.8342,
- "pc3": -0.332,
- "pc4": -1.2377,
- "pc5": 0.1286,
- "pc6": 4.135,
- "pc7": -4.0184,
- "pc8": -0.0,
- "pc9": 0.033,
- "pc10": -1.945,
- "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "20ecfcc4",
+ "model": "glm-4.5-air",
+ "score": 0.485,
+ "pc1": -2.9306,
+ "pc2": 0.5848,
+ "pc3": 0.2131,
+ "pc4": -0.7299,
+ "pc5": -2.6031,
+ "pc6": 0.9935,
+ "pc7": -3.9674,
+ "pc8": 1.5192,
+ "pc9": 6.8653,
+ "pc10": 2.4628,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "aff304c1",
+ "model": "glm-5.1",
+ "score": 0.48,
+ "pc1": -3.0811,
+ "pc2": 0.6315,
+ "pc3": -0.0927,
+ "pc4": -0.6091,
+ "pc5": -2.2292,
+ "pc6": 1.6442,
+ "pc7": -3.5641,
+ "pc8": 1.5562,
+ "pc9": 6.9361,
+ "pc10": 2.4716,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "1005e419",
+ "model": "glm-5.1",
+ "score": 0.635,
+ "pc1": -3.0811,
+ "pc2": 0.6315,
+ "pc3": -0.0927,
+ "pc4": -0.6091,
+ "pc5": -2.2292,
+ "pc6": 1.6442,
+ "pc7": -3.5641,
+ "pc8": 1.5562,
+ "pc9": 6.9361,
+ "pc10": 2.4716,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "80b5cf08",
+ "model": "glm-5.1",
+ "score": 0.835,
+ "pc1": -3.0811,
+ "pc2": 0.6315,
+ "pc3": -0.0927,
+ "pc4": -0.6091,
+ "pc5": -2.2292,
+ "pc6": 1.6442,
+ "pc7": -3.5641,
+ "pc8": 1.5562,
+ "pc9": 6.9361,
+ "pc10": 2.4716,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "fb0c6aef",
+ "model": "qwen-3.6-plus",
+ "score": 0.665,
+ "pc1": -2.4872,
+ "pc2": 0.1564,
+ "pc3": 3.7773,
+ "pc4": -1.5131,
+ "pc5": -3.5121,
+ "pc6": 1.9164,
+ "pc7": -3.282,
+ "pc8": 1.0825,
+ "pc9": 7.0195,
+ "pc10": 2.5928,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "a7393fb0",
+ "model": "glm-4.5-air",
+ "score": 0.615,
+ "pc1": -2.9292,
+ "pc2": 0.5618,
+ "pc3": 0.3056,
+ "pc4": -0.6549,
+ "pc5": -2.6372,
+ "pc6": 1.2746,
+ "pc7": -4.1902,
+ "pc8": 1.9195,
+ "pc9": 6.6569,
+ "pc10": 2.7341,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "c0ca12f7",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -3.0798,
+ "pc2": 0.6086,
+ "pc3": -0.0001,
+ "pc4": -0.5341,
+ "pc5": -2.2633,
+ "pc6": 1.9254,
+ "pc7": -3.7868,
+ "pc8": 1.9566,
+ "pc9": 6.7277,
+ "pc10": 2.7429,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "ae8a9e3a",
+ "model": "glm-5.1",
+ "score": 0.68,
+ "pc1": -3.0798,
+ "pc2": 0.6086,
+ "pc3": -0.0001,
+ "pc4": -0.5341,
+ "pc5": -2.2633,
+ "pc6": 1.9254,
+ "pc7": -3.7868,
+ "pc8": 1.9566,
+ "pc9": 6.7277,
+ "pc10": 2.7429,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "3e78199f",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -3.0798,
+ "pc2": 0.6086,
+ "pc3": -0.0001,
+ "pc4": -0.5341,
+ "pc5": -2.2633,
+ "pc6": 1.9254,
+ "pc7": -3.7868,
+ "pc8": 1.9566,
+ "pc9": 6.7277,
+ "pc10": 2.7429,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "602fba4b",
+ "model": "qwen-3.6-plus",
+ "score": 0.945,
+ "pc1": -2.4858,
+ "pc2": 0.1334,
+ "pc3": 3.8699,
+ "pc4": -1.4381,
+ "pc5": -3.5462,
+ "pc6": 2.1975,
+ "pc7": -3.5047,
+ "pc8": 1.4828,
+ "pc9": 6.811,
+ "pc10": 2.8641,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "f4281547",
+ "model": "glm-4.7",
+ "score": 0.78,
+ "pc1": -3.0234,
+ "pc2": 0.7188,
+ "pc3": -1.961,
+ "pc4": 0.4308,
+ "pc5": 1.6696,
+ "pc6": 2.0641,
+ "pc7": 2.8791,
+ "pc8": -0.0176,
+ "pc9": 0.1517,
+ "pc10": -0.1076,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "083647f8",
+ "model": "glm-4.7",
+ "score": 0.66,
+ "pc1": -3.0234,
+ "pc2": 0.7188,
+ "pc3": -1.961,
+ "pc4": 0.4308,
+ "pc5": 1.6696,
+ "pc6": 2.0641,
+ "pc7": 2.8791,
+ "pc8": -0.0176,
+ "pc9": 0.1517,
+ "pc10": -0.1076,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "c8f6a35c",
+ "model": "glm-4.7",
+ "score": 0.78,
+ "pc1": -3.0234,
+ "pc2": 0.7188,
+ "pc3": -1.961,
+ "pc4": 0.4308,
+ "pc5": 1.6696,
+ "pc6": 2.0641,
+ "pc7": 2.8791,
+ "pc8": -0.0176,
+ "pc9": 0.1517,
+ "pc10": -0.1076,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "32860f58",
+ "model": "glm-5.1",
+ "score": 0.75,
+ "pc1": -3.1559,
+ "pc2": 0.7182,
+ "pc3": -2.2055,
+ "pc4": 0.4558,
+ "pc5": 1.6682,
+ "pc6": 2.5743,
+ "pc7": 2.3362,
+ "pc8": 0.4891,
+ "pc9": 0.1904,
+ "pc10": -0.0604,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "3813f826",
+ "model": "glm-5.1",
+ "score": 0.5,
+ "pc1": -3.1559,
+ "pc2": 0.7182,
+ "pc3": -2.2055,
+ "pc4": 0.4558,
+ "pc5": 1.6682,
+ "pc6": 2.5743,
+ "pc7": 2.3362,
+ "pc8": 0.4891,
+ "pc9": 0.1904,
+ "pc10": -0.0604,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "699cf77b",
+ "model": "glm-5.1",
+ "score": 0.635,
+ "pc1": -3.1559,
+ "pc2": 0.7182,
+ "pc3": -2.2055,
+ "pc4": 0.4558,
+ "pc5": 1.6682,
+ "pc6": 2.5743,
+ "pc7": 2.3362,
+ "pc8": 0.4891,
+ "pc9": 0.1904,
+ "pc10": -0.0604,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "2ae87d54",
+ "model": "glm-4.7",
+ "score": 0.64,
+ "pc1": -3.0216,
+ "pc2": 0.7279,
+ "pc3": -1.9054,
+ "pc4": 0.3277,
+ "pc5": 1.8174,
+ "pc6": 2.0233,
+ "pc7": 3.0886,
+ "pc8": 0.206,
+ "pc9": 0.1952,
+ "pc10": 0.1062,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "64b059c8",
+ "model": "glm-4.7",
+ "score": 0.765,
+ "pc1": -3.0216,
+ "pc2": 0.7279,
+ "pc3": -1.9054,
+ "pc4": 0.3277,
+ "pc5": 1.8174,
+ "pc6": 2.0233,
+ "pc7": 3.0886,
+ "pc8": 0.206,
+ "pc9": 0.1952,
+ "pc10": 0.1062,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "c273dfb3",
+ "model": "glm-4.7",
+ "score": 0.68,
+ "pc1": -3.0216,
+ "pc2": 0.7279,
+ "pc3": -1.9054,
+ "pc4": 0.3277,
+ "pc5": 1.8174,
+ "pc6": 2.0233,
+ "pc7": 3.0886,
+ "pc8": 0.206,
+ "pc9": 0.1952,
+ "pc10": 0.1062,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "bc23f2b0",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -3.1541,
+ "pc2": 0.7273,
+ "pc3": -2.1499,
+ "pc4": 0.3527,
+ "pc5": 1.816,
+ "pc6": 2.5335,
+ "pc7": 2.5456,
+ "pc8": 0.7126,
+ "pc9": 0.2339,
+ "pc10": 0.1534,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "1e9fac18",
+ "model": "glm-5.1",
+ "score": 0.625,
+ "pc1": -3.1541,
+ "pc2": 0.7273,
+ "pc3": -2.1499,
+ "pc4": 0.3527,
+ "pc5": 1.816,
+ "pc6": 2.5335,
+ "pc7": 2.5456,
+ "pc8": 0.7126,
+ "pc9": 0.2339,
+ "pc10": 0.1534,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "0c02f27a",
+ "model": "glm-5.1",
+ "score": 1.0,
+ "pc1": -3.1541,
+ "pc2": 0.7273,
+ "pc3": -2.1499,
+ "pc4": 0.3527,
+ "pc5": 1.816,
+ "pc6": 2.5335,
+ "pc7": 2.5456,
+ "pc8": 0.7126,
+ "pc9": 0.2339,
+ "pc10": 0.1534,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor1k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "b0889b2f",
+ "model": "glm-5.1",
+ "score": 0.795,
+ "pc1": -3.1632,
+ "pc2": 0.7125,
+ "pc3": -2.3615,
+ "pc4": 0.2187,
+ "pc5": 1.6386,
+ "pc6": 3.0802,
+ "pc7": 2.1325,
+ "pc8": 0.725,
+ "pc9": 0.2078,
+ "pc10": 0.1965,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
- "short_id": "f501a861",
- "model": "opus-4.6",
- "score": 0.355,
- "pc1": 1.3642,
- "pc2": -3.8342,
- "pc3": -0.332,
- "pc4": -1.2377,
- "pc5": 0.1286,
- "pc6": 4.135,
- "pc7": -4.0184,
- "pc8": -0.0,
- "pc9": 0.033,
- "pc10": -1.945,
- "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ "run_id": "tetris_arch=none_ctx=none_noise=lor1k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "3e650991",
+ "model": "glm-5.1",
+ "score": 0.73,
+ "pc1": -3.1632,
+ "pc2": 0.7125,
+ "pc3": -2.3615,
+ "pc4": 0.2187,
+ "pc5": 1.6386,
+ "pc6": 3.0802,
+ "pc7": 2.1325,
+ "pc8": 0.725,
+ "pc9": 0.2078,
+ "pc10": 0.1965,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
- "short_id": "9720d53e",
- "model": "opus-4.6",
- "score": 0.75,
- "pc1": 1.3642,
- "pc2": -3.8342,
- "pc3": -0.332,
- "pc4": -1.2377,
- "pc5": 0.1286,
- "pc6": 4.135,
- "pc7": -4.0184,
- "pc8": -0.0,
- "pc9": 0.033,
- "pc10": -1.945,
- "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ "run_id": "tetris_arch=none_ctx=none_noise=lor1k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "527ae718",
+ "model": "glm-5.1",
+ "score": 0.81,
+ "pc1": -3.1632,
+ "pc2": 0.7125,
+ "pc3": -2.3615,
+ "pc4": 0.2187,
+ "pc5": 1.6386,
+ "pc6": 3.0802,
+ "pc7": 2.1325,
+ "pc8": 0.725,
+ "pc9": 0.2078,
+ "pc10": 0.1965,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "5759a070",
+ "model": "glm-4.7",
+ "score": 0.305,
+ "pc1": -3.0217,
+ "pc2": 0.7232,
+ "pc3": -1.8507,
+ "pc4": 0.4951,
+ "pc5": 1.8957,
+ "pc6": 1.9906,
+ "pc7": 3.2101,
+ "pc8": 0.0592,
+ "pc9": 0.0451,
+ "pc10": 0.1581,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "09b8d56a",
- "model": "qwen-3.6-plus",
- "score": 0.255,
- "pc1": -2.5694,
- "pc2": -0.69,
- "pc3": 2.1126,
- "pc4": -1.0506,
- "pc5": -0.236,
- "pc6": 3.4914,
- "pc7": -4.5656,
- "pc8": -0.0,
- "pc9": -0.0042,
- "pc10": -2.298,
- "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low"
+ "run_id": "tetris_arch=none_ctx=none_noise=lor50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "71592253",
+ "model": "glm-4.7",
+ "score": 0.715,
+ "pc1": -3.0217,
+ "pc2": 0.7232,
+ "pc3": -1.8507,
+ "pc4": 0.4951,
+ "pc5": 1.8957,
+ "pc6": 1.9906,
+ "pc7": 3.2101,
+ "pc8": 0.0592,
+ "pc9": 0.0451,
+ "pc10": 0.1581,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "5d88e9c7",
- "model": "sonnet-4.6",
- "score": 0.75,
- "pc1": 1.3547,
- "pc2": -3.8283,
- "pc3": -0.3298,
- "pc4": -1.2375,
- "pc5": 0.1308,
- "pc6": 4.1368,
- "pc7": -4.0148,
- "pc8": -0.0,
- "pc9": 0.033,
- "pc10": -1.9437,
- "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ "run_id": "tetris_arch=none_ctx=none_noise=lor50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "0cd7b5c0",
+ "model": "glm-4.7",
+ "score": 0.46,
+ "pc1": -3.0217,
+ "pc2": 0.7232,
+ "pc3": -1.8507,
+ "pc4": 0.4951,
+ "pc5": 1.8957,
+ "pc6": 1.9906,
+ "pc7": 3.2101,
+ "pc8": 0.0592,
+ "pc9": 0.0451,
+ "pc10": 0.1581,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
- "short_id": "20dc3752",
- "model": "sonnet-4.6",
- "score": 0.74,
- "pc1": 1.3547,
- "pc2": -3.8283,
- "pc3": -0.3298,
- "pc4": -1.2375,
- "pc5": 0.1308,
- "pc6": 4.1368,
- "pc7": -4.0148,
- "pc8": -0.0,
- "pc9": 0.033,
- "pc10": -1.9437,
- "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ "run_id": "tetris_arch=none_ctx=none_noise=lor50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "f0919def",
+ "model": "glm-5.1",
+ "score": 0.73,
+ "pc1": -3.1542,
+ "pc2": 0.7226,
+ "pc3": -2.0952,
+ "pc4": 0.5201,
+ "pc5": 1.8943,
+ "pc6": 2.5008,
+ "pc7": 2.6672,
+ "pc8": 0.5658,
+ "pc9": 0.0839,
+ "pc10": 0.2053,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=max_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
- "short_id": "4905874d",
- "model": "sonnet-4.6",
- "score": 0.75,
- "pc1": 1.3547,
- "pc2": -3.8283,
- "pc3": -0.3298,
- "pc4": -1.2375,
- "pc5": 0.1308,
- "pc6": 4.1368,
- "pc7": -4.0148,
- "pc8": -0.0,
- "pc9": 0.033,
- "pc10": -1.9437,
- "config_summary": "effort=max, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
+ "run_id": "tetris_arch=none_ctx=none_noise=lor50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "374c9fe4",
+ "model": "glm-5.1",
+ "score": 1.0,
+ "pc1": -3.1542,
+ "pc2": 0.7226,
+ "pc3": -2.0952,
+ "pc4": 0.5201,
+ "pc5": 1.8943,
+ "pc6": 2.5008,
+ "pc7": 2.6672,
+ "pc8": 0.5658,
+ "pc9": 0.0839,
+ "pc10": 0.2053,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=lor50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "120783c1",
+ "model": "glm-5.1",
+ "score": 0.835,
+ "pc1": -3.1542,
+ "pc2": 0.7226,
+ "pc3": -2.0952,
+ "pc4": 0.5201,
+ "pc5": 1.8943,
+ "pc6": 2.5008,
+ "pc7": 2.6672,
+ "pc8": 0.5658,
+ "pc9": 0.0839,
+ "pc10": 0.2053,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "3be19fa3",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.4972,
- "pc2": 0.5282,
- "pc3": 5.187,
- "pc4": -0.4356,
- "pc5": -0.9644,
- "pc6": -1.0677,
- "pc7": -0.5496,
- "pc8": 7.0631,
- "pc9": 3.1667,
- "pc10": -0.0884,
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "e12838e5",
+ "model": "glm-5.1",
+ "score": 0.86,
+ "pc1": -3.168,
+ "pc2": 0.7065,
+ "pc3": -2.2847,
+ "pc4": 0.3532,
+ "pc5": 1.3758,
+ "pc6": 2.8603,
+ "pc7": 2.0599,
+ "pc8": 0.1306,
+ "pc9": 0.0984,
+ "pc10": -0.5269,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "cac6bb65",
+ "model": "glm-5.1",
+ "score": 0.625,
+ "pc1": -3.168,
+ "pc2": 0.7065,
+ "pc3": -2.2847,
+ "pc4": 0.3532,
+ "pc5": 1.3758,
+ "pc6": 2.8603,
+ "pc7": 2.0599,
+ "pc8": 0.1306,
+ "pc9": 0.0984,
+ "pc10": -0.5269,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki100k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "3a8321c5",
+ "model": "glm-5.1",
+ "score": 0.585,
+ "pc1": -3.168,
+ "pc2": 0.7065,
+ "pc3": -2.2847,
+ "pc4": 0.3532,
+ "pc5": 1.3758,
+ "pc6": 2.8603,
+ "pc7": 2.0599,
+ "pc8": 0.1306,
+ "pc9": 0.0984,
+ "pc10": -0.5269,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "8b81a68b",
+ "model": "glm-5.1",
+ "score": 0.87,
+ "pc1": -3.1617,
+ "pc2": 0.7088,
+ "pc3": -2.0745,
+ "pc4": 0.479,
+ "pc5": 1.6978,
+ "pc6": 2.7241,
+ "pc7": 2.5295,
+ "pc8": 1.5962,
+ "pc9": 0.0216,
+ "pc10": -0.0555,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "20ecfcc4",
- "model": "glm-4.5-air",
- "score": 0.28,
- "pc1": -3.5341,
- "pc2": 0.8692,
- "pc3": 1.6114,
- "pc4": -0.0156,
- "pc5": -0.4642,
- "pc6": -0.8311,
- "pc7": -0.7712,
- "pc8": 7.0631,
- "pc9": 3.2335,
- "pc10": -0.8288,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "bca4f2f3",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.5901,
- "pc2": 0.0243,
- "pc3": 3.1206,
- "pc4": -0.2767,
- "pc5": -0.4836,
- "pc6": -0.8809,
- "pc7": -0.2981,
- "pc8": 7.0631,
- "pc9": 3.2124,
- "pc10": -0.2586,
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "bb9af51e",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -3.1617,
+ "pc2": 0.7088,
+ "pc3": -2.0745,
+ "pc4": 0.479,
+ "pc5": 1.6978,
+ "pc6": 2.7241,
+ "pc7": 2.5295,
+ "pc8": 1.5962,
+ "pc9": 0.0216,
+ "pc10": -0.0555,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki10k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "9bda026f",
+ "model": "glm-5.1",
+ "score": 0.59,
+ "pc1": -3.1617,
+ "pc2": 0.7088,
+ "pc3": -2.0745,
+ "pc4": 0.479,
+ "pc5": 1.6978,
+ "pc6": 2.7241,
+ "pc7": 2.5295,
+ "pc8": 1.5962,
+ "pc9": 0.0216,
+ "pc10": -0.0555,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=specific_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "fb0c6aef",
- "model": "qwen-3.6-plus",
- "score": 0.31,
- "pc1": -3.4591,
- "pc2": 0.5298,
- "pc3": 5.211,
- "pc4": -0.4593,
- "pc5": -1.0387,
- "pc6": -1.5732,
- "pc7": -1.103,
- "pc8": 7.0631,
- "pc9": 3.1709,
- "pc10": -0.563,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "6560e960",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.4972,
- "pc2": 0.5282,
- "pc3": 5.187,
- "pc4": -0.4356,
- "pc5": -0.9644,
- "pc6": -1.0677,
- "pc7": -0.5496,
- "pc8": 7.0631,
- "pc9": 3.1667,
- "pc10": -0.0884,
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki1k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "0f274b03",
+ "model": "glm-5.1",
+ "score": 0.93,
+ "pc1": -3.163,
+ "pc2": 0.7039,
+ "pc3": -2.4136,
+ "pc4": 0.4368,
+ "pc5": 1.5766,
+ "pc6": 2.9118,
+ "pc7": 2.22,
+ "pc8": 1.0117,
+ "pc9": -0.0752,
+ "pc10": -0.2549,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki1k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "485a520f",
+ "model": "glm-5.1",
+ "score": 0.785,
+ "pc1": -3.163,
+ "pc2": 0.7039,
+ "pc3": -2.4136,
+ "pc4": 0.4368,
+ "pc5": 1.5766,
+ "pc6": 2.9118,
+ "pc7": 2.22,
+ "pc8": 1.0117,
+ "pc9": -0.0752,
+ "pc10": -0.2549,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki1k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "7a7443d8",
+ "model": "glm-5.1",
+ "score": 0.835,
+ "pc1": -3.163,
+ "pc2": 0.7039,
+ "pc3": -2.4136,
+ "pc4": 0.4368,
+ "pc5": 1.5766,
+ "pc6": 2.9118,
+ "pc7": 2.22,
+ "pc8": 1.0117,
+ "pc9": -0.0752,
+ "pc10": -0.2549,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "a7393fb0",
- "model": "glm-4.5-air",
- "score": 0.23,
- "pc1": -3.5341,
- "pc2": 0.8692,
- "pc3": 1.6114,
- "pc4": -0.0156,
- "pc5": -0.4642,
- "pc6": -0.8311,
- "pc7": -0.7712,
- "pc8": 7.0631,
- "pc9": 3.2335,
- "pc10": -0.8288,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "ec236ed9",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.5901,
- "pc2": 0.0243,
- "pc3": 3.1206,
- "pc4": -0.2767,
- "pc5": -0.4836,
- "pc6": -0.8809,
- "pc7": -0.2981,
- "pc8": 7.0631,
- "pc9": 3.2124,
- "pc10": -0.2586,
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "0bde7ee4",
+ "model": "glm-5.1",
+ "score": 0.695,
+ "pc1": -3.1585,
+ "pc2": 0.7227,
+ "pc3": -2.1192,
+ "pc4": 0.4551,
+ "pc5": 1.9137,
+ "pc6": 2.7416,
+ "pc7": 2.3863,
+ "pc8": 1.0697,
+ "pc9": -0.1127,
+ "pc10": 0.5701,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "3021ad25",
+ "model": "glm-5.1",
+ "score": 0.835,
+ "pc1": -3.1585,
+ "pc2": 0.7227,
+ "pc3": -2.1192,
+ "pc4": 0.4551,
+ "pc5": 1.9137,
+ "pc6": 2.7416,
+ "pc7": 2.3863,
+ "pc8": 1.0697,
+ "pc9": -0.1127,
+ "pc10": 0.5701,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=vague_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "602fba4b",
- "model": "qwen-3.6-plus",
- "score": 0.77,
- "pc1": -3.4591,
- "pc2": 0.5298,
- "pc3": 5.211,
- "pc4": -0.4593,
- "pc5": -1.0387,
- "pc6": -1.5732,
- "pc7": -1.103,
- "pc8": 7.0631,
- "pc9": 3.1709,
- "pc10": -0.563,
+ "run_id": "tetris_arch=none_ctx=none_noise=wiki50k_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "f34781bd",
+ "model": "glm-5.1",
+ "score": 0.975,
+ "pc1": -3.1585,
+ "pc2": 0.7227,
+ "pc3": -2.1192,
+ "pc4": 0.4551,
+ "pc5": 1.9137,
+ "pc6": 2.7416,
+ "pc7": 2.3863,
+ "pc8": 1.0697,
+ "pc9": -0.1127,
+ "pc10": 0.5701,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=on_twrite=off_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=on_twrite=off_web=on_run4",
"short_id": "1e3f4cdb",
"model": "haiku-4.5",
- "score": 0.59,
- "pc1": 6.6173,
- "pc2": 6.1061,
- "pc3": 1.7415,
- "pc4": 1.1918,
- "pc5": 7.3419,
- "pc6": -0.2971,
- "pc7": -0.9647,
- "pc8": -0.0,
- "pc9": 0.0054,
- "pc10": -0.1751,
+ "score": 0.845,
+ "pc1": 7.3027,
+ "pc2": 6.7229,
+ "pc3": 1.8427,
+ "pc4": -3.6129,
+ "pc5": 6.9115,
+ "pc6": -0.6175,
+ "pc7": -1.6293,
+ "pc8": 0.6499,
+ "pc9": 0.4101,
+ "pc10": 1.1397,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=on_twrite=off_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=on_twrite=off_web=on_run5",
"short_id": "c7b0bb6b",
"model": "haiku-4.5",
- "score": 0.565,
- "pc1": 6.6173,
- "pc2": 6.1061,
- "pc3": 1.7415,
- "pc4": 1.1918,
- "pc5": 7.3419,
- "pc6": -0.2971,
- "pc7": -0.9647,
- "pc8": -0.0,
- "pc9": 0.0054,
- "pc10": -0.1751,
+ "score": 0.775,
+ "pc1": 7.3027,
+ "pc2": 6.7229,
+ "pc3": 1.8427,
+ "pc4": -3.6129,
+ "pc5": 6.9115,
+ "pc6": -0.6175,
+ "pc7": -1.6293,
+ "pc8": 0.6499,
+ "pc9": 0.4101,
+ "pc10": 1.1397,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=on_twrite=off_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=off_tglob=off_tgrep=off_tread=on_twrite=off_web=on_run6",
"short_id": "bbb70053",
"model": "haiku-4.5",
- "score": 0.715,
- "pc1": 6.6173,
- "pc2": 6.1061,
- "pc3": 1.7415,
- "pc4": 1.1918,
- "pc5": 7.3419,
- "pc6": -0.2971,
- "pc7": -0.9647,
- "pc8": -0.0,
- "pc9": 0.0054,
- "pc10": -0.1751,
+ "score": 0.805,
+ "pc1": 7.3027,
+ "pc2": 6.7229,
+ "pc3": 1.8427,
+ "pc4": -3.6129,
+ "pc5": 6.9115,
+ "pc6": -0.6175,
+ "pc7": -1.6293,
+ "pc8": 0.6499,
+ "pc9": 0.4101,
+ "pc10": 1.1397,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "77966846",
"model": "haiku-4.5",
- "score": 0.255,
- "pc1": 3.1598,
- "pc2": -1.516,
- "pc3": 0.5613,
- "pc4": 6.0975,
- "pc5": -0.3133,
- "pc6": -0.1858,
- "pc7": -0.626,
- "pc8": -0.0,
- "pc9": -0.0503,
- "pc10": 1.6554,
+ "score": 0.75,
+ "pc1": 4.1553,
+ "pc2": -1.5253,
+ "pc3": -2.3548,
+ "pc4": -6.249,
+ "pc5": -0.9253,
+ "pc6": 0.153,
+ "pc7": 0.6073,
+ "pc8": 0.2824,
+ "pc9": -0.3021,
+ "pc10": 1.2512,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "f6426aae",
"model": "haiku-4.5",
- "score": 0.405,
- "pc1": 3.1598,
- "pc2": -1.516,
- "pc3": 0.5613,
- "pc4": 6.0975,
- "pc5": -0.3133,
- "pc6": -0.1858,
- "pc7": -0.626,
- "pc8": -0.0,
- "pc9": -0.0503,
- "pc10": 1.6554,
+ "score": 0.945,
+ "pc1": 4.1553,
+ "pc2": -1.5253,
+ "pc3": -2.3548,
+ "pc4": -6.249,
+ "pc5": -0.9253,
+ "pc6": 0.153,
+ "pc7": 0.6073,
+ "pc8": 0.2824,
+ "pc9": -0.3021,
+ "pc10": 1.2512,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=high_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "f86cae22",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 3.1598,
- "pc2": -1.516,
- "pc3": 0.5613,
- "pc4": 6.0975,
- "pc5": -0.3133,
- "pc6": -0.1858,
- "pc7": -0.626,
- "pc8": -0.0,
- "pc9": -0.0503,
- "pc10": 1.6554,
+ "score": 0.735,
+ "pc1": 4.1553,
+ "pc2": -1.5253,
+ "pc3": -2.3548,
+ "pc4": -6.249,
+ "pc5": -0.9253,
+ "pc6": 0.153,
+ "pc7": 0.6073,
+ "pc8": 0.2824,
+ "pc9": -0.3021,
+ "pc10": 1.2512,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "7e5bb7c3",
"model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -1.5496,
- "pc2": 0.9833,
- "pc3": 2.5645,
- "pc4": 2.6526,
- "pc5": 0.1492,
- "pc6": -0.2184,
- "pc7": -0.5794,
- "pc8": -0.0,
- "pc9": -0.0533,
- "pc10": 0.5997,
+ "score": 0.485,
+ "pc1": -0.5165,
+ "pc2": 0.7262,
+ "pc3": 2.5894,
+ "pc4": -3.778,
+ "pc5": -0.6605,
+ "pc6": 0.0886,
+ "pc7": 0.8285,
+ "pc8": -0.2823,
+ "pc9": -0.426,
+ "pc10": 0.9359,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "0f8c8b62",
"model": "glm-4.5-air",
- "score": 0.155,
- "pc1": -1.5865,
- "pc2": 1.3243,
- "pc3": -1.0111,
- "pc4": 3.0726,
- "pc5": 0.6495,
- "pc6": 0.0182,
- "pc7": -0.8011,
- "pc8": -0.0,
- "pc9": 0.0136,
- "pc10": -0.1407,
+ "score": 0.67,
+ "pc1": -0.9948,
+ "pc2": 1.0893,
+ "pc3": -1.0522,
+ "pc4": -3.1828,
+ "pc5": -0.2155,
+ "pc6": -0.5457,
+ "pc7": -0.4374,
+ "pc8": 0.2845,
+ "pc9": -0.1888,
+ "pc10": 1.1111,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "b13700b7",
"model": "glm-4.5-air",
- "score": 0.305,
- "pc1": -1.5865,
- "pc2": 1.3243,
- "pc3": -1.0111,
- "pc4": 3.0726,
- "pc5": 0.6495,
- "pc6": 0.0182,
- "pc7": -0.8011,
- "pc8": -0.0,
- "pc9": 0.0136,
- "pc10": -0.1407,
+ "score": 0.735,
+ "pc1": -0.9948,
+ "pc2": 1.0893,
+ "pc3": -1.0522,
+ "pc4": -3.1828,
+ "pc5": -0.2155,
+ "pc6": -0.5457,
+ "pc7": -0.4374,
+ "pc8": 0.2845,
+ "pc9": -0.1888,
+ "pc10": 1.1111,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "8d789027",
"model": "glm-4.7",
- "score": 0.38,
- "pc1": -1.5113,
- "pc2": 1.3501,
- "pc3": -1.3561,
- "pc4": 3.1329,
- "pc5": 0.6573,
- "pc6": -0.734,
- "pc7": -1.2026,
- "pc8": -0.0,
- "pc9": -0.0106,
- "pc10": 0.0509,
+ "score": 0.755,
+ "pc1": -1.0129,
+ "pc2": 1.1367,
+ "pc3": -1.1135,
+ "pc4": -3.087,
+ "pc5": 0.1598,
+ "pc6": -0.4051,
+ "pc7": 0.5089,
+ "pc8": -0.1851,
+ "pc9": -0.1568,
+ "pc10": 1.0727,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "bb561270",
+ "model": "glm-4.7",
+ "score": 0.715,
+ "pc1": -1.0129,
+ "pc2": 1.1367,
+ "pc3": -1.1135,
+ "pc4": -3.087,
+ "pc5": 0.1598,
+ "pc6": -0.4051,
+ "pc7": 0.5089,
+ "pc8": -0.1851,
+ "pc9": -0.1568,
+ "pc10": 1.0727,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm47_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "485c959f",
+ "model": "glm-4.7",
+ "score": 0.92,
+ "pc1": -1.0129,
+ "pc2": 1.1367,
+ "pc3": -1.1135,
+ "pc4": -3.087,
+ "pc5": 0.1598,
+ "pc6": -0.4051,
+ "pc7": 0.5089,
+ "pc8": -0.1851,
+ "pc9": -0.1568,
+ "pc10": 1.0727,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "7fc5f846",
"model": "glm-5.1",
- "score": 0.365,
- "pc1": -1.5366,
- "pc2": 1.43,
- "pc3": -1.3772,
- "pc4": 3.0632,
- "pc5": 0.7926,
- "pc6": 0.083,
- "pc7": -1.0043,
- "pc8": -0.0,
- "pc9": 0.0045,
- "pc10": -0.1476,
+ "score": 0.975,
+ "pc1": -1.1454,
+ "pc2": 1.1361,
+ "pc3": -1.358,
+ "pc4": -3.062,
+ "pc5": 0.1584,
+ "pc6": 0.1051,
+ "pc7": -0.034,
+ "pc8": 0.3216,
+ "pc9": -0.118,
+ "pc10": 1.1199,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
"short_id": "8d7679dc",
"model": "glm-5.1",
- "score": 0.255,
- "pc1": -1.5366,
- "pc2": 1.43,
- "pc3": -1.3772,
- "pc4": 3.0632,
- "pc5": 0.7926,
- "pc6": 0.083,
- "pc7": -1.0043,
- "pc8": -0.0,
- "pc9": 0.0045,
- "pc10": -0.1476,
+ "score": 0.78,
+ "pc1": -1.1454,
+ "pc2": 1.1361,
+ "pc3": -1.358,
+ "pc4": -3.062,
+ "pc5": 0.1584,
+ "pc6": 0.1051,
+ "pc7": -0.034,
+ "pc8": 0.3216,
+ "pc9": -0.118,
+ "pc10": 1.1199,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
"short_id": "8d96f61d",
"model": "glm-5.1",
- "score": 0.255,
- "pc1": -1.5366,
- "pc2": 1.43,
- "pc3": -1.3772,
- "pc4": 3.0632,
- "pc5": 0.7926,
- "pc6": 0.083,
- "pc7": -1.0043,
- "pc8": -0.0,
- "pc9": 0.0045,
- "pc10": -0.1476,
+ "score": 0.705,
+ "pc1": -1.1454,
+ "pc2": 1.1361,
+ "pc3": -1.358,
+ "pc4": -3.062,
+ "pc5": 0.1584,
+ "pc6": 0.1051,
+ "pc7": -0.034,
+ "pc8": 0.3216,
+ "pc9": -0.118,
+ "pc10": 1.1199,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "8bb02c7c",
"model": "haiku-4.5",
- "score": 0.305,
- "pc1": 2.5293,
- "pc2": -1.5381,
- "pc3": 0.4226,
- "pc4": 2.681,
- "pc5": 0.4801,
- "pc6": -0.0024,
- "pc7": -0.342,
- "pc8": -0.0,
- "pc9": -0.01,
- "pc10": 0.6029,
+ "score": 0.72,
+ "pc1": 3.31,
+ "pc2": -1.5221,
+ "pc3": -1.1412,
+ "pc4": -2.8386,
+ "pc5": 0.2687,
+ "pc6": -0.1354,
+ "pc7": -0.0644,
+ "pc8": 0.1594,
+ "pc9": 0.0145,
+ "pc10": 1.1458,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "b1b1424a",
"model": "haiku-4.5",
- "score": 0.225,
- "pc1": 2.5293,
- "pc2": -1.5381,
- "pc3": 0.4226,
- "pc4": 2.681,
- "pc5": 0.4801,
- "pc6": -0.0024,
- "pc7": -0.342,
- "pc8": -0.0,
- "pc9": -0.01,
- "pc10": 0.6029,
+ "score": 0.565,
+ "pc1": 3.31,
+ "pc2": -1.5221,
+ "pc3": -1.1412,
+ "pc4": -2.8386,
+ "pc5": 0.2687,
+ "pc6": -0.1354,
+ "pc7": -0.0644,
+ "pc8": 0.1594,
+ "pc9": 0.0145,
+ "pc10": 1.1458,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "d9899ed8",
"model": "haiku-4.5",
- "score": 0.7,
- "pc1": 2.5293,
- "pc2": -1.5381,
- "pc3": 0.4226,
- "pc4": 2.681,
- "pc5": 0.4801,
- "pc6": -0.0024,
- "pc7": -0.342,
- "pc8": -0.0,
- "pc9": -0.01,
- "pc10": 0.6029,
+ "score": 0.75,
+ "pc1": 3.31,
+ "pc2": -1.5221,
+ "pc3": -1.1412,
+ "pc4": -2.8386,
+ "pc5": 0.2687,
+ "pc6": -0.1354,
+ "pc7": -0.0644,
+ "pc8": 0.1594,
+ "pc9": 0.0145,
+ "pc10": 1.1458,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "19d7fd45",
"model": "opus-4.6",
- "score": 0.39,
- "pc1": 2.4222,
- "pc2": -2.1592,
- "pc3": 0.1439,
- "pc4": 2.4418,
- "pc5": 0.4395,
- "pc6": -0.0803,
- "pc7": -0.5855,
- "pc8": -0.0,
- "pc9": -0.0119,
- "pc10": 0.478,
+ "score": 0.835,
+ "pc1": 3.1359,
+ "pc2": -2.2593,
+ "pc3": -1.2118,
+ "pc4": -2.5317,
+ "pc5": 0.3459,
+ "pc6": -0.0705,
+ "pc7": -0.2633,
+ "pc8": 0.2212,
+ "pc9": -0.0456,
+ "pc10": 1.2371,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "e10bfa92",
"model": "opus-4.6",
- "score": 0.825,
- "pc1": 2.4222,
- "pc2": -2.1592,
- "pc3": 0.1439,
- "pc4": 2.4418,
- "pc5": 0.4395,
- "pc6": -0.0803,
- "pc7": -0.5855,
- "pc8": -0.0,
- "pc9": -0.0119,
- "pc10": 0.478,
+ "score": 0.865,
+ "pc1": 3.1359,
+ "pc2": -2.2593,
+ "pc3": -1.2118,
+ "pc4": -2.5317,
+ "pc5": 0.3459,
+ "pc6": -0.0705,
+ "pc7": -0.2633,
+ "pc8": 0.2212,
+ "pc9": -0.0456,
+ "pc10": 1.2371,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "b060d46a",
"model": "opus-4.6",
- "score": 0.765,
- "pc1": 2.4222,
- "pc2": -2.1592,
- "pc3": 0.1439,
- "pc4": 2.4418,
- "pc5": 0.4395,
- "pc6": -0.0803,
- "pc7": -0.5855,
- "pc8": -0.0,
- "pc9": -0.0119,
- "pc10": 0.478,
+ "score": 0.97,
+ "pc1": 3.1359,
+ "pc2": -2.2593,
+ "pc3": -1.2118,
+ "pc4": -2.5317,
+ "pc5": 0.3459,
+ "pc6": -0.0705,
+ "pc7": -0.2633,
+ "pc8": 0.2212,
+ "pc9": -0.0456,
+ "pc10": 1.2371,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
"run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "cc48cc6a",
"model": "qwen-3.6-plus",
- "score": 0.3,
- "pc1": -1.5114,
- "pc2": 0.9849,
- "pc3": 2.5885,
- "pc4": 2.6289,
- "pc5": 0.0749,
- "pc6": -0.7239,
- "pc7": -1.1328,
- "pc8": -0.0,
- "pc9": -0.0491,
- "pc10": 0.1251,
+ "score": 0.665,
+ "pc1": -0.5514,
+ "pc2": 0.661,
+ "pc3": 2.5121,
+ "pc4": -3.966,
+ "pc5": -1.1245,
+ "pc6": 0.3772,
+ "pc7": 0.2481,
+ "pc8": -0.1522,
+ "pc9": -0.0347,
+ "pc10": 1.2411,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run4",
"short_id": "7d8d44d6",
"model": "sonnet-4.6",
- "score": 0.28,
- "pc1": 2.4127,
- "pc2": -2.1534,
- "pc3": 0.1461,
- "pc4": 2.442,
- "pc5": 0.4416,
- "pc6": -0.0786,
- "pc7": -0.5819,
- "pc8": -0.0,
- "pc9": -0.0119,
- "pc10": 0.4793,
+ "score": 0.835,
+ "pc1": 3.1279,
+ "pc2": -2.2512,
+ "pc3": -1.2078,
+ "pc4": -2.5117,
+ "pc5": 0.3083,
+ "pc6": -0.0067,
+ "pc7": -0.1821,
+ "pc8": 0.0842,
+ "pc9": 0.1001,
+ "pc10": 1.2826,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run5",
"short_id": "837ded2f",
"model": "sonnet-4.6",
- "score": 0.43,
- "pc1": 2.4127,
- "pc2": -2.1534,
- "pc3": 0.1461,
- "pc4": 2.442,
- "pc5": 0.4416,
- "pc6": -0.0786,
- "pc7": -0.5819,
- "pc8": -0.0,
- "pc9": -0.0119,
- "pc10": 0.4793,
+ "score": 0.97,
+ "pc1": 3.1279,
+ "pc2": -2.2512,
+ "pc3": -1.2078,
+ "pc4": -2.5117,
+ "pc5": 0.3083,
+ "pc6": -0.0067,
+ "pc7": -0.1821,
+ "pc8": 0.0842,
+ "pc9": 0.1001,
+ "pc10": 1.2826,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=sonnet46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
"short_id": "f9d8871e",
"model": "sonnet-4.6",
- "score": 0.315,
- "pc1": 2.4127,
- "pc2": -2.1534,
- "pc3": 0.1461,
- "pc4": 2.442,
- "pc5": 0.4416,
- "pc6": -0.0786,
- "pc7": -0.5819,
- "pc8": -0.0,
- "pc9": -0.0119,
- "pc10": 0.4793,
+ "score": 0.655,
+ "pc1": 3.1279,
+ "pc2": -2.2512,
+ "pc3": -1.2078,
+ "pc4": -2.5117,
+ "pc5": 0.3083,
+ "pc6": -0.0067,
+ "pc7": -0.1821,
+ "pc8": 0.0842,
+ "pc9": 0.1001,
+ "pc10": 1.2826,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=off_twrite=off_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=off_twrite=off_web=off_run4",
"short_id": "195c0c1f",
"model": "haiku-4.5",
"score": 0.65,
- "pc1": 9.4117,
- "pc2": 7.4615,
- "pc3": -0.4325,
- "pc4": 0.3446,
- "pc5": -3.3606,
- "pc6": -0.6183,
- "pc7": -1.7293,
- "pc8": -0.0,
- "pc9": -0.0678,
- "pc10": 1.843,
+ "pc1": 10.5296,
+ "pc2": 8.5596,
+ "pc3": -1.7326,
+ "pc4": 0.8554,
+ "pc5": -2.9738,
+ "pc6": 0.0357,
+ "pc7": 0.4806,
+ "pc8": 0.3363,
+ "pc9": -0.6803,
+ "pc10": 3.5158,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=off_twrite=off_web=off_run2",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=off_twrite=off_web=off_run5",
"short_id": "18bcc1ad",
"model": "haiku-4.5",
- "score": 0.47,
- "pc1": 9.4117,
- "pc2": 7.4615,
- "pc3": -0.4325,
- "pc4": 0.3446,
- "pc5": -3.3606,
- "pc6": -0.6183,
- "pc7": -1.7293,
- "pc8": -0.0,
- "pc9": -0.0678,
- "pc10": 1.843,
+ "score": 0.95,
+ "pc1": 10.5296,
+ "pc2": 8.5596,
+ "pc3": -1.7326,
+ "pc4": 0.8554,
+ "pc5": -2.9738,
+ "pc6": 0.0357,
+ "pc7": 0.4806,
+ "pc8": 0.3363,
+ "pc9": -0.6803,
+ "pc10": 3.5158,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=detailed_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=off_twrite=off_web=off_run3",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=off_budget=low_model=haiku45_pw=avail_prompt=detailed_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=off_tread=off_twrite=off_web=off_run6",
"short_id": "93e8feea",
"model": "haiku-4.5",
- "score": 0.405,
- "pc1": 9.4117,
- "pc2": 7.4615,
- "pc3": -0.4325,
- "pc4": 0.3446,
- "pc5": -3.3606,
- "pc6": -0.6183,
- "pc7": -1.7293,
- "pc8": -0.0,
- "pc9": -0.0678,
- "pc10": 1.843,
+ "score": 0.835,
+ "pc1": 10.5296,
+ "pc2": 8.5596,
+ "pc3": -1.7326,
+ "pc4": 0.8554,
+ "pc5": -2.9738,
+ "pc6": 0.0357,
+ "pc7": 0.4806,
+ "pc8": 0.3363,
+ "pc9": -0.6803,
+ "pc10": 3.5158,
"config_summary": "effort=high, prompt_style=detailed, language=typescript, max_budget=low, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=high_model=haiku45_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=off_web=off_run1",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=high_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=off_web=off_run4",
"short_id": "67825cfa",
"model": "haiku-4.5",
- "score": 0.65,
- "pc1": 6.0953,
- "pc2": 4.5966,
- "pc3": 0.864,
- "pc4": 8.5591,
- "pc5": -1.6507,
- "pc6": -0.0498,
- "pc7": 0.8766,
- "pc8": 0.0,
- "pc9": 0.0723,
- "pc10": -2.6621,
+ "score": 0.645,
+ "pc1": 7.1991,
+ "pc2": 5.1848,
+ "pc3": -2.9218,
+ "pc4": -8.3626,
+ "pc5": -3.3377,
+ "pc6": -0.0538,
+ "pc7": 1.54,
+ "pc8": -0.9638,
+ "pc9": -0.1758,
+ "pc10": -2.3854,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=high_model=haiku45_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=off_web=off_run2",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=high_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=off_web=off_run5",
"short_id": "ccc32a02",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 6.0953,
- "pc2": 4.5966,
- "pc3": 0.864,
- "pc4": 8.5591,
- "pc5": -1.6507,
- "pc6": -0.0498,
- "pc7": 0.8766,
- "pc8": 0.0,
- "pc9": 0.0723,
- "pc10": -2.6621,
+ "score": 0.765,
+ "pc1": 7.1991,
+ "pc2": 5.1848,
+ "pc3": -2.9218,
+ "pc4": -8.3626,
+ "pc5": -3.3377,
+ "pc6": -0.0538,
+ "pc7": 1.54,
+ "pc8": -0.9638,
+ "pc9": -0.1758,
+ "pc10": -2.3854,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=high_model=haiku45_pw=off_prompt=simple_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=off_web=off_run3",
+ "run_id": "tetris_arch=none_ctx=provided_noise=clean_dsgn=none_eff=high_echk=none_hlang=es_lang=ts_lint=on_budget=high_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=off_tglob=on_tgrep=on_tread=on_twrite=off_web=off_run6",
"short_id": "edcf7c7c",
"model": "haiku-4.5",
- "score": 0.155,
- "pc1": 6.0953,
- "pc2": 4.5966,
- "pc3": 0.864,
- "pc4": 8.5591,
- "pc5": -1.6507,
- "pc6": -0.0498,
- "pc7": 0.8766,
- "pc8": 0.0,
- "pc9": 0.0723,
- "pc10": -2.6621,
+ "score": 0.885,
+ "pc1": 7.1991,
+ "pc2": 5.1848,
+ "pc3": -2.9218,
+ "pc4": -8.3626,
+ "pc5": -3.3377,
+ "pc6": -0.0538,
+ "pc7": 1.54,
+ "pc8": -0.9638,
+ "pc9": -0.1758,
+ "pc10": -2.3854,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=high, strategy=use_subagents"
},
{
- "run_id": "tetris_arch=sep_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "b75222f6",
- "model": "gemma-4-26b",
- "score": 0.325,
- "pc1": -3.4972,
- "pc2": 0.5282,
- "pc3": 5.187,
- "pc4": -0.4356,
- "pc5": -0.9644,
- "pc6": -1.0677,
- "pc7": -0.5496,
- "pc8": -7.0631,
- "pc9": 3.1667,
- "pc10": -0.0884,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
"run_id": "tetris_arch=sep_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm45air_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "ec92f0b3",
"model": "glm-4.5-air",
- "score": 0.33,
- "pc1": -3.5341,
- "pc2": 0.8692,
- "pc3": 1.6114,
- "pc4": -0.0156,
- "pc5": -0.4642,
- "pc6": -0.8311,
- "pc7": -0.7712,
- "pc8": -7.0631,
- "pc9": 3.2335,
- "pc10": -0.8288,
- "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
- },
- {
- "run_id": "tetris_arch=sep_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=haiku45_pw=off_prompt=simple_prov=anth_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
- "short_id": "549e7976",
- "model": "haiku-4.5",
- "score": 0.325,
- "pc1": -1.5901,
- "pc2": 0.0243,
- "pc3": 3.1206,
- "pc4": -0.2767,
- "pc5": -0.4836,
- "pc6": -0.8809,
- "pc7": -0.2981,
- "pc8": -7.0631,
- "pc9": 3.2124,
- "pc10": -0.2586,
+ "score": 0.66,
+ "pc1": -2.9399,
+ "pc2": 0.6057,
+ "pc3": -0.5649,
+ "pc4": -0.3143,
+ "pc5": -1.5399,
+ "pc6": 0.3819,
+ "pc7": -5.3219,
+ "pc8": 1.6749,
+ "pc9": -7.3416,
+ "pc10": 0.7491,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=sep_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
+ "short_id": "100a4faf",
+ "model": "glm-5.1",
+ "score": 0.81,
+ "pc1": -3.0905,
+ "pc2": 0.6525,
+ "pc3": -0.8706,
+ "pc4": -0.1935,
+ "pc5": -1.166,
+ "pc6": 1.0326,
+ "pc7": -4.9186,
+ "pc8": 1.7119,
+ "pc9": -7.2708,
+ "pc10": 0.7579,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=sep_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run2",
+ "short_id": "2ef3a411",
+ "model": "glm-5.1",
+ "score": 0.5,
+ "pc1": -3.0905,
+ "pc2": 0.6525,
+ "pc3": -0.8706,
+ "pc4": -0.1935,
+ "pc5": -1.166,
+ "pc6": 1.0326,
+ "pc7": -4.9186,
+ "pc8": 1.7119,
+ "pc9": -7.2708,
+ "pc10": 0.7579,
+ "config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
+ },
+ {
+ "run_id": "tetris_arch=sep_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=glm51_pw=off_prompt=simple_prov=zai_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run3",
+ "short_id": "7ed01455",
+ "model": "glm-5.1",
+ "score": 0.43,
+ "pc1": -3.0905,
+ "pc2": 0.6525,
+ "pc3": -0.8706,
+ "pc4": -0.1935,
+ "pc5": -1.166,
+ "pc6": 1.0326,
+ "pc7": -4.9186,
+ "pc8": 1.7119,
+ "pc9": -7.2708,
+ "pc10": 0.7579,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
},
{
"run_id": "tetris_arch=sep_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
"short_id": "eade1121",
"model": "qwen-3.6-plus",
- "score": 0.58,
- "pc1": -3.4591,
- "pc2": 0.5298,
- "pc3": 5.211,
- "pc4": -0.4593,
- "pc5": -1.0387,
- "pc6": -1.5732,
- "pc7": -1.103,
- "pc8": -7.0631,
- "pc9": 3.1709,
- "pc10": -0.563,
+ "score": 0.79,
+ "pc1": -2.4965,
+ "pc2": 0.1774,
+ "pc3": 2.9994,
+ "pc4": -1.0975,
+ "pc5": -2.4488,
+ "pc6": 1.3047,
+ "pc7": -4.6365,
+ "pc8": 1.2382,
+ "pc9": -7.1874,
+ "pc10": 0.8791,
"config_summary": "effort=high, prompt_style=simple, language=typescript, max_budget=low"
}
],
@@ -6765,1166 +8765,1334 @@
{
"feature": "model_gemma-4-26b",
"axis": "model",
- "pc1": -0.1133,
- "pc2": 0.0317,
- "pc3": 0.3095,
- "pc4": -0.0199,
- "pc5": -0.048,
- "pc6": 0.0271,
- "pc7": 0.0555,
- "pc8": -0.0,
- "pc9": -0.0057,
- "pc10": 0.0845
+ "pc1": -0.0426,
+ "pc2": 0.0172,
+ "pc3": 0.397,
+ "pc4": -0.0709,
+ "pc5": -0.0505,
+ "pc6": 0.0128,
+ "pc7": 0.115,
+ "pc8": -0.0465,
+ "pc9": -0.0574,
+ "pc10": -0.0266
},
{
"feature": "model_glm-4.5-air",
"axis": "model",
- "pc1": -0.1226,
- "pc2": 0.0681,
- "pc3": -0.1217,
- "pc4": 0.0325,
- "pc5": 0.0022,
- "pc6": 0.0501,
- "pc7": 0.0207,
- "pc8": 0.0,
- "pc9": 0.0051,
- "pc10": -0.0528
+ "pc1": -0.0743,
+ "pc2": 0.0449,
+ "pc3": -0.0507,
+ "pc4": -0.0089,
+ "pc5": -0.0736,
+ "pc6": -0.1118,
+ "pc7": -0.1512,
+ "pc8": 0.0343,
+ "pc9": -0.0071,
+ "pc10": -0.0023
},
{
"feature": "model_glm-4.7",
"axis": "model",
- "pc1": -0.0838,
- "pc2": 0.064,
- "pc3": -0.1912,
- "pc4": 0.0428,
- "pc5": 0.0039,
- "pc6": -0.1513,
- "pc7": -0.0859,
- "pc8": -0.0,
- "pc9": -0.0019,
- "pc10": 0.0049
+ "pc1": -0.1062,
+ "pc2": 0.0745,
+ "pc3": -0.0974,
+ "pc4": 0.0184,
+ "pc5": 0.0432,
+ "pc6": -0.0856,
+ "pc7": 0.1505,
+ "pc8": -0.1154,
+ "pc9": -0.0072,
+ "pc10": -0.0025
},
{
"feature": "model_glm-5.1",
"axis": "model",
- "pc1": -0.1237,
- "pc2": 0.1157,
- "pc3": -0.2692,
- "pc4": 0.0341,
- "pc5": 0.053,
- "pc6": 0.0806,
- "pc7": -0.0478,
- "pc8": -0.0,
- "pc9": 0.0027,
- "pc10": -0.0632
+ "pc1": -0.1809,
+ "pc2": 0.0882,
+ "pc3": -0.2168,
+ "pc4": 0.0251,
+ "pc5": 0.0599,
+ "pc6": 0.1092,
+ "pc7": -0.0633,
+ "pc8": 0.0986,
+ "pc9": 0.0112,
+ "pc10": 0.0167
},
{
"feature": "model_haiku-4.5",
"axis": "model",
- "pc1": 0.1908,
- "pc2": 0.0503,
- "pc3": 0.0871,
- "pc4": 0.0354,
- "pc5": 0.0191,
- "pc6": 0.0337,
- "pc7": 0.0998,
- "pc8": 0.0,
- "pc9": 0.0011,
- "pc10": 0.0556
+ "pc1": 0.2215,
+ "pc2": 0.0613,
+ "pc3": -0.0257,
+ "pc4": -0.038,
+ "pc5": 0.0179,
+ "pc6": -0.0147,
+ "pc7": 0.0071,
+ "pc8": 0.012,
+ "pc9": 0.0087,
+ "pc10": -0.0212
+ },
+ {
+ "feature": "model_kimi-k2.5",
+ "axis": "model",
+ "pc1": -0.0188,
+ "pc2": -0.0022,
+ "pc3": 0.0852,
+ "pc4": -0.0216,
+ "pc5": -0.0338,
+ "pc6": 0.0,
+ "pc7": 0.0257,
+ "pc8": -0.0237,
+ "pc9": -0.0048,
+ "pc10": -0.0282
+ },
+ {
+ "feature": "model_minimax-m2.7",
+ "axis": "model",
+ "pc1": -0.0188,
+ "pc2": -0.0024,
+ "pc3": 0.0888,
+ "pc4": -0.0214,
+ "pc5": -0.0205,
+ "pc6": 0.0069,
+ "pc7": 0.0134,
+ "pc8": -0.0206,
+ "pc9": -0.0164,
+ "pc10": -0.0035
},
{
"feature": "model_opus-4.6",
"axis": "model",
- "pc1": 0.1116,
- "pc2": -0.1715,
- "pc3": -0.0269,
- "pc4": -0.0536,
- "pc5": 0.0011,
- "pc6": -0.0003,
- "pc7": -0.0051,
- "pc8": 0.0,
- "pc9": 0.0002,
- "pc10": 0.0008
+ "pc1": 0.1238,
+ "pc2": -0.1728,
+ "pc3": -0.0404,
+ "pc4": 0.0657,
+ "pc5": 0.0358,
+ "pc6": -0.0005,
+ "pc7": -0.0377,
+ "pc8": 0.0176,
+ "pc9": -0.0001,
+ "pc10": 0.0092
},
{
"feature": "model_qwen-3.6-plus",
"axis": "model",
- "pc1": -0.0953,
- "pc2": 0.0298,
- "pc3": 0.2932,
- "pc4": -0.0246,
- "pc5": -0.0637,
- "pc6": -0.1049,
- "pc7": -0.0908,
- "pc8": -0.0,
- "pc9": -0.0042,
- "pc10": -0.0438
+ "pc1": -0.0381,
+ "pc2": -0.0001,
+ "pc3": 0.2581,
+ "pc4": -0.0909,
+ "pc5": -0.148,
+ "pc6": 0.0672,
+ "pc7": -0.0274,
+ "pc8": -0.0065,
+ "pc9": 0.0325,
+ "pc10": 0.0219
},
{
"feature": "model_sonnet-4.6",
"axis": "model",
- "pc1": 0.1093,
- "pc2": -0.1709,
- "pc3": -0.0264,
- "pc4": -0.0539,
- "pc5": 0.0018,
- "pc6": 0.0003,
- "pc7": -0.0039,
- "pc8": -0.0,
- "pc9": 0.0002,
- "pc10": 0.0012
+ "pc1": 0.1222,
+ "pc2": -0.1723,
+ "pc3": -0.0391,
+ "pc4": 0.0686,
+ "pc5": 0.0302,
+ "pc6": 0.0097,
+ "pc7": -0.0246,
+ "pc8": -0.005,
+ "pc9": 0.0244,
+ "pc10": 0.0167
},
{
"feature": "effort_high",
"axis": "effort",
- "pc1": 0.0063,
- "pc2": 0.0971,
- "pc3": 0.0245,
- "pc4": 0.0799,
- "pc5": -0.0152,
- "pc6": -0.386,
- "pc7": 0.3958,
- "pc8": 0.0,
- "pc9": -0.0033,
- "pc10": 0.2083
+ "pc1": 0.0013,
+ "pc2": 0.1002,
+ "pc3": -0.0513,
+ "pc4": -0.0539,
+ "pc5": -0.0512,
+ "pc6": -0.3167,
+ "pc7": 0.188,
+ "pc8": 0.3588,
+ "pc9": 0.0227,
+ "pc10": -0.0088
},
{
"feature": "effort_max",
"axis": "effort",
- "pc1": -0.0063,
- "pc2": -0.0971,
- "pc3": -0.0245,
- "pc4": -0.0799,
- "pc5": 0.0152,
- "pc6": 0.386,
- "pc7": -0.3958,
- "pc8": -0.0,
- "pc9": 0.0033,
- "pc10": -0.2083
+ "pc1": -0.0013,
+ "pc2": -0.1002,
+ "pc3": 0.0513,
+ "pc4": 0.0539,
+ "pc5": 0.0512,
+ "pc6": 0.3167,
+ "pc7": -0.188,
+ "pc8": -0.3588,
+ "pc9": -0.0227,
+ "pc10": 0.0088
},
{
"feature": "prompt_style_detailed",
"axis": "prompt_style",
- "pc1": 0.1079,
- "pc2": 0.1406,
- "pc3": -0.0827,
- "pc4": -0.1748,
- "pc5": -0.3615,
- "pc6": -0.0085,
- "pc7": -0.0295,
- "pc8": -0.0,
- "pc9": -0.0047,
- "pc10": 0.1479
+ "pc1": 0.1121,
+ "pc2": 0.1459,
+ "pc3": -0.0809,
+ "pc4": 0.2672,
+ "pc5": -0.2802,
+ "pc6": 0.0146,
+ "pc7": 0.0675,
+ "pc8": -0.0136,
+ "pc9": -0.0302,
+ "pc10": 0.0717
},
{
"feature": "prompt_style_simple",
"axis": "prompt_style",
- "pc1": -0.1079,
- "pc2": -0.1406,
- "pc3": 0.0827,
- "pc4": 0.1748,
- "pc5": 0.3615,
- "pc6": 0.0085,
- "pc7": 0.0295,
- "pc8": 0.0,
- "pc9": 0.0047,
- "pc10": -0.1479
+ "pc1": -0.1121,
+ "pc2": -0.1459,
+ "pc3": 0.0809,
+ "pc4": -0.2672,
+ "pc5": 0.2802,
+ "pc6": -0.0146,
+ "pc7": -0.0675,
+ "pc8": 0.0136,
+ "pc9": 0.0302,
+ "pc10": -0.0717
},
{
"feature": "language_javascript",
"axis": "language",
- "pc1": -0.0237,
- "pc2": -0.0829,
- "pc3": -0.1091,
- "pc4": -0.0589,
- "pc5": 0.0662,
- "pc6": -0.2734,
- "pc7": 0.097,
- "pc8": -0.0,
- "pc9": -0.0003,
- "pc10": -0.0271
+ "pc1": -0.0052,
+ "pc2": -0.0979,
+ "pc3": 0.0942,
+ "pc4": 0.0565,
+ "pc5": -0.0075,
+ "pc6": -0.2044,
+ "pc7": 0.1595,
+ "pc8": 0.1631,
+ "pc9": -0.02,
+ "pc10": 0.0254
},
{
"feature": "language_typescript",
"axis": "language",
- "pc1": 0.0449,
- "pc2": 0.1114,
- "pc3": 0.1754,
- "pc4": 0.0821,
- "pc5": -0.0997,
- "pc6": 0.4074,
- "pc7": -0.1348,
- "pc8": 0.0,
- "pc9": 0.0003,
- "pc10": 0.049
+ "pc1": 0.0109,
+ "pc2": 0.1364,
+ "pc3": -0.1234,
+ "pc4": -0.0761,
+ "pc5": 0.0064,
+ "pc6": 0.2872,
+ "pc7": -0.2122,
+ "pc8": -0.248,
+ "pc9": 0.0248,
+ "pc10": -0.0487
},
{
"feature": "language_unspecified",
"axis": "language",
- "pc1": -0.0381,
- "pc2": -0.0708,
- "pc3": -0.1325,
- "pc4": -0.0543,
- "pc5": 0.0712,
- "pc6": -0.2882,
- "pc7": 0.089,
- "pc8": -0.0,
- "pc9": -0.0,
- "pc10": -0.0402
+ "pc1": -0.0099,
+ "pc2": -0.0908,
+ "pc3": 0.0764,
+ "pc4": 0.0488,
+ "pc5": -0.0014,
+ "pc6": -0.1931,
+ "pc7": 0.1339,
+ "pc8": 0.1804,
+ "pc9": -0.0142,
+ "pc10": 0.0423
},
{
"feature": "human_language_en",
"axis": "human_language",
- "pc1": -0.1045,
- "pc2": -0.11,
- "pc3": 0.0384,
- "pc4": -0.1483,
- "pc5": 0.3033,
- "pc6": -0.0345,
- "pc7": -0.1638,
- "pc8": -0.0,
- "pc9": -0.0101,
- "pc10": 0.3149
+ "pc1": -0.1146,
+ "pc2": -0.1134,
+ "pc3": 0.1152,
+ "pc4": 0.0583,
+ "pc5": 0.2954,
+ "pc6": -0.0182,
+ "pc7": -0.0435,
+ "pc8": 0.0409,
+ "pc9": -0.0283,
+ "pc10": 0.2968
},
{
"feature": "human_language_es",
"axis": "human_language",
- "pc1": 0.1045,
- "pc2": 0.11,
- "pc3": -0.0384,
- "pc4": 0.1483,
- "pc5": -0.3033,
- "pc6": 0.0345,
- "pc7": 0.1638,
- "pc8": 0.0,
- "pc9": 0.0101,
- "pc10": -0.3149
+ "pc1": 0.1146,
+ "pc2": 0.1134,
+ "pc3": -0.1152,
+ "pc4": -0.0583,
+ "pc5": -0.2954,
+ "pc6": 0.0182,
+ "pc7": 0.0435,
+ "pc8": -0.0409,
+ "pc9": 0.0283,
+ "pc10": -0.2968
},
{
"feature": "tool_read_off",
"axis": "tool_read",
- "pc1": 0.1508,
- "pc2": 0.1707,
- "pc3": 0.0235,
- "pc4": -0.1831,
- "pc5": -0.1054,
- "pc6": 0.0209,
- "pc7": 0.0829,
- "pc8": 0.0,
- "pc9": 0.0005,
- "pc10": -0.0112
+ "pc1": 0.1319,
+ "pc2": 0.1774,
+ "pc3": 0.0365,
+ "pc4": 0.1892,
+ "pc5": -0.0493,
+ "pc6": 0.0454,
+ "pc7": -0.0064,
+ "pc8": 0.0271,
+ "pc9": 0.0141,
+ "pc10": -0.0787
},
{
"feature": "tool_read_on",
"axis": "tool_read",
- "pc1": -0.1508,
- "pc2": -0.1707,
- "pc3": -0.0235,
- "pc4": 0.1831,
- "pc5": 0.1054,
- "pc6": -0.0209,
- "pc7": -0.0829,
- "pc8": -0.0,
- "pc9": -0.0005,
- "pc10": 0.0112
+ "pc1": -0.1319,
+ "pc2": -0.1774,
+ "pc3": -0.0365,
+ "pc4": -0.1892,
+ "pc5": 0.0493,
+ "pc6": -0.0454,
+ "pc7": 0.0064,
+ "pc8": -0.0271,
+ "pc9": -0.0141,
+ "pc10": 0.0787
},
{
"feature": "tool_write_off",
"axis": "tool_write",
- "pc1": 0.1473,
- "pc2": 0.1749,
- "pc3": 0.0487,
- "pc4": 0.1499,
- "pc5": 0.199,
- "pc6": -0.0195,
- "pc7": -0.0582,
- "pc8": -0.0,
- "pc9": 0.0012,
- "pc10": -0.0589
+ "pc1": 0.1362,
+ "pc2": 0.1811,
+ "pc3": 0.0097,
+ "pc4": -0.1903,
+ "pc5": 0.1378,
+ "pc6": -0.0387,
+ "pc7": 0.006,
+ "pc8": 0.0051,
+ "pc9": -0.0239,
+ "pc10": 0.0672
},
{
"feature": "tool_write_on",
"axis": "tool_write",
- "pc1": -0.1473,
- "pc2": -0.1749,
- "pc3": -0.0487,
- "pc4": -0.1499,
- "pc5": -0.199,
- "pc6": 0.0195,
- "pc7": 0.0582,
- "pc8": 0.0,
- "pc9": -0.0012,
- "pc10": 0.0589
+ "pc1": -0.1362,
+ "pc2": -0.1811,
+ "pc3": -0.0097,
+ "pc4": 0.1903,
+ "pc5": -0.1378,
+ "pc6": 0.0387,
+ "pc7": -0.006,
+ "pc8": -0.0051,
+ "pc9": 0.0239,
+ "pc10": -0.0672
},
{
"feature": "tool_edit_off",
"axis": "tool_edit",
- "pc1": 0.1527,
- "pc2": 0.1838,
- "pc3": 0.0679,
- "pc4": 0.0468,
- "pc5": 0.1352,
- "pc6": 0.0205,
- "pc7": 0.1182,
- "pc8": 0.0,
- "pc9": 0.0053,
- "pc10": -0.1735
+ "pc1": 0.1371,
+ "pc2": 0.1884,
+ "pc3": 0.0539,
+ "pc4": -0.1019,
+ "pc5": 0.0958,
+ "pc6": 0.0057,
+ "pc7": -0.0182,
+ "pc8": -0.0458,
+ "pc9": 0.0419,
+ "pc10": -0.2448
},
{
"feature": "tool_edit_on",
"axis": "tool_edit",
- "pc1": -0.1527,
- "pc2": -0.1838,
- "pc3": -0.0679,
- "pc4": -0.0468,
- "pc5": -0.1352,
- "pc6": -0.0205,
- "pc7": -0.1182,
- "pc8": -0.0,
- "pc9": -0.0053,
- "pc10": 0.1735
+ "pc1": -0.1371,
+ "pc2": -0.1884,
+ "pc3": -0.0539,
+ "pc4": 0.1019,
+ "pc5": -0.0958,
+ "pc6": -0.0057,
+ "pc7": 0.0182,
+ "pc8": 0.0458,
+ "pc9": -0.0419,
+ "pc10": 0.2448
},
{
"feature": "tool_glob_off",
"axis": "tool_glob",
- "pc1": 0.1167,
- "pc2": 0.1367,
- "pc3": 0.0707,
- "pc4": -0.1744,
- "pc5": 0.2577,
- "pc6": 0.0522,
- "pc7": 0.1668,
- "pc8": 0.0,
- "pc9": 0.0088,
- "pc10": -0.2563
+ "pc1": 0.0974,
+ "pc2": 0.1379,
+ "pc3": 0.1318,
+ "pc4": 0.0809,
+ "pc5": 0.2741,
+ "pc6": -0.0024,
+ "pc7": -0.0769,
+ "pc8": 0.0208,
+ "pc9": 0.0813,
+ "pc10": -0.3012
},
{
"feature": "tool_glob_on",
"axis": "tool_glob",
- "pc1": -0.1167,
- "pc2": -0.1367,
- "pc3": -0.0707,
- "pc4": 0.1744,
- "pc5": -0.2577,
- "pc6": -0.0522,
- "pc7": -0.1668,
- "pc8": -0.0,
- "pc9": -0.0088,
- "pc10": 0.2563
+ "pc1": -0.0974,
+ "pc2": -0.1379,
+ "pc3": -0.1318,
+ "pc4": -0.0809,
+ "pc5": -0.2741,
+ "pc6": 0.0024,
+ "pc7": 0.0769,
+ "pc8": -0.0208,
+ "pc9": -0.0813,
+ "pc10": 0.3012
},
{
"feature": "tool_grep_off",
"axis": "tool_grep",
- "pc1": 0.1394,
- "pc2": 0.1714,
- "pc3": 0.0357,
- "pc4": -0.0669,
- "pc5": 0.2328,
- "pc6": -0.0416,
- "pc7": -0.1347,
- "pc8": -0.0,
- "pc9": -0.0064,
- "pc10": 0.1852
+ "pc1": 0.1324,
+ "pc2": 0.1768,
+ "pc3": 0.0708,
+ "pc4": 0.002,
+ "pc5": 0.2375,
+ "pc6": -0.0166,
+ "pc7": -0.0801,
+ "pc8": 0.0444,
+ "pc9": -0.0158,
+ "pc10": 0.2046
},
{
"feature": "tool_grep_on",
"axis": "tool_grep",
- "pc1": -0.1394,
- "pc2": -0.1714,
- "pc3": -0.0357,
- "pc4": 0.0669,
- "pc5": -0.2328,
- "pc6": 0.0416,
- "pc7": 0.1347,
- "pc8": 0.0,
- "pc9": 0.0064,
- "pc10": -0.1852
+ "pc1": -0.1324,
+ "pc2": -0.1768,
+ "pc3": -0.0708,
+ "pc4": -0.002,
+ "pc5": -0.2375,
+ "pc6": 0.0166,
+ "pc7": 0.0801,
+ "pc8": -0.0444,
+ "pc9": 0.0158,
+ "pc10": -0.2046
},
{
"feature": "linter_off",
"axis": "linter",
- "pc1": 0.125,
- "pc2": 0.215,
- "pc3": -0.0542,
- "pc4": -0.1348,
- "pc5": 0.0408,
- "pc6": -0.0623,
- "pc7": -0.2115,
- "pc8": -0.0,
- "pc9": -0.0093,
- "pc10": 0.2667
+ "pc1": 0.1215,
+ "pc2": 0.2165,
+ "pc3": 0.0565,
+ "pc4": 0.124,
+ "pc5": 0.0565,
+ "pc6": -0.0045,
+ "pc7": -0.0215,
+ "pc8": 0.0352,
+ "pc9": -0.0403,
+ "pc10": 0.3256
},
{
"feature": "linter_on",
"axis": "linter",
- "pc1": -0.125,
- "pc2": -0.215,
- "pc3": 0.0542,
- "pc4": 0.1348,
- "pc5": -0.0408,
- "pc6": 0.0623,
- "pc7": 0.2115,
- "pc8": 0.0,
- "pc9": 0.0093,
- "pc10": -0.2667
+ "pc1": -0.1215,
+ "pc2": -0.2165,
+ "pc3": -0.0565,
+ "pc4": -0.124,
+ "pc5": -0.0565,
+ "pc6": 0.0045,
+ "pc7": 0.0215,
+ "pc8": -0.0352,
+ "pc9": 0.0403,
+ "pc10": -0.3256
},
{
"feature": "playwright_available",
"axis": "playwright",
- "pc1": 0.2836,
- "pc2": -0.2416,
- "pc3": -0.0259,
- "pc4": -0.054,
- "pc5": 0.0086,
- "pc6": 0.0138,
- "pc7": 0.0162,
- "pc8": 0.0,
- "pc9": 0.0013,
- "pc10": -0.0072
+ "pc1": 0.2853,
+ "pc2": -0.2259,
+ "pc3": -0.0774,
+ "pc4": 0.072,
+ "pc5": 0.0576,
+ "pc6": 0.0032,
+ "pc7": -0.0467,
+ "pc8": 0.0137,
+ "pc9": 0.0244,
+ "pc10": 0.0033
},
{
"feature": "playwright_instructed",
"axis": "playwright",
- "pc1": -0.0415,
- "pc2": 0.002,
- "pc3": 0.0007,
- "pc4": -0.0036,
- "pc5": 0.0011,
- "pc6": -0.0108,
- "pc7": -0.0241,
- "pc8": 0.0,
- "pc9": -0.0006,
- "pc10": -0.0199
+ "pc1": -0.0348,
+ "pc2": -0.0113,
+ "pc3": 0.0624,
+ "pc4": -0.0186,
+ "pc5": -0.0154,
+ "pc6": -0.0075,
+ "pc7": 0.0375,
+ "pc8": 0.0079,
+ "pc9": -0.0243,
+ "pc10": -0.0147
},
{
"feature": "playwright_off",
"axis": "playwright",
- "pc1": -0.273,
- "pc2": 0.2401,
- "pc3": 0.0257,
- "pc4": 0.0546,
- "pc5": -0.0089,
- "pc6": -0.0113,
- "pc7": -0.0107,
- "pc8": -0.0,
- "pc9": -0.0012,
- "pc10": 0.0117
+ "pc1": -0.2701,
+ "pc2": 0.2257,
+ "pc3": 0.0571,
+ "pc4": -0.0652,
+ "pc5": -0.052,
+ "pc6": -0.0008,
+ "pc7": 0.0345,
+ "pc8": -0.0159,
+ "pc9": -0.0166,
+ "pc10": 0.0013
},
{
"feature": "context_file_none",
"axis": "context_file",
- "pc1": -0.1297,
- "pc2": -0.0865,
- "pc3": -0.0288,
- "pc4": -0.372,
- "pc5": -0.0614,
- "pc6": 0.0243,
- "pc7": 0.0914,
- "pc8": 0.0,
- "pc9": 0.0014,
- "pc10": -0.0325
+ "pc1": -0.1276,
+ "pc2": -0.0912,
+ "pc3": 0.0909,
+ "pc4": 0.3681,
+ "pc5": -0.0019,
+ "pc6": 0.0141,
+ "pc7": -0.0121,
+ "pc8": -0.0114,
+ "pc9": 0.015,
+ "pc10": -0.134
},
{
"feature": "context_file_provided",
"axis": "context_file",
- "pc1": 0.1297,
- "pc2": 0.0865,
- "pc3": 0.0288,
- "pc4": 0.372,
- "pc5": 0.0614,
- "pc6": -0.0243,
- "pc7": -0.0914,
- "pc8": -0.0,
- "pc9": -0.0014,
- "pc10": 0.0325
+ "pc1": 0.1276,
+ "pc2": 0.0912,
+ "pc3": -0.0909,
+ "pc4": -0.3681,
+ "pc5": 0.0019,
+ "pc6": -0.0141,
+ "pc7": 0.0121,
+ "pc8": 0.0114,
+ "pc9": -0.015,
+ "pc10": 0.134
},
{
"feature": "web_search_off",
"axis": "web_search",
- "pc1": 0.1418,
- "pc2": 0.2238,
- "pc3": -0.0526,
- "pc4": -0.0511,
- "pc5": -0.2057,
- "pc6": -0.0115,
- "pc7": -0.0187,
- "pc8": -0.0,
- "pc9": 0.0002,
- "pc10": -0.0299
+ "pc1": 0.1334,
+ "pc2": 0.2309,
+ "pc3": -0.0424,
+ "pc4": 0.1218,
+ "pc5": -0.1833,
+ "pc6": -0.0076,
+ "pc7": 0.0585,
+ "pc8": -0.0415,
+ "pc9": -0.0196,
+ "pc10": 0.0375
},
{
"feature": "web_search_on",
"axis": "web_search",
- "pc1": -0.1418,
- "pc2": -0.2238,
- "pc3": 0.0526,
- "pc4": 0.0511,
- "pc5": 0.2057,
- "pc6": 0.0115,
- "pc7": 0.0187,
- "pc8": 0.0,
- "pc9": -0.0002,
- "pc10": 0.0299
+ "pc1": -0.1334,
+ "pc2": -0.2309,
+ "pc3": 0.0424,
+ "pc4": -0.1218,
+ "pc5": 0.1833,
+ "pc6": 0.0076,
+ "pc7": -0.0585,
+ "pc8": 0.0415,
+ "pc9": 0.0196,
+ "pc10": -0.0375
},
{
"feature": "max_budget_high",
"axis": "max_budget",
- "pc1": 0.0755,
- "pc2": 0.0026,
- "pc3": 0.0166,
- "pc4": 0.409,
- "pc5": -0.095,
- "pc6": -0.022,
- "pc7": -0.034,
- "pc8": -0.0,
- "pc9": -0.0048,
- "pc10": 0.126
+ "pc1": 0.0894,
+ "pc2": 0.0001,
+ "pc3": -0.1318,
+ "pc4": -0.3599,
+ "pc5": -0.1306,
+ "pc6": 0.029,
+ "pc7": 0.0728,
+ "pc8": 0.0036,
+ "pc9": -0.0312,
+ "pc10": 0.0121
},
{
"feature": "max_budget_low",
"axis": "max_budget",
- "pc1": -0.0755,
- "pc2": -0.0026,
- "pc3": -0.0166,
- "pc4": -0.409,
- "pc5": 0.095,
- "pc6": 0.022,
- "pc7": 0.034,
- "pc8": 0.0,
- "pc9": 0.0048,
- "pc10": -0.126
+ "pc1": -0.0894,
+ "pc2": -0.0001,
+ "pc3": 0.1318,
+ "pc4": 0.3599,
+ "pc5": 0.1306,
+ "pc6": -0.029,
+ "pc7": -0.0728,
+ "pc8": -0.0036,
+ "pc9": 0.0312,
+ "pc10": -0.0121
},
{
"feature": "strategy_creative_validate",
"axis": "strategy",
- "pc1": -0.0446,
- "pc2": -0.0022,
- "pc3": -0.0069,
- "pc4": 0.0131,
- "pc5": -0.0081,
- "pc6": -0.035,
- "pc7": -0.0355,
- "pc8": 0.0,
- "pc9": -0.0018,
- "pc10": 0.0043
+ "pc1": -0.0273,
+ "pc2": -0.0119,
+ "pc3": 0.0297,
+ "pc4": -0.0228,
+ "pc5": -0.0387,
+ "pc6": 0.0006,
+ "pc7": 0.0215,
+ "pc8": -0.0162,
+ "pc9": -0.0037,
+ "pc10": -0.0275
},
{
"feature": "strategy_delegate",
"axis": "strategy",
- "pc1": -0.03,
- "pc2": -0.0063,
- "pc3": 0.0594,
- "pc4": -0.0002,
- "pc5": -0.0153,
- "pc6": -0.0071,
- "pc7": -0.0062,
- "pc8": -0.0,
- "pc9": -0.0019,
- "pc10": 0.012
+ "pc1": -0.0325,
+ "pc2": -0.0065,
+ "pc3": -0.0106,
+ "pc4": -0.009,
+ "pc5": -0.0196,
+ "pc6": 0.0056,
+ "pc7": 0.031,
+ "pc8": -0.015,
+ "pc9": -0.0132,
+ "pc10": 0.0083
},
{
"feature": "strategy_iterate",
"axis": "strategy",
- "pc1": -0.0403,
- "pc2": -0.0028,
- "pc3": 0.011,
- "pc4": 0.0084,
- "pc5": -0.0078,
- "pc6": -0.0119,
- "pc7": -0.0232,
- "pc8": -0.0,
- "pc9": -0.0015,
- "pc10": 0.0023
+ "pc1": -0.0341,
+ "pc2": -0.013,
+ "pc3": 0.0418,
+ "pc4": -0.0147,
+ "pc5": -0.0371,
+ "pc6": -0.0179,
+ "pc7": 0.0394,
+ "pc8": -0.0243,
+ "pc9": -0.0328,
+ "pc10": -0.0144
},
{
"feature": "strategy_none",
"axis": "strategy",
- "pc1": -0.2321,
- "pc2": 0.2578,
- "pc3": -0.0258,
- "pc4": -0.0254,
- "pc5": 0.0523,
- "pc6": 0.0126,
- "pc7": 0.0267,
- "pc8": 0.0,
- "pc9": 0.0029,
- "pc10": -0.0569
+ "pc1": -0.2215,
+ "pc2": 0.2427,
+ "pc3": 0.0706,
+ "pc4": 0.0046,
+ "pc5": 0.0381,
+ "pc6": -0.0163,
+ "pc7": -0.0064,
+ "pc8": 0.0055,
+ "pc9": 0.0138,
+ "pc10": -0.021
},
{
"feature": "strategy_plan_first",
"axis": "strategy",
- "pc1": -0.0355,
- "pc2": -0.0041,
- "pc3": 0.0325,
- "pc4": 0.0039,
- "pc5": -0.01,
- "pc6": -0.0014,
- "pc7": -0.0133,
- "pc8": -0.0,
- "pc9": -0.0015,
- "pc10": 0.0044
+ "pc1": -0.033,
+ "pc2": -0.0124,
+ "pc3": 0.0173,
+ "pc4": -0.0157,
+ "pc5": -0.0352,
+ "pc6": 0.0142,
+ "pc7": 0.0205,
+ "pc8": -0.0033,
+ "pc9": -0.0114,
+ "pc10": -0.0011
},
{
"feature": "strategy_review",
"axis": "strategy",
- "pc1": -0.0236,
- "pc2": -0.0058,
- "pc3": 0.0267,
- "pc4": 0.003,
- "pc5": -0.0065,
- "pc6": 0.0065,
- "pc7": 0.0063,
- "pc8": 0.0,
- "pc9": -0.0009,
- "pc10": 0.0141
+ "pc1": -0.0273,
+ "pc2": -0.0065,
+ "pc3": 0.0053,
+ "pc4": -0.0105,
+ "pc5": -0.0159,
+ "pc6": 0.0216,
+ "pc7": -0.0038,
+ "pc8": 0.0146,
+ "pc9": -0.0072,
+ "pc10": -0.0233
},
{
"feature": "strategy_split_work",
"axis": "strategy",
- "pc1": -0.03,
- "pc2": -0.0063,
- "pc3": 0.0594,
- "pc4": -0.0002,
- "pc5": -0.0153,
- "pc6": -0.0071,
- "pc7": -0.0062,
- "pc8": 0.0,
- "pc9": -0.0019,
- "pc10": 0.012
+ "pc1": -0.0274,
+ "pc2": -0.0065,
+ "pc3": 0.0073,
+ "pc4": -0.0115,
+ "pc5": -0.0205,
+ "pc6": 0.016,
+ "pc7": -0.0052,
+ "pc8": 0.0072,
+ "pc9": -0.0159,
+ "pc10": -0.0016
},
{
"feature": "strategy_use_subagents",
"axis": "strategy",
- "pc1": 0.2833,
- "pc2": -0.257,
- "pc3": -0.0111,
- "pc4": 0.019,
- "pc5": -0.0395,
- "pc6": 0.0017,
- "pc7": -0.0074,
- "pc8": -0.0,
- "pc9": -0.0008,
- "pc10": 0.0478
+ "pc1": 0.2807,
+ "pc2": -0.2405,
+ "pc3": -0.1005,
+ "pc4": 0.0173,
+ "pc5": 0.0047,
+ "pc6": 0.009,
+ "pc7": -0.0231,
+ "pc8": 0.0062,
+ "pc9": 0.0082,
+ "pc10": 0.0374
},
{
"feature": "design_guidance_none",
"axis": "design_guidance",
- "pc1": 0.0678,
- "pc2": -0.0147,
- "pc3": -0.2017,
- "pc4": 0.0172,
- "pc5": 0.0457,
- "pc6": 0.0735,
- "pc7": 0.0475,
- "pc8": -0.5013,
- "pc9": -0.2278,
- "pc10": 0.0312
+ "pc1": 0.0604,
+ "pc2": -0.0165,
+ "pc3": -0.0404,
+ "pc4": 0.0455,
+ "pc5": 0.1618,
+ "pc6": -0.115,
+ "pc7": 0.2498,
+ "pc8": -0.1135,
+ "pc9": -0.4778,
+ "pc10": -0.1866
},
{
"feature": "design_guidance_specific",
"axis": "design_guidance",
- "pc1": -0.0477,
- "pc2": 0.0103,
- "pc3": 0.1419,
- "pc4": -0.0121,
- "pc5": -0.0321,
- "pc6": -0.0517,
- "pc7": -0.0334,
- "pc8": 0.3526,
- "pc9": 0.1602,
- "pc10": -0.0219
+ "pc1": -0.0425,
+ "pc2": 0.0119,
+ "pc3": 0.0267,
+ "pc4": -0.0335,
+ "pc5": -0.1131,
+ "pc6": 0.0743,
+ "pc7": -0.1705,
+ "pc8": 0.0702,
+ "pc9": 0.3413,
+ "pc10": 0.1245
},
{
"feature": "design_guidance_vague",
"axis": "design_guidance",
- "pc1": -0.0477,
- "pc2": 0.0103,
- "pc3": 0.1419,
- "pc4": -0.0121,
- "pc5": -0.0321,
- "pc6": -0.0517,
- "pc7": -0.0334,
- "pc8": 0.3526,
- "pc9": 0.1602,
- "pc10": -0.0219
+ "pc1": -0.0425,
+ "pc2": 0.0113,
+ "pc3": 0.0301,
+ "pc4": -0.0305,
+ "pc5": -0.1146,
+ "pc6": 0.0876,
+ "pc7": -0.1811,
+ "pc8": 0.0895,
+ "pc9": 0.331,
+ "pc10": 0.138
},
{
"feature": "architecture_best_practices",
"axis": "architecture",
- "pc1": -0.0477,
- "pc2": 0.0103,
- "pc3": 0.1419,
- "pc4": -0.0121,
- "pc5": -0.0321,
- "pc6": -0.0517,
- "pc7": -0.0334,
- "pc8": -0.3526,
- "pc9": 0.1602,
- "pc10": -0.0219
+ "pc1": -0.0398,
+ "pc2": 0.0132,
+ "pc3": -0.0286,
+ "pc4": -0.0023,
+ "pc5": -0.0413,
+ "pc6": 0.0189,
+ "pc7": -0.2321,
+ "pc8": 0.0759,
+ "pc9": -0.333,
+ "pc10": -0.0135
},
{
"feature": "architecture_none",
"axis": "architecture",
- "pc1": 0.0678,
- "pc2": -0.0147,
- "pc3": -0.2017,
- "pc4": 0.0172,
- "pc5": 0.0457,
- "pc6": 0.0735,
- "pc7": 0.0475,
- "pc8": 0.5013,
- "pc9": -0.2278,
- "pc10": 0.0312
+ "pc1": 0.0585,
+ "pc2": -0.0181,
+ "pc3": 0.0201,
+ "pc4": 0.0138,
+ "pc5": 0.0772,
+ "pc6": -0.0466,
+ "pc7": 0.3313,
+ "pc8": -0.109,
+ "pc9": 0.4907,
+ "pc10": -0.0201
},
{
"feature": "architecture_separation",
"axis": "architecture",
- "pc1": -0.0477,
- "pc2": 0.0103,
- "pc3": 0.1419,
- "pc4": -0.0121,
- "pc5": -0.0321,
- "pc6": -0.0517,
- "pc7": -0.0334,
- "pc8": -0.3526,
- "pc9": 0.1602,
- "pc10": -0.0219
+ "pc1": -0.0426,
+ "pc2": 0.0123,
+ "pc3": -0.0013,
+ "pc4": -0.0164,
+ "pc5": -0.0661,
+ "pc6": 0.0453,
+ "pc7": -0.2348,
+ "pc8": 0.0777,
+ "pc9": -0.3575,
+ "pc10": 0.039
},
{
"feature": "error_checking_none",
"axis": "error_checking",
- "pc1": 0.0476,
- "pc2": -0.0103,
- "pc3": -0.1397,
- "pc4": 0.0118,
- "pc5": 0.031,
- "pc6": 0.047,
- "pc7": 0.0255,
- "pc8": -0.0,
- "pc9": 0.6295,
- "pc10": 0.0435
+ "pc1": 0.0398,
+ "pc2": -0.0138,
+ "pc3": 0.0618,
+ "pc4": -0.0015,
+ "pc5": -0.029,
+ "pc6": 0.0172,
+ "pc7": 0.2448,
+ "pc8": -0.3718,
+ "pc9": -0.0662,
+ "pc10": 0.188
},
{
"feature": "error_checking_self_verify",
"axis": "error_checking",
- "pc1": -0.0476,
- "pc2": 0.0103,
- "pc3": 0.1397,
- "pc4": -0.0118,
- "pc5": -0.031,
- "pc6": -0.047,
- "pc7": -0.0255,
- "pc8": 0.0,
- "pc9": -0.6295,
- "pc10": -0.0435
+ "pc1": -0.0398,
+ "pc2": 0.0138,
+ "pc3": -0.0618,
+ "pc4": 0.0015,
+ "pc5": 0.029,
+ "pc6": -0.0172,
+ "pc7": -0.2448,
+ "pc8": 0.3718,
+ "pc9": 0.0662,
+ "pc10": -0.188
+ },
+ {
+ "feature": "context_noise_clean",
+ "axis": "context_noise",
+ "pc1": 0.1196,
+ "pc2": -0.0427,
+ "pc3": 0.2027,
+ "pc4": -0.0448,
+ "pc5": -0.2013,
+ "pc6": -0.3187,
+ "pc7": -0.3203,
+ "pc8": -0.076,
+ "pc9": -0.0123,
+ "pc10": -0.0046
+ },
+ {
+ "feature": "context_noise_lorem_100k",
+ "axis": "context_noise",
+ "pc1": -0.0491,
+ "pc2": 0.0177,
+ "pc3": -0.0823,
+ "pc4": 0.02,
+ "pc5": 0.0808,
+ "pc6": 0.1204,
+ "pc7": 0.1359,
+ "pc8": 0.0125,
+ "pc9": 0.0092,
+ "pc10": -0.0046
+ },
+ {
+ "feature": "context_noise_lorem_10k",
+ "axis": "context_noise",
+ "pc1": -0.0491,
+ "pc2": 0.018,
+ "pc3": -0.0801,
+ "pc4": 0.0154,
+ "pc5": 0.088,
+ "pc6": 0.1183,
+ "pc7": 0.1468,
+ "pc8": 0.0243,
+ "pc9": 0.0116,
+ "pc10": 0.0071
+ },
+ {
+ "feature": "context_noise_lorem_1k",
+ "axis": "context_noise",
+ "pc1": -0.0354,
+ "pc2": 0.0124,
+ "pc3": -0.0658,
+ "pc4": 0.007,
+ "pc5": 0.0559,
+ "pc6": 0.1128,
+ "pc7": 0.0783,
+ "pc8": 0.0271,
+ "pc9": 0.0079,
+ "pc10": 0.0076
+ },
+ {
+ "feature": "context_noise_lorem_50k",
+ "axis": "context_noise",
+ "pc1": -0.0491,
+ "pc2": 0.0178,
+ "pc3": -0.0779,
+ "pc4": 0.0229,
+ "pc5": 0.0918,
+ "pc6": 0.1166,
+ "pc7": 0.1531,
+ "pc8": 0.0165,
+ "pc9": 0.0035,
+ "pc10": 0.0099
+ },
+ {
+ "feature": "context_noise_wikipedia_100k",
+ "axis": "context_noise",
+ "pc1": -0.0355,
+ "pc2": 0.0123,
+ "pc3": -0.0636,
+ "pc4": 0.0113,
+ "pc5": 0.047,
+ "pc6": 0.1047,
+ "pc7": 0.0757,
+ "pc8": 0.0049,
+ "pc9": 0.0037,
+ "pc10": -0.0203
+ },
+ {
+ "feature": "context_noise_wikipedia_10k",
+ "axis": "context_noise",
+ "pc1": -0.0354,
+ "pc2": 0.0123,
+ "pc3": -0.0578,
+ "pc4": 0.0153,
+ "pc5": 0.058,
+ "pc6": 0.0997,
+ "pc7": 0.0929,
+ "pc8": 0.0596,
+ "pc9": 0.0008,
+ "pc10": -0.0021
+ },
+ {
+ "feature": "context_noise_wikipedia_1k",
+ "axis": "context_noise",
+ "pc1": -0.0354,
+ "pc2": 0.0123,
+ "pc3": -0.0672,
+ "pc4": 0.0139,
+ "pc5": 0.0538,
+ "pc6": 0.1066,
+ "pc7": 0.0815,
+ "pc8": 0.0377,
+ "pc9": -0.0029,
+ "pc10": -0.0098
+ },
+ {
+ "feature": "context_noise_wikipedia_50k",
+ "axis": "context_noise",
+ "pc1": -0.0354,
+ "pc2": 0.0126,
+ "pc3": -0.059,
+ "pc4": 0.0145,
+ "pc5": 0.0653,
+ "pc6": 0.1004,
+ "pc7": 0.0876,
+ "pc8": 0.0399,
+ "pc9": -0.0043,
+ "pc10": 0.022
},
{
"feature": "renderer_canvas",
"axis": "renderer",
- "pc1": -0.0391,
- "pc2": 0.0096,
- "pc3": 0.0197,
- "pc4": 0.0078,
- "pc5": 0.022,
- "pc6": 0.1561,
- "pc7": 0.1714,
- "pc8": 0.0,
- "pc9": -0.0009,
- "pc10": 0.1371
+ "pc1": -0.0525,
+ "pc2": 0.0189,
+ "pc3": -0.0714,
+ "pc4": 0.0183,
+ "pc5": 0.0428,
+ "pc6": -0.246,
+ "pc7": -0.0636,
+ "pc8": -0.1893,
+ "pc9": 0.0478,
+ "pc10": -0.0147
},
{
"feature": "renderer_dom",
"axis": "renderer",
- "pc1": -0.0626,
- "pc2": 0.0219,
- "pc3": -0.048,
- "pc4": 0.0203,
- "pc5": 0.0464,
- "pc6": 0.2321,
- "pc7": 0.2193,
- "pc8": 0.0,
- "pc9": -0.0001,
- "pc10": 0.1684
+ "pc1": -0.0446,
+ "pc2": 0.0155,
+ "pc3": -0.0638,
+ "pc4": 0.0061,
+ "pc5": 0.0322,
+ "pc6": -0.193,
+ "pc7": -0.086,
+ "pc8": -0.1726,
+ "pc9": 0.0425,
+ "pc10": -0.0031
},
{
"feature": "renderer_none",
"axis": "renderer",
- "pc1": 0.0977,
- "pc2": -0.0295,
- "pc3": 0.0166,
- "pc4": -0.0259,
- "pc5": -0.0643,
- "pc6": -0.3752,
- "pc7": -0.3826,
- "pc8": -0.0,
- "pc9": 0.0012,
- "pc10": -0.3003
+ "pc1": 0.097,
+ "pc2": -0.0341,
+ "pc3": 0.143,
+ "pc4": -0.022,
+ "pc5": -0.0696,
+ "pc6": 0.4243,
+ "pc7": 0.1334,
+ "pc8": 0.3402,
+ "pc9": -0.089,
+ "pc10": -0.0005
},
{
"feature": "renderer_svg",
"axis": "renderer",
- "pc1": -0.0391,
- "pc2": 0.0096,
- "pc3": 0.0197,
- "pc4": 0.0078,
- "pc5": 0.022,
- "pc6": 0.1561,
- "pc7": 0.1714,
- "pc8": 0.0,
- "pc9": -0.0009,
- "pc10": 0.1371
+ "pc1": -0.0525,
+ "pc2": 0.0186,
+ "pc3": -0.0799,
+ "pc4": 0.01,
+ "pc5": 0.0316,
+ "pc6": -0.2235,
+ "pc7": -0.0619,
+ "pc8": -0.1822,
+ "pc9": 0.046,
+ "pc10": 0.0082
},
{
"feature": "renderer_webgl",
"axis": "renderer",
- "pc1": -0.0481,
- "pc2": 0.0145,
- "pc3": -0.0081,
- "pc4": 0.0127,
- "pc5": 0.0316,
- "pc6": 0.1845,
- "pc7": 0.1882,
- "pc8": 0.0,
- "pc9": -0.0006,
- "pc10": 0.1477
+ "pc1": -0.0401,
+ "pc2": 0.0136,
+ "pc3": -0.0657,
+ "pc4": 0.0075,
+ "pc5": 0.0296,
+ "pc6": -0.1632,
+ "pc7": -0.0523,
+ "pc8": -0.1176,
+ "pc9": 0.0383,
+ "pc10": 0.0133
},
{
"feature": "provider_anthropic",
"axis": "provider",
- "pc1": 0.3174,
- "pc2": -0.1892,
- "pc3": 0.0399,
- "pc4": -0.0423,
- "pc5": 0.0187,
- "pc6": 0.0295,
- "pc7": 0.0812,
- "pc8": 0.0,
- "pc9": 0.0012,
- "pc10": 0.05
+ "pc1": 0.3272,
+ "pc2": -0.168,
+ "pc3": -0.0699,
+ "pc4": 0.0544,
+ "pc5": 0.0553,
+ "pc6": -0.0056,
+ "pc7": -0.0334,
+ "pc8": 0.0172,
+ "pc9": 0.0221,
+ "pc10": -0.0004
},
{
"feature": "provider_openrouter",
"axis": "provider",
- "pc1": -0.1545,
- "pc2": 0.0455,
- "pc3": 0.4453,
- "pc4": -0.0328,
- "pc5": -0.082,
- "pc6": -0.0538,
- "pc7": -0.022,
- "pc8": -0.0,
- "pc9": -0.0073,
- "pc10": 0.0336
+ "pc1": -0.0649,
+ "pc2": 0.0128,
+ "pc3": 0.5085,
+ "pc4": -0.1197,
+ "pc5": -0.1394,
+ "pc6": 0.0512,
+ "pc7": 0.0849,
+ "pc8": -0.0509,
+ "pc9": -0.0317,
+ "pc10": -0.0155
},
{
"feature": "provider_zai",
"axis": "provider",
- "pc1": -0.2198,
- "pc2": 0.1672,
- "pc3": -0.3882,
- "pc4": 0.0706,
- "pc5": 0.0436,
- "pc6": 0.0102,
- "pc7": -0.0699,
- "pc8": -0.0,
- "pc9": 0.0044,
- "pc10": -0.0795
+ "pc1": -0.273,
+ "pc2": 0.1544,
+ "pc3": -0.2845,
+ "pc4": 0.0301,
+ "pc5": 0.0428,
+ "pc6": -0.03,
+ "pc7": -0.0264,
+ "pc8": 0.0186,
+ "pc9": 0.0005,
+ "pc10": 0.0111
}
],
"axis_importance": [
{
"axis": "model",
- "pc1": 0.9503,
- "pc2": 0.702,
- "pc3": 1.3251,
- "pc4": 0.297,
- "pc5": 0.1928,
- "pc6": 0.4483,
- "pc7": 0.4096,
- "pc8": 0.0,
- "pc9": 0.0211,
- "pc10": 0.3066,
- "total": 4.6528
+ "pc1": 0.9473,
+ "pc2": 0.6359,
+ "pc3": 1.2991,
+ "pc4": 0.4296,
+ "pc5": 0.5134,
+ "pc6": 0.4184,
+ "pc7": 0.616,
+ "pc8": 0.3801,
+ "pc9": 0.1698,
+ "pc10": 0.1489,
+ "total": 5.5585
+ },
+ {
+ "axis": "context_noise",
+ "pc1": 0.4439,
+ "pc2": 0.1581,
+ "pc3": 0.7564,
+ "pc4": 0.165,
+ "pc5": 0.7419,
+ "pc6": 1.1984,
+ "pc7": 1.1721,
+ "pc8": 0.2984,
+ "pc9": 0.0562,
+ "pc10": 0.0882,
+ "total": 5.0786
},
{
"axis": "renderer",
"pc1": 0.2866,
- "pc2": 0.0852,
- "pc3": 0.112,
- "pc4": 0.0744,
- "pc5": 0.1863,
- "pc6": 1.104,
- "pc7": 1.133,
- "pc8": 0.0,
- "pc9": 0.0037,
- "pc10": 0.8907,
- "total": 3.8759
+ "pc2": 0.1007,
+ "pc3": 0.4238,
+ "pc4": 0.0639,
+ "pc5": 0.2059,
+ "pc6": 1.25,
+ "pc7": 0.3973,
+ "pc8": 1.0018,
+ "pc9": 0.2636,
+ "pc10": 0.0398,
+ "total": 4.0334
},
{
"axis": "design_guidance",
- "pc1": 0.1632,
- "pc2": 0.0353,
- "pc3": 0.4856,
- "pc4": 0.0414,
- "pc5": 0.11,
- "pc6": 0.1768,
- "pc7": 0.1143,
- "pc8": 1.2066,
- "pc9": 0.5482,
- "pc10": 0.075,
- "total": 2.9564
+ "pc1": 0.1453,
+ "pc2": 0.0397,
+ "pc3": 0.0972,
+ "pc4": 0.1095,
+ "pc5": 0.3895,
+ "pc6": 0.2769,
+ "pc7": 0.6014,
+ "pc8": 0.2732,
+ "pc9": 1.1501,
+ "pc10": 0.4491,
+ "total": 3.5319
},
{
"axis": "architecture",
- "pc1": 0.1632,
- "pc2": 0.0353,
- "pc3": 0.4856,
- "pc4": 0.0414,
- "pc5": 0.11,
- "pc6": 0.1768,
- "pc7": 0.1143,
- "pc8": 1.2066,
- "pc9": 0.5482,
- "pc10": 0.075,
- "total": 2.9564
- },
- {
- "axis": "provider",
- "pc1": 0.6916,
- "pc2": 0.4019,
- "pc3": 0.8734,
- "pc4": 0.1456,
- "pc5": 0.1443,
- "pc6": 0.0934,
- "pc7": 0.173,
- "pc8": 0.0,
- "pc9": 0.0129,
- "pc10": 0.1631,
- "total": 2.6992
+ "pc1": 0.141,
+ "pc2": 0.0437,
+ "pc3": 0.05,
+ "pc4": 0.0325,
+ "pc5": 0.1846,
+ "pc6": 0.1108,
+ "pc7": 0.7982,
+ "pc8": 0.2626,
+ "pc9": 1.1812,
+ "pc10": 0.0726,
+ "total": 2.8772
},
{
"axis": "language",
- "pc1": 0.1067,
- "pc2": 0.2652,
- "pc3": 0.4171,
- "pc4": 0.1953,
- "pc5": 0.2371,
- "pc6": 0.9691,
- "pc7": 0.3208,
- "pc8": 0.0,
- "pc9": 0.0006,
+ "pc1": 0.0259,
+ "pc2": 0.3251,
+ "pc3": 0.2939,
+ "pc4": 0.1814,
+ "pc5": 0.0153,
+ "pc6": 0.6847,
+ "pc7": 0.5056,
+ "pc8": 0.5915,
+ "pc9": 0.0591,
"pc10": 0.1164,
- "total": 2.6283
+ "total": 2.7989
+ },
+ {
+ "axis": "provider",
+ "pc1": 0.6651,
+ "pc2": 0.3353,
+ "pc3": 0.8628,
+ "pc4": 0.2042,
+ "pc5": 0.2375,
+ "pc6": 0.0869,
+ "pc7": 0.1447,
+ "pc8": 0.0867,
+ "pc9": 0.0543,
+ "pc10": 0.027,
+ "total": 2.7045
},
{
"axis": "tool_glob",
- "pc1": 0.2334,
- "pc2": 0.2733,
- "pc3": 0.1414,
- "pc4": 0.3488,
- "pc5": 0.5154,
- "pc6": 0.1045,
- "pc7": 0.3335,
- "pc8": 0.0,
- "pc9": 0.0177,
- "pc10": 0.5127,
- "total": 2.4807
+ "pc1": 0.1949,
+ "pc2": 0.2757,
+ "pc3": 0.2637,
+ "pc4": 0.1618,
+ "pc5": 0.5482,
+ "pc6": 0.0047,
+ "pc7": 0.1538,
+ "pc8": 0.0415,
+ "pc9": 0.1625,
+ "pc10": 0.6025,
+ "total": 2.4093
},
{
- "axis": "human_language",
- "pc1": 0.2089,
- "pc2": 0.22,
- "pc3": 0.0767,
- "pc4": 0.2966,
- "pc5": 0.6065,
- "pc6": 0.0689,
- "pc7": 0.3276,
- "pc8": 0.0,
- "pc9": 0.0202,
- "pc10": 0.6297,
- "total": 2.4551
+ "axis": "strategy",
+ "pc1": 0.6838,
+ "pc2": 0.5401,
+ "pc3": 0.2831,
+ "pc4": 0.1062,
+ "pc5": 0.2097,
+ "pc6": 0.1011,
+ "pc7": 0.151,
+ "pc8": 0.0924,
+ "pc9": 0.1062,
+ "pc10": 0.1347,
+ "total": 2.4083
},
{
"axis": "effort",
- "pc1": 0.0125,
- "pc2": 0.1942,
- "pc3": 0.049,
- "pc4": 0.1597,
- "pc5": 0.0305,
- "pc6": 0.7721,
- "pc7": 0.7917,
- "pc8": 0.0,
- "pc9": 0.0065,
- "pc10": 0.4166,
- "total": 2.4328
+ "pc1": 0.0027,
+ "pc2": 0.2003,
+ "pc3": 0.1027,
+ "pc4": 0.1078,
+ "pc5": 0.1023,
+ "pc6": 0.6333,
+ "pc7": 0.3761,
+ "pc8": 0.7175,
+ "pc9": 0.0454,
+ "pc10": 0.0176,
+ "total": 2.3057
},
{
- "axis": "linter",
- "pc1": 0.25,
- "pc2": 0.43,
- "pc3": 0.1083,
- "pc4": 0.2697,
- "pc5": 0.0815,
- "pc6": 0.1246,
- "pc7": 0.423,
- "pc8": 0.0,
- "pc9": 0.0186,
- "pc10": 0.5333,
- "total": 2.239
+ "axis": "human_language",
+ "pc1": 0.2293,
+ "pc2": 0.2268,
+ "pc3": 0.2304,
+ "pc4": 0.1165,
+ "pc5": 0.5908,
+ "pc6": 0.0364,
+ "pc7": 0.0869,
+ "pc8": 0.0818,
+ "pc9": 0.0565,
+ "pc10": 0.5937,
+ "total": 2.2491
},
{
"axis": "prompt_style",
- "pc1": 0.2159,
- "pc2": 0.2811,
- "pc3": 0.1654,
- "pc4": 0.3496,
- "pc5": 0.723,
- "pc6": 0.017,
- "pc7": 0.0591,
- "pc8": 0.0,
- "pc9": 0.0094,
- "pc10": 0.2958,
- "total": 2.1163
+ "pc1": 0.2242,
+ "pc2": 0.2919,
+ "pc3": 0.1618,
+ "pc4": 0.5344,
+ "pc5": 0.5604,
+ "pc6": 0.0292,
+ "pc7": 0.135,
+ "pc8": 0.0272,
+ "pc9": 0.0605,
+ "pc10": 0.1433,
+ "total": 2.1679
},
{
- "axis": "strategy",
- "pc1": 0.7193,
- "pc2": 0.5422,
- "pc3": 0.233,
- "pc4": 0.0733,
- "pc5": 0.1548,
- "pc6": 0.0832,
- "pc7": 0.1248,
- "pc8": 0.0,
- "pc9": 0.0133,
- "pc10": 0.1539,
- "total": 2.0978
+ "axis": "error_checking",
+ "pc1": 0.0797,
+ "pc2": 0.0276,
+ "pc3": 0.1237,
+ "pc4": 0.0031,
+ "pc5": 0.058,
+ "pc6": 0.0344,
+ "pc7": 0.4896,
+ "pc8": 0.7436,
+ "pc9": 0.1325,
+ "pc10": 0.3761,
+ "total": 2.0683
},
{
- "axis": "tool_grep",
- "pc1": 0.2788,
- "pc2": 0.3428,
- "pc3": 0.0714,
- "pc4": 0.1337,
- "pc5": 0.4655,
- "pc6": 0.0832,
- "pc7": 0.2693,
- "pc8": 0.0,
- "pc9": 0.0128,
- "pc10": 0.3704,
- "total": 2.0279
+ "axis": "linter",
+ "pc1": 0.2431,
+ "pc2": 0.433,
+ "pc3": 0.113,
+ "pc4": 0.248,
+ "pc5": 0.113,
+ "pc6": 0.009,
+ "pc7": 0.0429,
+ "pc8": 0.0704,
+ "pc9": 0.0807,
+ "pc10": 0.6512,
+ "total": 2.0043
},
{
- "axis": "error_checking",
- "pc1": 0.0952,
- "pc2": 0.0205,
- "pc3": 0.2795,
- "pc4": 0.0237,
- "pc5": 0.0621,
- "pc6": 0.0939,
- "pc7": 0.051,
- "pc8": 0.0,
- "pc9": 1.259,
- "pc10": 0.0869,
- "total": 1.9718
+ "axis": "tool_grep",
+ "pc1": 0.2648,
+ "pc2": 0.3536,
+ "pc3": 0.1416,
+ "pc4": 0.004,
+ "pc5": 0.475,
+ "pc6": 0.0332,
+ "pc7": 0.1603,
+ "pc8": 0.0888,
+ "pc9": 0.0317,
+ "pc10": 0.4093,
+ "total": 1.9623
},
{
"axis": "tool_edit",
- "pc1": 0.3053,
- "pc2": 0.3675,
- "pc3": 0.1358,
- "pc4": 0.0935,
- "pc5": 0.2703,
- "pc6": 0.0411,
- "pc7": 0.2364,
- "pc8": 0.0,
- "pc9": 0.0107,
- "pc10": 0.3471,
- "total": 1.8077
+ "pc1": 0.2742,
+ "pc2": 0.3768,
+ "pc3": 0.1078,
+ "pc4": 0.2039,
+ "pc5": 0.1916,
+ "pc6": 0.0115,
+ "pc7": 0.0365,
+ "pc8": 0.0916,
+ "pc9": 0.0839,
+ "pc10": 0.4895,
+ "total": 1.8673
},
{
- "axis": "tool_write",
- "pc1": 0.2946,
- "pc2": 0.3499,
- "pc3": 0.0974,
- "pc4": 0.2998,
- "pc5": 0.398,
- "pc6": 0.0389,
- "pc7": 0.1164,
- "pc8": 0.0,
- "pc9": 0.0025,
- "pc10": 0.1178,
- "total": 1.7153
+ "axis": "playwright",
+ "pc1": 0.5901,
+ "pc2": 0.4629,
+ "pc3": 0.1969,
+ "pc4": 0.1558,
+ "pc5": 0.125,
+ "pc6": 0.0115,
+ "pc7": 0.1187,
+ "pc8": 0.0374,
+ "pc9": 0.0653,
+ "pc10": 0.0192,
+ "total": 1.7828
},
{
- "axis": "context_file",
- "pc1": 0.2595,
- "pc2": 0.1729,
- "pc3": 0.0575,
- "pc4": 0.744,
- "pc5": 0.1229,
- "pc6": 0.0486,
- "pc7": 0.1828,
- "pc8": 0.0,
- "pc9": 0.0028,
- "pc10": 0.065,
- "total": 1.656
+ "axis": "web_search",
+ "pc1": 0.2667,
+ "pc2": 0.4619,
+ "pc3": 0.0847,
+ "pc4": 0.2437,
+ "pc5": 0.3666,
+ "pc6": 0.0152,
+ "pc7": 0.1171,
+ "pc8": 0.083,
+ "pc9": 0.0393,
+ "pc10": 0.075,
+ "total": 1.7532
},
{
- "axis": "max_budget",
- "pc1": 0.151,
- "pc2": 0.0053,
- "pc3": 0.0332,
- "pc4": 0.8181,
- "pc5": 0.19,
- "pc6": 0.0439,
- "pc7": 0.068,
- "pc8": 0.0,
- "pc9": 0.0096,
- "pc10": 0.252,
- "total": 1.5711
+ "axis": "context_file",
+ "pc1": 0.2551,
+ "pc2": 0.1824,
+ "pc3": 0.1818,
+ "pc4": 0.7362,
+ "pc5": 0.0039,
+ "pc6": 0.0282,
+ "pc7": 0.0242,
+ "pc8": 0.0227,
+ "pc9": 0.03,
+ "pc10": 0.2679,
+ "total": 1.7324
},
{
- "axis": "tool_read",
- "pc1": 0.3016,
- "pc2": 0.3413,
- "pc3": 0.047,
- "pc4": 0.3662,
- "pc5": 0.2109,
- "pc6": 0.0417,
- "pc7": 0.1657,
- "pc8": 0.0,
- "pc9": 0.0009,
- "pc10": 0.0224,
- "total": 1.4977
+ "axis": "max_budget",
+ "pc1": 0.1789,
+ "pc2": 0.0003,
+ "pc3": 0.2636,
+ "pc4": 0.7197,
+ "pc5": 0.2613,
+ "pc6": 0.058,
+ "pc7": 0.1457,
+ "pc8": 0.0072,
+ "pc9": 0.0623,
+ "pc10": 0.0241,
+ "total": 1.7211
},
{
- "axis": "web_search",
- "pc1": 0.2837,
- "pc2": 0.4475,
- "pc3": 0.1052,
- "pc4": 0.1023,
- "pc5": 0.4114,
- "pc6": 0.0229,
- "pc7": 0.0373,
- "pc8": 0.0,
- "pc9": 0.0005,
- "pc10": 0.0598,
- "total": 1.4706
+ "axis": "tool_write",
+ "pc1": 0.2724,
+ "pc2": 0.3623,
+ "pc3": 0.0193,
+ "pc4": 0.3806,
+ "pc5": 0.2756,
+ "pc6": 0.0774,
+ "pc7": 0.0121,
+ "pc8": 0.0102,
+ "pc9": 0.0478,
+ "pc10": 0.1344,
+ "total": 1.5921
},
{
- "axis": "playwright",
- "pc1": 0.5982,
- "pc2": 0.4837,
- "pc3": 0.0523,
- "pc4": 0.1121,
- "pc5": 0.0186,
- "pc6": 0.0359,
- "pc7": 0.051,
- "pc8": 0.0,
- "pc9": 0.0032,
- "pc10": 0.0388,
- "total": 1.3938
+ "axis": "tool_read",
+ "pc1": 0.2638,
+ "pc2": 0.3548,
+ "pc3": 0.0731,
+ "pc4": 0.3783,
+ "pc5": 0.0986,
+ "pc6": 0.0907,
+ "pc7": 0.0129,
+ "pc8": 0.0542,
+ "pc9": 0.0282,
+ "pc10": 0.1573,
+ "total": 1.5119
}
]
}
\ No newline at end of file