loop-benchmarking

Controlled experiments across agentic coding configurations. Same task, one variable, what actually works.
git clone https://git.shiptheloop.com/loop-benchmarking.git
Log | Files | Refs | README

c1013100.json (1129B)


      1 {
      2   "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=ts_lint=off_budget=low_model=gemma426b_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
      3   "short_id": "c1013100",
      4   "label": "Calibration (gemma-4-26b, en)",
      5   "notes": "",
      6   "human_tested_at": "2026-04-16",
      7   "human_tests": {
      8     "game_loads": false,
      9     "game_starts": false,
     10     "auto_drop": null,
     11     "move_left": null,
     12     "move_right": null,
     13     "move_down": null,
     14     "rotate": null,
     15     "hard_drop": null,
     16     "all_pieces_rotate": null,
     17     "piece_locks": null,
     18     "new_piece_spawns": null,
     19     "multiple_pieces": null,
     20     "line_clear": null,
     21     "score_increases_on_clear": null,
     22     "score_element_visible": null,
     23     "game_over": null,
     24     "playable_30s": null,
     25     "multi_line_clear": null,
     26     "score_scaling": null,
     27     "level_progression": null,
     28     "speed_progression": null,
     29     "next_piece_preview": null,
     30     "game_over_display": null,
     31     "counter_clockwise_rotation": null,
     32     "soft_drop_distinct": null,
     33     "rendering_clean": null
     34   }
     35 }

Impressum · Datenschutz