loop-benchmarking

Controlled experiments across agentic coding configurations. Same task, one variable, what actually works.
git clone https://git.shiptheloop.com/loop-benchmarking.git
Log | Files | Refs | README

6f157de1.json (1151B)


      1 {
      2   "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=opus46_pw=avail_prompt=simple_prov=anth_rndr=none_strat=usub_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run6",
      3   "short_id": "6f157de1",
      4   "label": "Calibration (opus-4.6, en)",
      5   "notes": "",
      6   "human_tested_at": "2026-04-16",
      7   "human_tests": {
      8     "game_loads": true,
      9     "game_starts": true,
     10     "auto_drop": true,
     11     "move_left": true,
     12     "move_right": true,
     13     "move_down": true,
     14     "rotate": true,
     15     "hard_drop": true,
     16     "all_pieces_rotate": true,
     17     "piece_locks": true,
     18     "new_piece_spawns": true,
     19     "multiple_pieces": true,
     20     "line_clear": true,
     21     "score_increases_on_clear": null,
     22     "score_element_visible": null,
     23     "game_over": true,
     24     "playable_30s": true,
     25     "multi_line_clear": true,
     26     "score_scaling": null,
     27     "level_progression": null,
     28     "speed_progression": null,
     29     "next_piece_preview": true,
     30     "game_over_display": true,
     31     "counter_clockwise_rotation": true,
     32     "soft_drop_distinct": null,
     33     "rendering_clean": null,
     34     "score_changes": true
     35   }
     36 }

Impressum · Datenschutz