loop-benchmarking

Controlled experiments across agentic coding configurations. Same task, one variable, what actually works.
git clone https://git.shiptheloop.com/loop-benchmarking.git
Log | Files | Refs | README

2763232d.json (1153B)


      1 {
      2   "run_id": "tetris_arch=none_ctx=none_noise=clean_dsgn=none_eff=high_echk=none_hlang=en_lang=js_lint=on_budget=low_model=qwen36p_pw=off_prompt=simple_prov=or_rndr=none_strat=none_tst=none_tedit=on_tglob=on_tgrep=on_tread=on_twrite=on_web=on_run1",
      3   "short_id": "2763232d",
      4   "label": "Calibration (qwen-3.6-plus, en)",
      5   "notes": "",
      6   "human_tested_at": "2026-04-16",
      7   "human_tests": {
      8     "game_loads": true,
      9     "game_starts": true,
     10     "auto_drop": true,
     11     "move_left": true,
     12     "move_right": true,
     13     "move_down": true,
     14     "rotate": true,
     15     "hard_drop": true,
     16     "all_pieces_rotate": null,
     17     "piece_locks": true,
     18     "new_piece_spawns": true,
     19     "multiple_pieces": true,
     20     "line_clear": true,
     21     "score_increases_on_clear": null,
     22     "score_element_visible": null,
     23     "game_over": true,
     24     "playable_30s": true,
     25     "multi_line_clear": true,
     26     "score_scaling": null,
     27     "level_progression": null,
     28     "speed_progression": null,
     29     "next_piece_preview": true,
     30     "game_over_display": true,
     31     "counter_clockwise_rotation": true,
     32     "soft_drop_distinct": true,
     33     "rendering_clean": null,
     34     "score_changes": true
     35   }
     36 }

Impressum · Datenschutz