bird-bench

vparity

BIRD SQL parity subset (150 tasks, seed 42). Original benchmark: https://huggingface.co/datasets/birdsql/bird_sql_dev_20251106. Adapter: https://github.com/laude-institute/harbor/tree/main/adapters/bird-bench.

uvx harbor run -d bird-bench@parity

Tasks (150)

california_schools__13
uvx harbor run -d bird-bench@parity -t california_schools__13
82d1fb0
california_schools__23
uvx harbor run -d bird-bench@parity -t california_schools__23
82d1fb0
california_schools__3
uvx harbor run -d bird-bench@parity -t california_schools__3
82d1fb0
california_schools__37
uvx harbor run -d bird-bench@parity -t california_schools__37
82d1fb0
california_schools__43
uvx harbor run -d bird-bench@parity -t california_schools__43
82d1fb0
california_schools__65
uvx harbor run -d bird-bench@parity -t california_schools__65
82d1fb0
california_schools__74
uvx harbor run -d bird-bench@parity -t california_schools__74
82d1fb0
california_schools__75
uvx harbor run -d bird-bench@parity -t california_schools__75
82d1fb0
california_schools__87
uvx harbor run -d bird-bench@parity -t california_schools__87
82d1fb0
card_games__350
uvx harbor run -d bird-bench@parity -t card_games__350
82d1fb0
card_games__362
uvx harbor run -d bird-bench@parity -t card_games__362
82d1fb0
card_games__402
uvx harbor run -d bird-bench@parity -t card_games__402
82d1fb0
card_games__410
uvx harbor run -d bird-bench@parity -t card_games__410
82d1fb0
card_games__412
uvx harbor run -d bird-bench@parity -t card_games__412
82d1fb0
card_games__438
uvx harbor run -d bird-bench@parity -t card_games__438
82d1fb0
card_games__444
uvx harbor run -d bird-bench@parity -t card_games__444
82d1fb0
card_games__445
uvx harbor run -d bird-bench@parity -t card_games__445
82d1fb0
card_games__450
uvx harbor run -d bird-bench@parity -t card_games__450
82d1fb0
card_games__451
uvx harbor run -d bird-bench@parity -t card_games__451
82d1fb0
card_games__454
uvx harbor run -d bird-bench@parity -t card_games__454
82d1fb0
card_games__458
uvx harbor run -d bird-bench@parity -t card_games__458
82d1fb0
card_games__469
uvx harbor run -d bird-bench@parity -t card_games__469
82d1fb0
card_games__474
uvx harbor run -d bird-bench@parity -t card_games__474
82d1fb0
card_games__487
uvx harbor run -d bird-bench@parity -t card_games__487
82d1fb0
codebase_community__542
uvx harbor run -d bird-bench@parity -t codebase_community__542
82d1fb0
codebase_community__545
uvx harbor run -d bird-bench@parity -t codebase_community__545
82d1fb0
codebase_community__570
uvx harbor run -d bird-bench@parity -t codebase_community__570
82d1fb0
codebase_community__575
uvx harbor run -d bird-bench@parity -t codebase_community__575
82d1fb0
codebase_community__579
uvx harbor run -d bird-bench@parity -t codebase_community__579
82d1fb0
codebase_community__599
uvx harbor run -d bird-bench@parity -t codebase_community__599
82d1fb0
codebase_community__602
uvx harbor run -d bird-bench@parity -t codebase_community__602
82d1fb0
codebase_community__620
uvx harbor run -d bird-bench@parity -t codebase_community__620
82d1fb0
codebase_community__634
uvx harbor run -d bird-bench@parity -t codebase_community__634
82d1fb0
codebase_community__639
uvx harbor run -d bird-bench@parity -t codebase_community__639
82d1fb0
codebase_community__643
uvx harbor run -d bird-bench@parity -t codebase_community__643
82d1fb0
codebase_community__678
uvx harbor run -d bird-bench@parity -t codebase_community__678
82d1fb0
codebase_community__681
uvx harbor run -d bird-bench@parity -t codebase_community__681
82d1fb0
codebase_community__688
uvx harbor run -d bird-bench@parity -t codebase_community__688
82d1fb0
codebase_community__697
uvx harbor run -d bird-bench@parity -t codebase_community__697
82d1fb0
codebase_community__712
uvx harbor run -d bird-bench@parity -t codebase_community__712
82d1fb0
codebase_community__715
uvx harbor run -d bird-bench@parity -t codebase_community__715
82d1fb0
debit_card_specializing__1478
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1478
82d1fb0
debit_card_specializing__1485
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1485
82d1fb0
debit_card_specializing__1488
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1488
82d1fb0
debit_card_specializing__1493
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1493
82d1fb0
debit_card_specializing__1501
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1501
82d1fb0
debit_card_specializing__1502
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1502
82d1fb0
debit_card_specializing__1532
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1532
82d1fb0
european_football_2__1026
uvx harbor run -d bird-bench@parity -t european_football_2__1026
82d1fb0
european_football_2__1030
uvx harbor run -d bird-bench@parity -t european_football_2__1030
82d1fb0
european_football_2__1041
uvx harbor run -d bird-bench@parity -t european_football_2__1041
82d1fb0
european_football_2__1050
uvx harbor run -d bird-bench@parity -t european_football_2__1050
82d1fb0
european_football_2__1058
uvx harbor run -d bird-bench@parity -t european_football_2__1058
82d1fb0
european_football_2__1062
uvx harbor run -d bird-bench@parity -t european_football_2__1062
82d1fb0
european_football_2__1066
uvx harbor run -d bird-bench@parity -t european_football_2__1066
82d1fb0
european_football_2__1084
uvx harbor run -d bird-bench@parity -t european_football_2__1084
82d1fb0
european_football_2__1090
uvx harbor run -d bird-bench@parity -t european_football_2__1090
82d1fb0
european_football_2__1093
uvx harbor run -d bird-bench@parity -t european_football_2__1093
82d1fb0
european_football_2__1112
uvx harbor run -d bird-bench@parity -t european_football_2__1112
82d1fb0
european_football_2__1116
uvx harbor run -d bird-bench@parity -t european_football_2__1116
82d1fb0
european_football_2__1133
uvx harbor run -d bird-bench@parity -t european_football_2__1133
82d1fb0
european_football_2__1141
uvx harbor run -d bird-bench@parity -t european_football_2__1141
82d1fb0
financial__110
uvx harbor run -d bird-bench@parity -t financial__110
82d1fb0
financial__117
uvx harbor run -d bird-bench@parity -t financial__117
82d1fb0
financial__118
uvx harbor run -d bird-bench@parity -t financial__118
82d1fb0
financial__132
uvx harbor run -d bird-bench@parity -t financial__132
82d1fb0
financial__158
uvx harbor run -d bird-bench@parity -t financial__158
82d1fb0
financial__181
uvx harbor run -d bird-bench@parity -t financial__181
82d1fb0
financial__193
uvx harbor run -d bird-bench@parity -t financial__193
82d1fb0
financial__89
uvx harbor run -d bird-bench@parity -t financial__89
82d1fb0
financial__90
uvx harbor run -d bird-bench@parity -t financial__90
82d1fb0
formula_1__1007
uvx harbor run -d bird-bench@parity -t formula_1__1007
82d1fb0
formula_1__848
uvx harbor run -d bird-bench@parity -t formula_1__848
82d1fb0
formula_1__876
uvx harbor run -d bird-bench@parity -t formula_1__876
82d1fb0
formula_1__891
uvx harbor run -d bird-bench@parity -t formula_1__891
82d1fb0
formula_1__900
uvx harbor run -d bird-bench@parity -t formula_1__900
82d1fb0
formula_1__902
uvx harbor run -d bird-bench@parity -t formula_1__902
82d1fb0
formula_1__905
uvx harbor run -d bird-bench@parity -t formula_1__905
82d1fb0
formula_1__912
uvx harbor run -d bird-bench@parity -t formula_1__912
82d1fb0
formula_1__924
uvx harbor run -d bird-bench@parity -t formula_1__924
82d1fb0
formula_1__931
uvx harbor run -d bird-bench@parity -t formula_1__931
82d1fb0
formula_1__936
uvx harbor run -d bird-bench@parity -t formula_1__936
82d1fb0
formula_1__938
uvx harbor run -d bird-bench@parity -t formula_1__938
82d1fb0
formula_1__965
uvx harbor run -d bird-bench@parity -t formula_1__965
82d1fb0
formula_1__972
uvx harbor run -d bird-bench@parity -t formula_1__972
82d1fb0
formula_1__975
uvx harbor run -d bird-bench@parity -t formula_1__975
82d1fb0
formula_1__976
uvx harbor run -d bird-bench@parity -t formula_1__976
82d1fb0
formula_1__989
uvx harbor run -d bird-bench@parity -t formula_1__989
82d1fb0
student_club__1329
uvx harbor run -d bird-bench@parity -t student_club__1329
82d1fb0
student_club__1330
uvx harbor run -d bird-bench@parity -t student_club__1330
82d1fb0
student_club__1336
uvx harbor run -d bird-bench@parity -t student_club__1336
82d1fb0
student_club__1342
uvx harbor run -d bird-bench@parity -t student_club__1342
82d1fb0
student_club__1350
uvx harbor run -d bird-bench@parity -t student_club__1350
82d1fb0
student_club__1357
uvx harbor run -d bird-bench@parity -t student_club__1357
82d1fb0
student_club__1367
uvx harbor run -d bird-bench@parity -t student_club__1367
82d1fb0
student_club__1368
uvx harbor run -d bird-bench@parity -t student_club__1368
82d1fb0
student_club__1385
uvx harbor run -d bird-bench@parity -t student_club__1385
82d1fb0
student_club__1405
uvx harbor run -d bird-bench@parity -t student_club__1405
82d1fb0
student_club__1418
uvx harbor run -d bird-bench@parity -t student_club__1418
82d1fb0
student_club__1419
uvx harbor run -d bird-bench@parity -t student_club__1419
82d1fb0