bird-bench
vparityBIRD SQL parity subset (150 tasks, seed 42). Original benchmark: https://huggingface.co/datasets/birdsql/bird_sql_dev_20251106. Adapter: https://github.com/laude-institute/harbor/tree/main/adapters/bird-bench.
uvx harbor run -d bird-bench@parityTasks (150)
california_schools__13
uvx harbor run -d bird-bench@parity -t california_schools__13b05ea1d
california_schools__23
uvx harbor run -d bird-bench@parity -t california_schools__23b05ea1d
california_schools__3
uvx harbor run -d bird-bench@parity -t california_schools__3b05ea1d
california_schools__37
uvx harbor run -d bird-bench@parity -t california_schools__37b05ea1d
california_schools__43
uvx harbor run -d bird-bench@parity -t california_schools__43b05ea1d
california_schools__65
uvx harbor run -d bird-bench@parity -t california_schools__65b05ea1d
california_schools__74
uvx harbor run -d bird-bench@parity -t california_schools__74b05ea1d
california_schools__75
uvx harbor run -d bird-bench@parity -t california_schools__75b05ea1d
california_schools__87
uvx harbor run -d bird-bench@parity -t california_schools__87b05ea1d
card_games__350
uvx harbor run -d bird-bench@parity -t card_games__350b05ea1d
card_games__362
uvx harbor run -d bird-bench@parity -t card_games__362b05ea1d
card_games__402
uvx harbor run -d bird-bench@parity -t card_games__402b05ea1d
card_games__410
uvx harbor run -d bird-bench@parity -t card_games__410b05ea1d
card_games__412
uvx harbor run -d bird-bench@parity -t card_games__412b05ea1d
card_games__438
uvx harbor run -d bird-bench@parity -t card_games__438b05ea1d
card_games__444
uvx harbor run -d bird-bench@parity -t card_games__444b05ea1d
card_games__445
uvx harbor run -d bird-bench@parity -t card_games__445b05ea1d
card_games__450
uvx harbor run -d bird-bench@parity -t card_games__450b05ea1d
card_games__451
uvx harbor run -d bird-bench@parity -t card_games__451b05ea1d
card_games__454
uvx harbor run -d bird-bench@parity -t card_games__454b05ea1d
card_games__458
uvx harbor run -d bird-bench@parity -t card_games__458b05ea1d
card_games__469
uvx harbor run -d bird-bench@parity -t card_games__469b05ea1d
card_games__474
uvx harbor run -d bird-bench@parity -t card_games__474b05ea1d
card_games__487
uvx harbor run -d bird-bench@parity -t card_games__487b05ea1d
codebase_community__542
uvx harbor run -d bird-bench@parity -t codebase_community__542b05ea1d
codebase_community__545
uvx harbor run -d bird-bench@parity -t codebase_community__545b05ea1d
codebase_community__570
uvx harbor run -d bird-bench@parity -t codebase_community__570b05ea1d
codebase_community__575
uvx harbor run -d bird-bench@parity -t codebase_community__575b05ea1d
codebase_community__579
uvx harbor run -d bird-bench@parity -t codebase_community__579b05ea1d
codebase_community__599
uvx harbor run -d bird-bench@parity -t codebase_community__599b05ea1d
codebase_community__602
uvx harbor run -d bird-bench@parity -t codebase_community__602b05ea1d
codebase_community__620
uvx harbor run -d bird-bench@parity -t codebase_community__620b05ea1d
codebase_community__634
uvx harbor run -d bird-bench@parity -t codebase_community__634b05ea1d
codebase_community__639
uvx harbor run -d bird-bench@parity -t codebase_community__639b05ea1d
codebase_community__643
uvx harbor run -d bird-bench@parity -t codebase_community__643b05ea1d
codebase_community__678
uvx harbor run -d bird-bench@parity -t codebase_community__678b05ea1d
codebase_community__681
uvx harbor run -d bird-bench@parity -t codebase_community__681b05ea1d
codebase_community__688
uvx harbor run -d bird-bench@parity -t codebase_community__688b05ea1d
codebase_community__697
uvx harbor run -d bird-bench@parity -t codebase_community__697b05ea1d
codebase_community__712
uvx harbor run -d bird-bench@parity -t codebase_community__712b05ea1d
codebase_community__715
uvx harbor run -d bird-bench@parity -t codebase_community__715b05ea1d
debit_card_specializing__1478
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1478b05ea1d
debit_card_specializing__1485
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1485b05ea1d
debit_card_specializing__1488
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1488b05ea1d
debit_card_specializing__1493
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1493b05ea1d
debit_card_specializing__1501
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1501b05ea1d
debit_card_specializing__1502
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1502b05ea1d
debit_card_specializing__1532
uvx harbor run -d bird-bench@parity -t debit_card_specializing__1532b05ea1d
european_football_2__1026
uvx harbor run -d bird-bench@parity -t european_football_2__1026b05ea1d
european_football_2__1030
uvx harbor run -d bird-bench@parity -t european_football_2__1030b05ea1d
european_football_2__1041
uvx harbor run -d bird-bench@parity -t european_football_2__1041b05ea1d
european_football_2__1050
uvx harbor run -d bird-bench@parity -t european_football_2__1050b05ea1d
european_football_2__1058
uvx harbor run -d bird-bench@parity -t european_football_2__1058b05ea1d
european_football_2__1062
uvx harbor run -d bird-bench@parity -t european_football_2__1062b05ea1d
european_football_2__1066
uvx harbor run -d bird-bench@parity -t european_football_2__1066b05ea1d
european_football_2__1084
uvx harbor run -d bird-bench@parity -t european_football_2__1084b05ea1d
european_football_2__1090
uvx harbor run -d bird-bench@parity -t european_football_2__1090b05ea1d
european_football_2__1093
uvx harbor run -d bird-bench@parity -t european_football_2__1093b05ea1d
european_football_2__1112
uvx harbor run -d bird-bench@parity -t european_football_2__1112b05ea1d
european_football_2__1116
uvx harbor run -d bird-bench@parity -t european_football_2__1116b05ea1d
european_football_2__1133
uvx harbor run -d bird-bench@parity -t european_football_2__1133b05ea1d
european_football_2__1141
uvx harbor run -d bird-bench@parity -t european_football_2__1141b05ea1d
financial__110
uvx harbor run -d bird-bench@parity -t financial__110b05ea1d
financial__117
uvx harbor run -d bird-bench@parity -t financial__117b05ea1d
financial__118
uvx harbor run -d bird-bench@parity -t financial__118b05ea1d
financial__132
uvx harbor run -d bird-bench@parity -t financial__132b05ea1d
financial__158
uvx harbor run -d bird-bench@parity -t financial__158b05ea1d
financial__181
uvx harbor run -d bird-bench@parity -t financial__181b05ea1d
financial__193
uvx harbor run -d bird-bench@parity -t financial__193b05ea1d
financial__89
uvx harbor run -d bird-bench@parity -t financial__89b05ea1d
financial__90
uvx harbor run -d bird-bench@parity -t financial__90b05ea1d
formula_1__1007
uvx harbor run -d bird-bench@parity -t formula_1__1007b05ea1d
formula_1__848
uvx harbor run -d bird-bench@parity -t formula_1__848b05ea1d
formula_1__876
uvx harbor run -d bird-bench@parity -t formula_1__876b05ea1d
formula_1__891
uvx harbor run -d bird-bench@parity -t formula_1__891b05ea1d
formula_1__900
uvx harbor run -d bird-bench@parity -t formula_1__900b05ea1d
formula_1__902
uvx harbor run -d bird-bench@parity -t formula_1__902b05ea1d
formula_1__905
uvx harbor run -d bird-bench@parity -t formula_1__905b05ea1d
formula_1__912
uvx harbor run -d bird-bench@parity -t formula_1__912b05ea1d
formula_1__924
uvx harbor run -d bird-bench@parity -t formula_1__924b05ea1d
formula_1__931
uvx harbor run -d bird-bench@parity -t formula_1__931b05ea1d
formula_1__936
uvx harbor run -d bird-bench@parity -t formula_1__936b05ea1d
formula_1__938
uvx harbor run -d bird-bench@parity -t formula_1__938b05ea1d
formula_1__965
uvx harbor run -d bird-bench@parity -t formula_1__965b05ea1d
formula_1__972
uvx harbor run -d bird-bench@parity -t formula_1__972b05ea1d
formula_1__975
uvx harbor run -d bird-bench@parity -t formula_1__975b05ea1d
formula_1__976
uvx harbor run -d bird-bench@parity -t formula_1__976b05ea1d
formula_1__989
uvx harbor run -d bird-bench@parity -t formula_1__989b05ea1d
student_club__1329
uvx harbor run -d bird-bench@parity -t student_club__1329b05ea1d
student_club__1330
uvx harbor run -d bird-bench@parity -t student_club__1330b05ea1d
student_club__1336
uvx harbor run -d bird-bench@parity -t student_club__1336b05ea1d
student_club__1342
uvx harbor run -d bird-bench@parity -t student_club__1342b05ea1d
student_club__1350
uvx harbor run -d bird-bench@parity -t student_club__1350b05ea1d
student_club__1357
uvx harbor run -d bird-bench@parity -t student_club__1357b05ea1d
student_club__1367
uvx harbor run -d bird-bench@parity -t student_club__1367b05ea1d
student_club__1368
uvx harbor run -d bird-bench@parity -t student_club__1368b05ea1d
student_club__1385
uvx harbor run -d bird-bench@parity -t student_club__1385b05ea1d
student_club__1405
uvx harbor run -d bird-bench@parity -t student_club__1405b05ea1d
student_club__1418
uvx harbor run -d bird-bench@parity -t student_club__1418b05ea1d
student_club__1419
uvx harbor run -d bird-bench@parity -t student_club__1419b05ea1d