swtbench-verified

v1.0

SWTBench Verified - Software Testing Benchmark for code generation

harbor run -d swtbench-verified@1.0

Tasks (433)

pytest-dev__pytest-5840
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-5840
e39578f
pytest-dev__pytest-6197
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-6197
e39578f
pytest-dev__pytest-6202
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-6202
e39578f
pytest-dev__pytest-7236
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7236
e39578f
pytest-dev__pytest-7324
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7324
e39578f
pytest-dev__pytest-7432
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7432
e39578f
pytest-dev__pytest-7521
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7521
e39578f
pytest-dev__pytest-7982
harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7982
e39578f
scikit-learn__scikit-learn-10297
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-10297
e39578f
scikit-learn__scikit-learn-10844
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-10844
e39578f
scikit-learn__scikit-learn-10908
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-10908
e39578f
scikit-learn__scikit-learn-11310
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-11310
e39578f
scikit-learn__scikit-learn-11578
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-11578
e39578f
scikit-learn__scikit-learn-12585
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-12585
e39578f
scikit-learn__scikit-learn-12682
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-12682
e39578f
scikit-learn__scikit-learn-12973
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-12973
e39578f
scikit-learn__scikit-learn-13124
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13124
e39578f
scikit-learn__scikit-learn-13135
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13135
e39578f
scikit-learn__scikit-learn-13142
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13142
e39578f
scikit-learn__scikit-learn-13328
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13328
e39578f
scikit-learn__scikit-learn-13439
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13439
e39578f
scikit-learn__scikit-learn-13496
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13496
e39578f
scikit-learn__scikit-learn-13779
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13779
e39578f
scikit-learn__scikit-learn-14053
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14053
e39578f
scikit-learn__scikit-learn-14087
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14087
e39578f
scikit-learn__scikit-learn-14141
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14141
e39578f
scikit-learn__scikit-learn-14496
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14496
e39578f
scikit-learn__scikit-learn-14629
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14629
e39578f
scikit-learn__scikit-learn-14894
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14894
e39578f
scikit-learn__scikit-learn-14983
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14983
e39578f
scikit-learn__scikit-learn-15100
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-15100
e39578f
scikit-learn__scikit-learn-9288
harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-9288
e39578f
sphinx-doc__sphinx-10449
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10449
e39578f
sphinx-doc__sphinx-10466
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10466
e39578f
sphinx-doc__sphinx-10614
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10614
e39578f
sphinx-doc__sphinx-10673
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10673
e39578f
sphinx-doc__sphinx-11445
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-11445
e39578f
sphinx-doc__sphinx-11510
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-11510
e39578f
sphinx-doc__sphinx-8459
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8459
e39578f
sphinx-doc__sphinx-8475
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8475
e39578f
sphinx-doc__sphinx-8548
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8548
e39578f
sphinx-doc__sphinx-8551
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8551
e39578f
sphinx-doc__sphinx-8593
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8593
e39578f
sphinx-doc__sphinx-8595
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8595
e39578f
sphinx-doc__sphinx-8621
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8621
e39578f
sphinx-doc__sphinx-8638
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8638
e39578f
sphinx-doc__sphinx-8721
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8721
e39578f
sphinx-doc__sphinx-9229
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9229
e39578f
sphinx-doc__sphinx-9230
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9230
e39578f
sphinx-doc__sphinx-9258
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9258
e39578f
sphinx-doc__sphinx-9281
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9281
e39578f
sphinx-doc__sphinx-9320
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9320
e39578f
sphinx-doc__sphinx-9367
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9367
e39578f
sphinx-doc__sphinx-9461
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9461
e39578f
sphinx-doc__sphinx-9591
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9591
e39578f
sphinx-doc__sphinx-9602
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9602
e39578f
sphinx-doc__sphinx-9658
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9658
e39578f
sphinx-doc__sphinx-9673
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9673
e39578f
sphinx-doc__sphinx-9698
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9698
e39578f
sphinx-doc__sphinx-9711
harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9711
e39578f
sympy__sympy-11618
harbor run -d swtbench-verified@1.0 -t sympy__sympy-11618
e39578f
sympy__sympy-12096
harbor run -d swtbench-verified@1.0 -t sympy__sympy-12096
e39578f
sympy__sympy-12419
harbor run -d swtbench-verified@1.0 -t sympy__sympy-12419
e39578f
sympy__sympy-12481
harbor run -d swtbench-verified@1.0 -t sympy__sympy-12481
e39578f
sympy__sympy-12489
harbor run -d swtbench-verified@1.0 -t sympy__sympy-12489
e39578f
sympy__sympy-13031
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13031
e39578f
sympy__sympy-13372
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13372
e39578f
sympy__sympy-13480
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13480
e39578f
sympy__sympy-13551
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13551
e39578f
sympy__sympy-13615
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13615
e39578f
sympy__sympy-13647
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13647
e39578f
sympy__sympy-13757
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13757
e39578f
sympy__sympy-13798
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13798
e39578f
sympy__sympy-13852
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13852
e39578f
sympy__sympy-13877
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13877
e39578f
sympy__sympy-13974
harbor run -d swtbench-verified@1.0 -t sympy__sympy-13974
e39578f
sympy__sympy-14248
harbor run -d swtbench-verified@1.0 -t sympy__sympy-14248
e39578f
sympy__sympy-14531
harbor run -d swtbench-verified@1.0 -t sympy__sympy-14531
e39578f
sympy__sympy-14711
harbor run -d swtbench-verified@1.0 -t sympy__sympy-14711
e39578f
sympy__sympy-14976
harbor run -d swtbench-verified@1.0 -t sympy__sympy-14976
e39578f
sympy__sympy-15017
harbor run -d swtbench-verified@1.0 -t sympy__sympy-15017
e39578f
sympy__sympy-15345
harbor run -d swtbench-verified@1.0 -t sympy__sympy-15345
e39578f
sympy__sympy-15349
harbor run -d swtbench-verified@1.0 -t sympy__sympy-15349
e39578f
sympy__sympy-15599
harbor run -d swtbench-verified@1.0 -t sympy__sympy-15599
e39578f
sympy__sympy-15809
harbor run -d swtbench-verified@1.0 -t sympy__sympy-15809
e39578f
sympy__sympy-15875
harbor run -d swtbench-verified@1.0 -t sympy__sympy-15875
e39578f
sympy__sympy-15976
harbor run -d swtbench-verified@1.0 -t sympy__sympy-15976
e39578f
sympy__sympy-16450
harbor run -d swtbench-verified@1.0 -t sympy__sympy-16450
e39578f
sympy__sympy-16597
harbor run -d swtbench-verified@1.0 -t sympy__sympy-16597
e39578f
sympy__sympy-16766
harbor run -d swtbench-verified@1.0 -t sympy__sympy-16766
e39578f
sympy__sympy-16792
harbor run -d swtbench-verified@1.0 -t sympy__sympy-16792
e39578f
sympy__sympy-16886
harbor run -d swtbench-verified@1.0 -t sympy__sympy-16886
e39578f
sympy__sympy-17139
harbor run -d swtbench-verified@1.0 -t sympy__sympy-17139
e39578f
sympy__sympy-17318
harbor run -d swtbench-verified@1.0 -t sympy__sympy-17318
e39578f
sympy__sympy-17630
harbor run -d swtbench-verified@1.0 -t sympy__sympy-17630
e39578f
sympy__sympy-17655
harbor run -d swtbench-verified@1.0 -t sympy__sympy-17655
e39578f
sympy__sympy-18189
harbor run -d swtbench-verified@1.0 -t sympy__sympy-18189
e39578f
sympy__sympy-18199
harbor run -d swtbench-verified@1.0 -t sympy__sympy-18199
e39578f
sympy__sympy-18211
harbor run -d swtbench-verified@1.0 -t sympy__sympy-18211
e39578f
sympy__sympy-18698
harbor run -d swtbench-verified@1.0 -t sympy__sympy-18698
e39578f