swtbench-verified

v1.0

SWTBench Verified - Software Testing Benchmark for code generation

uvx harbor run -d swtbench-verified@1.0

Tasks (433)

pytest-dev__pytest-5840
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-5840
e39578f
pytest-dev__pytest-6197
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-6197
e39578f
pytest-dev__pytest-6202
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-6202
e39578f
pytest-dev__pytest-7236
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7236
e39578f
pytest-dev__pytest-7324
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7324
e39578f
pytest-dev__pytest-7432
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7432
e39578f
pytest-dev__pytest-7521
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7521
e39578f
pytest-dev__pytest-7982
uvx harbor run -d swtbench-verified@1.0 -t pytest-dev__pytest-7982
e39578f
scikit-learn__scikit-learn-10297
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-10297
e39578f
scikit-learn__scikit-learn-10844
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-10844
e39578f
scikit-learn__scikit-learn-10908
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-10908
e39578f
scikit-learn__scikit-learn-11310
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-11310
e39578f
scikit-learn__scikit-learn-11578
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-11578
e39578f
scikit-learn__scikit-learn-12585
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-12585
e39578f
scikit-learn__scikit-learn-12682
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-12682
e39578f
scikit-learn__scikit-learn-12973
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-12973
e39578f
scikit-learn__scikit-learn-13124
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13124
e39578f
scikit-learn__scikit-learn-13135
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13135
e39578f
scikit-learn__scikit-learn-13142
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13142
e39578f
scikit-learn__scikit-learn-13328
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13328
e39578f
scikit-learn__scikit-learn-13439
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13439
e39578f
scikit-learn__scikit-learn-13496
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13496
e39578f
scikit-learn__scikit-learn-13779
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-13779
e39578f
scikit-learn__scikit-learn-14053
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14053
e39578f
scikit-learn__scikit-learn-14087
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14087
e39578f
scikit-learn__scikit-learn-14141
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14141
e39578f
scikit-learn__scikit-learn-14496
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14496
e39578f
scikit-learn__scikit-learn-14629
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14629
e39578f
scikit-learn__scikit-learn-14894
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14894
e39578f
scikit-learn__scikit-learn-14983
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-14983
e39578f
scikit-learn__scikit-learn-15100
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-15100
e39578f
scikit-learn__scikit-learn-9288
uvx harbor run -d swtbench-verified@1.0 -t scikit-learn__scikit-learn-9288
e39578f
sphinx-doc__sphinx-10449
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10449
e39578f
sphinx-doc__sphinx-10466
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10466
e39578f
sphinx-doc__sphinx-10614
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10614
e39578f
sphinx-doc__sphinx-10673
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-10673
e39578f
sphinx-doc__sphinx-11445
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-11445
e39578f
sphinx-doc__sphinx-11510
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-11510
e39578f
sphinx-doc__sphinx-8459
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8459
e39578f
sphinx-doc__sphinx-8475
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8475
e39578f
sphinx-doc__sphinx-8548
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8548
e39578f
sphinx-doc__sphinx-8551
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8551
e39578f
sphinx-doc__sphinx-8593
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8593
e39578f
sphinx-doc__sphinx-8595
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8595
e39578f
sphinx-doc__sphinx-8621
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8621
e39578f
sphinx-doc__sphinx-8638
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8638
e39578f
sphinx-doc__sphinx-8721
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-8721
e39578f
sphinx-doc__sphinx-9229
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9229
e39578f
sphinx-doc__sphinx-9230
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9230
e39578f
sphinx-doc__sphinx-9258
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9258
e39578f
sphinx-doc__sphinx-9281
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9281
e39578f
sphinx-doc__sphinx-9320
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9320
e39578f
sphinx-doc__sphinx-9367
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9367
e39578f
sphinx-doc__sphinx-9461
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9461
e39578f
sphinx-doc__sphinx-9591
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9591
e39578f
sphinx-doc__sphinx-9602
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9602
e39578f
sphinx-doc__sphinx-9658
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9658
e39578f
sphinx-doc__sphinx-9673
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9673
e39578f
sphinx-doc__sphinx-9698
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9698
e39578f
sphinx-doc__sphinx-9711
uvx harbor run -d swtbench-verified@1.0 -t sphinx-doc__sphinx-9711
e39578f
sympy__sympy-11618
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-11618
e39578f
sympy__sympy-12096
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-12096
e39578f
sympy__sympy-12419
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-12419
e39578f
sympy__sympy-12481
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-12481
e39578f
sympy__sympy-12489
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-12489
e39578f
sympy__sympy-13031
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13031
e39578f
sympy__sympy-13372
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13372
e39578f
sympy__sympy-13480
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13480
e39578f
sympy__sympy-13551
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13551
e39578f
sympy__sympy-13615
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13615
e39578f
sympy__sympy-13647
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13647
e39578f
sympy__sympy-13757
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13757
e39578f
sympy__sympy-13798
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13798
e39578f
sympy__sympy-13852
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13852
e39578f
sympy__sympy-13877
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13877
e39578f
sympy__sympy-13974
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-13974
e39578f
sympy__sympy-14248
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-14248
e39578f
sympy__sympy-14531
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-14531
e39578f
sympy__sympy-14711
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-14711
e39578f
sympy__sympy-14976
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-14976
e39578f
sympy__sympy-15017
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-15017
e39578f
sympy__sympy-15345
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-15345
e39578f
sympy__sympy-15349
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-15349
e39578f
sympy__sympy-15599
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-15599
e39578f
sympy__sympy-15809
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-15809
e39578f
sympy__sympy-15875
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-15875
e39578f
sympy__sympy-15976
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-15976
e39578f
sympy__sympy-16450
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-16450
e39578f
sympy__sympy-16597
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-16597
e39578f
sympy__sympy-16766
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-16766
e39578f
sympy__sympy-16792
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-16792
e39578f
sympy__sympy-16886
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-16886
e39578f
sympy__sympy-17139
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-17139
e39578f
sympy__sympy-17318
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-17318
e39578f
sympy__sympy-17630
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-17630
e39578f
sympy__sympy-17655
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-17655
e39578f
sympy__sympy-18189
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-18189
e39578f
sympy__sympy-18199
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-18199
e39578f
sympy__sympy-18211
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-18211
e39578f
sympy__sympy-18698
uvx harbor run -d swtbench-verified@1.0 -t sympy__sympy-18698
e39578f