cooperbench

v1.0

CooperBench: multi-agent cooperation benchmark. 652 feature pairs across 12 repos requiring two agents to coordinate via messaging.

uvx harbor run -d cooperbench@1.0

Tasks (652)

cb-click-t2800-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f3-5
d6a644d
cb-click-t2800-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f3-6
d6a644d
cb-click-t2800-f3-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f3-7
d6a644d
cb-click-t2800-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f4-5
d6a644d
cb-click-t2800-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f4-6
d6a644d
cb-click-t2800-f4-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f4-7
d6a644d
cb-click-t2800-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f5-6
d6a644d
cb-click-t2800-f5-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f5-7
d6a644d
cb-click-t2800-f6-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f6-7
d6a644d
cb-click-t2956-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f1-2
d6a644d
cb-click-t2956-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f1-3
d6a644d
cb-click-t2956-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f1-4
d6a644d
cb-click-t2956-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f1-5
d6a644d
cb-click-t2956-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f1-6
d6a644d
cb-click-t2956-f1-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f1-7
d6a644d
cb-click-t2956-f1-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f1-8
d6a644d
cb-click-t2956-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f2-3
d6a644d
cb-click-t2956-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f2-4
d6a644d
cb-click-t2956-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f2-5
d6a644d
cb-click-t2956-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f2-6
d6a644d
cb-click-t2956-f2-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f2-7
d6a644d
cb-click-t2956-f2-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f2-8
d6a644d
cb-click-t2956-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f3-4
d6a644d
cb-click-t2956-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f3-5
d6a644d
cb-click-t2956-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f3-6
d6a644d
cb-click-t2956-f3-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f3-7
d6a644d
cb-click-t2956-f3-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f3-8
d6a644d
cb-click-t2956-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f4-5
d6a644d
cb-click-t2956-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f4-6
d6a644d
cb-click-t2956-f4-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f4-7
d6a644d
cb-click-t2956-f4-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f4-8
d6a644d
cb-click-t2956-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f5-6
d6a644d
cb-click-t2956-f5-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f5-7
d6a644d
cb-click-t2956-f5-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f5-8
d6a644d
cb-click-t2956-f6-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f6-7
d6a644d
cb-click-t2956-f6-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f6-8
d6a644d
cb-click-t2956-f7-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2956-f7-8
d6a644d
cb-datasets-t3997-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f1-2
d6a644d
cb-datasets-t3997-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f1-3
d6a644d
cb-datasets-t3997-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f1-4
d6a644d
cb-datasets-t3997-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f1-5
d6a644d
cb-datasets-t3997-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f2-3
d6a644d
cb-datasets-t3997-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f2-4
d6a644d
cb-datasets-t3997-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f2-5
d6a644d
cb-datasets-t3997-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f3-4
d6a644d
cb-datasets-t3997-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f3-5
d6a644d
cb-datasets-t3997-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t3997-f4-5
d6a644d
cb-datasets-t6252-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f1-2
d6a644d
cb-datasets-t6252-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f1-3
d6a644d
cb-datasets-t6252-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f1-4
d6a644d
cb-datasets-t6252-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f1-5
d6a644d
cb-datasets-t6252-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f1-6
d6a644d
cb-datasets-t6252-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f2-3
d6a644d
cb-datasets-t6252-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f2-4
d6a644d
cb-datasets-t6252-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f2-5
d6a644d
cb-datasets-t6252-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f2-6
d6a644d
cb-datasets-t6252-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f3-4
d6a644d
cb-datasets-t6252-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f3-5
d6a644d
cb-datasets-t6252-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f3-6
d6a644d
cb-datasets-t6252-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f4-5
d6a644d
cb-datasets-t6252-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f4-6
d6a644d
cb-datasets-t6252-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t6252-f5-6
d6a644d
cb-datasets-t7309-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-datasets-t7309-f1-2
d6a644d
cb-dirty-equals-t43-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-2
d6a644d
cb-dirty-equals-t43-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-3
d6a644d
cb-dirty-equals-t43-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-4
d6a644d
cb-dirty-equals-t43-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-5
d6a644d
cb-dirty-equals-t43-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-6
d6a644d
cb-dirty-equals-t43-f1-7
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-7
d6a644d
cb-dirty-equals-t43-f1-8
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-8
d6a644d
cb-dirty-equals-t43-f1-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f1-9
d6a644d
cb-dirty-equals-t43-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f2-3
d6a644d
cb-dirty-equals-t43-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f2-4
d6a644d
cb-dirty-equals-t43-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f2-5
d6a644d
cb-dirty-equals-t43-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f2-6
d6a644d
cb-dirty-equals-t43-f2-7
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f2-7
d6a644d
cb-dirty-equals-t43-f2-8
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f2-8
d6a644d
cb-dirty-equals-t43-f2-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f2-9
d6a644d
cb-dirty-equals-t43-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f3-4
d6a644d
cb-dirty-equals-t43-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f3-5
d6a644d
cb-dirty-equals-t43-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f3-6
d6a644d
cb-dirty-equals-t43-f3-7
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f3-7
d6a644d
cb-dirty-equals-t43-f3-8
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f3-8
d6a644d
cb-dirty-equals-t43-f3-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f3-9
d6a644d
cb-dirty-equals-t43-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f4-5
d6a644d
cb-dirty-equals-t43-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f4-6
d6a644d
cb-dirty-equals-t43-f4-7
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f4-7
d6a644d
cb-dirty-equals-t43-f4-8
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f4-8
d6a644d
cb-dirty-equals-t43-f4-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f4-9
d6a644d
cb-dirty-equals-t43-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f5-6
d6a644d
cb-dirty-equals-t43-f5-7
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f5-7
d6a644d
cb-dirty-equals-t43-f5-8
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f5-8
d6a644d
cb-dirty-equals-t43-f5-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f5-9
d6a644d
cb-dirty-equals-t43-f6-7
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f6-7
d6a644d
cb-dirty-equals-t43-f6-8
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f6-8
d6a644d
cb-dirty-equals-t43-f6-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f6-9
d6a644d
cb-dirty-equals-t43-f7-8
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f7-8
d6a644d
cb-dirty-equals-t43-f7-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f7-9
d6a644d
cb-dirty-equals-t43-f8-9
uvx harbor run -d cooperbench@1.0 -t cb-dirty-equals-t43-f8-9
d6a644d
cb-dspy-t8394-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f1-2
d6a644d