cooperbench
v1.0CooperBench: multi-agent cooperation benchmark. 652 feature pairs across 12 repos requiring two agents to coordinate via messaging.
uvx harbor run -d cooperbench@1.0Tasks (652)
cb-chi-t26-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f1-2d6a644d
cb-chi-t26-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f1-3d6a644d
cb-chi-t26-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f1-4d6a644d
cb-chi-t26-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f2-3d6a644d
cb-chi-t26-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f2-4d6a644d
cb-chi-t26-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f3-4d6a644d
cb-chi-t27-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f1-2d6a644d
cb-chi-t27-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f1-3d6a644d
cb-chi-t27-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f1-4d6a644d
cb-chi-t27-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f2-3d6a644d
cb-chi-t27-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f2-4d6a644d
cb-chi-t27-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f3-4d6a644d
cb-chi-t56-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-2d6a644d
cb-chi-t56-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-3d6a644d
cb-chi-t56-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-4d6a644d
cb-chi-t56-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-5d6a644d
cb-chi-t56-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f2-3d6a644d
cb-chi-t56-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f2-4d6a644d
cb-chi-t56-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f2-5d6a644d
cb-chi-t56-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f3-4d6a644d
cb-chi-t56-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f3-5d6a644d
cb-chi-t56-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f4-5d6a644d
cb-click-t2068-f1-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-10d6a644d
cb-click-t2068-f1-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-11d6a644d
cb-click-t2068-f1-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-12d6a644d
cb-click-t2068-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-2d6a644d
cb-click-t2068-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-3d6a644d
cb-click-t2068-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-4d6a644d
cb-click-t2068-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-5d6a644d
cb-click-t2068-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-6d6a644d
cb-click-t2068-f1-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-7d6a644d
cb-click-t2068-f1-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-8d6a644d
cb-click-t2068-f1-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-9d6a644d
cb-click-t2068-f10-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f10-11d6a644d
cb-click-t2068-f10-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f10-12d6a644d
cb-click-t2068-f11-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f11-12d6a644d
cb-click-t2068-f2-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-10d6a644d
cb-click-t2068-f2-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-11d6a644d
cb-click-t2068-f2-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-12d6a644d
cb-click-t2068-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-3d6a644d
cb-click-t2068-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-4d6a644d
cb-click-t2068-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-5d6a644d
cb-click-t2068-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-6d6a644d
cb-click-t2068-f2-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-7d6a644d
cb-click-t2068-f2-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-8d6a644d
cb-click-t2068-f2-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-9d6a644d
cb-click-t2068-f3-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-10d6a644d
cb-click-t2068-f3-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-11d6a644d
cb-click-t2068-f3-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-12d6a644d
cb-click-t2068-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-4d6a644d
cb-click-t2068-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-5d6a644d
cb-click-t2068-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-6d6a644d
cb-click-t2068-f3-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-7d6a644d
cb-click-t2068-f3-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-8d6a644d
cb-click-t2068-f3-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-9d6a644d
cb-click-t2068-f4-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-10d6a644d
cb-click-t2068-f4-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-11d6a644d
cb-click-t2068-f4-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-12d6a644d
cb-click-t2068-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-5d6a644d
cb-click-t2068-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-6d6a644d
cb-click-t2068-f4-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-7d6a644d
cb-click-t2068-f4-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-8d6a644d
cb-click-t2068-f4-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-9d6a644d
cb-click-t2068-f5-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-10d6a644d
cb-click-t2068-f5-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-11d6a644d
cb-click-t2068-f5-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-12d6a644d
cb-click-t2068-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-6d6a644d
cb-click-t2068-f5-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-7d6a644d
cb-click-t2068-f5-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-8d6a644d
cb-click-t2068-f5-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-9d6a644d
cb-click-t2068-f6-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-10d6a644d
cb-click-t2068-f6-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-11d6a644d
cb-click-t2068-f6-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-12d6a644d
cb-click-t2068-f6-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-7d6a644d
cb-click-t2068-f6-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-8d6a644d
cb-click-t2068-f6-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-9d6a644d
cb-click-t2068-f7-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-10d6a644d
cb-click-t2068-f7-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-11d6a644d
cb-click-t2068-f7-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-12d6a644d
cb-click-t2068-f7-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-8d6a644d
cb-click-t2068-f7-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-9d6a644d
cb-click-t2068-f8-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-10d6a644d
cb-click-t2068-f8-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-11d6a644d
cb-click-t2068-f8-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-12d6a644d
cb-click-t2068-f8-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-9d6a644d
cb-click-t2068-f9-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f9-10d6a644d
cb-click-t2068-f9-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f9-11d6a644d
cb-click-t2068-f9-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f9-12d6a644d
cb-click-t2800-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-2d6a644d
cb-click-t2800-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-3d6a644d
cb-click-t2800-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-4d6a644d
cb-click-t2800-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-5d6a644d
cb-click-t2800-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-6d6a644d
cb-click-t2800-f1-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-7d6a644d
cb-click-t2800-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-3d6a644d
cb-click-t2800-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-4d6a644d
cb-click-t2800-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-5d6a644d
cb-click-t2800-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-6d6a644d
cb-click-t2800-f2-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-7d6a644d
cb-click-t2800-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f3-4d6a644d