cooperbench

v1.0

CooperBench: multi-agent cooperation benchmark. 652 feature pairs across 12 repos requiring two agents to coordinate via messaging.

uvx harbor run -d cooperbench@1.0

Tasks (652)

cb-chi-t26-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f1-2
d6a644d
cb-chi-t26-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f1-3
d6a644d
cb-chi-t26-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f1-4
d6a644d
cb-chi-t26-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f2-3
d6a644d
cb-chi-t26-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f2-4
d6a644d
cb-chi-t26-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t26-f3-4
d6a644d
cb-chi-t27-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f1-2
d6a644d
cb-chi-t27-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f1-3
d6a644d
cb-chi-t27-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f1-4
d6a644d
cb-chi-t27-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f2-3
d6a644d
cb-chi-t27-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f2-4
d6a644d
cb-chi-t27-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t27-f3-4
d6a644d
cb-chi-t56-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-2
d6a644d
cb-chi-t56-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-3
d6a644d
cb-chi-t56-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-4
d6a644d
cb-chi-t56-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f1-5
d6a644d
cb-chi-t56-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f2-3
d6a644d
cb-chi-t56-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f2-4
d6a644d
cb-chi-t56-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f2-5
d6a644d
cb-chi-t56-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f3-4
d6a644d
cb-chi-t56-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f3-5
d6a644d
cb-chi-t56-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-chi-t56-f4-5
d6a644d
cb-click-t2068-f1-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-10
d6a644d
cb-click-t2068-f1-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-11
d6a644d
cb-click-t2068-f1-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-12
d6a644d
cb-click-t2068-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-2
d6a644d
cb-click-t2068-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-3
d6a644d
cb-click-t2068-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-4
d6a644d
cb-click-t2068-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-5
d6a644d
cb-click-t2068-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-6
d6a644d
cb-click-t2068-f1-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-7
d6a644d
cb-click-t2068-f1-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-8
d6a644d
cb-click-t2068-f1-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f1-9
d6a644d
cb-click-t2068-f10-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f10-11
d6a644d
cb-click-t2068-f10-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f10-12
d6a644d
cb-click-t2068-f11-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f11-12
d6a644d
cb-click-t2068-f2-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-10
d6a644d
cb-click-t2068-f2-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-11
d6a644d
cb-click-t2068-f2-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-12
d6a644d
cb-click-t2068-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-3
d6a644d
cb-click-t2068-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-4
d6a644d
cb-click-t2068-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-5
d6a644d
cb-click-t2068-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-6
d6a644d
cb-click-t2068-f2-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-7
d6a644d
cb-click-t2068-f2-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-8
d6a644d
cb-click-t2068-f2-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f2-9
d6a644d
cb-click-t2068-f3-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-10
d6a644d
cb-click-t2068-f3-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-11
d6a644d
cb-click-t2068-f3-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-12
d6a644d
cb-click-t2068-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-4
d6a644d
cb-click-t2068-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-5
d6a644d
cb-click-t2068-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-6
d6a644d
cb-click-t2068-f3-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-7
d6a644d
cb-click-t2068-f3-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-8
d6a644d
cb-click-t2068-f3-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f3-9
d6a644d
cb-click-t2068-f4-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-10
d6a644d
cb-click-t2068-f4-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-11
d6a644d
cb-click-t2068-f4-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-12
d6a644d
cb-click-t2068-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-5
d6a644d
cb-click-t2068-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-6
d6a644d
cb-click-t2068-f4-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-7
d6a644d
cb-click-t2068-f4-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-8
d6a644d
cb-click-t2068-f4-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f4-9
d6a644d
cb-click-t2068-f5-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-10
d6a644d
cb-click-t2068-f5-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-11
d6a644d
cb-click-t2068-f5-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-12
d6a644d
cb-click-t2068-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-6
d6a644d
cb-click-t2068-f5-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-7
d6a644d
cb-click-t2068-f5-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-8
d6a644d
cb-click-t2068-f5-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f5-9
d6a644d
cb-click-t2068-f6-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-10
d6a644d
cb-click-t2068-f6-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-11
d6a644d
cb-click-t2068-f6-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-12
d6a644d
cb-click-t2068-f6-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-7
d6a644d
cb-click-t2068-f6-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-8
d6a644d
cb-click-t2068-f6-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f6-9
d6a644d
cb-click-t2068-f7-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-10
d6a644d
cb-click-t2068-f7-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-11
d6a644d
cb-click-t2068-f7-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-12
d6a644d
cb-click-t2068-f7-8
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-8
d6a644d
cb-click-t2068-f7-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f7-9
d6a644d
cb-click-t2068-f8-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-10
d6a644d
cb-click-t2068-f8-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-11
d6a644d
cb-click-t2068-f8-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-12
d6a644d
cb-click-t2068-f8-9
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f8-9
d6a644d
cb-click-t2068-f9-10
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f9-10
d6a644d
cb-click-t2068-f9-11
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f9-11
d6a644d
cb-click-t2068-f9-12
uvx harbor run -d cooperbench@1.0 -t cb-click-t2068-f9-12
d6a644d
cb-click-t2800-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-2
d6a644d
cb-click-t2800-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-3
d6a644d
cb-click-t2800-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-4
d6a644d
cb-click-t2800-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-5
d6a644d
cb-click-t2800-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-6
d6a644d
cb-click-t2800-f1-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f1-7
d6a644d
cb-click-t2800-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-3
d6a644d
cb-click-t2800-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-4
d6a644d
cb-click-t2800-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-5
d6a644d
cb-click-t2800-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-6
d6a644d
cb-click-t2800-f2-7
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f2-7
d6a644d
cb-click-t2800-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-click-t2800-f3-4
d6a644d