cooperbench

v1.0

CooperBench: multi-agent cooperation benchmark. 652 feature pairs across 12 repos requiring two agents to coordinate via messaging.

uvx harbor run -d cooperbench@1.0

Tasks (652)

cb-dspy-t8394-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f1-3
d6a644d
cb-dspy-t8394-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f1-4
d6a644d
cb-dspy-t8394-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f1-5
d6a644d
cb-dspy-t8394-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f2-3
d6a644d
cb-dspy-t8394-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f2-4
d6a644d
cb-dspy-t8394-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f2-5
d6a644d
cb-dspy-t8394-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f3-4
d6a644d
cb-dspy-t8394-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f3-5
d6a644d
cb-dspy-t8394-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8394-f4-5
d6a644d
cb-dspy-t8563-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f1-2
d6a644d
cb-dspy-t8563-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f1-3
d6a644d
cb-dspy-t8563-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f1-4
d6a644d
cb-dspy-t8563-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f1-5
d6a644d
cb-dspy-t8563-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f1-6
d6a644d
cb-dspy-t8563-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f2-3
d6a644d
cb-dspy-t8563-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f2-4
d6a644d
cb-dspy-t8563-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f2-5
d6a644d
cb-dspy-t8563-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f2-6
d6a644d
cb-dspy-t8563-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f3-4
d6a644d
cb-dspy-t8563-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f3-5
d6a644d
cb-dspy-t8563-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f3-6
d6a644d
cb-dspy-t8563-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f4-5
d6a644d
cb-dspy-t8563-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f4-6
d6a644d
cb-dspy-t8563-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8563-f5-6
d6a644d
cb-dspy-t8587-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f1-2
d6a644d
cb-dspy-t8587-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f1-3
d6a644d
cb-dspy-t8587-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f1-4
d6a644d
cb-dspy-t8587-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f1-5
d6a644d
cb-dspy-t8587-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f1-6
d6a644d
cb-dspy-t8587-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f2-3
d6a644d
cb-dspy-t8587-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f2-4
d6a644d
cb-dspy-t8587-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f2-5
d6a644d
cb-dspy-t8587-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f2-6
d6a644d
cb-dspy-t8587-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f3-4
d6a644d
cb-dspy-t8587-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f3-5
d6a644d
cb-dspy-t8587-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f3-6
d6a644d
cb-dspy-t8587-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f4-5
d6a644d
cb-dspy-t8587-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f4-6
d6a644d
cb-dspy-t8587-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8587-f5-6
d6a644d
cb-dspy-t8635-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f1-2
d6a644d
cb-dspy-t8635-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f1-3
d6a644d
cb-dspy-t8635-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f1-4
d6a644d
cb-dspy-t8635-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f1-5
d6a644d
cb-dspy-t8635-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f1-6
d6a644d
cb-dspy-t8635-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f2-3
d6a644d
cb-dspy-t8635-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f2-4
d6a644d
cb-dspy-t8635-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f2-5
d6a644d
cb-dspy-t8635-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f2-6
d6a644d
cb-dspy-t8635-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f3-4
d6a644d
cb-dspy-t8635-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f3-5
d6a644d
cb-dspy-t8635-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f3-6
d6a644d
cb-dspy-t8635-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f4-5
d6a644d
cb-dspy-t8635-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f4-6
d6a644d
cb-dspy-t8635-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-dspy-t8635-f5-6
d6a644d
cb-jinja-t1465-f1-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-10
d6a644d
cb-jinja-t1465-f1-2
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-2
d6a644d
cb-jinja-t1465-f1-3
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-3
d6a644d
cb-jinja-t1465-f1-4
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-4
d6a644d
cb-jinja-t1465-f1-5
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-5
d6a644d
cb-jinja-t1465-f1-6
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-6
d6a644d
cb-jinja-t1465-f1-7
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-7
d6a644d
cb-jinja-t1465-f1-8
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-8
d6a644d
cb-jinja-t1465-f1-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f1-9
d6a644d
cb-jinja-t1465-f2-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-10
d6a644d
cb-jinja-t1465-f2-3
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-3
d6a644d
cb-jinja-t1465-f2-4
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-4
d6a644d
cb-jinja-t1465-f2-5
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-5
d6a644d
cb-jinja-t1465-f2-6
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-6
d6a644d
cb-jinja-t1465-f2-7
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-7
d6a644d
cb-jinja-t1465-f2-8
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-8
d6a644d
cb-jinja-t1465-f2-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f2-9
d6a644d
cb-jinja-t1465-f3-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f3-10
d6a644d
cb-jinja-t1465-f3-4
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f3-4
d6a644d
cb-jinja-t1465-f3-5
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f3-5
d6a644d
cb-jinja-t1465-f3-6
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f3-6
d6a644d
cb-jinja-t1465-f3-7
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f3-7
d6a644d
cb-jinja-t1465-f3-8
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f3-8
d6a644d
cb-jinja-t1465-f3-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f3-9
d6a644d
cb-jinja-t1465-f4-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f4-10
d6a644d
cb-jinja-t1465-f4-5
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f4-5
d6a644d
cb-jinja-t1465-f4-6
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f4-6
d6a644d
cb-jinja-t1465-f4-7
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f4-7
d6a644d
cb-jinja-t1465-f4-8
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f4-8
d6a644d
cb-jinja-t1465-f4-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f4-9
d6a644d
cb-jinja-t1465-f5-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f5-10
d6a644d
cb-jinja-t1465-f5-6
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f5-6
d6a644d
cb-jinja-t1465-f5-7
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f5-7
d6a644d
cb-jinja-t1465-f5-8
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f5-8
d6a644d
cb-jinja-t1465-f5-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f5-9
d6a644d
cb-jinja-t1465-f6-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f6-10
d6a644d
cb-jinja-t1465-f6-7
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f6-7
d6a644d
cb-jinja-t1465-f6-8
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f6-8
d6a644d
cb-jinja-t1465-f6-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f6-9
d6a644d
cb-jinja-t1465-f7-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f7-10
d6a644d
cb-jinja-t1465-f7-8
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f7-8
d6a644d
cb-jinja-t1465-f7-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f7-9
d6a644d
cb-jinja-t1465-f8-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f8-10
d6a644d
cb-jinja-t1465-f8-9
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f8-9
d6a644d
cb-jinja-t1465-f9-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1465-f9-10
d6a644d
cb-jinja-t1559-f1-10
uvx harbor run -d cooperbench@1.0 -t cb-jinja-t1559-f1-10
d6a644d