Skip to content

Commit 1c8b775

Browse files
authored
Merge pull request #1 from cooperbench/faq_section
Faq section
2 parents 6bd6174 + 043d7bd commit 1c8b775

File tree

4 files changed

+158
-1
lines changed

4 files changed

+158
-1
lines changed

src/components/FAQ.astro

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
---
2+
export interface Props {
3+
className?: string;
4+
}
5+
6+
const { className = "" } = Astro.props;
7+
---
8+
9+
<div class={`space-y-3 mb-8 not-prose ${className}`}>
10+
<slot />
11+
</div>

src/components/FAQItem.astro

Lines changed: 45 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,45 @@
1+
---
2+
export interface Props {
3+
question: string;
4+
icon?: 'wrench' | 'chart' | 'sparkles';
5+
defaultOpen?: boolean;
6+
}
7+
8+
const { question, icon, defaultOpen = false } = Astro.props;
9+
10+
const icons = {
11+
wrench: `<svg class="w-5 h-5 text-stone-500 flex-shrink-0" fill="none" stroke="currentColor" viewBox="0 0 24 24"><path stroke-linecap="round" stroke-linejoin="round" stroke-width="1.5" d="M11.42 15.17L17.25 21A2.652 2.652 0 0021 17.25l-5.877-5.877M11.42 15.17l2.496-3.03c.317-.384.74-.626 1.208-.766M11.42 15.17l-4.655 5.653a2.548 2.548 0 11-3.586-3.586l6.837-5.63m5.108-.233c.55-.164 1.163-.188 1.743-.14a4.5 4.5 0 004.486-6.336l-3.276 3.277a3.004 3.004 0 01-2.25-2.25l3.276-3.276a4.5 4.5 0 00-6.336 4.486c.091 1.076-.071 2.264-.904 2.95l-.102.085m-1.745 1.437L5.909 7.5H4.5L2.25 3.75l1.5-1.5L7.5 4.5v1.409l4.26 4.26m-1.745 1.437l1.745-1.437m6.615 8.206L15.75 15.75M4.867 19.125h.008v.008h-.008v-.008z" /></svg>`,
12+
chart: `<svg class="w-5 h-5 text-stone-500 flex-shrink-0" fill="none" stroke="currentColor" viewBox="0 0 24 24"><path stroke-linecap="round" stroke-linejoin="round" stroke-width="1.5" d="M3.75 3v11.25A2.25 2.25 0 006 16.5h2.25M3.75 3h-1.5m1.5 0h16.5m0 0h1.5m-1.5 0v11.25A2.25 2.25 0 0118 16.5h-2.25m-7.5 0h7.5m-7.5 0l-1 3m8.5-3l1 3m0 0l.5 1.5m-.5-1.5h-9.5m0 0l-.5 1.5m.75-9l3-3 2.148 2.148A12.061 12.061 0 0116.5 7.605" /></svg>`,
13+
sparkles: `<svg class="w-5 h-5 text-stone-500 flex-shrink-0" fill="none" stroke="currentColor" viewBox="0 0 24 24"><path stroke-linecap="round" stroke-linejoin="round" stroke-width="1.5" d="M9.813 15.904L9 18.75l-.813-2.846a4.5 4.5 0 00-3.09-3.09L2.25 12l2.846-.813a4.5 4.5 0 003.09-3.09L9 5.25l.813 2.846a4.5 4.5 0 003.09 3.09L15.75 12l-2.846.813a4.5 4.5 0 00-3.09 3.09zM18.259 8.715L18 9.75l-.259-1.035a3.375 3.375 0 00-2.455-2.456L14.25 6l1.036-.259a3.375 3.375 0 002.455-2.456L18 2.25l.259 1.035a3.375 3.375 0 002.456 2.456L21.75 6l-1.035.259a3.375 3.375 0 00-2.456 2.456zM16.894 20.567L16.5 21.75l-.394-1.183a2.25 2.25 0 00-1.423-1.423L13.5 18.75l1.183-.394a2.25 2.25 0 001.423-1.423l.394-1.183.394 1.183a2.25 2.25 0 001.423 1.423l1.183.394-1.183.394a2.25 2.25 0 00-1.423 1.423z" /></svg>`
14+
};
15+
---
16+
17+
<details class="group bg-stone-100 rounded-2xl overflow-hidden border border-stone-200" open={defaultOpen}>
18+
<summary class="flex items-center gap-4 p-5 cursor-pointer hover:bg-stone-150 transition-colors">
19+
<svg
20+
class="w-4 h-4 text-stone-400 group-open:rotate-90 transition-transform flex-shrink-0"
21+
fill="currentColor"
22+
viewBox="0 0 20 20"
23+
>
24+
<path
25+
fill-rule="evenodd"
26+
d="M7.21 14.77a.75.75 0 01.02-1.06L11.168 10 7.23 6.29a.75.75 0 111.04-1.08l4.5 4.25a.75.75 0 010 1.08l-4.5 4.25a.75.75 0 01-1.06-.02z"
27+
clip-rule="evenodd"
28+
/>
29+
</svg>
30+
{icon && <Fragment set:html={icons[icon]} />}
31+
<span class="font-semibold text-stone-900">{question}</span>
32+
</summary>
33+
<div class="px-5 pb-5 pl-14 text-stone-600 [&>p]:mb-3 [&>p:last-child]:mb-0">
34+
<slot />
35+
</div>
36+
</details>
37+
38+
<style>
39+
summary {
40+
list-style: none;
41+
}
42+
summary::-webkit-details-marker {
43+
display: none;
44+
}
45+
</style>

src/content/blog/curse-of-coordination.mdx

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,9 @@ authors:
99
image: "/static/images/hao_zhu.png"
1010
---
1111

12+
import FAQ from '../../components/FAQ.astro';
13+
import FAQItem from '../../components/FAQItem.astro';
14+
1215
{/* TL;DR */}
1316
<div className="mb-10 not-prose py-6 px-6 bg-blue-50 rounded-xl">
1417
<p className="text-xs font-semibold text-blue-900 uppercase tracking-wider mb-3">
@@ -219,3 +222,20 @@ And that's what makes us hopeful. These emergent coordination behaviors give us
219222
Even better, CooperBench isn't just a dataset. It's a live environment. You can drop models in, pair them up, and let them learn to work together through trial and error. The same tasks that expose failures today can be the training ground that fixes them.
220223

221224
The bottleneck for multi-agent systems isn't raw ability. It's social intelligence. But social intelligence can be taught. And now we have a place to teach it.
225+
226+
## FAQ
227+
228+
<FAQ>
229+
<FAQItem question="Wouldn't better orchestration solve this?" icon="wrench">
230+
<p>CooperBench is a general evaluation benchmark for evaluating agent cooperation when they each have an individual task.</p>
231+
<p>We can definitely see how clever orchestration techniques can help agent perform better on CooperBench. If you are interested in submitting to our benchmark, let us know.</p>
232+
<p>However, our bet is in the long run, agents' native ability to coordinate will be more important than any external scaffolding. Scaffolding requires human architects to design the right structures for each new domain. Native ability lets agents figure it out themselves.</p>
233+
<p>We are happy to be proven wrong though!</p>
234+
</FAQItem>
235+
236+
<FAQItem question="Can this actually be improved?" icon="sparkles">
237+
<p>We think so. In successful traces, agents spontaneously developed coordination strategies: dividing roles, claiming resources, negotiating before acting. These behaviors emerged without prompting.</p>
238+
<p>What's missing is reliability. Effective coordination requires <em>theory of mind</em>: tracking what your partner knows, believes, and intends. Current models struggle to maintain these partner models across extended interactions.</p>
239+
<p>CooperBench provides hundreds of examples where coordination succeeds and fails. That's a training signal for the pragmatic and social reasoning that collaboration requires.</p>
240+
</FAQItem>
241+
</FAQ>

src/layouts/BlogPostLayout.astro

Lines changed: 82 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@ const { frontmatter, headings } = Astro.props;
5555
<TableOfContents headings={headings} />
5656

5757
<!-- Article Body -->
58-
<div class="prose prose-lg max-w-none">
58+
<div class="max-w-none blog-content">
5959
<slot />
6060
</div>
6161

@@ -126,6 +126,87 @@ const { frontmatter, headings } = Astro.props;
126126
</main>
127127
</BaseLayout>
128128

129+
<style is:global>
130+
.blog-content {
131+
font-size: 1rem;
132+
line-height: 1.8;
133+
color: #4b5563;
134+
}
135+
136+
.blog-content h2 {
137+
font-size: 1.75rem;
138+
font-weight: 700;
139+
color: #111827;
140+
margin-top: 2.5rem;
141+
margin-bottom: 1rem;
142+
line-height: 1.3;
143+
letter-spacing: -0.025em;
144+
}
145+
146+
.blog-content h3 {
147+
font-size: 1.25rem;
148+
font-weight: 600;
149+
color: #1f2937;
150+
margin-top: 2rem;
151+
margin-bottom: 0.75rem;
152+
line-height: 1.4;
153+
}
154+
155+
.blog-content h4 {
156+
font-size: 1.0625rem;
157+
font-weight: 600;
158+
color: #374151;
159+
margin-top: 1.5rem;
160+
margin-bottom: 0.5rem;
161+
}
162+
163+
.blog-content p {
164+
margin-bottom: 1.25rem;
165+
}
166+
167+
.blog-content strong {
168+
color: #1f2937;
169+
font-weight: 600;
170+
}
171+
172+
.blog-content em {
173+
color: #374151;
174+
}
175+
176+
.blog-content figcaption {
177+
font-size: 0.8125rem;
178+
color: #6b7280;
179+
margin-top: 0.75rem;
180+
}
181+
182+
.blog-content blockquote {
183+
font-size: 0.9375rem;
184+
border-left: 3px solid #d1d5db;
185+
padding-left: 1rem;
186+
color: #6b7280;
187+
font-style: normal;
188+
}
189+
190+
.blog-content ul, .blog-content ol {
191+
margin-top: 0.75rem;
192+
margin-bottom: 1.25rem;
193+
}
194+
195+
.blog-content li {
196+
margin-bottom: 0.375rem;
197+
}
198+
199+
.blog-content a {
200+
color: #2563eb;
201+
text-decoration: underline;
202+
text-underline-offset: 2px;
203+
}
204+
205+
.blog-content a:hover {
206+
color: #1d4ed8;
207+
}
208+
</style>
209+
129210
<script>
130211
const scrollBtn = document.querySelector(".scroll-to-top");
131212
if (scrollBtn) {

0 commit comments

Comments
 (0)