Skip to content

Commit 16117c7

Browse files
committed
Deploying to gh-pages from @ c20633f 🚀
1 parent b4004a9 commit 16117c7

File tree

6,963 files changed

+8854
-8854
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

6,963 files changed

+8854
-8854
lines changed

404.html

Lines changed: 1 addition & 1 deletion
Large diffs are not rendered by default.

404/index.html

Lines changed: 1 addition & 1 deletion
Large diffs are not rendered by default.

__next.!KGhvbWUp.__PAGE__.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,6 @@
22
2:I[1215,["/jj-benchmark/_next/static/chunks/f04c4ae3c299e41d.js","/jj-benchmark/_next/static/chunks/7b3532f74521bafe.js"],"default"]
33
4:I[75049,["/jj-benchmark/_next/static/chunks/d2c13bb33c4fcd54.js","/jj-benchmark/_next/static/chunks/c21188132e0e0d48.js"],"OutletBoundary"]
44
5:"$Sreact.suspense"
5-
0:{"buildId":"zYbV-FSlGw5lIkET42KmM","rsc":["$","$1","c",{"children":[["$","div",null,{"className":"min-h-screen bg-background text-foreground font-sans selection:bg-primary/20","children":[["$","div",null,{"className":"fixed inset-0 -z-10 h-full w-full bg-background bg-[radial-gradient(#2a2a2a_1px,transparent_1px)] [background-size:16px_16px] [mask-image:radial-gradient(ellipse_50%_50%_at_50%_50%,#000_70%,transparent_100%)] opacity-20 dark:opacity-40"}],["$","div",null,{"className":"container mx-auto px-4 py-16 max-w-6xl","children":[["$","div",null,{"className":"text-center mb-16 space-y-6","children":[["$","div",null,{"className":"inline-flex items-center justify-center p-1.5 rounded-full bg-secondary/50 backdrop-blur-sm border border-border mb-4","children":[["$","span",null,{"className":"flex h-2 w-2 rounded-full bg-emerald-500 mx-2 animate-pulse"}],["$","span",null,{"className":"text-xs font-medium px-2","children":"Live Benchmarks"}]]}],["$","h1",null,{"className":"text-5xl md:text-7xl font-bold tracking-tight bg-clip-text text-transparent bg-gradient-to-b from-foreground to-foreground/50 pb-2","children":"JJ Benchmark"}],["$","p",null,{"className":"text-lg text-muted-foreground max-w-2xl mx-auto leading-relaxed","children":"Performance results of AI coding models on Jujutsu tasks, measuring success rate and execution time with high precision."}],["$","div",null,{"className":"flex items-center justify-center gap-6 text-sm text-muted-foreground pt-4","children":[["$","a",null,{"href":"https://github.com/TabbyML/jj-benchmark","target":"_blank","rel":"noopener noreferrer","className":"flex items-center gap-2 hover:text-primary transition-colors","children":[["$","svg",null,{"xmlns":"http://www.w3.org/2000/svg","width":24,"height":24,"viewBox":"0 0 24 24","fill":"none","stroke":"currentColor","strokeWidth":2,"strokeLinecap":"round","strokeLinejoin":"round","className":"lucide lucide-github w-4 h-4","aria-hidden":"true","children":[["$","path","tonef",{"d":"M15 22v-4a4.8 4.8 0 0 0-1-3.5c3 0 6-2 6-5.5.08-1.25-.27-2.48-1-3.5.28-1.15.28-2.35 0-3.5 0 0-1 0-3 1.5-2.64-.5-5.36-.5-8 0C6 2 5 2 5 2c-.3 1.15-.3 2.35 0 3.5A5.403 5.403 0 0 0 4 9c0 3.5 3 5.5 6 5.5-.39.49-.68 1.05-.85 1.65-.17.6-.22 1.23-.15 1.85v4"}],["$","path","9comsn",{"d":"M9 18c-4.51 2-5-2-7-2"}],"$undefined"]}],["$","span",null,{"children":"View on GitHub"}]]}],["$","div",null,{"className":"h-4 w-px bg-border"}],["$","span",null,{"className":"flex items-center gap-2","children":[["$","svg",null,{"xmlns":"http://www.w3.org/2000/svg","width":24,"height":24,"viewBox":"0 0 24 24","fill":"none","stroke":"currentColor","strokeWidth":2,"strokeLinecap":"round","strokeLinejoin":"round","className":"lucide lucide-terminal w-4 h-4","aria-hidden":"true","children":[["$","path","baeox8",{"d":"M12 19h8"}],["$","path","1yngyt",{"d":"m4 17 6-6-6-6"}],"$undefined"]}],["$","span",null,{"children":["Last run: ","3/16/2026"]}]]}]]}]]}],["$","$L2",null,{"data":[{"id":"1","model":"claude-4-6-sonnet","agent":"Pochi","passedEvals":58,"successRate":92,"avgLatency":128.78561904761906,"isNew":true},{"id":"2","model":"claude-opus-4-6","agent":"Pochi","passedEvals":55,"successRate":87,"avgLatency":102.30577777777775,"isNew":false},{"id":"3","model":"gemini-3.1-pro","agent":"Pochi","passedEvals":53,"successRate":84,"avgLatency":267.562365079365,"isNew":false},{"id":"4","model":"gpt-5.2-codex","agent":"Pochi","passedEvals":52,"successRate":83,"avgLatency":120.62274603174605,"isNew":false},{"id":"5","model":"gpt-5.4","agent":"Pochi","passedEvals":51,"successRate":81,"avgLatency":77.60012698412699,"isNew":false},{"id":"6","model":"kimi-k2.5","agent":"Pochi","passedEvals":50,"successRate":79,"avgLatency":241.03384126984136,"isNew":false},{"id":"7","model":"gemini-3-flash","agent":"Pochi","passedEvals":46,"successRate":73,"avgLatency":207.24031746031756,"isNew":false},{"id":"8","model":"glm-4.7","agent":"Pochi","passedEvals":44,"successRate":70,"avgLatency":185.81307936507937,"isNew":false},{"id":"9","model":"qwen3-coder-480b-A35b-instruct","agent":"Pochi","passedEvals":43,"successRate":68,"avgLatency":124.88849206349207,"isNew":false},{"id":"10","model":"glm-4.7-flash","agent":"Pochi","passedEvals":33,"successRate":52,"avgLatency":114.15141269841268,"isNew":false}]}]]}]]}],[["$","script","script-0",{"src":"/jj-benchmark/_next/static/chunks/f04c4ae3c299e41d.js","async":true}],["$","script","script-1",{"src":"/jj-benchmark/_next/static/chunks/7b3532f74521bafe.js","async":true}]],"$L3"]}],"loading":null,"isPartial":false}
5+
0:{"buildId":"6mp5GVY9QrOEBN6V4ojsn","rsc":["$","$1","c",{"children":[["$","div",null,{"className":"min-h-screen bg-background text-foreground font-sans selection:bg-primary/20","children":[["$","div",null,{"className":"fixed inset-0 -z-10 h-full w-full bg-background bg-[radial-gradient(#2a2a2a_1px,transparent_1px)] [background-size:16px_16px] [mask-image:radial-gradient(ellipse_50%_50%_at_50%_50%,#000_70%,transparent_100%)] opacity-20 dark:opacity-40"}],["$","div",null,{"className":"container mx-auto px-4 py-16 max-w-6xl","children":[["$","div",null,{"className":"text-center mb-16 space-y-6","children":[["$","div",null,{"className":"inline-flex items-center justify-center p-1.5 rounded-full bg-secondary/50 backdrop-blur-sm border border-border mb-4","children":[["$","span",null,{"className":"flex h-2 w-2 rounded-full bg-emerald-500 mx-2 animate-pulse"}],["$","span",null,{"className":"text-xs font-medium px-2","children":"Live Benchmarks"}]]}],["$","h1",null,{"className":"text-5xl md:text-7xl font-bold tracking-tight bg-clip-text text-transparent bg-gradient-to-b from-foreground to-foreground/50 pb-2","children":"JJ Benchmark"}],["$","p",null,{"className":"text-lg text-muted-foreground max-w-2xl mx-auto leading-relaxed","children":"Performance results of AI coding models on Jujutsu tasks, measuring success rate and execution time with high precision."}],["$","div",null,{"className":"flex items-center justify-center gap-6 text-sm text-muted-foreground pt-4","children":[["$","a",null,{"href":"https://github.com/TabbyML/jj-benchmark","target":"_blank","rel":"noopener noreferrer","className":"flex items-center gap-2 hover:text-primary transition-colors","children":[["$","svg",null,{"xmlns":"http://www.w3.org/2000/svg","width":24,"height":24,"viewBox":"0 0 24 24","fill":"none","stroke":"currentColor","strokeWidth":2,"strokeLinecap":"round","strokeLinejoin":"round","className":"lucide lucide-github w-4 h-4","aria-hidden":"true","children":[["$","path","tonef",{"d":"M15 22v-4a4.8 4.8 0 0 0-1-3.5c3 0 6-2 6-5.5.08-1.25-.27-2.48-1-3.5.28-1.15.28-2.35 0-3.5 0 0-1 0-3 1.5-2.64-.5-5.36-.5-8 0C6 2 5 2 5 2c-.3 1.15-.3 2.35 0 3.5A5.403 5.403 0 0 0 4 9c0 3.5 3 5.5 6 5.5-.39.49-.68 1.05-.85 1.65-.17.6-.22 1.23-.15 1.85v4"}],["$","path","9comsn",{"d":"M9 18c-4.51 2-5-2-7-2"}],"$undefined"]}],["$","span",null,{"children":"View on GitHub"}]]}],["$","div",null,{"className":"h-4 w-px bg-border"}],["$","span",null,{"className":"flex items-center gap-2","children":[["$","svg",null,{"xmlns":"http://www.w3.org/2000/svg","width":24,"height":24,"viewBox":"0 0 24 24","fill":"none","stroke":"currentColor","strokeWidth":2,"strokeLinecap":"round","strokeLinejoin":"round","className":"lucide lucide-terminal w-4 h-4","aria-hidden":"true","children":[["$","path","baeox8",{"d":"M12 19h8"}],["$","path","1yngyt",{"d":"m4 17 6-6-6-6"}],"$undefined"]}],["$","span",null,{"children":["Last run: ","3/17/2026"]}]]}]]}]]}],["$","$L2",null,{"data":[{"id":"1","model":"claude-4-6-sonnet","agent":"Pochi","passedEvals":58,"successRate":92,"avgLatency":128.78561904761906,"isNew":true},{"id":"2","model":"claude-opus-4-6","agent":"Pochi","passedEvals":55,"successRate":87,"avgLatency":102.30577777777775,"isNew":false},{"id":"3","model":"gemini-3.1-pro","agent":"Pochi","passedEvals":53,"successRate":84,"avgLatency":267.562365079365,"isNew":false},{"id":"4","model":"gpt-5.2-codex","agent":"Pochi","passedEvals":52,"successRate":83,"avgLatency":120.62274603174605,"isNew":false},{"id":"5","model":"gpt-5.4","agent":"Pochi","passedEvals":51,"successRate":81,"avgLatency":77.60012698412699,"isNew":false},{"id":"6","model":"kimi-k2.5","agent":"Pochi","passedEvals":50,"successRate":79,"avgLatency":241.03384126984136,"isNew":false},{"id":"7","model":"gemini-3-flash","agent":"Pochi","passedEvals":46,"successRate":73,"avgLatency":207.24031746031756,"isNew":false},{"id":"8","model":"glm-4.7","agent":"Pochi","passedEvals":44,"successRate":70,"avgLatency":185.81307936507937,"isNew":false},{"id":"9","model":"qwen3-coder-480b-A35b-instruct","agent":"Pochi","passedEvals":43,"successRate":68,"avgLatency":124.88849206349207,"isNew":false},{"id":"10","model":"glm-4.7-flash","agent":"Pochi","passedEvals":33,"successRate":52,"avgLatency":114.15141269841268,"isNew":false}]}]]}]]}],[["$","script","script-0",{"src":"/jj-benchmark/_next/static/chunks/f04c4ae3c299e41d.js","async":true}],["$","script","script-1",{"src":"/jj-benchmark/_next/static/chunks/7b3532f74521bafe.js","async":true}]],"$L3"]}],"loading":null,"isPartial":false}
66
3:["$","$L4",null,{"children":["$","$5",null,{"name":"Next.MetadataOutlet","children":"$@6"}]}]
77
6:null

__next.!KGhvbWUp.txt

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
11
1:"$Sreact.fragment"
22
2:I[36064,["/jj-benchmark/_next/static/chunks/d2c13bb33c4fcd54.js","/jj-benchmark/_next/static/chunks/c21188132e0e0d48.js"],"default"]
33
3:I[81497,["/jj-benchmark/_next/static/chunks/d2c13bb33c4fcd54.js","/jj-benchmark/_next/static/chunks/c21188132e0e0d48.js"],"default"]
4-
0:{"buildId":"zYbV-FSlGw5lIkET42KmM","rsc":["$","$1","c",{"children":[null,["$","$L2",null,{"parallelRouterKey":"children","template":["$","$L3",null,{}],"notFound":[[["$","title",null,{"children":"404: This page could not be found."}],["$","div",null,{"style":{"fontFamily":"system-ui,\"Segoe UI\",Roboto,Helvetica,Arial,sans-serif,\"Apple Color Emoji\",\"Segoe UI Emoji\"","height":"100vh","textAlign":"center","display":"flex","flexDirection":"column","alignItems":"center","justifyContent":"center"},"children":["$","div",null,{"children":[["$","style",null,{"dangerouslySetInnerHTML":{"__html":"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}"}}],["$","h1",null,{"className":"next-error-h1","style":{"display":"inline-block","margin":"0 20px 0 0","padding":"0 23px 0 0","fontSize":24,"fontWeight":500,"verticalAlign":"top","lineHeight":"49px"},"children":404}],["$","div",null,{"style":{"display":"inline-block"},"children":["$","h2",null,{"style":{"fontSize":14,"fontWeight":400,"lineHeight":"49px","margin":0},"children":"This page could not be found."}]}]]}]}]],[]]}]]}],"loading":null,"isPartial":false}
4+
0:{"buildId":"6mp5GVY9QrOEBN6V4ojsn","rsc":["$","$1","c",{"children":[null,["$","$L2",null,{"parallelRouterKey":"children","template":["$","$L3",null,{}],"notFound":[[["$","title",null,{"children":"404: This page could not be found."}],["$","div",null,{"style":{"fontFamily":"system-ui,\"Segoe UI\",Roboto,Helvetica,Arial,sans-serif,\"Apple Color Emoji\",\"Segoe UI Emoji\"","height":"100vh","textAlign":"center","display":"flex","flexDirection":"column","alignItems":"center","justifyContent":"center"},"children":["$","div",null,{"children":[["$","style",null,{"dangerouslySetInnerHTML":{"__html":"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}"}}],["$","h1",null,{"className":"next-error-h1","style":{"display":"inline-block","margin":"0 20px 0 0","padding":"0 23px 0 0","fontSize":24,"fontWeight":500,"verticalAlign":"top","lineHeight":"49px"},"children":404}],["$","div",null,{"style":{"display":"inline-block"},"children":["$","h2",null,{"style":{"fontSize":14,"fontWeight":400,"lineHeight":"49px","margin":0},"children":"This page could not be found."}]}]]}]}]],[]]}]]}],"loading":null,"isPartial":false}

0 commit comments

Comments
 (0)