File tree 14 files changed +80
-14
lines changed
14 files changed +80
-14
lines changed Original file line number Diff line number Diff line change 12
12
13
13
14
14
< link rel ="icon " href ="/assets/images/favicon.png ">
15
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
15
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
16
16
17
17
18
18
Original file line number Diff line number Diff line change 12
12
13
13
14
14
< link rel ="icon " href ="../assets/images/favicon.png ">
15
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
15
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
16
16
17
17
18
18
Original file line number Diff line number Diff line change 12
12
13
13
14
14
< link rel ="icon " href ="../../assets/images/favicon.png ">
15
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
15
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
16
16
17
17
18
18
Original file line number Diff line number Diff line change 12
12
13
13
14
14
< link rel ="icon " href ="../assets/images/favicon.png ">
15
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
15
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
16
16
17
17
18
18
Original file line number Diff line number Diff line change 12
12
13
13
14
14
< link rel ="icon " href ="../../assets/images/favicon.png ">
15
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
15
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
16
16
17
17
18
18
Original file line number Diff line number Diff line change 12
12
13
13
14
14
< link rel ="icon " href ="../../assets/images/favicon.png ">
15
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
15
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
16
16
17
17
18
18
Original file line number Diff line number Diff line change 16
16
17
17
18
18
< link rel ="icon " href ="../assets/images/favicon.png ">
19
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
19
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
20
20
21
21
22
22
Original file line number Diff line number Diff line change 16
16
17
17
18
18
< link rel ="icon " href ="../assets/images/favicon.png ">
19
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
19
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
20
20
21
21
22
22
Original file line number Diff line number Diff line change 14
14
15
15
16
16
< link rel ="icon " href ="assets/images/favicon.png ">
17
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
17
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
18
18
19
19
20
20
Original file line number Diff line number Diff line change 14
14
15
15
16
16
< link rel ="icon " href ="../assets/images/favicon.png ">
17
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
17
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
18
18
19
19
20
20
546
546
547
547
< h1 id ="leaderboard "> Leaderboard</ h1 >
548
548
< p > < center > </ p >
549
- < p > Under construction</ p >
549
+ < h1 id ="scicode-leaderboard "> SciCode Leaderboard</ h1 >
550
+ < table >
551
+ < thead >
552
+ < tr >
553
+ < th > Model</ th >
554
+ < th > Main Problem Resolve Rate</ th >
555
+ </ tr >
556
+ </ thead >
557
+ < tbody >
558
+ < tr >
559
+ < td > OpenAI o1-preview</ td >
560
+ < td > 7.7%</ td >
561
+ </ tr >
562
+ < tr >
563
+ < td > Claude3.5-Sonnet</ td >
564
+ < td > 4.6%</ td >
565
+ </ tr >
566
+ < tr >
567
+ < td > Deepseek-Coder-v2</ td >
568
+ < td > 3.1%</ td >
569
+ </ tr >
570
+ < tr >
571
+ < td > GPT-4o</ td >
572
+ < td > 1.5%</ td >
573
+ </ tr >
574
+ < tr >
575
+ < td > GPT-4-Turbo</ td >
576
+ < td > 1.5%</ td >
577
+ </ tr >
578
+ < tr >
579
+ < td > OpenAI o1-mini</ td >
580
+ < td > 1.5%</ td >
581
+ </ tr >
582
+ < tr >
583
+ < td > Gemini 1.5 Pro</ td >
584
+ < td > 1.5%</ td >
585
+ </ tr >
586
+ < tr >
587
+ < td > Claude3-Opus</ td >
588
+ < td > 1.5%</ td >
589
+ </ tr >
590
+ < tr >
591
+ < td > Claude3-Sonnet</ td >
592
+ < td > 1.5%</ td >
593
+ </ tr >
594
+ < tr >
595
+ < td > Qwen2-72B-Instruct</ td >
596
+ < td > 1.5%</ td >
597
+ </ tr >
598
+ < tr >
599
+ < td > Llama-3.1-405B-Instruct</ td >
600
+ < td > 0%</ td >
601
+ </ tr >
602
+ < tr >
603
+ < td > Llama-3.1-70B-Instruct</ td >
604
+ < td > 0%</ td >
605
+ </ tr >
606
+ < tr >
607
+ < td > Mixtral-8x22B-Instruct</ td >
608
+ < td > 0%</ td >
609
+ </ tr >
610
+ < tr >
611
+ < td > Llama-3-70B-Chat</ td >
612
+ < td > 0%</ td >
613
+ </ tr >
614
+ </ tbody >
615
+ </ table >
550
616
<!-- Once you've added the results to the submission repository,
551
617
bring back the table here -->
552
618
<!-- include-markdown "leaderboard_table.md" -->
Original file line number Diff line number Diff line change 12
12
13
13
14
14
< link rel ="icon " href ="../assets/images/favicon.png ">
15
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
15
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
16
16
17
17
18
18
Original file line number Diff line number Diff line change 16
16
17
17
18
18
< link rel ="icon " href ="../assets/images/favicon.png ">
19
- < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.42 ">
19
+ < meta name ="generator " content ="mkdocs-1.6.1, mkdocs-material-9.5.43 ">
20
20
21
21
22
22
Load Diff Large diffs are not rendered by default.
You can’t perform that action at this time.
0 commit comments