@@ -552,88 +552,88 @@ <h1 id="scicode-leaderboard">SciCode Leaderboard</h1>
552
552
< tr >
553
553
< th > Models</ th >
554
554
< th > Main Problem Resolve Rate</ th >
555
- < th > < span style ="background- color:lightgrey "> Subproblem</ span > </ th >
555
+ < th > < span style ="color:grey "> Subproblem</ span > </ th >
556
556
</ tr >
557
557
</ thead >
558
558
< tbody >
559
559
< tr >
560
560
< td > 🥇 OpenAI o1-preview</ td >
561
- < td > < div align ="center "> 7.7</ div > </ td >
562
- < td > < div align ="center " style ="background- color:lightgrey "> 28.5</ div > </ td >
561
+ < td > < div align ="center "> < strong > 7.7</ strong > </ div > </ td >
562
+ < td > < div align ="center " style ="color:grey "> 28.5</ div > </ td >
563
563
</ tr >
564
564
< tr >
565
565
< td > 🥈 Claude3.5-Sonnet</ td >
566
- < td > < div align ="center "> 4.6</ div > </ td >
567
- < td > < div align ="center " style ="background- color:lightgrey "> 26.0</ div > </ td >
566
+ < td > < div align ="center "> < strong > 4.6</ strong > </ div > </ td >
567
+ < td > < div align ="center " style ="color:grey "> 26.0</ div > </ td >
568
568
</ tr >
569
569
< tr >
570
570
< td > 🥉 Claude3.5-Sonnet (new)</ td >
571
- < td > < div align ="center "> 4.6</ div > </ td >
572
- < td > < div align ="center " style ="background- color:lightgrey "> 25.3</ div > </ td >
571
+ < td > < div align ="center "> < strong > 4.6</ strong > </ div > </ td >
572
+ < td > < div align ="center " style ="color:grey "> 25.3</ div > </ td >
573
573
</ tr >
574
574
< tr >
575
575
< td > Deepseek-Coder-v2</ td >
576
- < td > < div align ="center "> 3.1</ div > </ td >
577
- < td > < div align ="center " style ="background- color:lightgrey "> 21.2</ div > </ td >
576
+ < td > < div align ="center "> < strong > 3.1</ strong > </ div > </ td >
577
+ < td > < div align ="center " style ="color:grey "> 21.2</ div > </ td >
578
578
</ tr >
579
579
< tr >
580
580
< td > GPT-4o</ td >
581
- < td > < div align ="center "> 1.5</ div > </ td >
582
- < td > < div align ="center " style ="background- color:lightgrey "> 25.0</ div > </ td >
581
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
582
+ < td > < div align ="center " style ="color:grey "> 25.0</ div > </ td >
583
583
</ tr >
584
584
< tr >
585
585
< td > GPT-4-Turbo</ td >
586
- < td > < div align ="center "> 1.5</ div > </ td >
587
- < td > < div align ="center " style ="background- color:lightgrey "> 22.9</ div > </ td >
586
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
587
+ < td > < div align ="center " style ="color:grey "> 22.9</ div > </ td >
588
588
</ tr >
589
589
< tr >
590
590
< td > OpenAI o1-mini</ td >
591
- < td > < div align ="center "> 1.5</ div > </ td >
592
- < td > < div align ="center " style ="background- color:lightgrey "> 22.2</ div > </ td >
591
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
592
+ < td > < div align ="center " style ="color:grey "> 22.2</ div > </ td >
593
593
</ tr >
594
594
< tr >
595
595
< td > Gemini 1.5 Pro</ td >
596
- < td > < div align ="center "> 1.5</ div > </ td >
597
- < td > < div align ="center " style ="background- color:lightgrey "> 21.9</ div > </ td >
596
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
597
+ < td > < div align ="center " style ="color:grey "> 21.9</ div > </ td >
598
598
</ tr >
599
599
< tr >
600
600
< td > Claude3-Opus</ td >
601
- < td > < div align ="center "> 1.5</ div > </ td >
602
- < td > < div align ="center " style ="background- color:lightgrey "> 21.5</ div > </ td >
601
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
602
+ < td > < div align ="center " style ="color:grey "> 21.5</ div > </ td >
603
603
</ tr >
604
604
< tr >
605
605
< td > Llama-3.1-405B-Chat</ td >
606
- < td > < div align ="center "> 1.5</ div > </ td >
607
- < td > < div align ="center " style ="background- color:lightgrey "> 19.8</ div > </ td >
606
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
607
+ < td > < div align ="center " style ="color:grey "> 19.8</ div > </ td >
608
608
</ tr >
609
609
< tr >
610
610
< td > Claude3-Sonnet</ td >
611
- < td > < div align ="center "> 1.5</ div > </ td >
612
- < td > < div align ="center " style ="background- color:lightgrey "> 17.0</ div > </ td >
611
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
612
+ < td > < div align ="center " style ="color:grey "> 17.0</ div > </ td >
613
613
</ tr >
614
614
< tr >
615
615
< td > Qwen2-72B-Instruct</ td >
616
- < td > < div align ="center "> 1.5</ div > </ td >
617
- < td > < div align ="center " style ="background- color:lightgrey "> 17.0</ div > </ td >
616
+ < td > < div align ="center "> < strong > 1.5</ strong > </ div > </ td >
617
+ < td > < div align ="center " style ="color:grey "> 17.0</ div > </ td >
618
618
</ tr >
619
619
< tr >
620
620
< td > Llama-3.1-70B-Chat</ td >
621
- < td > < div align ="center "> 0.0</ div > </ td >
622
- < td > < div align ="center " style ="background- color:lightgrey "> 17.0</ div > </ td >
621
+ < td > < div align ="center "> < strong > 0.0</ strong > </ div > </ td >
622
+ < td > < div align ="center " style ="color:grey "> 17.0</ div > </ td >
623
623
</ tr >
624
624
< tr >
625
625
< td > Mixtral-8x22B-Instruct</ td >
626
- < td > < div align ="center "> 0.0</ div > </ td >
627
- < td > < div align ="center " style ="background- color:lightgrey "> 16.3</ div > </ td >
626
+ < td > < div align ="center "> < strong > 0.0</ strong > </ div > </ td >
627
+ < td > < div align ="center " style ="color:grey "> 16.3</ div > </ td >
628
628
</ tr >
629
629
< tr >
630
630
< td > Llama-3-70B-Chat</ td >
631
- < td > < div align ="center "> 0.0</ div > </ td >
632
- < td > < div align ="center " style ="background- color:lightgrey "> 14.6</ div > </ td >
631
+ < td > < div align ="center "> < strong > 0.0</ strong > </ div > </ td >
632
+ < td > < div align ="center " style ="color:grey "> 14.6</ div > </ td >
633
633
</ tr >
634
634
</ tbody >
635
635
</ table >
636
- < p > Note: If the models tie in the Main Problem resolve rate, we will then compare the Subproblems.</ p >
636
+ < p > < strong > Note: If the models tie in the Main Problem resolve rate, we will then compare the Subproblems.</ strong > </ p >
637
637
<!-- Once you've added the results to the submission repository,
638
638
bring back the table here -->
639
639
<!-- include-markdown "leaderboard_table.md" -->
0 commit comments