1+ < div style ="padding: 1rem 0 ">
2+ < div style ="display:flex;flex-wrap:wrap;gap:10px;margin-bottom:1.5rem ">
3+ < div style ="background:var(--color-background-secondary);border-radius:var(--border-radius-md);padding:.75rem 1rem;flex:1;min-width:120px ">
4+ < div style ="font-size:12px;color:var(--color-text-secondary);margin-bottom:4px "> Recall</ div >
5+ < div style ="font-size:22px;font-weight:500;color:var(--color-text-primary) "> 0.862</ div >
6+ </ div >
7+ < div style ="background:var(--color-background-secondary);border-radius:var(--border-radius-md);padding:.75rem 1rem;flex:1;min-width:120px ">
8+ < div style ="font-size:12px;color:var(--color-text-secondary);margin-bottom:4px "> F1</ div >
9+ < div style ="font-size:22px;font-weight:500;color:var(--color-text-primary) "> 0.804</ div >
10+ </ div >
11+ < div style ="background:var(--color-background-secondary);border-radius:var(--border-radius-md);padding:.75rem 1rem;flex:1;min-width:120px ">
12+ < div style ="font-size:12px;color:var(--color-text-secondary);margin-bottom:4px "> Tokens removed</ div >
13+ < div style ="font-size:22px;font-weight:500;color:var(--color-text-primary) "> 91.5%</ div >
14+ </ div >
15+ < div style ="background:var(--color-background-secondary);border-radius:var(--border-radius-md);padding:.75rem 1rem;flex:1;min-width:120px ">
16+ < div style ="font-size:12px;color:var(--color-text-secondary);margin-bottom:4px "> vs Qwen 35B recall</ div >
17+ < div style ="font-size:22px;font-weight:500;color:var(--color-text-primary) "> +11.3pp</ div >
18+ </ div >
19+ </ div >
20+
21+ < div style ="display:flex;gap:16px;flex-wrap:wrap;margin-bottom:.75rem;font-size:12px;color:var(--color-text-secondary) ">
22+ < span style ="display:flex;align-items:center;gap:5px "> < span style ="width:10px;height:10px;border-radius:2px;background:#7F77DD "> </ span > Squeez-2B (ours)</ span >
23+ < span style ="display:flex;align-items:center;gap:5px "> < span style ="width:10px;height:10px;border-radius:2px;background:#1D9E75 "> </ span > Qwen 3.5 35B A3B</ span >
24+ < span style ="display:flex;align-items:center;gap:5px "> < span style ="width:10px;height:10px;border-radius:2px;background:#378ADD "> </ span > Kimi K2</ span >
25+ < span style ="display:flex;align-items:center;gap:5px "> < span style ="width:10px;height:10px;border-radius:2px;background:#888780 "> </ span > Qwen 3.5 2B base</ span >
26+ < span style ="display:flex;align-items:center;gap:5px "> < span style ="width:10px;height:10px;border-radius:2px;background:#D3D1C7 "> </ span > Heuristics</ span >
27+ </ div >
28+
29+ < div style ="position:relative;height:300px;width:100% ">
30+ < canvas id ="mainChart "> </ canvas >
31+ </ div >
32+ </ div >
33+ < script src ="https://cdnjs.cloudflare.com/ajax/libs/Chart.js/4.4.1/chart.umd.js "> </ script >
34+ < script >
35+ const labels = [ 'Squeez-2B' , 'Qwen 35B A3B' , 'Kimi K2' , 'Qwen 3.5 2B base' , 'BM25' , 'First-N' , 'Random' , 'Last-N' ] ;
36+ const recall = [ 0.8624 , 0.7498 , 0.5286 , 0.5299 , 0.2172 , 0.1445 , 0.1009 , 0.0503 ] ;
37+ const f1 = [ 0.8035 , 0.7254 , 0.6827 , 0.5482 , 0.2314 , 0.1570 , 0.1966 , 0.1393 ] ;
38+ const colors = [ '#7F77DD' , '#1D9E75' , '#378ADD' , '#888780' , '#D3D1C7' , '#D3D1C7' , '#D3D1C7' , '#D3D1C7' ] ;
39+ const f1colors = colors . map ( c => c + 'aa' ) ;
40+
41+ new Chart ( document . getElementById ( 'mainChart' ) , {
42+ type : 'bar' ,
43+ data : {
44+ labels,
45+ datasets : [
46+ { label : 'Recall' , data : recall , backgroundColor : colors , borderRadius : 4 , borderSkipped : false , barPercentage : 0.45 , categoryPercentage : 0.85 } ,
47+ { label : 'F1' , data : f1 , backgroundColor : f1colors , borderRadius : 4 , borderSkipped : false , barPercentage : 0.45 , categoryPercentage : 0.85 }
48+ ]
49+ } ,
50+ options : {
51+ responsive : true ,
52+ maintainAspectRatio : false ,
53+ plugins : {
54+ legend : { display : false } ,
55+ tooltip : {
56+ callbacks : {
57+ label : ctx => ` ${ ctx . dataset . label } : ${ ctx . parsed . y . toFixed ( 3 ) } `
58+ }
59+ }
60+ } ,
61+ scales : {
62+ y : {
63+ min : 0 , max : 1 ,
64+ ticks : { color : '#888780' , font : { size : 11 } , callback : v => v . toFixed ( 1 ) } ,
65+ grid : { color : 'rgba(136,135,128,0.12)' } ,
66+ border : { display : false }
67+ } ,
68+ x : {
69+ ticks : { color : '#888780' , font : { size : 11 } , maxRotation : 20 } ,
70+ grid : { display : false } ,
71+ border : { display : false }
72+ }
73+ }
74+ }
75+ } ) ;
76+ </ script >
0 commit comments