-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathwave15_16_bench.json
More file actions
80 lines (80 loc) · 2.16 KB
/
wave15_16_bench.json
File metadata and controls
80 lines (80 loc) · 2.16 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
{
"ada_serve": {
"get_gamma_tight_mean_us": 0.9136096341535449,
"get_gamma_relaxed_mean_us": 0.8304266957566142
},
"conf_spec": {
"verify_step_flat_mean_us": 131.89301802776754,
"verify_step_peaked_mean_us": 127.55730585195124,
"speedup_peaked_vs_flat": 1.0339903084880808
},
"seq_packing": {
"pack_short_mean_us": 2754.269145661965,
"pack_long_mean_us": 43442.320797475986
},
"meta_reasoner": {
"compute_entropy_mean_us": 448.64398054778576,
"step_mean_us": 0.12037414126098156
},
"yoco": {
"append_mean_us": 0.5921470001339912,
"get_shared_kv_mean_us": 2230.5147512815893
},
"cla": {
"schedule_from_config_mean_us": 19.488262478262186
},
"kvsharer": {
"record_layer_kv_mean_us": 21.99302799999714,
"compute_share_map_mean_us": 9653.354207985103
},
"diffkv": {
"get_policy_mean_us": 1.3691647909581661,
"record_attention_mean_us": 5.658150534145534
},
"paris_kv": {
"encode_mean_us": 29.439809964969754,
"decode_mean_us": 3.897286718711257,
"online_update_mean_us": 107.18385048676282
},
"kvtuner": {
"search_mean_us": 4212.210872210562
},
"dovetail": {
"verify_one_mean_us": 602.4091276340187
},
"pipo": {
"run_layer_mean_us": 1376.2445945758373
},
"mobile_moe": {
"route_single_mean_us": 14.881356712430716,
"route_batch_32_mean_us": 486.74682318232954
},
"online_sd": {
"record_mean_us": 1.4046194264665246,
"should_update_mean_us": 0.16073868609964848
},
"lookahead_reasoning": {
"run_cycle_mean_us": 13.650477631017566
},
"sparse_spec": {
"pillar_update_mean_us": 1.2022118316963315,
"top_k_indices_mean_us": 24.385556753259152
},
"fr_spec": {
"forward_mean_us": 4095.0087434612215,
"compress_logits_mean_us": 12.583496747538447,
"expand_logits_mean_us": 21.783086471259594,
"compression_ratio": 0.25
},
"long_spec": {
"head_forward_mean_us": 12434.656594414264
},
"forelen": {
"egtp_predict_mean_us": 99.12135696504265,
"plp_update_mean_us": 1.42301213927567
},
"rasd": {
"corpus_search_mean_us": 0.7165118586272001,
"build_retrieval_tree_mean_us": 1.8304085824638605
}
}