Skip to content

Commit 5e90395

Browse files
Add Llama 3.1 to special unit dict (#2150)
1 parent e216af0 commit 5e90395

File tree

1 file changed

+5
-17
lines changed

1 file changed

+5
-17
lines changed

tools/submission/submission_checker.py

+5-17
Original file line numberDiff line numberDiff line change
@@ -1914,50 +1914,38 @@ def log_result(
19141914
notes = notes + system_json.get("sw_notes")
19151915
special_unit_dict = {
19161916
"gptj-99": {
1917-
"SingleStream": "Latency (ms)",
1918-
"MultiStream": "Latency (ms)",
19191917
"Offline": "Tokens/s",
19201918
"Server": "Tokens/s",
19211919
},
19221920
"gptj-99.9": {
1923-
"SingleStream": "Latency (ms)",
1924-
"MultiStream": "Latency (ms)",
19251921
"Offline": "Tokens/s",
19261922
"Server": "Tokens/s",
19271923
},
19281924
"llama2-70b-99": {
1929-
"SingleStream": "Latency (ms)",
1930-
"MultiStream": "Latency (ms)",
19311925
"Offline": "Tokens/s",
19321926
"Server": "Tokens/s",
19331927
},
19341928
"llama2-70b-99.9": {
1935-
"SingleStream": "Latency (ms)",
1936-
"MultiStream": "Latency (ms)",
19371929
"Offline": "Tokens/s",
19381930
"Server": "Tokens/s",
19391931
},
19401932
"llama2-70b-interactive-99": {
1941-
"SingleStream": "Latency (ms)",
1942-
"MultiStream": "Latency (ms)",
19431933
"Offline": "Tokens/s",
19441934
"Server": "Tokens/s",
19451935
},
19461936
"llama2-70b-interactive-99.9": {
1947-
"SingleStream": "Latency (ms)",
1948-
"MultiStream": "Latency (ms)",
1937+
"Offline": "Tokens/s",
1938+
"Server": "Tokens/s",
1939+
},
1940+
"llama3.1-405b": {
19491941
"Offline": "Tokens/s",
19501942
"Server": "Tokens/s",
19511943
},
19521944
"mixtral-8x7b": {
1953-
"SingleStream": "Latency (ms)",
1954-
"MultiStream": "Latency (ms)",
19551945
"Offline": "Tokens/s",
19561946
"Server": "Tokens/s",
19571947
},
19581948
"llama3.1-405b": {
1959-
"SingleStream": "Latency (ms)",
1960-
"MultiStream": "Latency (ms)",
19611949
"Offline": "Tokens/s",
19621950
"Server": "Tokens/s",
19631951
},
@@ -1977,7 +1965,7 @@ def log_result(
19771965
if config.version == "v4.0":
19781966
unit = unit_dict[scenario_fixed]
19791967
else:
1980-
unit = special_unit_dict.get(mlperf_model, unit_dict)[scenario_fixed]
1968+
unit = special_unit_dict.get(mlperf_model, unit_dict).get(scenario_fixed, unit_dict[scenario_fixed])
19811969
power_unit = power_unit_dict[scenario_fixed]
19821970

19831971
if (power_metric <= 0) or (

0 commit comments

Comments
 (0)