@@ -1914,50 +1914,38 @@ def log_result(
1914
1914
notes = notes + system_json .get ("sw_notes" )
1915
1915
special_unit_dict = {
1916
1916
"gptj-99" : {
1917
- "SingleStream" : "Latency (ms)" ,
1918
- "MultiStream" : "Latency (ms)" ,
1919
1917
"Offline" : "Tokens/s" ,
1920
1918
"Server" : "Tokens/s" ,
1921
1919
},
1922
1920
"gptj-99.9" : {
1923
- "SingleStream" : "Latency (ms)" ,
1924
- "MultiStream" : "Latency (ms)" ,
1925
1921
"Offline" : "Tokens/s" ,
1926
1922
"Server" : "Tokens/s" ,
1927
1923
},
1928
1924
"llama2-70b-99" : {
1929
- "SingleStream" : "Latency (ms)" ,
1930
- "MultiStream" : "Latency (ms)" ,
1931
1925
"Offline" : "Tokens/s" ,
1932
1926
"Server" : "Tokens/s" ,
1933
1927
},
1934
1928
"llama2-70b-99.9" : {
1935
- "SingleStream" : "Latency (ms)" ,
1936
- "MultiStream" : "Latency (ms)" ,
1937
1929
"Offline" : "Tokens/s" ,
1938
1930
"Server" : "Tokens/s" ,
1939
1931
},
1940
1932
"llama2-70b-interactive-99" : {
1941
- "SingleStream" : "Latency (ms)" ,
1942
- "MultiStream" : "Latency (ms)" ,
1943
1933
"Offline" : "Tokens/s" ,
1944
1934
"Server" : "Tokens/s" ,
1945
1935
},
1946
1936
"llama2-70b-interactive-99.9" : {
1947
- "SingleStream" : "Latency (ms)" ,
1948
- "MultiStream" : "Latency (ms)" ,
1937
+ "Offline" : "Tokens/s" ,
1938
+ "Server" : "Tokens/s" ,
1939
+ },
1940
+ "llama3.1-405b" : {
1949
1941
"Offline" : "Tokens/s" ,
1950
1942
"Server" : "Tokens/s" ,
1951
1943
},
1952
1944
"mixtral-8x7b" : {
1953
- "SingleStream" : "Latency (ms)" ,
1954
- "MultiStream" : "Latency (ms)" ,
1955
1945
"Offline" : "Tokens/s" ,
1956
1946
"Server" : "Tokens/s" ,
1957
1947
},
1958
1948
"llama3.1-405b" : {
1959
- "SingleStream" : "Latency (ms)" ,
1960
- "MultiStream" : "Latency (ms)" ,
1961
1949
"Offline" : "Tokens/s" ,
1962
1950
"Server" : "Tokens/s" ,
1963
1951
},
@@ -1977,7 +1965,7 @@ def log_result(
1977
1965
if config .version == "v4.0" :
1978
1966
unit = unit_dict [scenario_fixed ]
1979
1967
else :
1980
- unit = special_unit_dict .get (mlperf_model , unit_dict )[scenario_fixed ]
1968
+ unit = special_unit_dict .get (mlperf_model , unit_dict ). get ( scenario_fixed , unit_dict [scenario_fixed ])
1981
1969
power_unit = power_unit_dict [scenario_fixed ]
1982
1970
1983
1971
if (power_metric <= 0 ) or (
0 commit comments