@@ -53,6 +53,7 @@ TestSettingsInternal::TestSettingsInternal(
53
53
use_token_latencies(requested.use_token_latencies),
54
54
server_ttft_latency(requested.server_ttft_latency),
55
55
server_tpot_latency(requested.server_tpot_latency),
56
+ server_constant_gen(requested.server_constant_gen),
56
57
infer_token_latencies(requested.infer_token_latencies),
57
58
token_latency_scaling_factor(requested.token_latency_scaling_factor) {
58
59
// Target QPS, target latency, and max_async_queries.
@@ -305,6 +306,8 @@ void LogRequestedTestSettings(const TestSettings &s) {
305
306
s.server_max_async_queries );
306
307
MLPERF_LOG (detail, " requested_server_num_issue_query_threads" ,
307
308
s.server_num_issue_query_threads );
309
+ MLPERF_LOG (detail, " requested_server_constant_gen" ,
310
+ s.server_constant_gen );
308
311
break ;
309
312
case TestScenario::Offline:
310
313
MLPERF_LOG (detail, " requested_offline_expected_qps" ,
@@ -452,6 +455,8 @@ void TestSettingsInternal::LogEffectiveSettings() const {
452
455
s.performance_sample_count );
453
456
MLPERF_LOG (detail, " effective_sample_concatenate_permutation" ,
454
457
s.sample_concatenate_permutation );
458
+ MLPERF_LOG (detail, " effective_server_constant_gen" ,
459
+ s.server_constant_gen );
455
460
#else
456
461
detail (" " );
457
462
detail (" Effective Settings:" );
@@ -772,6 +777,8 @@ int TestSettings::FromConfig(const std::string &path, const std::string &model,
772
777
server_coalesce_queries = (val == 0 ) ? false : true ;
773
778
if (lookupkv (model, " Server" , " max_async_queries" , &val, nullptr ))
774
779
server_max_async_queries = int (val);
780
+ if (lookupkv (model, " Server" , " constant_gen" , &val, nullptr ))
781
+ server_constant_gen = (val == 0 ) ? false : true ;
775
782
776
783
lookupkv (model, scenario, " min_duration" , &min_duration_ms, nullptr );
777
784
lookupkv (model, scenario, " max_duration" , &max_duration_ms, nullptr );
0 commit comments