@@ -53,6 +53,7 @@ TestSettingsInternal::TestSettingsInternal(
5353 use_token_latencies(requested.use_token_latencies),
5454 server_ttft_latency(requested.server_ttft_latency),
5555 server_tpot_latency(requested.server_tpot_latency),
56+ server_constant_gen(requested.server_constant_gen),
5657 infer_token_latencies(requested.infer_token_latencies),
5758 token_latency_scaling_factor(requested.token_latency_scaling_factor) {
5859 // Target QPS, target latency, and max_async_queries.
@@ -305,6 +306,8 @@ void LogRequestedTestSettings(const TestSettings &s) {
305306 s.server_max_async_queries );
306307 MLPERF_LOG (detail, " requested_server_num_issue_query_threads" ,
307308 s.server_num_issue_query_threads );
309+ MLPERF_LOG (detail, " requested_server_constant_gen" ,
310+ s.server_constant_gen );
308311 break ;
309312 case TestScenario::Offline:
310313 MLPERF_LOG (detail, " requested_offline_expected_qps" ,
@@ -452,6 +455,8 @@ void TestSettingsInternal::LogEffectiveSettings() const {
452455 s.performance_sample_count );
453456 MLPERF_LOG (detail, " effective_sample_concatenate_permutation" ,
454457 s.sample_concatenate_permutation );
458+ MLPERF_LOG (detail, " effective_server_constant_gen" ,
459+ s.server_constant_gen );
455460#else
456461 detail (" " );
457462 detail (" Effective Settings:" );
@@ -772,6 +777,8 @@ int TestSettings::FromConfig(const std::string &path, const std::string &model,
772777 server_coalesce_queries = (val == 0 ) ? false : true ;
773778 if (lookupkv (model, " Server" , " max_async_queries" , &val, nullptr ))
774779 server_max_async_queries = int (val);
780+ if (lookupkv (model, " Server" , " constant_gen" , &val, nullptr ))
781+ server_constant_gen = (val == 0 ) ? false : true ;
775782
776783 lookupkv (model, scenario, " min_duration" , &min_duration_ms, nullptr );
777784 lookupkv (model, scenario, " max_duration" , &max_duration_ms, nullptr );
0 commit comments