We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7b82fb7 commit 5ceda8eCopy full SHA for 5ceda8e
src/cpp/src/module_genai/modules/md_text_to_speech/models/qwen3_omni.cpp
@@ -207,6 +207,11 @@ void TextToSpeechImpl_Qwen3Omni::load_code_predictor_models(const ov::AnyMap& tt
207
GENAI_INFO("TextToSpeechModule[" + module_desc->name +
208
"]: sample_codec_token_greedy_search is enabled, will use greedy decoding in sample_codec_token");
209
merge_code_predictor_ov_models(ar_models, sce_models);
210
+ if (m_enable_merge_ov_models) {
211
+ // Release original infer requests to save memory since they won't be used anymore.
212
+ m_code_predictor_ar_infers.clear();
213
+ m_code_predictor_single_codec_embed_infers.clear();
214
+ }
215
}
216
217
0 commit comments