File tree Expand file tree Collapse file tree
src/rkllama/api/models/audio Expand file tree Collapse file tree Original file line number Diff line number Diff line change 11# RKLLama: LLM Server and Client for Rockchip 3588/3576
22
3- ### [ Version: 0.0.66 ] ( #New-Version )
3+ ### [ Version: 0.0.67 ] ( #New-Version )
44
55Video demo ( version 0.0.1 ):
66
Original file line number Diff line number Diff line change 11[project ]
22name = " rkllama"
3- version = " 0.0.66 "
3+ version = " 0.0.67 "
44authors = [
55 { name =" NotPunchnox" , email =" punchnoxpro@gmail.com" },
66 { name =" TomJacobsUK" , email =" tom@tomjacobs.co.uk" },
Original file line number Diff line number Diff line change @@ -206,8 +206,9 @@ def phoneme_ids_to_audio(
206206 )
207207
208208 # Get the encoder outputs
209+ g = None # In case of Multispeaker Voice
209210 if speaker_id is not None :
210- z , y_mask , _ = encoder_output
211+ z , y_mask , g = encoder_output
211212 else :
212213 z , y_mask = encoder_output
213214
@@ -241,6 +242,10 @@ def phoneme_ids_to_audio(
241242 # Construct inputs for RKNN decoder model
242243 inputs_chunk = [zc .astype (np .float32 ), yc .astype (np .float32 )]
243244
245+ # For multispeaker models, we need to add the channel info generated by the encoder
246+ if g is not None :
247+ inputs_chunk .append (g )
248+
244249 # Inference RKNN (decoder) of the chunk
245250 result = self .session_rknn .inference (inputs = inputs_chunk , data_format = "nchw" )
246251
You can’t perform that action at this time.
0 commit comments