@@ -364,7 +364,8 @@ def bert_vits2_infer(self, state, encode=True):
364
364
# if state["lang"] == "auto":
365
365
# state["lang"] = classify_language(state["text"], target_languages=model.lang)
366
366
if state ["lang" ] == "auto" :
367
- sentences_list = split_languages (state ["text" ], state ["speaker_lang" ])
367
+ sentences_list = split_languages (state ["text" ], state ["speaker_lang" ], expand_abbreviations = True ,
368
+ expand_hyphens = True )
368
369
else :
369
370
sentences_list = [(state ["text" ], state ["lang" ])]
370
371
audios = []
@@ -404,7 +405,8 @@ def stream_bert_vits2_infer(self, state, fname=None):
404
405
state ["text" ] = re .sub (r'\s+' , ' ' , state ["text" ]).strip ()
405
406
sampling_rate = model .sampling_rate
406
407
407
- sentences_list = split_languages (state ["text" ], state ["speaker_lang" ])
408
+ sentences_list = split_languages (state ["text" ], state ["speaker_lang" ], expand_abbreviations = True ,
409
+ expand_hyphens = True )
408
410
409
411
# audios = []
410
412
@@ -499,15 +501,15 @@ def gpt_sovits_infer(self, state, encode=True):
499
501
infer_func = model .infer
500
502
501
503
audio = infer_func (text = state .get ("text" ),
502
- lang = state .get ("lang" ),
503
- reference_audio = state .get ("reference_audio" ),
504
- reference_audio_sr = state .get ("reference_audio_sr" ),
505
- prompt_text = state .get ("prompt_text" ),
506
- prompt_lang = state .get ("prompt_lang" ),
507
- top_k = state .get ("top_k" ),
508
- top_p = state .get ("top_p" ),
509
- temperature = state .get ("temperature" ),
510
- )
504
+ lang = state .get ("lang" ),
505
+ reference_audio = state .get ("reference_audio" ),
506
+ reference_audio_sr = state .get ("reference_audio_sr" ),
507
+ prompt_text = state .get ("prompt_text" ),
508
+ prompt_lang = state .get ("prompt_lang" ),
509
+ top_k = state .get ("top_k" ),
510
+ top_p = state .get ("top_p" ),
511
+ temperature = state .get ("temperature" ),
512
+ )
511
513
sampling_rate = model .sampling_rate
512
514
513
515
return self .encode (sampling_rate , audio , state ["format" ]) if encode else audio
0 commit comments