mirror of
https://github.com/SWivid/F5-TTS.git
synced 2026-01-15 06:23:22 -08:00
@@ -33,8 +33,6 @@ Install other packages:
|
||||
pip install -r requirements.txt
|
||||
```
|
||||
|
||||
**Note**: install numpy with version < 2.x, e.g. `pip install numpy==1.22.0`.
|
||||
|
||||
## Prepare Dataset
|
||||
|
||||
Example data processing scripts for Emilia and Wenetspeech4TTS, and you may tailor your own one along with a Dataset class in `model/dataset.py`.
|
||||
|
||||
@@ -280,7 +280,7 @@ def infer_batch(ref_audio, ref_text, gen_text_batches, exp_name, remove_silence,
|
||||
|
||||
return (target_sample_rate, final_wave), spectrogram_path
|
||||
|
||||
def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, custom_split_words):
|
||||
def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, custom_split_words=''):
|
||||
if not custom_split_words.strip():
|
||||
custom_words = [word.strip() for word in custom_split_words.split(',')]
|
||||
global SPLIT_WORDS
|
||||
|
||||
@@ -12,6 +12,7 @@ jieba
|
||||
jiwer
|
||||
librosa
|
||||
matplotlib
|
||||
numpy==1.23.5
|
||||
pydub
|
||||
pypinyin
|
||||
safetensors
|
||||
|
||||
Reference in New Issue
Block a user