forked from dusty-nv/jetson-containers
-
Notifications
You must be signed in to change notification settings - Fork 0
/
test_voices.py
47 lines (34 loc) · 1.61 KB
/
test_voices.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
#!/usr/bin/env python3
import os
import torch
import pprint
from TTS.api import TTS
device = "cuda" if torch.cuda.is_available() else "cpu"
#print(TTS().list_models())
model="tts_models/multilingual/multi-dataset/xtts_v2" # "tts_models/multilingual/multi-dataset/xtts_v1.1"
language='en'
print(f"Loading TTS model {model}")
tts = TTS(model).to(device)
print(dir(tts.synthesizer.tts_model.speaker_manager))
print(tts.synthesizer.tts_model.speaker_manager)
print(f"\nMulti-speaker: {tts.is_multi_speaker}")
if tts.is_multi_speaker:
print(f"\nSpeakers: {tts.synthesizer.tts_model.speaker_manager.name_to_id}")
print(f"\nLanguages: {tts.synthesizer.tts_model.language_manager.name_to_id}")
# Text to speech to a file
prompts = [
"Hello there, how are you today?",
"The weather is 76 degrees out and sunny.",
"Your first meeting is in an hour downtown, with normal traffic.",
"Can I interest you in anything quick for breakfast?",
]
if tts.is_multi_speaker:
prompts = [' '.join(prompts)] #+ prompts
for speaker in tts.synthesizer.tts_model.speaker_manager.speakers:
for prompt_idx, prompt in enumerate(prompts):
wav = f"/data/audio/tts/{os.path.basename(model)}_offline_{speaker.lower().replace(' ', '_')}.wav"
print(f'\ngenerating "{prompt}" speaker="{speaker}" lang="{language}" wav="{wav}"\n')
if tts.is_multi_speaker:
tts.tts_to_file(text=prompt, speaker=speaker, language=language, file_path=wav)
else:
tts.tts_to_file(text=prompt, speaker_wav=speaker_wav, language=language, file_path=wav)