Commit
·
41c25c6
1
Parent(s):
02dd47f
Update README.md
Browse files
README.md
CHANGED
|
@@ -51,6 +51,19 @@ model = HifiGanModel.restore_from(restore_path=path)
|
|
| 51 |
```
|
| 52 |
import soundfile as sf
|
| 53 |
parsed = spec_generator.parse("You can type your sentence here to get nemo to produce speech.")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 54 |
spectrogram = spec_generator.generate_spectrogram(tokens=parsed,speaker=92)
|
| 55 |
audio = model.convert_spectrogram_to_audio(spec=spectrogram)
|
| 56 |
sf.write("speech.wav", audio.to('cpu').detach().numpy()[0], 44100)
|
|
@@ -75,7 +88,7 @@ FastPitch multispeaker is a fully-parallel text-to-speech model based on FastSpe
|
|
| 75 |
|
| 76 |
## Training
|
| 77 |
|
| 78 |
-
The NeMo toolkit [3] was used for training the models for 1000 epochs.
|
| 79 |
|
| 80 |
## Datasets
|
| 81 |
|
|
|
|
| 51 |
```
|
| 52 |
import soundfile as sf
|
| 53 |
parsed = spec_generator.parse("You can type your sentence here to get nemo to produce speech.")
|
| 54 |
+
"""
|
| 55 |
+
speaker id:
|
| 56 |
+
92 Cori Samuel
|
| 57 |
+
6097 Phil Benson
|
| 58 |
+
9017 John Van Stan
|
| 59 |
+
6670 Mike Pelton
|
| 60 |
+
6671 Tony Oliva
|
| 61 |
+
8051 Maria Kasper
|
| 62 |
+
9136 Helen Taylor
|
| 63 |
+
11614 Sylviamb
|
| 64 |
+
11697 Celine Major
|
| 65 |
+
12787 LikeManyWaters
|
| 66 |
+
"""
|
| 67 |
spectrogram = spec_generator.generate_spectrogram(tokens=parsed,speaker=92)
|
| 68 |
audio = model.convert_spectrogram_to_audio(spec=spectrogram)
|
| 69 |
sf.write("speech.wav", audio.to('cpu').detach().numpy()[0], 44100)
|
|
|
|
| 88 |
|
| 89 |
## Training
|
| 90 |
|
| 91 |
+
The NeMo toolkit [3] was used for training the models for 1000 epochs.
|
| 92 |
|
| 93 |
## Datasets
|
| 94 |
|