mirror of https://github.com/malarinv/tacotron2
Compare commits
2 Commits
dde35048b7
...
5a30069f0a
| Author | SHA1 | Date |
|---|---|---|
|
|
5a30069f0a | |
|
|
dcc9ab3625 |
33
taco2/tts.py
33
taco2/tts.py
|
|
@ -5,6 +5,8 @@ import numpy as np
|
|||
import torch
|
||||
import pyaudio
|
||||
import klepto
|
||||
import argparse
|
||||
from pathlib import Path
|
||||
from .model import Tacotron2
|
||||
from glow import WaveGlow
|
||||
from .hparams import HParams
|
||||
|
|
@ -14,7 +16,8 @@ from .denoiser import Denoiser
|
|||
from .audio_processing import griffin_lim, postprocess_audio
|
||||
|
||||
TTS_SAMPLE_RATE = 22050
|
||||
OUTPUT_SAMPLE_RATE = 16000
|
||||
OUTPUT_SAMPLE_RATE = 22050
|
||||
# OUTPUT_SAMPLE_RATE = 16000
|
||||
|
||||
# config from
|
||||
# https://github.com/NVIDIA/waveglow/blob/master/config.json
|
||||
|
|
@ -116,7 +119,7 @@ class TTSModel(object):
|
|||
audio = audio.cpu().numpy()
|
||||
|
||||
return postprocess_audio(
|
||||
audio, src_rate=TTS_SAMPLE_RATE, dst_rate=OUTPUT_SAMPLE_RATE
|
||||
audio, tempo=0.6, src_rate=TTS_SAMPLE_RATE, dst_rate=OUTPUT_SAMPLE_RATE
|
||||
)
|
||||
|
||||
|
||||
|
|
@ -133,10 +136,7 @@ def player_gen():
|
|||
return play_device
|
||||
|
||||
|
||||
def repl():
|
||||
tts_model = TTSModel(
|
||||
"/Users/malar/Work/tacotron2_r4_83000.pt", "/Users/malar/Work/waveglow_484000"
|
||||
)
|
||||
def repl(tts_model):
|
||||
player = player_gen()
|
||||
|
||||
def loop():
|
||||
|
|
@ -148,7 +148,26 @@ def repl():
|
|||
|
||||
|
||||
def main():
|
||||
interactive_loop = repl()
|
||||
parser = argparse.ArgumentParser(
|
||||
formatter_class=argparse.ArgumentDefaultsHelpFormatter
|
||||
)
|
||||
parser.add_argument(
|
||||
"-t",
|
||||
"--tacotron2_path",
|
||||
type=Path,
|
||||
default="./tacotron.pt",
|
||||
help="Path to a tacotron2 model",
|
||||
)
|
||||
parser.add_argument(
|
||||
"-w",
|
||||
"--waveglow_path",
|
||||
type=Path,
|
||||
default="./waveglow_256channels.pt",
|
||||
help="Path to a waveglow model",
|
||||
)
|
||||
args = parser.parse_args()
|
||||
tts_model = TTSModel(**vars(args))
|
||||
interactive_loop = repl(tts_model)
|
||||
while True:
|
||||
interactive_loop()
|
||||
|
||||
|
|
|
|||
Loading…
Reference in New Issue