From 1d3e8b2901c60124d440569f9868d8d3023e6a09 Mon Sep 17 00:00:00 2001 From: Michael Hansen Date: Mon, 30 Oct 2023 11:34:13 -0500 Subject: [PATCH] Add extra options to infer script --- src/python/piper_train/infer.py | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/src/python/piper_train/infer.py b/src/python/piper_train/infer.py index bc535d5..378af21 100644 --- a/src/python/piper_train/infer.py +++ b/src/python/piper_train/infer.py @@ -24,6 +24,11 @@ def main(): ) parser.add_argument("--output-dir", required=True, help="Path to write WAV files") parser.add_argument("--sample-rate", type=int, default=22050) + # + parser.add_argument("--noise-scale", type=float, default=0.667) + parser.add_argument("--length-scale", type=float, default=1.0) + parser.add_argument("--noise-w", type=float, default=0.8) + # args = parser.parse_args() args.output_dir = Path(args.output_dir) @@ -49,7 +54,7 @@ def main(): text = torch.LongTensor(phoneme_ids).unsqueeze(0) text_lengths = torch.LongTensor([len(phoneme_ids)]) - scales = [0.667, 1.0, 0.8] + scales = [args.noise_scale, args.length_scale, args.noise_w] sid = torch.LongTensor([speaker_id]) if speaker_id is not None else None start_time = time.perf_counter()