Tune MeloTTS speed and prosody defaults

This commit is contained in:
2026-05-03 18:24:39 +09:00
parent 46a6b926df
commit f5194f55a1
6 changed files with 53 additions and 6 deletions

View File

@@ -1,4 +1,4 @@
FROM python:3.10-slim
FROM python:3.11-slim
ENV PYTHONUNBUFFERED=1

View File

@@ -11,6 +11,9 @@ def main() -> None:
parser.add_argument("--language", default="KR")
parser.add_argument("--speaker", default="KR")
parser.add_argument("--speed", type=float, default=1.0)
parser.add_argument("--sdp-ratio", type=float, default=0.2)
parser.add_argument("--noise-scale", type=float, default=0.6)
parser.add_argument("--noise-scale-w", type=float, default=0.8)
parser.add_argument("--device", default="cpu")
args = parser.parse_args()
@@ -29,6 +32,9 @@ def main() -> None:
speaker_ids[args.speaker],
str(output_path),
speed=args.speed,
sdp_ratio=args.sdp_ratio,
noise_scale=args.noise_scale,
noise_scale_w=args.noise_scale_w,
)