From de910380bcc41249d7e4857b46f46fa83f2335b4 Mon Sep 17 00:00:00 2001 From: Shivam Mehta Date: Mon, 27 May 2024 13:40:02 +0200 Subject: [PATCH] Fixing batched synthesis for multispeaker model --- matcha/cli.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/matcha/cli.py b/matcha/cli.py index 635c586..7daf130 100644 --- a/matcha/cli.py +++ b/matcha/cli.py @@ -326,12 +326,13 @@ def batched_synthesis(args, device, model, vocoder, denoiser, texts, spk): for i, batch in enumerate(dataloader): i = i + 1 start_t = dt.datetime.now() + b = batch["x"].shape[0] output = model.synthesise( batch["x"].to(device), batch["x_lengths"].to(device), n_timesteps=args.steps, temperature=args.temperature, - spks=spk, + spks=spk.expand(b) if spk is not None else spk, length_scale=args.speaking_rate, )