Fixing batched synthesis for multispeaker model

2026-02-05 18:29:19 +08:00 · 2024-05-27 13:40:02 +02:00
parent aa496aa13f
commit de910380bc
1 changed files with 2 additions and 1 deletions
--- a/matcha/cli.py
+++ b/matcha/cli.py
@@ -326,12 +326,13 @@ def batched_synthesis(args, device, model, vocoder, denoiser, texts, spk):
    for i, batch in enumerate(dataloader):
        i = i + 1
        start_t = dt.datetime.now()
        b = batch["x"].shape[0]
        output = model.synthesise(
            batch["x"].to(device),
            batch["x_lengths"].to(device),
            n_timesteps=args.steps,
            temperature=args.temperature,
-            spks=spk,
+            spks=spk.expand(b) if spk is not None else spk,
            length_scale=args.speaking_rate,
        )