feat: windows infer & gradio (#312)

* fix: windows infer * docs: update readme * docs: update readme * feat: v1.5 gradio for windows&linux * fix: dependencies * feat: windows infer & gradio --------- Co-authored-by: NeRF-Factory <zzhizhou66@gmail.com>
2026-02-05 01:49:20 +08:00 · 2025-04-12 23:22:22 +08:00
parent 36163fccbd
commit 67e7ee3c73
14 changed files with 613 additions and 245 deletions
--- a/musetalk/utils/audio_processor.py
+++ b/musetalk/utils/audio_processor.py
@@ -49,8 +49,9 @@ class AudioProcessor:
        whisper_feature = []
        # Process multiple 30s mel input features
        for input_feature in whisper_input_features:
-            audio_feats = whisper.encoder(input_feature.to(device), output_hidden_states=True).hidden_states
-            audio_feats = torch.stack(audio_feats, dim=2).to(weight_dtype)
+            input_feature = input_feature.to(device).to(weight_dtype)
+            audio_feats = whisper.encoder(input_feature, output_hidden_states=True).hidden_states
+            audio_feats = torch.stack(audio_feats, dim=2)
            whisper_feature.append(audio_feats)

        whisper_feature = torch.cat(whisper_feature, dim=1)
--- a/musetalk/utils/utils.py
+++ b/musetalk/utils/utils.py
@@ -8,26 +8,18 @@ from einops import rearrange
 import shutil
 import os.path as osp

-ffmpeg_path = os.getenv('FFMPEG_PATH')
-if ffmpeg_path is None:
-    print("please download ffmpeg-static and export to FFMPEG_PATH. \nFor example: export FFMPEG_PATH=/musetalk/ffmpeg-4.4-amd64-static")
-elif ffmpeg_path not in os.getenv('PATH'):
-    print("add ffmpeg to path")
-    os.environ["PATH"] = f"{ffmpeg_path}:{os.environ['PATH']}"
-
-    
 from musetalk.models.vae import VAE
 from musetalk.models.unet import UNet,PositionalEncoding


 def load_all_model(
-    unet_model_path="./models/musetalk/pytorch_model.bin",
-    vae_type="sd-vae-ft-mse",
-    unet_config="./models/musetalk/musetalk.json",
+    unet_model_path=os.path.join("models", "musetalkV15", "unet.pth"),
+    vae_type="sd-vae",
+    unet_config=os.path.join("models", "musetalkV15", "musetalk.json"),
    device=None,
 ):
    vae = VAE(
-        model_path = f"./models/{vae_type}/",
+        model_path = os.path.join("models", vae_type),
    )
    print(f"load unet model from {unet_model_path}")
    unet = UNet(