Spaces:

Francke
/

LatentSync

Running

Francke commited on 18 days ago

Commit

53da172

1 Parent(s): bc75124

cpu

Files changed (1) hide show

app.py CHANGED Viewed

@@ -109,7 +109,7 @@ def main(video_path, audio_path, progress=gr.Progress(track_tqdm=True)):
     else:
         raise NotImplementedError("cross_attention_dim must be 768 or 384")
-    audio_encoder = Audio2Feature(model_path=whisper_model_path, device="cuda", num_frames=config.data.num_frames)
     vae = AutoencoderKL.from_pretrained("stabilityai/sd-vae-ft-mse", torch_dtype=torch.float16)
     vae.config.scaling_factor = 0.18215

     else:
         raise NotImplementedError("cross_attention_dim must be 768 or 384")
+    audio_encoder = Audio2Feature(model_path=whisper_model_path, device="cpu", num_frames=config.data.num_frames)
     vae = AutoencoderKL.from_pretrained("stabilityai/sd-vae-ft-mse", torch_dtype=torch.float16)
     vae.config.scaling_factor = 0.18215