Spaces:
Running
Running
cpu
Browse files
app.py
CHANGED
@@ -109,7 +109,7 @@ def main(video_path, audio_path, progress=gr.Progress(track_tqdm=True)):
|
|
109 |
else:
|
110 |
raise NotImplementedError("cross_attention_dim must be 768 or 384")
|
111 |
|
112 |
-
audio_encoder = Audio2Feature(model_path=whisper_model_path, device="
|
113 |
|
114 |
vae = AutoencoderKL.from_pretrained("stabilityai/sd-vae-ft-mse", torch_dtype=torch.float16)
|
115 |
vae.config.scaling_factor = 0.18215
|
|
|
109 |
else:
|
110 |
raise NotImplementedError("cross_attention_dim must be 768 or 384")
|
111 |
|
112 |
+
audio_encoder = Audio2Feature(model_path=whisper_model_path, device="cpu", num_frames=config.data.num_frames)
|
113 |
|
114 |
vae = AutoencoderKL.from_pretrained("stabilityai/sd-vae-ft-mse", torch_dtype=torch.float16)
|
115 |
vae.config.scaling_factor = 0.18215
|