Spaces:

smartfeed
/

test_video

Running on Zero

App Files Files Community

zhiweili commited on 24 days ago

Commit

708a6ea

1 Parent(s): 05483e9

add app_i2v

Browse files

Files changed (4) hide show

app.py +6 -3
app_i2v.py +104 -0
app_video.py → app_t2v.py +3 -8
video_model.py +9 -0

app.py CHANGED Viewed

@@ -1,10 +1,13 @@
 import gradio as gr
-from app_video import create_demo as create_demo_face
 with gr.Blocks(css="style.css") as demo:
     with gr.Tabs():
-        with gr.Tab(label="Video"):
-            create_demo_face()
 demo.launch()

 import gradio as gr
+from app_t2v import create_demo as create_demo_t2v
+from app_i2v import create_demo as create_demo_i2v
 with gr.Blocks(css="style.css") as demo:
     with gr.Tabs():
+        with gr.Tab(label="tx2vid"):
+            create_demo_t2v()
+        with gr.Tab(label="img2vid"):
+            create_demo_i2v()
 demo.launch()

app_i2v.py ADDED Viewed

	@@ -0,0 +1,104 @@

+import spaces
+import gradio as gr
+import time
+import torch
+import gc
+import tempfile
+from diffusers.utils import export_to_video, load_image
+from video_model import video_pipe
+device = "cuda" if torch.cuda.is_available() else "cpu"
+def create_demo() -> gr.Blocks:
+    @spaces.GPU(duration=60)
+    def image_to_video(
+        image_path: str,
+        prompt: str,
+        negative_prompt: str,
+        width: int = 768,
+        height: int = 512,
+        num_frames: int = 121,
+        frame_rate: int = 25,
+        num_inference_steps: int = 30,
+        seed: int = 8,
+        progress=gr.Progress(),
+    ):
+        generator = torch.Generator(device=device).manual_seed(seed)
+        input_image = load_image(image_path)
+        run_task_time = 0
+        time_cost_str = ''
+        run_task_time, time_cost_str = get_time_cost(run_task_time, time_cost_str)
+        try:
+            with torch.no_grad():
+                video = video_pipe(
+                    image=input_image,
+                    prompt=prompt,
+                    negative_prompt=negative_prompt,
+                    generator=generator,
+                    width=width,
+                    height=height,
+                    num_frames=num_frames,
+                    num_inference_steps=num_inference_steps,
+                ).frames[0]
+        finally:
+            torch.cuda.empty_cache()
+            gc.collect()
+        run_task_time, time_cost_str = get_time_cost(run_task_time, time_cost_str)
+        output_path = tempfile.mktemp(suffix=".mp4")
+        export_to_video(video, output_path, fps=frame_rate)
+        del video
+        torch.cuda.empty_cache()
+        return output_path, time_cost_str
+    def get_time_cost(run_task_time, time_cost_str):
+        now_time = int(time.time()*1000)
+        if run_task_time == 0:
+            time_cost_str = 'start'
+        else:
+            if time_cost_str != '':
+                time_cost_str += f'-->'
+            time_cost_str += f'{now_time - run_task_time}'
+        run_task_time = now_time
+        return run_task_time, time_cost_str
+    with gr.Blocks() as demo:
+        with gr.Row():
+            with gr.Column():
+                i2vid_image_path = gr.File(label="Input Image")
+                i2vid_prompt = gr.Textbox(
+                    label="Enter Your Prompt",
+                    placeholder="Describe the video you want to generate (minimum 50 characters)...",
+                    value="A woman with long brown hair and light skin smiles at another woman with long blonde hair. The woman with brown hair wears a black jacket and has a small, barely noticeable mole on her right cheek. The camera angle is a close-up, focused on the woman with brown hair's face. The lighting is warm and natural, likely from the setting sun, casting a soft glow on the scene. The scene appears to be real-life footage.",
+                    lines=5,
+                )
+                i2vid_negative_prompt = gr.Textbox(
+                    label="Enter Negative Prompt",
+                    placeholder="Describe what you don't want in the video...",
+                    value="low quality, worst quality, deformed, distorted, disfigured, motion smear, motion artifacts, fused fingers, bad anatomy, weird hand, ugly",
+                    lines=2,
+                )
+                i2vid_generate = gr.Button(
+                    "Generate Video",
+                    variant="primary",
+                    size="lg",
+                )
+            with gr.Column():
+                i2vid_output = gr.Video(label="Generated Output")
+                i2vid_generated_cost = gr.Textbox(label="Time cost by step (ms):", visible=True, interactive=False)
+        i2vid_generate.click(
+            fn=image_to_video,
+            inputs=[i2vid_image_path, i2vid_prompt, i2vid_negative_prompt],
+            outputs=[i2vid_output, i2vid_generated_cost],
+        )
+    return demo

app_video.py → app_t2v.py RENAMED Viewed

@@ -4,18 +4,13 @@ import time
 import torch
 import gc
 import tempfile
-import numpy as np
-import cv2
-from diffusers import LTXPipeline
-from diffusers.utils import export_to_video
 device = "cuda" if torch.cuda.is_available() else "cpu"
-pipe = LTXPipeline.from_pretrained("Lightricks/LTX-Video", torch_dtype=torch.bfloat16)
-pipe.to(device)
 def create_demo() -> gr.Blocks:
     @spaces.GPU(duration=60)
@@ -36,7 +31,7 @@ def create_demo() -> gr.Blocks:
         run_task_time, time_cost_str = get_time_cost(run_task_time, time_cost_str)
         try:
             with torch.no_grad():
-                video = pipe(
                     prompt=prompt,
                     negative_prompt=negative_prompt,
                     generator=generator,

 import torch
 import gc
 import tempfile
+from diffusers.utils import export_to_video, load_image
+from video_model import video_pipe
 device = "cuda" if torch.cuda.is_available() else "cpu"
 def create_demo() -> gr.Blocks:
     @spaces.GPU(duration=60)
         run_task_time, time_cost_str = get_time_cost(run_task_time, time_cost_str)
         try:
             with torch.no_grad():
+                video = video_pipe(
                     prompt=prompt,
                     negative_prompt=negative_prompt,
                     generator=generator,

video_model.py ADDED Viewed

	@@ -0,0 +1,9 @@

+import torch
+from diffusers import LTXPipeline
+device = "cuda" if torch.cuda.is_available() else "cpu"
+video_pipe = LTXPipeline.from_pretrained("Lightricks/LTX-Video", torch_dtype=torch.bfloat16)
+video_pipe.to(device)