Spaces:

becteur92
/

smollvm

Paused

App Files Files Community

youssef commited on about 22 hours ago

Commit

c9f0527

1 Parent(s): 3ad5e22

fix dockerfile

Browse files

Files changed (2) hide show

Dockerfile +1 -0
src/video_processor/processor.py +31 -23

Dockerfile CHANGED Viewed

@@ -1,4 +1,5 @@
 FROM nvidia/cuda:12.3.2-cudnn9-devel-ubuntu22.04
 ENV DEBIAN_FRONTEND=noninteractive
 RUN apt-get update && \
     apt-get upgrade -y && \

 FROM nvidia/cuda:12.3.2-cudnn9-devel-ubuntu22.04
 ENV DEBIAN_FRONTEND=noninteractive
 RUN apt-get update && \
     apt-get upgrade -y && \

src/video_processor/processor.py CHANGED Viewed

@@ -65,34 +65,42 @@ class VideoAnalyzer:
     def analyze_segment(self, video_path: str, start_time: float) -> str:
         """Analyze a single video segment."""
         messages = [
             {
-                "role": "system",
-                "content": [{"type": "text", "text": """You are a detailed video analysis assistant. Analyze and describe:
-1. People: their appearance, actions, and interactions
-2. Environment: location, weather, time of day, lighting
-3. Objects: key items, their positions and movements
-4. Text: any visible text, signs, or captions
-5. Events: what is happening in sequence
-6. Visual details: colors, patterns, visual effects
-Be specific about timing and details to enable searching through the video later."""}]
-            },
             {
-                "role": "user",
-                "content": [
-                    {"type": "video", "path": video_path},
-                    {"type": "text", "text": """Describe this segment comprehensively. Include:
-- Who appears and what are they doing?
-- What is the environment and weather like?
-- What objects or items are visible?
-- Is there any text visible on screen?
-- What actions or events are occurring?
-- Note any significant visual details
-Be specific about all visual elements to enable searching later."""}
-                ]
             }
         ]
         inputs = self.processor.apply_chat_template(
             messages,
             add_generation_prompt=True,

     def analyze_segment(self, video_path: str, start_time: float) -> str:
         """Analyze a single video segment."""
         messages = [
+    {
+        "role": "system",
+        "content": [
             {
+                "type": "text",
+                "text": (
+                    "You are an AI specialized in video content analysis. "
+                    "Your task is to watch the provided video segment and generate a detailed, structured description focusing on the following elements:\n"
+                    "1. **People and Their Actions:** Identify all individuals, their appearances, and describe their activities or interactions.\n"
+                    "2. **Environment and Setting:** Describe the location, time of day, weather conditions, and any notable background details.\n"
+                    "3. **Objects and Their Positions:** List prominent objects, their attributes, and spatial relationships within the scene.\n"
+                    "4. **On-Screen Text:** Transcribe any visible text, including signs, labels, or subtitles, and specify their locations.\n"
+                    "5. **Key Events and Timing:** Outline significant events, actions, or changes, along with their timestamps.\n\n"
+                    "Provide the information in a clear and concise manner, using bullet points or numbered lists where appropriate."
+                )
+            }
+        ]
+    },
+    {
+        "role": "user",
+        "content": [
+            {"type": "video", "path": video_path},
             {
+                "type": "text",
+                "text": (
+                    "Please analyze the attached video segment and provide a structured description as per the guidelines above. "
+                    "If certain elements are not present in the video, you may omit them from your response."
+                )
             }
         ]
+    }
+]
         inputs = self.processor.apply_chat_template(
             messages,
             add_generation_prompt=True,