Spaces:

NN-BRD
/

hackathon_depth_segment

Runtime error

App Files Files Community

jens commited on Aug 1, 2023

Commit

6b8e3c4

1 Parent(s): 0ef8343

depth estimation

Browse files

Files changed (4) hide show

app.py +7 -10
inference.py +55 -0
requirements.txt +2 -1
tests.py +0 -0

app.py CHANGED Viewed

@@ -1,20 +1,17 @@
 import gradio as gr
 from segment_anything import SamAutomaticMaskGenerator, sam_model_registry
 import supervision as sv
 def snap(image, video):
-    MODEL_TYPE = "vit_b"
-    checkpoint = "sam_vit_b_01ec64.pth"
-    sam = sam_model_registry[MODEL_TYPE](checkpoint=checkpoint)
-    mask_generator = SamAutomaticMaskGenerator(sam)
-    #mask_generator = SamAutomaticMaskGenerator(sam, points_per_side=50)
-    sam_result = mask_generator.generate(image)
-    mask_annotator = sv.MaskAnnotator()
-    detections = sv.Detections.from_sam(sam_result=sam_result)
-    annotated_image = mask_annotator.annotate(scene=image.copy(), detections=detections)
-    return [annotated_image, video]
 demo = gr.Interface(

 import gradio as gr
 from segment_anything import SamAutomaticMaskGenerator, sam_model_registry
 import supervision as sv
+from inference import DepthPredictor, SegmentPredictor
 def snap(image, video):
+    depth_predictor = DepthPredictor()
+    #segment_predictor = SegmentPredictor()
+    #sam_result = segment_predictor.predict(image)
+    depth_result = depth_predictor.predict(image)
+    return [depth_result, video]
 demo = gr.Interface(

inference.py ADDED Viewed

	@@ -0,0 +1,55 @@

+from transformers import DPTImageProcessor, DPTForDepthEstimation
+from segment_anything import SamAutomaticMaskGenerator, sam_model_registry
+import gradio as gr
+import supervision as sv
+import torch
+import numpy as np
+from PIL import Image
+import requests
+class DepthPredictor:
+    def __init__(self):
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.processor = DPTImageProcessor.from_pretrained("Intel/dpt-large").to(self.device)
+        self.model = DPTForDepthEstimation.from_pretrained("Intel/dpt-large").to(self.device)
+        self.model.eval()
+    def predict(self, image):
+        # prepare image for the model
+        inputs = self.processor(images=image, return_tensors="pt").to(self.device)
+        with torch.no_grad():
+            outputs = self.model(**inputs)
+            predicted_depth = outputs.predicted_depth
+        # interpolate to original size
+        prediction = torch.nn.functional.interpolate(
+            predicted_depth.unsqueeze(1),
+            size=image.size[::-1],
+            mode="bicubic",
+            align_corners=False,
+        )
+        # visualize the prediction
+        output = prediction.squeeze().cpu().numpy()
+        formatted = (output * 255 / np.max(output)).astype("uint8")
+        depth = Image.fromarray(formatted)
+        return depth
+class sam_inference:
+    def __init__(self):
+        MODEL_TYPE = "vit_b"
+        checkpoint = "sam_vit_b_01ec64.pth"
+        sam = sam_model_registry[MODEL_TYPE](checkpoint=checkpoint)
+        self.mask_generator = SamAutomaticMaskGenerator(sam)
+    def predict(self, image):
+        sam_result = self.mask_generator.generate(image)
+        mask_annotator = sv.MaskAnnotator()
+        detections = sv.Detections.from_sam(sam_result=sam_result)
+        annotated_image = mask_annotator.annotate(scene=image.copy(), detections=detections)
+        return [annotated_image]

requirements.txt CHANGED Viewed

@@ -4,4 +4,5 @@ segment-anything
 supervision
 torch
 torchvision
-opencv-python

 supervision
 torch
 torchvision
+opencv-python
+transformers

tests.py ADDED Viewed

File without changes