Spaces:

manfredmichael
/

mask-detection-manfred

Sleeping

App Files Files Community

manfredmichael commited on May 23, 2024

Commit

93c1293

1 Parent(s): d95d48a

Add pipeline

Browse files

Files changed (3) hide show

.gitignore +4 -0
app.py +101 -0
pipelines.py +218 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,4 @@

+__pycache__/
+temps/*
+runs/*
+.ipynb_checkpoints/

app.py ADDED Viewed

	@@ -0,0 +1,101 @@

+import base64
+import json
+import os, shutil
+import re
+import time
+import uuid
+import cv2
+import numpy as np
+import streamlit as st
+from PIL import Image
+# from extract_video import extract_method_single_video
+from utils import st_file_selector, img2base64
+from pipelines import ImagePipeline, VideoPipeline
+import os
+DEBUG = True
+def main():
+    st.markdown("###")
+    uploaded_file = st.file_uploader('Upload a picture', type=['mp4', 'jpg', 'jpeg', 'png'], accept_multiple_files=False)
+    with st.spinner(f'Loading samples...'):
+        while not os.path.isdir("sample_files"):
+            time.sleep(1)
+    st.markdown("### or")
+    selected_file = st_file_selector(st, path='sample_files', key = 'selected', label = 'Choose a sample image/video')
+    if uploaded_file:
+        random_id = uuid.uuid1()
+        base_folder = "temps"
+        filename = "{}.{}".format(random_id, uploaded_file.type.split("/")[-1])
+        file_type = uploaded_file.type.split("/")[0]
+        filepath = f"{base_folder}/{filename}"
+        faces_folder = f"{base_folder}/images/{random_id}"
+        st.write(filepath)
+        if uploaded_file.type == 'video/mp4':
+            with open(f"temps/{filename}", mode='wb') as f:
+                f.write(uploaded_file.read())
+            video_path = filepath
+            st.video(uploaded_file)
+        else:
+            img = Image.open(uploaded_file).convert('RGB')
+            ext = uploaded_file.type.split("/")[-1]
+            st.image(img)
+    elif selected_file:
+        base_folder = "sample_files"
+        file_type = selected_file.split(".")[-1]
+        filename = selected_file.split("/")[-1]
+        filepath = f"{base_folder}/{selected_file}"
+        if file_type == 'mp4':
+            video_file = open(filepath, 'rb')
+            video_bytes = video_file.read()
+            st.video(video_bytes)
+            video_path = filepath
+        else:
+            img = Image.open(filepath).convert('RGB')
+            st.image(img)
+    else:
+        return
+    annotated_img = None
+    with st.spinner(f'Analyzing {file_type}...'):
+        if file_type == 'video' or file_type == 'mp4':
+            result = video_pipeline(video_path)
+        else:
+            result, annotated_img = image_pipeline({'images': [img2base64(np.array(img))]}, draw_bbox=True)
+    if annotated_img is not None:
+        st.image(annotated_img)
+    if 'incorrectly' in result['message']:
+        st.error(result['message'], icon="🚨")
+    else:
+        st.success(result['message'], icon="✅")
+    st.divider()
+    st.write('## Response JSON')
+    st.write(result)
+def setup():
+    if not os.path.isdir("temps"):
+        os.makedirs("temps")
+if __name__ == "__main__":
+    image_pipeline = ImagePipeline()
+    video_pipeline = VideoPipeline()
+    # with st.sidebar:
+    st.title("Improper Mask Wearing Detection")
+    setup()
+    main()

pipelines.py ADDED Viewed

	@@ -0,0 +1,218 @@

+from PIL import Image
+from ultralytics import YOLO
+import numpy as np
+import cv2
+import torch
+from utils import readb64, img2base64
+model_int8 = YOLO('weights/best.torchscript', task='detect')
+labels = {
+    0: 'mask_weared_incorrect',
+    1: 'with_mask',
+    2: 'without_mask',
+}
+def inference_on_image(path):
+    results = model_int8(path)
+    img = cv2.imread(path, cv2.COLOR_BGR2RGB)
+    for box in results[0].boxes:
+        img = draw_bbox_prediction(img, box)
+    cv2.imshow('Detected Image', img)
+    cv2.waitKey(0)
+    return results
+def inference_on_video(path, vid_stride=10):
+    results = model_int8(path, vid_stride=10, stream=True)
+    cap = cv2.VideoCapture(path)
+    ret, img = cap.read()
+    frame_counter = 0
+    while True:
+        ret, img = cap.read()
+        if ret:
+            if frame_counter % 10 == 0:
+                result = next(results)
+            for box in result.boxes:
+                img = draw_bbox_prediction(img, box)
+        else:
+            cap.release()
+            break
+        cv2.imshow('Detected Image', img)
+        frame_counter += 1
+        k = cv2.waitKey(5) & 0xFF
+        if k == 27:
+            cap.release()
+            cv2.destroyAllWindows()
+            break
+    return results
+def draw_bbox_prediction(img, box):
+    cls = box.cls.item()
+    confidence = box.conf.item()
+    label = labels[cls]
+    x1, y1, x2, y2 = map(int, list(box.xyxy.numpy()[0]))
+    scaler = (x2-x1)/(640/8)
+    cv2.rectangle(img, (x1, y1), (x2, y2), (0, 102, 255), int(2*scaler))
+    img = cv2.rectangle(img, (x1, y1 - int(20*scaler)), (x1 + (x2 - x1)*3, y1), (0, 102, 255), -1)
+    img = cv2.putText(img, "{}: {:.3f}".format(label, confidence), (x1,y1-5),cv2.FONT_HERSHEY_SIMPLEX,0.6*scaler,(255,255,255), int(1*scaler))
+    return img
+class ImagePipeline:
+    def __init__(self, device='cpu', gpu_id=0, weights='weights/best.torchscript'):
+        self.model = YOLO(weights, task='detect')
+    def preprocess(self, data):
+        image_base64 = data.pop("images", data)
+        if not type(image_base64) == list:
+            image_base64 = [image_base64]
+        elif len(image_base64) > 1:
+            raise Exception("ImagePipeline only accepts 1 image/frame")
+        images = [readb64(image) for image in image_base64]
+        return images
+    def inference(self, images):
+        results = self.model(images[0])
+        return results
+    def get_response(self, inference_result):
+        response = []
+        if not bool(set([0, 2]).intersection(inference_result[0].boxes.cls.numpy())):
+        # if not set([0, 2]).issubset(inference_result[0].boxes.cls.numpy()):
+            message = "Everyone is wearing mask correctly"
+        else:
+            message = "Someone is not wearing mask or incorrectly wearing mask"
+        for i, result in enumerate(inference_result):
+            for xywhn, cls, conf in zip(
+                result.boxes.xywhn,
+                result.boxes.cls,
+                result.boxes.conf
+            ):
+                xywhn = list(xywhn.numpy())
+                response.append({
+                    'xywhn': {
+                        'x': float(xywhn[0]),
+                        'y': float(xywhn[1]),
+                        'w': float(xywhn[2]),
+                        'h': float(xywhn[3]),
+                    },
+                    'class': cls.item(),
+                    'confidence': conf.item(),
+                })
+        return {'results': response,
+                'message': message}
+    def draw_bbox(self, images, inference_result):
+        img = np.array(images[0])
+        boxes = list(inference_result[0].boxes)
+        boxes.reverse()
+        for box in boxes:
+            img = draw_bbox_prediction(img, box)
+        return img
+    def __call__(self, data, config_payload=None, draw_bbox=False):
+        images = self.preprocess(data)
+        inference_result = self.inference(images)
+        response = self.get_response(inference_result)
+        if draw_bbox:
+            annotated_img = self.draw_bbox(images, inference_result)
+            return response, annotated_img
+        return response
+class VideoPipeline:
+    def __init__(self, device='cpu', gpu_id=0, weights='weights/best.torchscript'):
+        self.model = YOLO(weights, task='detect')
+    def preprocess(self, data):
+        return data
+    def inference(self, video_path, vid_stride=30):
+        results = self.model(video_path, vid_stride=vid_stride)
+        return results
+    def get_response(self, inference_result):
+        response = []
+        # default message
+        message = "Everyone is wearing mask correctly"
+        for i, result in enumerate(inference_result):
+            if set([0, 2]).issubset(inference_result[0].boxes.cls.numpy()):
+                message = "Someone is not wearing mask or incorrectly wearing mask"
+            for xywhn, cls, conf in zip(
+                result.boxes.xywhn,
+                result.boxes.cls,
+                result.boxes.conf
+            ):
+                xywhn = list(xywhn.numpy())
+                response.append({
+                    'xywhn': {
+                        'x': float(xywhn[0]),
+                        'y': float(xywhn[1]),
+                        'w': float(xywhn[2]),
+                        'h': float(xywhn[3]),
+                    },
+                    'class': cls.item(),
+                    'confidence': conf.item(),
+                })
+        return {'results': response,
+                'message': message}
+    def __call__(self, data, config_payload=None):
+        data = self.preprocess(data)
+        inference_result = self.inference(data)
+        response = self.get_response(inference_result)
+        return response
+if __name__ == '__main__':
+    import cv2
+    import argparse
+    parser = argparse.ArgumentParser(formatter_class=argparse.ArgumentDefaultsHelpFormatter)
+    parser.add_argument('--input_type',
+                    default='image',
+                    const='image',
+                    nargs='?',
+                    choices=['image', 'video'],
+                    help='type of input (default: %(default)s)')
+    parser.add_argument("-p", "--path", help="filepath")
+    args = parser.parse_args()
+    if args.input_type=='image':
+        results = inference_on_image(args.path)
+    elif args.input_type == 'video':
+        results = inference_on_video(args.path)
+    print(results)
+    # Examples
+    # python pipelines.py --input_type image --path sample_files/image-1.jpeg
+    # python pipelines.py --input_type video --path sample_files/video-1.mp4