Added CoreML support

8ff · Aug 18, 2023 · 187c884 · 187c884
1 parent b8dbc70
commit 187c884
Show file tree

Hide file tree

Showing 6 changed files with 294 additions and 72 deletions.
diff --git a/README.md b/README.md
@@ -14,7 +14,7 @@ Firescrew is a cutting-edge application written in Go that enables real-time obj
 ## Key Features
 - **Real-Time Motion Detection**: Firescrew can detect motion from a live feed and provide real-time alerts.
 - **Object Identification**: Identify specific objects like cars and people in real-time.
-- **Model Flexibility**: Firescrew can use the latest YOLOv8 model or Coral EdgeTPU models for enhanced performance.
+- **Model Flexibility**: Firescrew can use the latest YOLOv8 model, MobileNET with Coral TPU or YOLOv8s with CoreML (MAC Only) for enhanced performance.
 - **Performance**: Firescrew takes full advantage of Go's concurrency handling and speed, providing a high-performance solution for real-time image processing.
 - **RTSP Network Camera Support**: Firescrew is compatible with RTSP network cameras, extending its applicability in a wide range of scenarios.
 - **MQTT/Webhook/Script/Slack**: Firescrew can send events to MQTT/Webhook/Script/Slack for further processing.
@@ -23,6 +23,7 @@ Firescrew is a cutting-edge application written in Go that enables real-time obj
 
 ```
 Things added/fixed in last 3 days:
+- Added CoreML YoloV8s (Mac only)
 - Added MQTT/Webhook/ScriptHook/Slack support!
 - Added ffprobe timeout/Fixed MQTT port in template/Added docs page
 - Added inference statistics and much more!
@@ -163,6 +164,15 @@ You can do this by running the following command:
 pip3 install pycoral numpy Pillow
 ```
 
+## Running YOLOV8s with CoreML (Mac Only)
+This has been tested working on `M1/M2 MacOS 13.4.1`, it works when using `python3.10` and not `3.11`
+```bash
+git clone https://github.com/8ff/firescrew && cd firescrew/assets
+pip3.10 install coremltools Pillow
+./objectDetectServerCoreML.py
+```
+Now in your config.json file set `"networkObjectDetectServer": "",` addr:8555 where `addr` is the ip of your machine running the above script
+
 ## RTSP Camera Stream URLs
 Firescrew supports two different RTSP camera streams: a low resolution stream (`deviceUrl`) and a high resolution stream (`hiResDeviceUrl`). These streams are used for different purposes and should be set up accordingly.
 The `deviceUrl` should be set to a low resolution video feed, typically around 640x360. This stream is used for motion detection. Note that the resolution of this stream significantly impacts the CPU usage. A higher resolution will lead to more CPU usage, so it is recommended to keep this stream at a lower resolution.
@@ -305,7 +315,6 @@ Your insights and perspectives are vital in shaping the future of Firescrew. Tog
 
 
 ## Roadmap
-- Build a doc site
 - GetDimensions Web UI
 - Add benchmarks
 - Add uploading footage to S3 compatible cloud host

diff --git a/assets/objectDetectServerCoral.py b/assets/objectDetectServerCoral.py
diff --git a/assets/objectDetectServerCoreML.py b/assets/objectDetectServerCoreML.py
@@ -0,0 +1,195 @@
+#!/usr/bin/env python3.10
+# This runs on python 3.10
+# pip3.10 install coremltools Pillow
+
+import coremltools as ct
+import numpy as np
+import PIL.Image
+import socket
+import threading
+import io
+import json
+import time
+import traceback
+
+
+# Load the Core ML model
+# model_path = "./YOLOv3.mlmodel"
+model_path = "./yolov8s.mlmodel"
+model = ct.models.MLModel(model_path)
+# print model details
+# print(model)
+
+class_labels = {
+    0: 'person',
+    1: 'bicycle',
+    2: 'car',
+    3: 'motorcycle',
+    4: 'airplane',
+    5: 'bus',
+    6: 'train',
+    7: 'truck',
+    8: 'boat',
+    9: 'traffic light',
+    10: 'fire hydrant',
+    12: 'stop sign',
+    13: 'parking meter',
+    14: 'bench',
+    15: 'bird',
+    16: 'cat',
+    17: 'dog',
+    18: 'horse',
+    19: 'sheep',
+    20: 'cow',
+    21: 'elephant',
+    22: 'bear',
+    23: 'zebra',
+    24: 'giraffe',
+    26: 'backpack',
+    27: 'umbrella',
+    30: 'handbag',
+    31: 'tie',
+    32: 'suitcase',
+    33: 'frisbee',
+    34: 'skis',
+    35: 'snowboard',
+    36: 'sports ball',
+    37: 'kite',
+    38: 'baseball bat',
+    39: 'baseball glove',
+    40: 'skateboard',
+    41: 'surfboard',
+    42: 'tennis racket',
+    43: 'bottle',
+    45: 'wine glass',
+    46: 'cup',
+    47: 'fork',
+    48: 'knife',
+    49: 'spoon',
+    50: 'bowl',
+    51: 'banana',
+    52: 'apple',
+    53: 'sandwich',
+    54: 'orange',
+    55: 'broccoli',
+    56: 'carrot',
+    57: 'hot dog',
+    58: 'pizza',
+    59: 'donut',
+    60: 'cake',
+    61: 'chair',
+    62: 'couch',
+    63: 'potted plant',
+    64: 'bed',
+    66: 'dining table',
+    69: 'toilet',
+    71: 'tv',
+    72: 'laptop',
+    73: 'mouse',
+    74: 'remote',
+    75: 'keyboard',
+    76: 'cell phone',
+    77: 'microwave',
+    78: 'oven',
+    79: 'toaster',
+    80: 'sink',
+    81: 'refrigerator',
+    83: 'book',
+    84: 'clock',
+    85: 'vase',
+    86: 'scissors',
+    87: 'teddy bear',
+    88: 'hair drier',
+    89: 'toothbrush',
+}
+
+def load_image(data, resize_to=None):
+    img = PIL.Image.open(io.BytesIO(data))
+    if resize_to is not None:
+        img_resized = PIL.Image.new('RGB', resize_to)
+        img_resized.paste(img, (0, (resize_to[1] - img.size[1]) // 2))
+        img = img_resized
+    img_np = np.array(img).astype(np.float32)
+    return img_np, img
+
+
+def recvall(sock, count):
+    buf = b''
+    while count:
+        newbuf = sock.recv(count)
+        if not newbuf: return None
+        buf += newbuf
+        count -= len(newbuf)
+    return buf
+
+def handle_client(conn):
+    try:
+        while True:
+            frame_len_bytes = conn.recv(4)
+            if not frame_len_bytes:
+                break
+            frame_len = int.from_bytes(frame_len_bytes, 'big')
+            frame_data = recvall(conn, frame_len)
+            if frame_data is None:
+                break
+
+            # Load and resize the image
+            img_np, img_resized = load_image(frame_data, resize_to=(640, 640))
+
+            # Run the model
+            out_dict = model.predict({'image': img_resized})
+
+            # Extract the results
+            predictions = []
+            for i, confidence in enumerate(out_dict['confidence'][0]):
+                if confidence > 0 and i in class_labels:
+                    coordinates = out_dict['coordinates'][0]
+                    x_center, y_center, width, height = coordinates
+                    x_center *= 640  # Scale to the model's expected size
+                    y_center = (y_center * 640 - 140) # Adjust y_center to match the original image size
+                    width *= 640 # Scale to the model's expected size
+                    height = (height * 640) / 2 # Adjust height to match the original image size
+                    left = int(x_center - (width / 2))
+                    top = int(y_center - (height / 2))
+                    right = int(x_center + (width / 2))
+                    bottom = int(y_center + (height / 2))
+                    prediction = {
+                        'object': i + 1,
+                        'class_name': class_labels[i],
+                        'box': [left, top, right, bottom],
+                        'confidence': float(confidence),
+                    }
+                    predictions.append(prediction)
+
+            # Convert the predictions to a JSON string
+            predictions_json = json.dumps(predictions)
+
+            # Send the results back to the client
+            conn.sendall((predictions_json + '\n').encode())
+    except Exception as e:
+        print(f"Exception handling client: {e}")
+        traceback.print_exc()  # Print the full traceback
+    finally:
+        print("Closing connection")
+        conn.close()
+
+
+def main():
+    LISTEN_ADDR = "0.0.0.0"
+    LISTEN_PORT = 8555
+
+    s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
+    s.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
+    s.bind((LISTEN_ADDR, LISTEN_PORT))
+    s.listen(5)
+
+    print(f"Server is listening on {LISTEN_ADDR}:{LISTEN_PORT}")
+
+    while True:
+        conn, addr = s.accept()
+        print(f"Got connection from {addr}")
+        thread = threading.Thread(target=handle_client, args=(conn,))
+        thread.start()
+
+if __name__ == "__main__":
+    main()
diff --git a/assets/yolov8s.mlmodel b/assets/yolov8s.mlmodel
diff --git a/doc/src/desktop.afdesign b/doc/src/desktop.afdesign