wyzely-detect/wyzely_detect/__main__.py

# import face_recognition
from pathlib import Path

import cv2

# import hjson as json
import torch
from ultralytics import YOLO

from .utils import notify, utils
from .utils.cli_args import argparser

DATETIME_FORMAT = "%Y-%m-%d %H:%M:%S"
args = None

objects_and_peoples = {
    "objects": {},
    "peoples": {},
}


def main():
    global objects_and_peoples
    global args
    # RUN_BY_COMPOSE = os.getenv("RUN_BY_COMPOSE") # Replace this with code to check for gpu


    args = argparser.parse_args()

    # Check if a CUDA GPU is available. If it is, set it via torch. If not, set it to cpu
    # https://github.com/ultralytics/ultralytics/issues/3084#issuecomment-1732433168
    # Currently, I have been unable to set up Poetry to use GPU for Torch
    for i in range(torch.cuda.device_count()):
        print(torch.cuda.get_device_properties(i).name)
    if torch.cuda.is_available():
        torch.cuda.set_device(0)
        print("Set CUDA device")
    else:
        print("No CUDA device available, using CPU")

    model = YOLO("yolov8n.pt")

    # Depending on if the user wants to use a stream or a capture device,
    # Set the video capture to the appropriate source
    if args.url:
        video_capture = cv2.VideoCapture(args.url)
    else:
        video_capture = cv2.VideoCapture(args.capture_device)

    # Eliminate lag by setting the buffer size to 1
    # This makes it so that the video capture will only grab the most recent frame
    # However, this means that the video may be choppy
    video_capture.set(cv2.CAP_PROP_BUFFERSIZE, 1)

    # Print the resolution of the video
    print(
        f"Video resolution: {video_capture.get(cv2.CAP_PROP_FRAME_WIDTH)}x{video_capture.get(cv2.CAP_PROP_FRAME_HEIGHT)}"  # noqa: E501
    )

    print("Beginning video capture...")
    while True:
        # Grab a single frame of video
        ret, frame = video_capture.read()
        # Only process every other frame of video to save time
        # Resize frame of video to a smaller size for faster recognition processing
        run_frame = cv2.resize(frame, (0, 0), fx=args.run_scale, fy=args.run_scale)
        # view_frame = cv2.resize(frame, (0, 0), fx=args.view_scale, fy=args.view_scale)

        results = model(run_frame, verbose=False)

        path_to_faces = Path(args.faces_directory)
        path_to_faces_exists = path_to_faces.is_dir()

        for i, r in enumerate(results):
            # list of dicts with each dict containing a label, x1, y1, x2, y2
            plot_boxes = []

            # The following is stuff for people
            # This is still in the for loop as each result, no matter if anything is detected, will be present.
            # Thus, there will always be one result (r)

            # Only run if path_to_faces exists
            # May be better to check every iteration, but this also works
            if path_to_faces_exists:
                if face_details := utils.recognize_face(
                    path_to_directory=path_to_faces, run_frame=run_frame, min_confidence=args.face_confidence_threshold
                ):
                    plot_boxes.append(face_details)
                    objects_and_peoples = notify.thing_detected(
                        thing_name=face_details["label"],
                        objects_and_peoples=objects_and_peoples,
                        detection_type="peoples",
                        detection_window=args.detection_window,
                        detection_duration=args.detection_duration,
                        notification_window=args.notification_window,
                        ntfy_url=args.ntfy_url,
                    )

            # The following is stuff for objects
            # Setup dictionary of object names
            if (
                objects_and_peoples["objects"] == {}
                or objects_and_peoples["objects"] is None
            ):
                for name in r.names.values():
                    objects_and_peoples["objects"][name] = {
                        "last_detection_time": None,
                        "detection_duration": None,
                        # "first_detection_time": None,
                        "last_notification_time": None,
                    }
                # Also, make sure that the objects to detect are in the list of objects_and_peoples
                # If it isn't, print a warning
                for obj in args.detect_object:
                    if obj not in objects_and_peoples:
                        print(
                            f"Warning: {obj} is not in the list of objects the model can detect!"
                        )

            for box in r.boxes:
                # Get the name of the object
                class_id = r.names[box.cls[0].item()]
                # Get the coordinates of the object
                cords = box.xyxy[0].tolist()
                cords = [round(x) for x in cords]
                # Get the confidence
                conf = round(box.conf[0].item(), 2)
                # Print it out, adding a spacer between each object
                # print("Object type:", class_id)
                # print("Coordinates:", cords)
                # print("Probability:", conf)
                # print("---")

                # Now do stuff (if conf > 0.5)
                if conf < args.object_confidence_threshold or (
                    class_id not in args.detect_object and args.detect_object != []
                ):
                    # If the confidence is too low
                    # or if the object is not in the list of objects to detect and the list of objects to detect is not empty
                    # then skip this iteration
                    continue

                # Add the object to the list of objects to plot
                plot_boxes.append(
                    {
                        "label": class_id,
                        "x1": cords[0],
                        "y1": cords[1],
                        "x2": cords[2],
                        "y2": cords[3],
                    }
                )

                objects_and_peoples = notify.thing_detected(
                    thing_name=class_id,
                    objects_and_peoples=objects_and_peoples,
                    detection_type="objects",
                    detection_window=args.detection_window,
                    detection_duration=args.detection_duration,
                    notification_window=args.notification_window,
                    ntfy_url=args.ntfy_url,
                )

            # To debug plotting, use r.plot() to cross reference the bounding boxes drawn by the plot_label() and r.plot()
            frame_to_show = utils.plot_label(
                boxes=plot_boxes,
                full_frame=frame,
                # full_frame=r.plot(),
                run_scale=args.run_scale,
                view_scale=args.view_scale,
            )

            # Display the resulting frame
            # cv2.imshow("", r)
            if not args.no_display:
                cv2.imshow(f"Video{i}", frame_to_show)

        # Hit 'q' on the keyboard to quit!
        if cv2.waitKey(1) & 0xFF == ord("q"):
            break

    # Release handle to the webcam
    print("Releasing video capture")
    video_capture.release()
    cv2.destroyAllWindows()


if __name__ == "__main__":
    main()
Simple object detection 2023-10-02 01:56:40 +01:00			`# import face_recognition`
			`from pathlib import Path`
Move argparse code to `cli_args.py` 2023-10-27 16:54:36 +01:00
			`import cv2`
Added notification stuff 2023-10-05 03:03:11 +01:00
Simple object detection 2023-10-02 01:56:40 +01:00			`# import hjson as json`
			`import torch`
			`from ultralytics import YOLO`

Move argparse code to `cli_args.py` 2023-10-27 16:54:36 +01:00			`from .utils import notify, utils`
			`from .utils.cli_args import argparser`
Simple object detection 2023-10-02 01:56:40 +01:00
			`DATETIME_FORMAT = "%Y-%m-%d %H:%M:%S"`
			`args = None`

Manage timers in notify.py 2023-10-14 21:40:36 +01:00			`objects_and_peoples = {`
			`"objects": {},`
			`"peoples": {},`
			`}`
Added notification stuff 2023-10-05 03:03:11 +01:00

Simple object detection 2023-10-02 01:56:40 +01:00			`def main():`
Manage timers in notify.py 2023-10-14 21:40:36 +01:00			`global objects_and_peoples`
Simple object detection 2023-10-02 01:56:40 +01:00			`global args`
			`# RUN_BY_COMPOSE = os.getenv("RUN_BY_COMPOSE") # Replace this with code to check for gpu`

Added flags for timers 2023-10-06 02:17:31 +01:00
Simple object detection 2023-10-02 01:56:40 +01:00			`args = argparser.parse_args()`

Changed repo URL and added repo to pyproject.toml 2023-10-22 22:53:29 +01:00			`# Check if a CUDA GPU is available. If it is, set it via torch. If not, set it to cpu`
Simple object detection 2023-10-02 01:56:40 +01:00			`# https://github.com/ultralytics/ultralytics/issues/3084#issuecomment-1732433168`
Added notification stuff 2023-10-05 03:03:11 +01:00			`# Currently, I have been unable to set up Poetry to use GPU for Torch`
Turn off verbose output Also print object type 2023-10-04 03:03:39 +01:00			`for i in range(torch.cuda.device_count()):`
			`print(torch.cuda.get_device_properties(i).name)`
			`if torch.cuda.is_available():`
Simple object detection 2023-10-02 01:56:40 +01:00			`torch.cuda.set_device(0)`
			`print("Set CUDA device")`
Added notification stuff 2023-10-05 03:03:11 +01:00			`else:`
Simple object detection 2023-10-02 01:56:40 +01:00			`print("No CUDA device available, using CPU")`
Added notification stuff 2023-10-05 03:03:11 +01:00
Simple object detection 2023-10-02 01:56:40 +01:00			`model = YOLO("yolov8n.pt")`

Add `--url` Don't use Pytorch GPU 2023-10-06 00:40:53 +01:00			`# Depending on if the user wants to use a stream or a capture device,`
			`# Set the video capture to the appropriate source`
			`if args.url:`
			`video_capture = cv2.VideoCapture(args.url)`
			`else:`
			`video_capture = cv2.VideoCapture(args.capture_device)`

Simple object detection 2023-10-02 01:56:40 +01:00			`# Eliminate lag by setting the buffer size to 1`
			`# This makes it so that the video capture will only grab the most recent frame`
			`# However, this means that the video may be choppy`
			`video_capture.set(cv2.CAP_PROP_BUFFERSIZE, 1)`

			`# Print the resolution of the video`
			`print(`
			`f"Video resolution: {video_capture.get(cv2.CAP_PROP_FRAME_WIDTH)}x{video_capture.get(cv2.CAP_PROP_FRAME_HEIGHT)}" # noqa: E501`
			`)`

			`print("Beginning video capture...")`
			`while True:`
			`# Grab a single frame of video`
			`ret, frame = video_capture.read()`
			`# Only process every other frame of video to save time`
			`# Resize frame of video to a smaller size for faster recognition processing`
			`run_frame = cv2.resize(frame, (0, 0), fx=args.run_scale, fy=args.run_scale)`
Manually plot boxes, rather than using `r.plot()` 2023-10-13 23:44:38 +01:00			`# view_frame = cv2.resize(frame, (0, 0), fx=args.view_scale, fy=args.view_scale)`
Added notification stuff 2023-10-05 03:03:11 +01:00
Turn off verbose output Also print object type 2023-10-04 03:03:39 +01:00			`results = model(run_frame, verbose=False)`
Check if face directory exists; switch to ArcFace Other fixes: * Improve error handling during face recognition * Change VS Code run configuration name * Update `deepface-test.ipynb` * Reset version to `0.1.0` (not pushed to PyPi yet) 2023-10-22 18:02:07 +01:00
			`path_to_faces = Path(args.faces_directory)`
Format code 2023-10-22 22:54:30 +01:00			`path_to_faces_exists = path_to_faces.is_dir()`
Check if face directory exists; switch to ArcFace Other fixes: * Improve error handling during face recognition * Change VS Code run configuration name * Update `deepface-test.ipynb` * Reset version to `0.1.0` (not pushed to PyPi yet) 2023-10-22 18:02:07 +01:00
Manually plot boxes, rather than using `r.plot()` 2023-10-13 23:44:38 +01:00			`for i, r in enumerate(results):`
			`# list of dicts with each dict containing a label, x1, y1, x2, y2`
			`plot_boxes = []`
Fix facial recognition Scaling still seems to be imperfect 2023-10-14 23:37:42 +01:00
			`# The following is stuff for people`
			`# This is still in the for loop as each result, no matter if anything is detected, will be present.`
			`# Thus, there will always be one result (r)`
Check if face directory exists; switch to ArcFace Other fixes: * Improve error handling during face recognition * Change VS Code run configuration name * Update `deepface-test.ipynb` * Reset version to `0.1.0` (not pushed to PyPi yet) 2023-10-22 18:02:07 +01:00
			`# Only run if path_to_faces exists`
			`# May be better to check every iteration, but this also works`
			`if path_to_faces_exists:`
			`if face_details := utils.recognize_face(`
Add `--face-confidence-threshold` 2023-10-27 17:23:44 +01:00			`path_to_directory=path_to_faces, run_frame=run_frame, min_confidence=args.face_confidence_threshold`
Check if face directory exists; switch to ArcFace Other fixes: * Improve error handling during face recognition * Change VS Code run configuration name * Update `deepface-test.ipynb` * Reset version to `0.1.0` (not pushed to PyPi yet) 2023-10-22 18:02:07 +01:00			`):`
			`plot_boxes.append(face_details)`
			`objects_and_peoples = notify.thing_detected(`
			`thing_name=face_details["label"],`
			`objects_and_peoples=objects_and_peoples,`
			`detection_type="peoples",`
			`detection_window=args.detection_window,`
			`detection_duration=args.detection_duration,`
			`notification_window=args.notification_window,`
			`ntfy_url=args.ntfy_url,`
			`)`
Fix facial recognition Scaling still seems to be imperfect 2023-10-14 23:37:42 +01:00
			`# The following is stuff for objects`
Added notification stuff 2023-10-05 03:03:11 +01:00			`# Setup dictionary of object names`
Fixed scaling :tada: 2023-10-15 01:25:27 +01:00			`if (`
			`objects_and_peoples["objects"] == {}`
			`or objects_and_peoples["objects"] is None`
			`):`
Added notification stuff 2023-10-05 03:03:11 +01:00			`for name in r.names.values():`
Manage timers in notify.py 2023-10-14 21:40:36 +01:00			`objects_and_peoples["objects"][name] = {`
Added notification stuff 2023-10-05 03:03:11 +01:00			`"last_detection_time": None,`
			`"detection_duration": None,`
			`# "first_detection_time": None,`
Don't spam notifications 2023-10-06 01:12:42 +01:00			`"last_notification_time": None,`
Actually (?) fixed notification spam! 2023-10-06 02:00:12 +01:00			`}`
Manage timers in notify.py 2023-10-14 21:40:36 +01:00			`# Also, make sure that the objects to detect are in the list of objects_and_peoples`
Optionally only detect specific objects 2023-10-14 00:13:46 +01:00			`# If it isn't, print a warning`
			`for obj in args.detect_object:`
Manage timers in notify.py 2023-10-14 21:40:36 +01:00			`if obj not in objects_and_peoples:`
Format 2023-10-14 00:16:55 +01:00			`print(`
			`f"Warning: {obj} is not in the list of objects the model can detect!"`
			`)`

Turn off verbose output Also print object type 2023-10-04 03:03:39 +01:00			`for box in r.boxes:`
			`# Get the name of the object`
			`class_id = r.names[box.cls[0].item()]`
			`# Get the coordinates of the object`
			`cords = box.xyxy[0].tolist()`
			`cords = [round(x) for x in cords]`
			`# Get the confidence`
			`conf = round(box.conf[0].item(), 2)`
			`# Print it out, adding a spacer between each object`
Added notification stuff 2023-10-05 03:03:11 +01:00			`# print("Object type:", class_id)`
			`# print("Coordinates:", cords)`
			`# print("Probability:", conf)`
			`# print("---")`

Actually (?) fixed notification spam! 2023-10-06 02:00:12 +01:00			`# Now do stuff (if conf > 0.5)`
Add `--face-confidence-threshold` 2023-10-27 17:23:44 +01:00			`if conf < args.object_confidence_threshold or (`
Format 2023-10-14 00:16:55 +01:00			`class_id not in args.detect_object and args.detect_object != []`
			`):`
Optionally only detect specific objects 2023-10-14 00:13:46 +01:00			`# If the confidence is too low`
			`# or if the object is not in the list of objects to detect and the list of objects to detect is not empty`
			`# then skip this iteration`
Actually (?) fixed notification spam! 2023-10-06 02:00:12 +01:00			`continue`

Manually plot boxes, rather than using `r.plot()` 2023-10-13 23:44:38 +01:00			`# Add the object to the list of objects to plot`
			`plot_boxes.append(`
			`{`
			`"label": class_id,`
			`"x1": cords[0],`
			`"y1": cords[1],`
			`"x2": cords[2],`
			`"y2": cords[3],`
			`}`
			`)`

Fixed scaling :tada: 2023-10-15 01:25:27 +01:00			`objects_and_peoples = notify.thing_detected(`
Manage timers in notify.py 2023-10-14 21:40:36 +01:00			`thing_name=class_id,`
			`objects_and_peoples=objects_and_peoples,`
			`detection_type="objects",`
			`detection_window=args.detection_window,`
			`detection_duration=args.detection_duration,`
			`notification_window=args.notification_window,`
			`ntfy_url=args.ntfy_url,`
			`)`
Added notification stuff 2023-10-05 03:03:11 +01:00
Fixed scaling :tada: 2023-10-15 01:25:27 +01:00			`# To debug plotting, use r.plot() to cross reference the bounding boxes drawn by the plot_label() and r.plot()`
Manually plot boxes, rather than using `r.plot()` 2023-10-13 23:44:38 +01:00			`frame_to_show = utils.plot_label(`
			`boxes=plot_boxes,`
			`full_frame=frame,`
			`# full_frame=r.plot(),`
			`run_scale=args.run_scale,`
			`view_scale=args.view_scale,`
			`)`
Format 2023-10-14 00:16:55 +01:00
Manually plot boxes, rather than using `r.plot()` 2023-10-13 23:44:38 +01:00			`# Display the resulting frame`
			`# cv2.imshow("", r)`
Fixed Docker support and updated README.md 2023-10-15 04:31:48 +01:00			`if not args.no_display:`
			`cv2.imshow(f"Video{i}", frame_to_show)`
Simple object detection 2023-10-02 01:56:40 +01:00
			`# Hit 'q' on the keyboard to quit!`
			`if cv2.waitKey(1) & 0xFF == ord("q"):`
			`break`

			`# Release handle to the webcam`
			`print("Releasing video capture")`
			`video_capture.release()`
			`cv2.destroyAllWindows()`

Fixed scaling :tada: 2023-10-15 01:25:27 +01:00
Allow program to be run as a script 2023-10-14 21:46:42 +01:00			`if __name__ == "__main__":`
			`main()`