wyzely-detect/main.py

import datetime
import face_recognition
import cv2
import numpy as np
from dotenv import load_dotenv
import os
import json
import pathlib
import requests
import time


load_dotenv()
URL = os.getenv("URL")
RUN_SCALE = os.getenv("RUN_SCALE")
VIEW_SCALE = os.getenv("VIEW_SCALE")
DATETIME_FORMAT = "%Y-%m-%d %H:%M:%S"
# RUN_SCALE = 0.25
# VIEW_SCALE = 0.75
DISPLAY = False
RUN_BY_COMPOSE = os.getenv("RUN_BY_COMPOSE")
NTFY_URL = os.getenv("NTFY_URL")


def find_face_from_name(name):
    for face in config["faces"]:
        if config["faces"][face]["name"] == name:
            return face
    return None


def write_config():
    with open(config_path, "w") as config_file:
        json.dump(config, config_file, indent=4)


print("Hello, world!")

# Initialize some variables
face_locations = []
face_encodings = []
face_names = []
known_face_encodings = []
known_face_names = []
process_this_frame = True

# Load the config file, if it does not exist or is blank, create it
config = {
    # If RUN_BY_COMPOSE is true, set url to rtsp://wyze-bridge:8554/wyze_cam_name, otherwise set it to "rtsp://localhost:8554/wyze_cam_name"
    "URL": "rtsp://localhost:8554/wyze_cam_name"
    if not RUN_BY_COMPOSE
    else "rtsp://bridge:8554/wyze_cam_name",
    "run_scale": "0.25",
    "view_scale": "0.75",
    "faces": {
        "example1": {"image": "config/example1.jpg", "last_seen": ""},
        "example2": {"image": "config/example2.jpg", "last_seen": ""},
    },
    "ntfy_url": "https://ntfy.sh/example",
    "display": True,
}
config_path = pathlib.Path("config/config.json")
if config_path.exists():
    with open(config_path, "r") as config_file:
        config = json.load(config_file)
else:
    with open(config_path, "w") as config_file:
        json.dump(config, config_file, indent=4)
    print("Config file created, please edit it and restart the program")
    print("For relative paths, use the format config/example.jpg")
    exit()


if URL:
    config["URL"] = URL
else:
    URL = config["URL"]
if RUN_SCALE:
    config["RUN_SCALE"] = RUN_SCALE
else:
    RUN_SCALE = float(config["RUN_SCALE"])
if VIEW_SCALE:
    config["VIEW_SCALE"] = VIEW_SCALE
else:
    VIEW_SCALE = float(config["VIEW_SCALE"])
if DISPLAY:
    config["DISPLAY"] = DISPLAY
else:
    DISPLAY = config["display"]
if NTFY_URL:
    config["ntfy_url"] = NTFY_URL
else:
    NTFY_URL = config["ntfy_url"]
print(f"Current config: {config}")

for face in config["faces"]:
    # Load a sample picture and learn how to recognize it.
    image = face_recognition.load_image_file(config["faces"][face]["image"])
    face_encoding = face_recognition.face_encodings(image)[0]
    known_face_encodings.append(face_encoding)
    # Append the key to the list of known face names
    known_face_names.append(face)

video_capture = cv2.VideoCapture(URL)
# Eliminate lag by setting the buffer size to 1
# This makes it so that the video capture will only grab the most recent frame
# However, this means that the video may be choppy
video_capture.set(cv2.CAP_PROP_BUFFERSIZE, 1)

# Print the resolution of the video
print(
    f"Video resolution: {video_capture.get(cv2.CAP_PROP_FRAME_WIDTH)}x{video_capture.get(cv2.CAP_PROP_FRAME_HEIGHT)}"
)

print("Beginning video capture...")
while True:
    # Grab a single frame of video
    ret, frame = video_capture.read()
    # Only process every other frame of video to save time
    # Resize frame of video to a smaller size for faster face recognition processing
    run_frame = cv2.resize(frame, (0, 0), fx=RUN_SCALE, fy=RUN_SCALE)
    view_frame = cv2.resize(frame, (0, 0), fx=VIEW_SCALE, fy=VIEW_SCALE)
    # Convert the image from BGR color (which OpenCV uses) to RGB color (which face_recognition uses)
    rgb_run_frame = run_frame[:, :, ::-1]
    # Find all the faces and face encodings in the current frame of video
    # model cnn is gpu accelerated, but hog is cpu only
    face_locations = face_recognition.face_locations(
        rgb_run_frame, model="hog"
    )  # This crashes the program without output on my laptop when it's running without Docker compose
    face_encodings = face_recognition.face_encodings(rgb_run_frame, face_locations)
    face_names = []
    for face_encoding in face_encodings:
        # See if the face is a match for the known face(s)
        matches = face_recognition.compare_faces(known_face_encodings, face_encoding)
        name = "Unknown"
        # Or instead, use the known face with the smallest distance to the new face
        face_distances = face_recognition.face_distance(
            known_face_encodings, face_encoding
        )
        best_match_index = np.argmin(face_distances)
        if matches[best_match_index]:
            name = known_face_names[best_match_index]
            last_seen = config["faces"][name]["last_seen"]
            # If it's never been seen, set the last seen time to x+5 seconds ago so it will be seen
            # Kind of a hacky way to do it, but it works... hopefully
            if last_seen == "":
                print(f"{name} has been seen for the first time")
                config["faces"][name]["last_seen"] = (
                    datetime.datetime.now() - datetime.timedelta(seconds=15)
                ).strftime(DATETIME_FORMAT)
                write_config()
            # Check if the face has been seen in the last 5 seconds
            if datetime.datetime.now() - datetime.datetime.strptime(
                last_seen, DATETIME_FORMAT
            ) > datetime.timedelta(seconds=10):
                print(f"{name} has been seen")
                # Send a notification
                print(f"Sending notification to{NTFY_URL}")
                requests.post(
                    NTFY_URL,
                    data=f'"{name}" has been seen',
                    headers={
                        "Title": "Face Detected",
                        "Priority": "urgent",
                        "Tags": "neutral_face",
                    },
                )
            # Update the last seen time
            config["faces"][name]["last_seen"] = datetime.datetime.now().strftime(
                DATETIME_FORMAT
            )
            # print("Writing config...")
            write_config()
        face_names.append(name)
    # Display the results
    # Iterate over each face found in the frame to draw a box around it
    # Zip is used to iterate over two lists at the same time
    for (top, right, bottom, left), name in zip(face_locations, face_names):
        # print(f"Face found at {top}, {right}, {bottom}, {left} with name {name}")
        # Scale back up face locations since the frame we detected in was scaled to 1/4 size
        top = int(top * (VIEW_SCALE / RUN_SCALE))
        right = int(right * (VIEW_SCALE / RUN_SCALE))
        bottom = int(bottom * (VIEW_SCALE / RUN_SCALE))
        left = int(left * (VIEW_SCALE / RUN_SCALE))

        # Draw a box around the face
        cv2.rectangle(view_frame, (left, top), (right, bottom), (0, 0, 255), 2)

        # Draw a label with a name below the face
        cv2.rectangle(
            view_frame, (left, bottom - 35), (right, bottom), (0, 0, 255), cv2.FILLED
        )
        font = cv2.FONT_HERSHEY_DUPLEX
        cv2.putText(
            view_frame, name, (left + 6, bottom - 6), font, 1.0, (255, 255, 255), 1
        )

    # Display the resulting image if DISPLAY is set to true
    if config["display"]:
        cv2.imshow("Scaled View", view_frame)

    # Hit 'q' on the keyboard to quit!
    if cv2.waitKey(1) & 0xFF == ord("q"):
        break

# Release handle to the webcam
print("Releasing video capture")
video_capture.release()
cv2.destroyAllWindows()
Initial commit 2022-12-17 21:54:47 +00:00			`import datetime`
			`import face_recognition`
			`import cv2`
			`import numpy as np`
			`from dotenv import load_dotenv`
			`import os`
			`import json`
			`import pathlib`
Made some more progress on Docker Compose 2022-12-18 04:26:08 +00:00			`import requests`
			`import time`
Initial commit 2022-12-17 21:54:47 +00:00

			`load_dotenv()`
			`URL = os.getenv("URL")`
			`RUN_SCALE = os.getenv("RUN_SCALE")`
			`VIEW_SCALE = os.getenv("VIEW_SCALE")`
			`DATETIME_FORMAT = "%Y-%m-%d %H:%M:%S"`
			`# RUN_SCALE = 0.25`
			`# VIEW_SCALE = 0.75`
Made displaying video optional 2022-12-17 22:09:39 +00:00			`DISPLAY = False`
Worked on Docker Compose 2022-12-18 03:55:17 +00:00			`RUN_BY_COMPOSE = os.getenv("RUN_BY_COMPOSE")`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`NTFY_URL = os.getenv("NTFY_URL")`
Initial commit 2022-12-17 21:54:47 +00:00

			`def find_face_from_name(name):`
			`for face in config["faces"]:`
			`if config["faces"][face]["name"] == name:`
			`return face`
			`return None`


			`def write_config():`
			`with open(config_path, "w") as config_file:`
			`json.dump(config, config_file, indent=4)`


Made some more progress Commiting to update the current Docker image on ghcr 2022-12-18 18:14:31 +00:00			`print("Hello, world!")`

Initial commit 2022-12-17 21:54:47 +00:00			`# Initialize some variables`
			`face_locations = []`
			`face_encodings = []`
			`face_names = []`
			`known_face_encodings = []`
			`known_face_names = []`
			`process_this_frame = True`

			`# Load the config file, if it does not exist or is blank, create it`
			`config = {`
Worked on Docker Compose 2022-12-18 03:55:17 +00:00			`# If RUN_BY_COMPOSE is true, set url to rtsp://wyze-bridge:8554/wyze_cam_name, otherwise set it to "rtsp://localhost:8554/wyze_cam_name"`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`"URL": "rtsp://localhost:8554/wyze_cam_name"`
			`if not RUN_BY_COMPOSE`
			`else "rtsp://bridge:8554/wyze_cam_name",`
Made displaying video optional 2022-12-17 22:09:39 +00:00			`"run_scale": "0.25",`
			`"view_scale": "0.75",`
Initial commit 2022-12-17 21:54:47 +00:00			`"faces": {`
Use `config/` for images + config.json 2022-12-18 00:19:10 +00:00			`"example1": {"image": "config/example1.jpg", "last_seen": ""},`
			`"example2": {"image": "config/example2.jpg", "last_seen": ""},`
Initial commit 2022-12-17 21:54:47 +00:00			`},`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`"ntfy_url": "https://ntfy.sh/example",`
			`"display": True,`
Initial commit 2022-12-17 21:54:47 +00:00			`}`
Use `config/` for images + config.json 2022-12-18 00:19:10 +00:00			`config_path = pathlib.Path("config/config.json")`
Initial commit 2022-12-17 21:54:47 +00:00			`if config_path.exists():`
			`with open(config_path, "r") as config_file:`
			`config = json.load(config_file)`
			`else:`
			`with open(config_path, "w") as config_file:`
			`json.dump(config, config_file, indent=4)`
			`print("Config file created, please edit it and restart the program")`
Use `config/` for images + config.json 2022-12-18 00:19:10 +00:00			`print("For relative paths, use the format config/example.jpg")`
Initial commit 2022-12-17 21:54:47 +00:00			`exit()`


			`if URL:`
			`config["URL"] = URL`
			`else:`
			`URL = config["URL"]`
			`if RUN_SCALE:`
			`config["RUN_SCALE"] = RUN_SCALE`
			`else:`
			`RUN_SCALE = float(config["RUN_SCALE"])`
			`if VIEW_SCALE:`
			`config["VIEW_SCALE"] = VIEW_SCALE`
			`else:`
			`VIEW_SCALE = float(config["VIEW_SCALE"])`
Made displaying video optional 2022-12-17 22:09:39 +00:00			`if DISPLAY:`
			`config["DISPLAY"] = DISPLAY`
			`else:`
			`DISPLAY = config["display"]`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`if NTFY_URL:`
			`config["ntfy_url"] = NTFY_URL`
			`else:`
			`NTFY_URL = config["ntfy_url"]`
Made displaying video optional 2022-12-17 22:09:39 +00:00			`print(f"Current config: {config}")`
Initial commit 2022-12-17 21:54:47 +00:00
			`for face in config["faces"]:`
			`# Load a sample picture and learn how to recognize it.`
			`image = face_recognition.load_image_file(config["faces"][face]["image"])`
			`face_encoding = face_recognition.face_encodings(image)[0]`
			`known_face_encodings.append(face_encoding)`
			`# Append the key to the list of known face names`
			`known_face_names.append(face)`

			`video_capture = cv2.VideoCapture(URL)`
			`# Eliminate lag by setting the buffer size to 1`
			`# This makes it so that the video capture will only grab the most recent frame`
			`# However, this means that the video may be choppy`
			`video_capture.set(cv2.CAP_PROP_BUFFERSIZE, 1)`

Made some more progress on Docker Compose 2022-12-18 04:26:08 +00:00			`# Print the resolution of the video`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`print(`
			`f"Video resolution: {video_capture.get(cv2.CAP_PROP_FRAME_WIDTH)}x{video_capture.get(cv2.CAP_PROP_FRAME_HEIGHT)}"`
			`)`
Made some more progress on Docker Compose 2022-12-18 04:26:08 +00:00
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`print("Beginning video capture...")`
Initial commit 2022-12-17 21:54:47 +00:00			`while True:`
			`# Grab a single frame of video`
			`ret, frame = video_capture.read()`
			`# Only process every other frame of video to save time`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`# Resize frame of video to a smaller size for faster face recognition processing`
			`run_frame = cv2.resize(frame, (0, 0), fx=RUN_SCALE, fy=RUN_SCALE)`
			`view_frame = cv2.resize(frame, (0, 0), fx=VIEW_SCALE, fy=VIEW_SCALE)`
			`# Convert the image from BGR color (which OpenCV uses) to RGB color (which face_recognition uses)`
			`rgb_run_frame = run_frame[:, :, ::-1]`
			`# Find all the faces and face encodings in the current frame of video`
			`# model cnn is gpu accelerated, but hog is cpu only`
Fixed rapid notifications 2022-12-18 19:44:42 +00:00			`face_locations = face_recognition.face_locations(`
			`rgb_run_frame, model="hog"`
			`) # This crashes the program without output on my laptop when it's running without Docker compose`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`face_encodings = face_recognition.face_encodings(rgb_run_frame, face_locations)`
			`face_names = []`
			`for face_encoding in face_encodings:`
			`# See if the face is a match for the known face(s)`
			`matches = face_recognition.compare_faces(known_face_encodings, face_encoding)`
			`name = "Unknown"`
			`# Or instead, use the known face with the smallest distance to the new face`
			`face_distances = face_recognition.face_distance(`
			`known_face_encodings, face_encoding`
			`)`
			`best_match_index = np.argmin(face_distances)`
			`if matches[best_match_index]:`
			`name = known_face_names[best_match_index]`
			`last_seen = config["faces"][name]["last_seen"]`
			`# If it's never been seen, set the last seen time to x+5 seconds ago so it will be seen`
			`# Kind of a hacky way to do it, but it works... hopefully`
			`if last_seen == "":`
Fixed rapid notifications 2022-12-18 19:44:42 +00:00			`print(f"{name} has been seen for the first time")`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`config["faces"][name]["last_seen"] = (`
			`datetime.datetime.now() - datetime.timedelta(seconds=15)`
			`).strftime(DATETIME_FORMAT)`
			`write_config()`
			`# Check if the face has been seen in the last 5 seconds`
			`if datetime.datetime.now() - datetime.datetime.strptime(`
			`last_seen, DATETIME_FORMAT`
			`) > datetime.timedelta(seconds=10):`
			`print(f"{name} has been seen")`
Fixed rapid notifications 2022-12-18 19:44:42 +00:00			`# Send a notification`
			`print(f"Sending notification to{NTFY_URL}")`
			`requests.post(`
			`NTFY_URL,`
			`data=f'"{name}" has been seen',`
			`headers={`
			`"Title": "Face Detected",`
			`"Priority": "urgent",`
			`"Tags": "neutral_face",`
			`},`
			`)`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`# Update the last seen time`
			`config["faces"][name]["last_seen"] = datetime.datetime.now().strftime(`
			`DATETIME_FORMAT`
Initial commit 2022-12-17 21:54:47 +00:00			`)`
Don't keep printing `writing configuration` A better solution would be to store it in memory (config with last seen) And every x seconds, write it 2022-12-18 19:55:52 +00:00			`# print("Writing config...")`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`write_config()`
			`face_names.append(name)`
Initial commit 2022-12-17 21:54:47 +00:00			`# Display the results`
			`# Iterate over each face found in the frame to draw a box around it`
			`# Zip is used to iterate over two lists at the same time`
			`for (top, right, bottom, left), name in zip(face_locations, face_names):`
Removed `face found at ...` notice It was originally for debugging 2022-12-18 19:15:43 +00:00			`# print(f"Face found at {top}, {right}, {bottom}, {left} with name {name}")`
Initial commit 2022-12-17 21:54:47 +00:00			`# Scale back up face locations since the frame we detected in was scaled to 1/4 size`
			`top = int(top * (VIEW_SCALE / RUN_SCALE))`
			`right = int(right * (VIEW_SCALE / RUN_SCALE))`
			`bottom = int(bottom * (VIEW_SCALE / RUN_SCALE))`
			`left = int(left * (VIEW_SCALE / RUN_SCALE))`

			`# Draw a box around the face`
			`cv2.rectangle(view_frame, (left, top), (right, bottom), (0, 0, 255), 2)`

			`# Draw a label with a name below the face`
			`cv2.rectangle(`
			`view_frame, (left, bottom - 35), (right, bottom), (0, 0, 255), cv2.FILLED`
			`)`
			`font = cv2.FONT_HERSHEY_DUPLEX`
			`cv2.putText(`
			`view_frame, name, (left + 6, bottom - 6), font, 1.0, (255, 255, 255), 1`
			`)`

Made displaying video optional 2022-12-17 22:09:39 +00:00			`# Display the resulting image if DISPLAY is set to true`
Worked on Docker Compose 2022-12-18 03:55:17 +00:00			`if config["display"]:`
Made displaying video optional 2022-12-17 22:09:39 +00:00			`cv2.imshow("Scaled View", view_frame)`
Initial commit 2022-12-17 21:54:47 +00:00
			`# Hit 'q' on the keyboard to quit!`
			`if cv2.waitKey(1) & 0xFF == ord("q"):`
			`break`

			`# Release handle to the webcam`
Added support for `ntfy.sh` 2022-12-18 19:07:11 +00:00			`print("Releasing video capture")`
Initial commit 2022-12-17 21:54:47 +00:00			`video_capture.release()`
			`cv2.destroyAllWindows()`