scripts/run_detection.py

# Copyright 2025 Yakhyokhuja Valikhujaev
# Author: Yakhyokhuja Valikhujaev
# GitHub: https://github.com/yakhyo

"""Face detection on image or webcam.

Usage:
    python run_detection.py --image path/to/image.jpg
    python run_detection.py --webcam
"""

from __future__ import annotations

import argparse
import os

import cv2

from uniface.detection import SCRFD, RetinaFace, YOLOv5Face
from uniface.visualization import draw_detections


def process_image(detector, image_path: str, threshold: float = 0.6, save_dir: str = 'outputs'):
    image = cv2.imread(image_path)
    if image is None:
        print(f"Error: Failed to load image from '{image_path}'")
        return

    faces = detector.detect(image)

    if faces:
        bboxes = [face.bbox for face in faces]
        scores = [face.confidence for face in faces]
        landmarks = [face.landmarks for face in faces]
        draw_detections(image, bboxes, scores, landmarks, vis_threshold=threshold)

    os.makedirs(save_dir, exist_ok=True)
    output_path = os.path.join(save_dir, f'{os.path.splitext(os.path.basename(image_path))[0]}_out.jpg')
    cv2.imwrite(output_path, image)
    print(f'Output saved: {output_path}')


def run_webcam(detector, threshold: float = 0.6):
    cap = cv2.VideoCapture(0)  # 0 = default webcam
    if not cap.isOpened():
        print('Cannot open webcam')
        return

    print("Press 'q' to quit")

    while True:
        ret, frame = cap.read()
        frame = cv2.flip(frame, 1)  # mirror for natural interaction
        if not ret:
            break

        faces = detector.detect(frame)

        # unpack face data for visualization
        bboxes = [f.bbox for f in faces]
        scores = [f.confidence for f in faces]
        landmarks = [f.landmarks for f in faces]
        draw_detections(
            image=frame,
            bboxes=bboxes,
            scores=scores,
            landmarks=landmarks,
            vis_threshold=threshold,
            draw_score=True,
            fancy_bbox=True,
        )

        cv2.putText(
            frame,
            f'Faces: {len(faces)}',
            (10, 30),
            cv2.FONT_HERSHEY_SIMPLEX,
            1,
            (0, 255, 0),
            2,
        )
        cv2.imshow('Face Detection', frame)

        if cv2.waitKey(1) & 0xFF == ord('q'):
            break

    cap.release()
    cv2.destroyAllWindows()


def main():
    parser = argparse.ArgumentParser(description='Run face detection')
    parser.add_argument('--image', type=str, help='Path to input image')
    parser.add_argument('--webcam', action='store_true', help='Use webcam')
    parser.add_argument('--method', type=str, default='retinaface', choices=['retinaface', 'scrfd', 'yolov5face'])
    parser.add_argument('--threshold', type=float, default=0.25, help='Visualization threshold')
    parser.add_argument('--save_dir', type=str, default='outputs')
    args = parser.parse_args()

    if not args.image and not args.webcam:
        parser.error('Either --image or --webcam must be specified')

    if args.method == 'retinaface':
        detector = RetinaFace()
    elif args.method == 'scrfd':
        detector = SCRFD()
    else:
        from uniface.constants import YOLOv5FaceWeights

        detector = YOLOv5Face(model_name=YOLOv5FaceWeights.YOLOV5M)

    if args.webcam:
        run_webcam(detector, args.threshold)
    else:
        process_image(detector, args.image, args.threshold, args.save_dir)


if __name__ == '__main__':
    main()
refactor: Standardize naming conventions (#47) * refactor: Standardize naming conventions * chore: Update the version and re-run experiments * chore: Improve code quality tooling and documentation - Add pre-commit job to CI workflow for automated linting on PRs - Update uniface/__init__.py with copyright header, module docstring, and logically grouped exports - Revise CONTRIBUTING.md to reflect pre-commit handles all formatting - Remove redundant ruff check from CI (now handled by pre-commit) - Update build job Python version to 3.11 (matches requires-python) 2025-12-30 00:20:34 +09:00			`# Copyright 2025 Yakhyokhuja Valikhujaev`
			`# Author: Yakhyokhuja Valikhujaev`
			`# GitHub: https://github.com/yakhyo`

			`"""Face detection on image or webcam.`

			`Usage:`
			`python run_detection.py --image path/to/image.jpg`
			`python run_detection.py --webcam`
			`"""`

			`from __future__ import annotations`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00
			`import argparse`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00			`import os`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00			`import cv2`

feat: Add YOLOv5 face detection support (#26) * feat: Add YOLOv5 face detection model * docs: Update docs, add new model information * feat: Add YOLOv5 face detection model * test: Add testing and running 2025-12-03 23:35:56 +09:00			`from uniface.detection import SCRFD, RetinaFace, YOLOv5Face`
feat: Update recognition, landmark modules 2025-07-02 18:52:28 +09:00			`from uniface.visualization import draw_detections`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00

feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`def process_image(detector, image_path: str, threshold: float = 0.6, save_dir: str = 'outputs'):`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00			`image = cv2.imread(image_path)`
			`if image is None:`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`print(f"Error: Failed to load image from '{image_path}'")`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00			`return`

feat: Update recognition, landmark modules 2025-07-02 18:52:28 +09:00			`faces = detector.detect(image)`
improve logging system with verbose flag - silent by default (only warnings/errors) - add --verbose flag to all scripts - add enable_logging() function for library users - cleaner output for end users 2025-11-08 01:15:25 +09:00
feat: Update recognition, landmark modules 2025-07-02 18:52:28 +09:00			`if faces:`
refactor: Standardize naming conventions (#47) * refactor: Standardize naming conventions * chore: Update the version and re-run experiments * chore: Improve code quality tooling and documentation - Add pre-commit job to CI workflow for automated linting on PRs - Update uniface/__init__.py with copyright header, module docstring, and logically grouped exports - Revise CONTRIBUTING.md to reflect pre-commit handles all formatting - Remove redundant ruff check from CI (now handled by pre-commit) - Update build job Python version to 3.11 (matches requires-python) 2025-12-30 00:20:34 +09:00			`bboxes = [face.bbox for face in faces]`
			`scores = [face.confidence for face in faces]`
			`landmarks = [face.landmarks for face in faces]`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`draw_detections(image, bboxes, scores, landmarks, vis_threshold=threshold)`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00
			`os.makedirs(save_dir, exist_ok=True)`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`output_path = os.path.join(save_dir, f'{os.path.splitext(os.path.basename(image_path))[0]}_out.jpg')`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00			`cv2.imwrite(output_path, image)`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`print(f'Output saved: {output_path}')`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00

ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`def run_webcam(detector, threshold: float = 0.6):`
			`cap = cv2.VideoCapture(0) # 0 = default webcam`
			`if not cap.isOpened():`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`print('Cannot open webcam')`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`return`

			`print("Press 'q' to quit")`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`while True:`
			`ret, frame = cap.read()`
			`frame = cv2.flip(frame, 1) # mirror for natural interaction`
			`if not ret:`
			`break`

			`faces = detector.detect(frame)`

			`# unpack face data for visualization`
refactor: Standardize naming conventions (#47) * refactor: Standardize naming conventions * chore: Update the version and re-run experiments * chore: Improve code quality tooling and documentation - Add pre-commit job to CI workflow for automated linting on PRs - Update uniface/__init__.py with copyright header, module docstring, and logically grouped exports - Revise CONTRIBUTING.md to reflect pre-commit handles all formatting - Remove redundant ruff check from CI (now handled by pre-commit) - Update build job Python version to 3.11 (matches requires-python) 2025-12-30 00:20:34 +09:00			`bboxes = [f.bbox for f in faces]`
			`scores = [f.confidence for f in faces]`
			`landmarks = [f.landmarks for f in faces]`
feat: Add yolov5n, update docs and ruff code format 2025-12-11 01:02:18 +09:00			`draw_detections(`
			`image=frame,`
			`bboxes=bboxes,`
			`scores=scores,`
			`landmarks=landmarks,`
			`vis_threshold=threshold,`
			`draw_score=True,`
			`fancy_bbox=True,`
			`)`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00
chore: Code style formatting changes 2025-11-26 00:05:24 +09:00			`cv2.putText(`
			`frame,`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`f'Faces: {len(faces)}',`
chore: Code style formatting changes 2025-11-26 00:05:24 +09:00			`(10, 30),`
			`cv2.FONT_HERSHEY_SIMPLEX,`
			`1,`
			`(0, 255, 0),`
			`2,`
			`)`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`cv2.imshow('Face Detection', frame)`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`if cv2.waitKey(1) & 0xFF == ord('q'):`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`break`

			`cap.release()`
			`cv2.destroyAllWindows()`


			`def main():`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`parser = argparse.ArgumentParser(description='Run face detection')`
			`parser.add_argument('--image', type=str, help='Path to input image')`
			`parser.add_argument('--webcam', action='store_true', help='Use webcam')`
feat: Add YOLOv5 face detection support (#26) * feat: Add YOLOv5 face detection model * docs: Update docs, add new model information * feat: Add YOLOv5 face detection model * test: Add testing and running 2025-12-03 23:35:56 +09:00			`parser.add_argument('--method', type=str, default='retinaface', choices=['retinaface', 'scrfd', 'yolov5face'])`
			`parser.add_argument('--threshold', type=float, default=0.25, help='Visualization threshold')`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`parser.add_argument('--save_dir', type=str, default='outputs')`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00			`args = parser.parse_args()`

ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`if not args.image and not args.webcam:`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`parser.error('Either --image or --webcam must be specified')`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00
feat: Add YOLOv5 face detection support (#26) * feat: Add YOLOv5 face detection model * docs: Update docs, add new model information * feat: Add YOLOv5 face detection model * test: Add testing and running 2025-12-03 23:35:56 +09:00			`if args.method == 'retinaface':`
			`detector = RetinaFace()`
			`elif args.method == 'scrfd':`
			`detector = SCRFD()`
			`else:`
			`from uniface.constants import YOLOv5FaceWeights`
feat: Update examples and some minor changes to UniFace API (#28) * chore: Style changes and create jupyter notebook template * docs: Update docstring for detection * feat: Keyword only for common parameters: model_name, conf_thresh, nms_thresh, input_size * chore: Update drawing and let the conf text optional for drawing * feat: add fancy bbox draw * docs: Add examples of using UniFace * feat: Add version to all examples 2025-12-07 19:51:08 +09:00
feat: Add 2D Gaze estimation models (#34) * feat: Add Gaze Estimation, update docs and Add example notebook, inference code * docs: Update README.md 2025-12-14 14:07:46 +09:00			`detector = YOLOv5Face(model_name=YOLOv5FaceWeights.YOLOV5M)`
improve logging system with verbose flag - silent by default (only warnings/errors) - add --verbose flag to all scripts - add enable_logging() function for library users - cleaner output for end users 2025-11-08 01:15:25 +09:00
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`if args.webcam:`
			`run_webcam(detector, args.threshold)`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`else:`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`process_image(detector, args.image, args.threshold, args.save_dir)`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00

feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`if __name__ == '__main__':`
feat: Add model name signature and several more updates 2025-03-26 11:55:56 +09:00			`main()`