scripts/run_video_detection.py

# Face detection on video files
# Usage: python run_video_detection.py --input video.mp4 --output output.mp4

import argparse
from pathlib import Path

import cv2
from tqdm import tqdm

from uniface import SCRFD, RetinaFace
from uniface.visualization import draw_detections


def process_video(
    detector,
    input_path: str,
    output_path: str,
    threshold: float = 0.6,
    show_preview: bool = False,
):
    cap = cv2.VideoCapture(input_path)
    if not cap.isOpened():
        print(f"Error: Cannot open video file '{input_path}'")
        return

    # get video properties
    total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
    fps = cap.get(cv2.CAP_PROP_FPS)
    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))

    print(f'Input: {input_path} ({width}x{height}, {fps:.1f} fps, {total_frames} frames)')
    print(f'Output: {output_path}')

    fourcc = cv2.VideoWriter_fourcc(*'mp4v')  # codec for .mp4
    out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))

    if not out.isOpened():
        print(f"Error: Cannot create output video '{output_path}'")
        cap.release()
        return

    frame_count = 0
    total_faces = 0

    for _ in tqdm(range(total_frames), desc='Processing', unit='frames'):
        ret, frame = cap.read()
        if not ret:
            break

        frame_count += 1
        faces = detector.detect(frame)
        total_faces += len(faces)

        bboxes = [f['bbox'] for f in faces]
        scores = [f['confidence'] for f in faces]
        landmarks = [f['landmarks'] for f in faces]
        draw_detections(
            image=frame, bboxes=bboxes, scores=scores, landmarks=landmarks, vis_threshold=threshold, fancy_bbox=True
        )

        cv2.putText(
            frame,
            f'Faces: {len(faces)}',
            (10, 30),
            cv2.FONT_HERSHEY_SIMPLEX,
            1,
            (0, 255, 0),
            2,
        )
        out.write(frame)

        if show_preview:
            cv2.imshow("Processing - Press 'q' to cancel", frame)
            if cv2.waitKey(1) & 0xFF == ord('q'):
                print('\nCancelled by user')
                break

    cap.release()
    out.release()
    if show_preview:
        cv2.destroyAllWindows()

    avg_faces = total_faces / frame_count if frame_count > 0 else 0
    print(f'\nDone! {frame_count} frames, {total_faces} faces ({avg_faces:.1f} avg/frame)')
    print(f'Saved: {output_path}')


def main():
    parser = argparse.ArgumentParser(description='Process video with face detection')
    parser.add_argument('--input', type=str, required=True, help='Input video path')
    parser.add_argument('--output', type=str, required=True, help='Output video path')
    parser.add_argument('--detector', type=str, default='retinaface', choices=['retinaface', 'scrfd'])
    parser.add_argument('--threshold', type=float, default=0.6, help='Visualization threshold')
    parser.add_argument('--preview', action='store_true', help='Show live preview')
    args = parser.parse_args()

    if not Path(args.input).exists():
        print(f"Error: Input file '{args.input}' does not exist")
        return

    Path(args.output).parent.mkdir(parents=True, exist_ok=True)

    detector = RetinaFace() if args.detector == 'retinaface' else SCRFD()
    process_video(detector, args.input, args.output, args.threshold, args.preview)


if __name__ == '__main__':
    main()
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`# Face detection on video files`
			`# Usage: python run_video_detection.py --input video.mp4 --output output.mp4`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
			`import argparse`
			`from pathlib import Path`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00
			`import cv2`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`from tqdm import tqdm`

ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`from uniface import SCRFD, RetinaFace`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`from uniface.visualization import draw_detections`


chore: Code style formatting changes 2025-11-26 00:05:24 +09:00			`def process_video(`
			`detector,`
			`input_path: str,`
			`output_path: str,`
			`threshold: float = 0.6,`
			`show_preview: bool = False,`
			`):`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`cap = cv2.VideoCapture(input_path)`
			`if not cap.isOpened():`
			`print(f"Error: Cannot open video file '{input_path}'")`
			`return`

ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`# get video properties`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`fps = cap.get(cv2.CAP_PROP_FPS)`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))`
			`height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))`

feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`print(f'Input: {input_path} ({width}x{height}, {fps:.1f} fps, {total_frames} frames)')`
			`print(f'Output: {output_path}')`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`fourcc = cv2.VideoWriter_fourcc(*'mp4v') # codec for .mp4`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`out = cv2.VideoWriter(output_path, fourcc, fps, (width, height))`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
			`if not out.isOpened():`
			`print(f"Error: Cannot create output video '{output_path}'")`
			`cap.release()`
			`return`

			`frame_count = 0`
			`total_faces = 0`

feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`for _ in tqdm(range(total_frames), desc='Processing', unit='frames'):`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`ret, frame = cap.read()`
			`if not ret:`
			`break`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`frame_count += 1`
			`faces = detector.detect(frame)`
			`total_faces += len(faces)`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`bboxes = [f['bbox'] for f in faces]`
			`scores = [f['confidence'] for f in faces]`
			`landmarks = [f['landmarks'] for f in faces]`
feat: Add yolov5n, update docs and ruff code format 2025-12-11 01:02:18 +09:00			`draw_detections(`
			`image=frame, bboxes=bboxes, scores=scores, landmarks=landmarks, vis_threshold=threshold, fancy_bbox=True`
			`)`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
chore: Code style formatting changes 2025-11-26 00:05:24 +09:00			`cv2.putText(`
			`frame,`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`f'Faces: {len(faces)}',`
chore: Code style formatting changes 2025-11-26 00:05:24 +09:00			`(10, 30),`
			`cv2.FONT_HERSHEY_SIMPLEX,`
			`1,`
			`(0, 255, 0),`
			`2,`
			`)`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`out.write(frame)`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
			`if show_preview:`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`cv2.imshow("Processing - Press 'q' to cancel", frame)`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`if cv2.waitKey(1) & 0xFF == ord('q'):`
			`print('\nCancelled by user')`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`break`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`cap.release()`
			`out.release()`
			`if show_preview:`
			`cv2.destroyAllWindows()`

			`avg_faces = total_faces / frame_count if frame_count > 0 else 0`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`print(f'\nDone! {frame_count} frames, {total_faces} faces ({avg_faces:.1f} avg/frame)')`
			`print(f'Saved: {output_path}')`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00

			`def main():`
feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`parser = argparse.ArgumentParser(description='Process video with face detection')`
			`parser.add_argument('--input', type=str, required=True, help='Input video path')`
			`parser.add_argument('--output', type=str, required=True, help='Output video path')`
			`parser.add_argument('--detector', type=str, default='retinaface', choices=['retinaface', 'scrfd'])`
			`parser.add_argument('--threshold', type=float, default=0.6, help='Visualization threshold')`
			`parser.add_argument('--preview', action='store_true', help='Show live preview')`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`args = parser.parse_args()`

			`if not Path(args.input).exists():`
			`print(f"Error: Input file '{args.input}' does not exist")`
			`return`

ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`Path(args.output).parent.mkdir(parents=True, exist_ok=True)`

feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`detector = RetinaFace() if args.detector == 'retinaface' else SCRFD()`
ref: Update some refactoring files for testing 2025-11-25 23:19:45 +09:00			`process_video(detector, args.input, args.output, args.threshold, args.preview)`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00

feat: Enhace emotion inference speed on ARM and add FaceAnalyzer, Face classes for ease of use. (#25) * feat: Update linting and type annotations, return types in detect * feat: add face analyzer and face classes * chore: Update the format and clean up some docstrings * docs: Update usage documentation * feat: Change AgeGender model output to 0, 1 instead of string (Female, Male) * test: Update testing code * feat: Add Apple silicon backend for torchscript inference * feat: Add face analyzer example and add run emotion for testing 2025-11-30 20:32:07 +09:00			`if __name__ == '__main__':`
ref: Add comprehensive test suite and enhance model functionality - Add new test files for age_gender, factory, landmark, recognition, scrfd, and utils - Add new scripts for age_gender, landmarks, and video detection - Update documentation in README.md, MODELS.md, QUICKSTART.md - Improve model constants and face utilities - Update detection models (retinaface, scrfd) with enhanced functionality - Update project configuration in pyproject.toml 2025-11-15 21:09:37 +09:00			`main()`