-
Notifications
You must be signed in to change notification settings - Fork 57
/
crop_mouth.py
37 lines (29 loc) · 1.38 KB
/
crop_mouth.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
#! /usr/bin/env python
# -*- coding: utf-8 -*-
# Copyright 2023 Imperial College London (Pingchuan Ma)
# Apache 2.0 (http://www.apache.org/licenses/LICENSE-2.0)
import os
import cv2
import hydra
import torchvision
from pipelines.detectors.mediapipe.detector import LandmarksDetector
from pipelines.data.data_module import AVSRDataLoader
def save2vid(filename, vid, frames_per_second):
os.makedirs(os.path.dirname(filename), exist_ok=True)
torchvision.io.write_video(filename, vid, frames_per_second)
@hydra.main(version_base=None, config_path="hydra_configs", config_name="default")
def main(cfg):
if cfg.detector == "mediapipe":
from pipelines.detectors.mediapipe.detector import LandmarksDetector
landmarks_detector = LandmarksDetector()
if cfg.detector == "retinaface":
from pipelines.detectors.retinaface.detector import LandmarksDetector
landmarks_detector = LandmarksDetector()
dataloader = AVSRDataLoader(modality="video", speed_rate=1, transform=False, detector=cfg.detector, convert_gray=False)
landmarks = landmarks_detector(cfg.data_filename)
data = dataloader.load_data(cfg.data_filename, landmarks)
fps = cv2.VideoCapture(cfg.data_filename).get(cv2.CAP_PROP_FPS)
save2vid(cfg.dst_filename, data, fps)
print(f"The mouth images have been cropped and saved to {cfg.dst_filename}")
if __name__ == "__main__":
main()