Next (#502)

* Validate the overrides from facefusion.ini * Break down cli testing * Remove architecture lookup to support old driver * Remove architecture lookup to support old driver * Remove hwaccel auto * Respect the output video resolution * Bump next version * Full directml support (#501) * Introduce conditional thread management for DML support * Finish migration to thread helpers * Introduce dynamic frame colorizer sizes * Introduce dynamic frame colorizer sizes * Add 192x192 to frame colorizer * Fix async audio
2024-04-19 13:35:36 +02:00
parent 092dfbb796
commit 4efa5b2c6e
30 changed files with 350 additions and 191 deletions
--- a/facefusion/face_analyser.py
+++ b/facefusion/face_analyser.py
@@ -1,6 +1,5 @@
 from typing import Any, Optional, List, Tuple
 from time import sleep
-import threading
 import cv2
 import numpy
 import onnxruntime
@@ -13,12 +12,11 @@ from facefusion.face_store import get_static_faces, set_static_faces
 from facefusion.execution import apply_execution_provider_options
 from facefusion.download import conditional_download
 from facefusion.filesystem import resolve_relative_path, is_file
+from facefusion.thread_helper import thread_lock, thread_semaphore, conditional_thread_semaphore
 from facefusion.typing import VisionFrame, Face, FaceSet, FaceAnalyserOrder, FaceAnalyserAge, FaceAnalyserGender, ModelSet, BoundingBox, FaceLandmarkSet, FaceLandmark5, FaceLandmark68, Score, FaceScoreSet, Embedding
 from facefusion.vision import resize_frame_resolution, unpack_resolution

 FACE_ANALYSER = None
-THREAD_SEMAPHORE : threading.Semaphore = threading.Semaphore()
-THREAD_LOCK : threading.Lock = threading.Lock()
 MODELS : ModelSet =\
 {
 	'face_detector_retinaface':
@@ -85,7 +83,7 @@ def get_face_analyser() -> Any:
 	face_detectors = {}
 	face_landmarkers = {}

-	with THREAD_LOCK:
+	with thread_lock():
 		while process_manager.is_checking():
 			sleep(0.5)
 		if FACE_ANALYSER is None:
@@ -185,7 +183,7 @@ def detect_with_retinaface(vision_frame : VisionFrame, face_detector_size : str)
 	score_list = []

 	detect_vision_frame = prepare_detect_frame(temp_vision_frame, face_detector_size)
-	with THREAD_SEMAPHORE:
+	with thread_semaphore():
 		detections = face_detector.run(None,
 		{
 			face_detector.get_inputs()[0].name: detect_vision_frame
@@ -227,7 +225,7 @@ def detect_with_scrfd(vision_frame : VisionFrame, face_detector_size : str) -> T
 	score_list = []

 	detect_vision_frame = prepare_detect_frame(temp_vision_frame, face_detector_size)
-	with THREAD_SEMAPHORE:
+	with thread_semaphore():
 		detections = face_detector.run(None,
 		{
 			face_detector.get_inputs()[0].name: detect_vision_frame
@@ -266,7 +264,7 @@ def detect_with_yoloface(vision_frame : VisionFrame, face_detector_size : str) -
 	score_list = []

 	detect_vision_frame = prepare_detect_frame(temp_vision_frame, face_detector_size)
-	with THREAD_SEMAPHORE:
+	with thread_semaphore():
 		detections = face_detector.run(None,
 		{
 			face_detector.get_inputs()[0].name: detect_vision_frame
@@ -304,7 +302,7 @@ def detect_with_yunet(vision_frame : VisionFrame, face_detector_size : str) -> T

 	face_detector.setInputSize((temp_vision_frame.shape[1], temp_vision_frame.shape[0]))
 	face_detector.setScoreThreshold(facefusion.globals.face_detector_score)
-	with THREAD_SEMAPHORE:
+	with thread_semaphore():
 		_, detections = face_detector.detect(temp_vision_frame)
 	if numpy.any(detections):
 		for detection in detections:
@@ -380,10 +378,11 @@ def calc_embedding(temp_vision_frame : VisionFrame, face_landmark_5 : FaceLandma
 	crop_vision_frame = crop_vision_frame / 127.5 - 1
 	crop_vision_frame = crop_vision_frame[:, :, ::-1].transpose(2, 0, 1).astype(numpy.float32)
 	crop_vision_frame = numpy.expand_dims(crop_vision_frame, axis = 0)
-	embedding = face_recognizer.run(None,
-	{
-		face_recognizer.get_inputs()[0].name: crop_vision_frame
-	})[0]
+	with conditional_thread_semaphore(facefusion.globals.execution_providers):
+		embedding = face_recognizer.run(None,
+		{
+			face_recognizer.get_inputs()[0].name: crop_vision_frame
+		})[0]
 	embedding = embedding.ravel()
 	normed_embedding = embedding / numpy.linalg.norm(embedding)
 	return embedding, normed_embedding
@@ -399,10 +398,11 @@ def detect_face_landmark_68(temp_vision_frame : VisionFrame, bounding_box : Boun
 		crop_vision_frame[:, :, 0] = cv2.createCLAHE(clipLimit = 2).apply(crop_vision_frame[:, :, 0])
 	crop_vision_frame = cv2.cvtColor(crop_vision_frame, cv2.COLOR_Lab2RGB)
 	crop_vision_frame = crop_vision_frame.transpose(2, 0, 1).astype(numpy.float32) / 255.0
-	face_landmark_68, face_heatmap = face_landmarker.run(None,
-	{
-		face_landmarker.get_inputs()[0].name: [ crop_vision_frame ]
-	})
+	with conditional_thread_semaphore(facefusion.globals.execution_providers):
+		face_landmark_68, face_heatmap = face_landmarker.run(None,
+		{
+			face_landmarker.get_inputs()[0].name: [ crop_vision_frame ]
+		})
 	face_landmark_68 = face_landmark_68[:, :, :2][0] / 64
 	face_landmark_68 = face_landmark_68.reshape(1, -1, 2) * 256
 	face_landmark_68 = cv2.transform(face_landmark_68, cv2.invertAffineTransform(affine_matrix))
@@ -416,10 +416,11 @@ def expand_face_landmark_68_from_5(face_landmark_5 : FaceLandmark5) -> FaceLandm
 	face_landmarker = get_face_analyser().get('face_landmarkers').get('68_5')
 	affine_matrix = estimate_matrix_by_face_landmark_5(face_landmark_5, 'ffhq_512', (1, 1))
 	face_landmark_5 = cv2.transform(face_landmark_5.reshape(1, -1, 2), affine_matrix).reshape(-1, 2)
-	face_landmark_68_5 = face_landmarker.run(None,
-	{
-		face_landmarker.get_inputs()[0].name: [ face_landmark_5 ]
-	})[0][0]
+	with conditional_thread_semaphore(facefusion.globals.execution_providers):
+		face_landmark_68_5 = face_landmarker.run(None,
+		{
+			face_landmarker.get_inputs()[0].name: [ face_landmark_5 ]
+		})[0][0]
 	face_landmark_68_5 = cv2.transform(face_landmark_68_5.reshape(1, -1, 2), cv2.invertAffineTransform(affine_matrix)).reshape(-1, 2)
 	return face_landmark_68_5

@@ -432,10 +433,11 @@ def detect_gender_age(temp_vision_frame : VisionFrame, bounding_box : BoundingBo
 	crop_vision_frame, affine_matrix = warp_face_by_translation(temp_vision_frame, translation, scale, (96, 96))
 	crop_vision_frame = crop_vision_frame[:, :, ::-1].transpose(2, 0, 1).astype(numpy.float32)
 	crop_vision_frame = numpy.expand_dims(crop_vision_frame, axis = 0)
-	prediction = gender_age.run(None,
-	{
-		gender_age.get_inputs()[0].name: crop_vision_frame
-	})[0][0]
+	with conditional_thread_semaphore(facefusion.globals.execution_providers):
+		prediction = gender_age.run(None,
+		{
+			gender_age.get_inputs()[0].name: crop_vision_frame
+		})[0][0]
 	gender = int(numpy.argmax(prediction[:2]))
 	age = int(numpy.round(prediction[2] * 100))
 	return gender, age