Next (#107)

* Allow passing the onnxruntime to install.py * Fix CI * Disallow none execution providers in the UI * Use CV2 to detect fps * Respect trim on videos with audio * Respect trim on videos with audio (finally) * Implement caching to speed up preview and webcam * Define webcam UI and webcam performance * Remove layout from components * Add primary buttons * Extract benchmark and webcam settings * Introduce compact UI settings * Caching for IO and **** prediction * Caching for IO and **** prediction * Introduce face analyser caching * Fix some typing * Improve setup for benchmark * Clear image cache via post process * Fix settings in UI, Simplify restore_audio() using shortest * Select resolution and fps via webcam ui * Introduce read_static_image() to stop caching temp images * Use DirectShow under Windows * Multi-threading for webcam * Fix typing * Refactor frame processor * Refactor webcam processing * Avoid warnings due capture.isOpened() * Resume downloads (#110) * Introduce resumable downloads * Fix CURL commands * Break execution_settings into pieces * Cosmetic changes on cv2 webcam * Update Gradio * Move face cache to own file * Uniform namings for threading * Fix sorting of get_temp_frame_paths(), extend get_temp_frames_pattern() * Minor changes from the review * Looks stable to tme * Update the disclaimer * Update the disclaimer * Update the disclaimer
2026-06-13 07:47:48 +02:00 · 2023-09-19 11:21:18 +02:00
parent 7f69889c95
commit 66ea4928f8
45 changed files with 866 additions and 588 deletions
@@ -57,16 +57,19 @@ def clear_frame_processors_modules() -> None:
 	FRAME_PROCESSORS_MODULES = []


-def multi_process_frame(source_path : str, temp_frame_paths : List[str], process_frames: Callable[[str, List[str], Any], None], update: Callable[[], None]) -> None:
-	with ThreadPoolExecutor(max_workers = facefusion.globals.execution_thread_count) as executor:
-		futures = []
-		queue = create_queue(temp_frame_paths)
-		queue_per_future = max(len(temp_frame_paths) // facefusion.globals.execution_thread_count * facefusion.globals.execution_queue_count, 1)
-		while not queue.empty():
-			future = executor.submit(process_frames, source_path, pick_queue(queue, queue_per_future), update)
-			futures.append(future)
-		for future in as_completed(futures):
-			future.result()
+def multi_process_frames(source_path : str, temp_frame_paths : List[str], process_frames : Callable[[str, List[str], Callable[[], None]], None]) -> None:
+	progress_bar_format = '{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}, {rate_fmt}{postfix}]'
+	with tqdm(total = len(temp_frame_paths), desc = wording.get('processing'), unit = 'frame', dynamic_ncols = True, bar_format = progress_bar_format) as progress:
+		with ThreadPoolExecutor(max_workers = facefusion.globals.execution_thread_count) as executor:
+			futures = []
+			queue_temp_frame_paths : Queue[str] = create_queue(temp_frame_paths)
+			queue_per_future = max(len(temp_frame_paths) // facefusion.globals.execution_thread_count * facefusion.globals.execution_queue_count, 1)
+			while not queue_temp_frame_paths.empty():
+				payload_temp_frame_paths = pick_queue(queue_temp_frame_paths, queue_per_future)
+				future = executor.submit(process_frames, source_path, payload_temp_frame_paths, lambda: update_progress(progress))
+				futures.append(future)
+			for future_done in as_completed(futures):
+				future_done.result()


 def create_queue(temp_frame_paths : List[str]) -> Queue[str]:
@@ -84,13 +87,6 @@ def pick_queue(queue : Queue[str], queue_per_future : int) -> List[str]:
 	return queues


-def process_video(source_path : str, frame_paths : List[str], process_frames : Callable[[str, List[str], Any], None]) -> None:
-	progress_bar_format = '{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}, {rate_fmt}{postfix}]'
-	total = len(frame_paths)
-	with tqdm(total = total, desc = wording.get('processing'), unit = 'frame', dynamic_ncols = True, bar_format = progress_bar_format) as progress:
-		multi_process_frame(source_path, frame_paths, process_frames, lambda: update_progress(progress))
-
-
 def update_progress(progress : Any = None) -> None:
 	process = psutil.Process(os.getpid())
 	memory_usage = process.memory_info().rss / 1024 / 1024 / 1024
@@ -1,5 +1,4 @@
 from typing import Any, List, Callable
-import cv2
 import threading
 from gfpgan.utils import GFPGANer

@@ -9,10 +8,11 @@ from facefusion.core import update_status
 from facefusion.face_analyser import get_many_faces
 from facefusion.typing import Frame, Face, ProcessMode
 from facefusion.utilities import conditional_download, resolve_relative_path, is_image, is_video
+from facefusion.vision import read_image, read_static_image, write_image

 FRAME_PROCESSOR = None
-THREAD_SEMAPHORE = threading.Semaphore()
-THREAD_LOCK = threading.Lock()
+THREAD_SEMAPHORE : threading.Semaphore = threading.Semaphore()
+THREAD_LOCK : threading.Lock = threading.Lock()
 NAME = 'FACEFUSION.FRAME_PROCESSOR.FACE_ENHANCER'


@@ -54,6 +54,7 @@ def pre_process(mode : ProcessMode) -> bool:

 def post_process() -> None:
 	clear_frame_processor()
+	read_static_image.cache_clear()


 def enhance_face(target_face : Face, temp_frame : Frame) -> Frame:
@@ -83,20 +84,19 @@ def process_frame(source_face : Face, reference_face : Face, temp_frame : Frame)
 	return temp_frame


-def process_frames(source_path : str, temp_frame_paths : List[str], update: Callable[[], None]) -> None:
+def process_frames(source_path : str, temp_frame_paths : List[str], update_progress: Callable[[], None]) -> None:
 	for temp_frame_path in temp_frame_paths:
-		temp_frame = cv2.imread(temp_frame_path)
+		temp_frame = read_image(temp_frame_path)
 		result_frame = process_frame(None, None, temp_frame)
-		cv2.imwrite(temp_frame_path, result_frame)
-		if update:
-			update()
+		write_image(temp_frame_path, result_frame)
+		update_progress()


 def process_image(source_path : str, target_path : str, output_path : str) -> None:
-	target_frame = cv2.imread(target_path)
+	target_frame = read_static_image(target_path)
 	result_frame = process_frame(None, None, target_frame)
-	cv2.imwrite(output_path, result_frame)
+	write_image(output_path, result_frame)


 def process_video(source_path : str, temp_frame_paths : List[str]) -> None:
-	facefusion.processors.frame.core.process_video(None, temp_frame_paths, process_frames)
+	facefusion.processors.frame.core.multi_process_frames(None, temp_frame_paths, process_frames)
@@ -1,5 +1,4 @@
 from typing import Any, List, Callable
-import cv2
 import insightface
 import threading

@@ -11,9 +10,10 @@ from facefusion.face_analyser import get_one_face, get_many_faces, find_similar_
 from facefusion.face_reference import get_face_reference, set_face_reference
 from facefusion.typing import Face, Frame, ProcessMode
 from facefusion.utilities import conditional_download, resolve_relative_path, is_image, is_video
+from facefusion.vision import read_image, read_static_image, write_image

 FRAME_PROCESSOR = None
-THREAD_LOCK = threading.Lock()
+THREAD_LOCK : threading.Lock = threading.Lock()
 NAME = 'FACEFUSION.FRAME_PROCESSOR.FACE_SWAPPER'


@@ -43,7 +43,7 @@ def pre_process(mode : ProcessMode) -> bool:
 	if not is_image(facefusion.globals.source_path):
 		update_status(wording.get('select_image_source') + wording.get('exclamation_mark'), NAME)
 		return False
-	elif not get_one_face(cv2.imread(facefusion.globals.source_path)):
+	elif not get_one_face(read_static_image(facefusion.globals.source_path)):
 		update_status(wording.get('no_source_face_detected') + wording.get('exclamation_mark'), NAME)
 		return False
 	if mode in [ 'output', 'preview' ] and not is_image(facefusion.globals.target_path) and not is_video(facefusion.globals.target_path):
@@ -56,6 +56,7 @@ def pre_process(mode : ProcessMode) -> bool:

 def post_process() -> None:
 	clear_frame_processor()
+	read_static_image.cache_clear()


 def swap_face(source_face : Face, target_face : Face, temp_frame : Frame) -> Frame:
@@ -76,32 +77,31 @@ def process_frame(source_face : Face, reference_face : Face, temp_frame : Frame)
 	return temp_frame


-def process_frames(source_path : str, temp_frame_paths : List[str], update: Callable[[], None]) -> None:
-	source_face = get_one_face(cv2.imread(source_path))
+def process_frames(source_path : str, temp_frame_paths : List[str], update_progress: Callable[[], None]) -> None:
+	source_face = get_one_face(read_static_image(source_path))
 	reference_face = get_face_reference() if 'reference' in facefusion.globals.face_recognition else None
 	for temp_frame_path in temp_frame_paths:
-		temp_frame = cv2.imread(temp_frame_path)
+		temp_frame = read_image(temp_frame_path)
 		result_frame = process_frame(source_face, reference_face, temp_frame)
-		cv2.imwrite(temp_frame_path, result_frame)
-		if update:
-			update()
+		write_image(temp_frame_path, result_frame)
+		update_progress()


 def process_image(source_path : str, target_path : str, output_path : str) -> None:
-	source_face = get_one_face(cv2.imread(source_path))
-	target_frame = cv2.imread(target_path)
+	source_face = get_one_face(read_static_image(source_path))
+	target_frame = read_static_image(target_path)
 	reference_face = get_one_face(target_frame, facefusion.globals.reference_face_position) if 'reference' in facefusion.globals.face_recognition else None
 	result_frame = process_frame(source_face, reference_face, target_frame)
-	cv2.imwrite(output_path, result_frame)
+	write_image(output_path, result_frame)


 def process_video(source_path : str, temp_frame_paths : List[str]) -> None:
 	conditional_set_face_reference(temp_frame_paths)
-	frame_processors.process_video(source_path, temp_frame_paths, process_frames)
+	frame_processors.multi_process_frames(source_path, temp_frame_paths, process_frames)


 def conditional_set_face_reference(temp_frame_paths : List[str]) -> None:
 	if 'reference' in facefusion.globals.face_recognition and not get_face_reference():
-		reference_frame = cv2.imread(temp_frame_paths[facefusion.globals.reference_frame_number])
+		reference_frame = read_static_image(temp_frame_paths[facefusion.globals.reference_frame_number])
 		reference_face = get_one_face(reference_frame, facefusion.globals.reference_face_position)
 		set_face_reference(reference_face)
@@ -1,5 +1,4 @@
 from typing import Any, List, Callable
-import cv2
 import threading
 from basicsr.archs.rrdbnet_arch import RRDBNet
 from realesrgan import RealESRGANer
@@ -10,10 +9,11 @@ from facefusion import wording, utilities
 from facefusion.core import update_status
 from facefusion.typing import Frame, Face, ProcessMode
 from facefusion.utilities import conditional_download, resolve_relative_path
+from facefusion.vision import read_image, read_static_image, write_image

 FRAME_PROCESSOR = None
-THREAD_SEMAPHORE = threading.Semaphore()
-THREAD_LOCK = threading.Lock()
+THREAD_SEMAPHORE : threading.Semaphore = threading.Semaphore()
+THREAD_LOCK : threading.Lock = threading.Lock()
 NAME = 'FACEFUSION.FRAME_PROCESSOR.FRAME_ENHANCER'


@@ -63,6 +63,7 @@ def pre_process(mode : ProcessMode) -> bool:

 def post_process() -> None:
 	clear_frame_processor()
+	read_static_image.cache_clear()


 def enhance_frame(temp_frame : Frame) -> Frame:
@@ -75,20 +76,19 @@ def process_frame(source_face : Face, reference_face : Face, temp_frame : Frame)
 	return enhance_frame(temp_frame)


-def process_frames(source_path : str, temp_frame_paths : List[str], update: Callable[[], None]) -> None:
+def process_frames(source_path : str, temp_frame_paths : List[str], update_progress: Callable[[], None]) -> None:
 	for temp_frame_path in temp_frame_paths:
-		temp_frame = cv2.imread(temp_frame_path)
+		temp_frame = read_image(temp_frame_path)
 		result_frame = process_frame(None, None, temp_frame)
-		cv2.imwrite(temp_frame_path, result_frame)
-		if update:
-			update()
+		write_image(temp_frame_path, result_frame)
+		update_progress()


 def process_image(source_path : str, target_path : str, output_path : str) -> None:
-	target_frame = cv2.imread(target_path)
+	target_frame = read_static_image(target_path)
 	result = process_frame(None, None, target_frame)
-	cv2.imwrite(output_path, result)
+	write_image(output_path, result)


 def process_video(source_path : str, temp_frame_paths : List[str]) -> None:
-	frame_processors.process_video(None, temp_frame_paths, process_frames)
+	frame_processors.multi_process_frames(None, temp_frame_paths, process_frames)