diff --git a/README.md b/README.md new file mode 100644 index 0000000..8d019fa --- /dev/null +++ b/README.md @@ -0,0 +1,65 @@ +Take a video and replace the face in it with a face of your choice. You only need one image of the desired face. No dataset, no training. + +That's it, that's the software. + +![demo-gif](demo.gif) + +## Installation +> Do not create any issues regarding installation problems. I am only responsible for issues in this program, use google for help. + +1. install `python`, `pip` and `git` +2. install `ffmpeg` +3. run the following commands in terminal: +``` +git clone https://github.com/s0md3v/roop +cd roop +pip3 install -r requirements.txt +``` + +### Do you have a decent GPU? +If you have a good enough GPU, you can use it to speed up the face-swapping process by running `run.py` with `--gpu` flag. +If you plan on doing, you will need to install the appropriate `onnxruntime-*` package as follows: + +#### NVIDIA +``` +pip3 install onnxruntime-gpu +``` +#### AMD +``` +git clone https://github.com/microsoft/onnxruntime +cd onnxruntime +./build.sh --config Release --build_wheel --update --build --parallel --cmake_extra_defines CMAKE_PREFIX_PATH=/opt/rocm/lib/cmake ONNXRUNTIME_VERSION=$ONNXRUNTIME_VERSION onnxruntime_BUILD_UNIT_TESTS=off --use_rocm --rocm_home=/opt/rocm +pip install build/Linux/Release/dist/*.whl +``` + +## Usage +> Note: When you run this program for the first time, it will download some models ~300MB in size. + +Executing `python run.py` command will launch this window: + +Choose a face (image with desired face) and the target image/video (image/video in which you want to replace the face) and click on `Start`. The output will be saved in `output.mp4` file. + +Don't touch the FPS checkbox unless you know what you are doing. + +Additional command line arguments are given below: +``` +-h, --help show this help message and exit +-f SOURCE_IMG, --face SOURCE_IMG + use this face +-t TARGET_PATH, --target TARGET_PATH + replace this face +--keep-fps keep original fps +--gpu use gpu +--keep-frames don't delete frames directory +``` + +Looking for a CLI mode? Using the -f/--face argument will make the program in cli mode. + +## Future plans +- [ ] Replace a selective face throughout the video +- [ ] Support for replacing multiple faces + +## Credits +- [ffmpeg](https://ffmpeg.org/): for making video related operations easy +- [deepinsight](https://github.com/deepinsight): for their [insightface](https://github.com/deepinsight/insightface) project which provided a well-made library and models. +- and all developers behind libraries used in this project. diff --git a/core/__init__.py b/core/__init__.py new file mode 100644 index 0000000..8d1c8b6 --- /dev/null +++ b/core/__init__.py @@ -0,0 +1 @@ + diff --git a/core/config.py b/core/config.py new file mode 100644 index 0000000..1edf36c --- /dev/null +++ b/core/config.py @@ -0,0 +1,9 @@ +import insightface + +face_analyser = insightface.app.FaceAnalysis(name='buffalo_l', providers=['CUDAExecutionProvider', 'ROCMExecutionProvider', 'CPUExecutionProvider']) +face_analyser.prepare(ctx_id=0, det_size=(640, 640)) + + +def get_face(img_data): + analysed = face_analyser.get(img_data) + return sorted(analysed, key=lambda x: x.bbox[0])[0] diff --git a/core/processor.py b/core/processor.py new file mode 100644 index 0000000..a7c5265 --- /dev/null +++ b/core/processor.py @@ -0,0 +1,28 @@ +import cv2 +import insightface +from core.config import get_face +from core.utils import rreplace + +face_swapper = insightface.model_zoo.get_model('inswapper_128.onnx', providers=['CUDAExecutionProvider', 'ROCMExecutionProvider', 'CPUExecutionProvider']) + + +def process_video(source_img, frame_paths): + source_face = get_face(cv2.imread(source_img)) + for frame_path in frame_paths: + frame = cv2.imread(frame_path) + try: + face = get_face(frame) + result = face_swapper.get(frame, face, source_face, paste_back=True) + cv2.imwrite(frame_path, result) + except Exception as e: + pass + + +def process_img(source_img, target_path): + frame = cv2.imread(target_path) + face = get_face(frame) + source_face = get_face(cv2.imread(source_img)) + result = face_swapper.get(frame, face, source_face, paste_back=True) + target_path = rreplace(target_path, "/", "/swapped-", 1) if "/" in target_path else "swapped-"+target_path + print(target_path) + cv2.imwrite(target_path, result) diff --git a/core/utils.py b/core/utils.py new file mode 100644 index 0000000..8cdeb0e --- /dev/null +++ b/core/utils.py @@ -0,0 +1,46 @@ +import os +import shutil + +def run_command(command, mode="silent"): + if mode == "debug": + return os.system(command) + return os.popen(command).read() + +def detect_fps(input_path): + output = os.popen(f"ffprobe -v error -select_streams v -of default=noprint_wrappers=1:nokey=1 -show_entries stream=r_frame_rate {input_path}").read() + if "/" in output: + try: + return int(output.split("/")[0]) // int(output.split("/")[1]) + except: + pass + return 60 + + +def set_fps(input_path, output_path, fps): + os.system(f"ffmpeg -i {input_path} -filter:v fps=fps={fps} {output_path}") + + +def create_video(video_name, fps, output_dir): + os.system(f"ffmpeg -framerate {fps} -pattern_type glob -i '{output_dir}/*.png' -c:v libx264 -pix_fmt yuv420p -y {output_dir}/output.mp4") + + +def extract_frames(input_path, output_dir): + os.system(f"ffmpeg -i {input_path} '{output_dir}/%04d.png'") + + +def add_audio(current_dir, output_dir, target_path, keep_frames): + video = target_path.split("/")[-1] + video_name = video.split(".")[0] + os.system(f"ffmpeg -i {output_dir}/output.mp4 -i {output_dir}/{video} -c:v copy -map 0:v:0 -map 1:a:0 -y {current_dir}/swapped-{video_name}.mp4") + if not os.path.isfile(current_dir + "/swapped-" + video_name + ".mp4"): + shutil.move(output_dir + "/output.mp4", current_dir + "/swapped-" + video_name + ".mp4") + if not keep_frames: + shutil.rmtree(output_dir) + + +def is_img(path): + return path.lower().endswith(("png", "jpg", "jpeg", "bmp")) + +def rreplace(s, old, new, occurrence): + li = s.rsplit(old, occurrence) + return new.join(li) diff --git a/demo.gif b/demo.gif new file mode 100644 index 0000000..4ec0085 Binary files /dev/null and b/demo.gif differ diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000..9143efe --- /dev/null +++ b/requirements.txt @@ -0,0 +1,4 @@ +numpy +opencv-python +onnx +insightface diff --git a/run.py b/run.py new file mode 100644 index 0000000..62bb92e --- /dev/null +++ b/run.py @@ -0,0 +1,113 @@ +import glob +import argparse +import multiprocessing as mp +import os +from pathlib import Path +import tkinter as tk +from tkinter import filedialog +from core.processor import process_video, process_img +from core.utils import is_img, detect_fps, set_fps, create_video, add_audio, extract_frames +import webbrowser +import psutil +import shutil + +pool = None +args = {} + +parser = argparse.ArgumentParser() +parser.add_argument('-f', '--face', help='use this face', dest='source_img') +parser.add_argument('-t', '--target', help='replace this face', dest='target_path') +parser.add_argument('--keep-fps', help='maintain original fps', dest='keep_fps', action='store_true', default=False) +parser.add_argument('--gpu', help='use gpu', dest='gpu', action='store_true', default=False) +parser.add_argument('--keep-frames', help='keep frames directory', dest='keep_frames', action='store_true', default=False) + +for name, value in vars(parser.parse_args()).items(): + args[name] = value + +def start_processing(): + if args['gpu']: + process_video(args['source_img'], args["frame_paths"]) + return + frame_paths = args["frame_paths"] + n = len(frame_paths)//(psutil.cpu_count()-1) + processes = [] + for i in range(0, len(frame_paths), n): + p = pool.apply_async(process_video, args=(args['source_img'], frame_paths[i:i+n],)) + processes.append(p) + for p in processes: + p.get() + pool.close() + pool.join() + + +def select_face(): + args['source_img'] = filedialog.askopenfilename(title="Select a face") + + +def select_target(): + args['target_path'] = filedialog.askopenfilename(title="Select a target") + + +def toggle_fps_limit(): + args['keep_fps'] = limit_fps.get() != True + + +def start(): + global pool + pool = mp.Pool(psutil.cpu_count()-1) + current_dir = os.getcwd() + target_path = args['target_path'] + if is_img(target_path): + process_img(args['source_img'], target_path) + return + video_name = target_path.split("/")[-1].split(".")[0] + output_dir = current_dir + "/" + video_name + Path(output_dir).mkdir(exist_ok=True) + fps = detect_fps(target_path) + if not args['keep_fps'] and fps > 30: + this_path = output_dir + "/" + video_name + ".mp4" + set_fps(target_path, this_path, 30) + target_path, fps = this_path, 30 + else: + shutil.copy(target_path, output_dir) + extract_frames(target_path, output_dir) + args['frame_paths'] = tuple(sorted( + glob.glob(output_dir + "/*.png"), + key=lambda x: int(x.split("/")[-1].replace(".png", "")) + )) + start_processing() + create_video(video_name, fps, output_dir) + add_audio(current_dir, output_dir, target_path, args['keep_frames']) + + +if __name__ == "__main__": + if args['source_img']: + start() + quit() + window = tk.Tk() + window.geometry("600x200") + window.title("roop") + + # Contact information + support_link = tk.Label(window, text="Support the project ^_^", fg="red", cursor="hand2") + support_link.pack(padx=10, pady=10) + support_link.bind("", lambda e: webbrowser.open("https://github.com/sponsors/s0md3v")) + + # Select a face button + face_button = tk.Button(window, text="Select a face", command=select_face) + face_button.pack(side=tk.LEFT, padx=10, pady=10) + + # Select a target button + target_button = tk.Button(window, text="Select a target", command=select_target) + target_button.pack(side=tk.RIGHT, padx=10, pady=10) + + # FPS limit checkbox + limit_fps = tk.IntVar() + fps_checkbox = tk.Checkbutton(window, text="Limit FPS to 30", variable=limit_fps, command=toggle_fps_limit, font=("Arial", 8)) + fps_checkbox.pack(side=tk.BOTTOM) + fps_checkbox.select() + + # Start button + start_button = tk.Button(window, text="Start", bg="green", command=start) + start_button.pack(side=tk.BOTTOM, padx=10, pady=10) + window.mainloop()