FaceSwap / roop /ui.py
supArs's picture
Upload 48 files
43adbb1
raw
history blame
41.4 kB
import os
import time
import gradio as gr
import cv2
import pathlib
import shutil
import roop.globals
import roop.metadata
import roop.utilities as util
from roop.face_util import extract_face_images
from roop.capturer import get_video_frame, get_video_frame_total, get_image_frame
from roop.ProcessEntry import ProcessEntry
restart_server = False
live_cam_active = False
RECENT_DIRECTORY_SOURCE = None
RECENT_DIRECTORY_TARGET = None
RECENT_DIRECTORY_OUTPUT = None
SELECTION_FACES_DATA = None
last_image = None
input_thumbs = []
target_thumbs = []
IS_INPUT = True
SELECTED_FACE_INDEX = 0
SELECTED_INPUT_FACE_INDEX = 0
SELECTED_TARGET_FACE_INDEX = 0
roop.globals.keep_fps = None
roop.globals.keep_frames = None
roop.globals.skip_audio = None
roop.globals.use_batch = None
input_faces = None
target_faces = None
face_selection = None
fake_cam_image = None
current_cam_image = None
cam_swapping = False
camthread = None
selected_preview_index = 0
is_processing = False
list_files_process : list[ProcessEntry] = []
def prepare_environment():
roop.globals.output_path = os.path.abspath(os.path.join(os.getcwd(), "output"))
os.makedirs(roop.globals.output_path, exist_ok=True)
os.environ["TEMP"] = os.environ["TMP"] = os.path.abspath(os.path.join(os.getcwd(), "temp"))
os.makedirs(os.environ["TEMP"], exist_ok=True)
os.environ["GRADIO_TEMP_DIR"] = os.environ["TEMP"]
def run():
from roop.core import suggest_execution_providers, decode_execution_providers, set_display_ui
global input_faces, target_faces, face_selection, fake_cam_image, restart_server, live_cam_active, on_settings_changed
prepare_environment()
available_themes = ["Default", "gradio/glass", "gradio/monochrome", "gradio/seafoam", "gradio/soft", "gstaff/xkcd", "freddyaboulton/dracula_revamped", "ysharma/steampunk"]
image_formats = ['jpg','png', 'webp']
video_formats = ['avi','mkv', 'mp4', 'webm']
video_codecs = ['libx264', 'libx265', 'libvpx-vp9', 'h264_nvenc', 'hevc_nvenc']
providerlist = suggest_execution_providers()
settings_controls = []
live_cam_active = roop.globals.CFG.live_cam_start_active
set_display_ui(show_msg)
roop.globals.execution_providers = decode_execution_providers([roop.globals.CFG.provider])
print(f'Using provider {roop.globals.execution_providers} - Device:{util.get_device()}')
run_server = True
mycss = """
span {color: var(--block-info-text-color)}
#fixedheight {
max-height: 238.4px;
overflow-y: auto !important;
}
"""
while run_server:
server_name = roop.globals.CFG.server_name
if server_name is None or len(server_name) < 1:
server_name = None
server_port = roop.globals.CFG.server_port
if server_port <= 0:
server_port = None
ssl_verify = False if server_name == '0.0.0.0' else True
with gr.Blocks(title=f'{roop.metadata.name} {roop.metadata.version}', theme=roop.globals.CFG.selected_theme, css=mycss) as ui:
with gr.Row(variant='compact'):
gr.Markdown(f"### [{roop.metadata.name} {roop.metadata.version}](https://github.com/C0untFloyd/roop-unleashed)")
gr.HTML(util.create_version_html(), elem_id="versions")
with gr.Tab("🎭 Face Swap"):
with gr.Row(variant='panel'):
with gr.Column(scale=2):
with gr.Row():
with gr.Column(min_width=160):
input_faces = gr.Gallery(label="Input faces", allow_preview=True, preview=True, height=128, object_fit="scale-down")
mask_top = gr.Slider(0, 256, value=0, label="Offset Face Top", step=1.0, interactive=True)
bt_remove_selected_input_face = gr.Button("❌ Remove selected", size='sm')
bt_clear_input_faces = gr.Button("πŸ’₯ Clear all", variant='stop', size='sm')
with gr.Column(min_width=160):
target_faces = gr.Gallery(label="Target faces", allow_preview=True, preview=True, height=128, object_fit="scale-down")
bt_remove_selected_target_face = gr.Button("❌ Remove selected", size='sm')
bt_add_local = gr.Button('Add local files from', size='sm')
local_folder = gr.Textbox(show_label=False, placeholder="/content/", interactive=True)
with gr.Row(variant='panel'):
bt_srcimg = gr.Image(label='Source Face Image', type='filepath', tool=None, height=233)
bt_destfiles = gr.Files(label='Target File(s)', file_count="multiple", elem_id='filelist', height=233)
with gr.Row(variant='panel'):
gr.Markdown('')
forced_fps = gr.Slider(minimum=0, maximum=120, value=0, label="Video FPS", info='Overrides detected fps if not 0', step=1.0, interactive=True, container=True)
with gr.Column(scale=2):
previewimage = gr.Image(label="Preview Image", height=576, interactive=False)
with gr.Row(variant='panel'):
fake_preview = gr.Checkbox(label="Face swap frames", value=False)
bt_refresh_preview = gr.Button("πŸ”„ Refresh", variant='secondary', size='sm')
bt_use_face_from_preview = gr.Button("Use Face from this Frame", variant='primary', size='sm')
with gr.Row():
preview_frame_num = gr.Slider(0, 0, value=0, label="Frame Number", step=1.0, interactive=True)
with gr.Row():
text_frame_clip = gr.Markdown('Processing frame range [0 - 0]')
set_frame_start = gr.Button("β¬… Set as Start", size='sm')
set_frame_end = gr.Button("➑ Set as End", size='sm')
with gr.Row(visible=False) as dynamic_face_selection:
with gr.Column(scale=2):
face_selection = gr.Gallery(label="Detected faces", allow_preview=True, preview=True, height=256, object_fit="scale-down")
with gr.Column():
bt_faceselect = gr.Button("β˜‘ Use selected face", size='sm')
bt_cancelfaceselect = gr.Button("Done", size='sm')
with gr.Column():
gr.Markdown(' ')
with gr.Row(variant='panel'):
with gr.Column(scale=1):
selected_face_detection = gr.Dropdown(["First found", "All faces", "Selected face", "All female", "All male"], value="First found", label="Select face selection for swapping")
max_face_distance = gr.Slider(0.01, 1.0, value=0.65, label="Max Face Similarity Threshold")
video_swapping_method = gr.Dropdown(["Extract Frames to media","In-Memory processing"], value="In-Memory", label="Select video processing method", interactive=True)
roop.globals.keep_frames = gr.Checkbox(label="Keep Frames (relevant only when extracting frames)", value=False)
roop.globals.skip_audio = gr.Checkbox(label="Skip audio", value=False)
with gr.Column(scale=1):
selected_enhancer = gr.Dropdown(["None", "Codeformer", "DMDNet", "GFPGAN"], value="None", label="Select post-processing")
blend_ratio = gr.Slider(0.0, 1.0, value=0.65, label="Original/Enhanced image blend ratio")
with gr.Column(scale=1):
chk_useclip = gr.Checkbox(label="Use Text Masking", value=False)
clip_text = gr.Textbox(label="List of objects to mask and restore back on fake image", placeholder="cup,hands,hair,banana" ,elem_id='tooltip')
gr.Dropdown(["Clip2Seg"], value="Clip2Seg", label="Engine")
bt_preview_mask = gr.Button("πŸ‘₯ Show Mask Preview", variant='secondary')
with gr.Row(variant='panel'):
with gr.Column():
bt_start = gr.Button("β–Ά Start", variant='primary')
gr.Button("πŸ‘€ Open Output Folder", size='sm').click(fn=lambda: util.open_folder(roop.globals.output_path))
with gr.Column():
bt_stop = gr.Button("⏹ Stop", variant='secondary')
with gr.Column(scale=2):
gr.Markdown(' ')
with gr.Row(variant='panel'):
with gr.Column():
resultfiles = gr.Files(label='Processed File(s)', interactive=False)
with gr.Column():
resultimage = gr.Image(type='filepath', label='Final Image', interactive=False, )
with gr.Tab("πŸŽ₯ Live Cam"):
with gr.Row():
with gr.Column(scale=2):
cam_toggle = gr.Checkbox(label='Activate', value=live_cam_active)
with gr.Column(scale=1):
vcam_toggle = gr.Checkbox(label='Stream to virtual camera', value=False)
with gr.Column(scale=1):
camera_num = gr.Slider(0, 2, value=0, label="Camera Number", step=1.0, interactive=True)
if live_cam_active:
with gr.Row():
with gr.Column():
cam = gr.Webcam(label='Camera', source='webcam', mirror_webcam=True, interactive=True, streaming=False)
with gr.Column():
fake_cam_image = gr.Image(label='Fake Camera Output', interactive=False)
with gr.Tab("πŸŽ‰ Extras"):
with gr.Row():
files_to_process = gr.Files(label='File(s) to process', file_count="multiple")
# with gr.Row(variant='panel'):
# with gr.Accordion(label="Post process", open=False):
# with gr.Column():
# selected_post_enhancer = gr.Dropdown(["None", "Codeformer", "GFPGAN"], value="None", label="Select post-processing")
# with gr.Column():
# gr.Button("Start").click(fn=lambda: gr.Info('Not yet implemented...'))
with gr.Row(variant='panel'):
with gr.Accordion(label="Video/GIF", open=False):
with gr.Row(variant='panel'):
with gr.Column():
gr.Markdown("""
# Cut video
Be aware that this means re-encoding the video which might take a longer time.
Encoding uses your configuration from the Settings Tab.
""")
with gr.Column():
cut_start_time = gr.Slider(0, 1000000, value=0, label="Start Frame", step=1.0, interactive=True)
with gr.Column():
cut_end_time = gr.Slider(1, 1000000, value=1, label="End Frame", step=1.0, interactive=True)
with gr.Column():
start_cut_video = gr.Button("Start")
# with gr.Row(variant='panel'):
# with gr.Column():
# gr.Markdown("""
# # Join videos
# This also re-encodes the videos like cutting above.
# """)
# with gr.Column():
# start_join_videos = gr.Button("Start")
with gr.Row(variant='panel'):
gr.Markdown("Extract frames from video")
start_extract_frames = gr.Button("Start")
with gr.Row(variant='panel'):
gr.Markdown("Create video from image files")
gr.Button("Start").click(fn=lambda: gr.Info('Not yet implemented...'))
with gr.Row(variant='panel'):
gr.Markdown("Create GIF from video")
start_create_gif = gr.Button("Create GIF")
with gr.Row():
extra_files_output = gr.Files(label='Resulting output files', file_count="multiple")
with gr.Tab("βš™ Settings"):
with gr.Row():
with gr.Column():
themes = gr.Dropdown(available_themes, label="Theme", info="Change needs complete restart", value=roop.globals.CFG.selected_theme)
with gr.Column():
settings_controls.append(gr.Checkbox(label="Public Server", value=roop.globals.CFG.server_share, elem_id='server_share', interactive=True))
settings_controls.append(gr.Checkbox(label='Clear output folder before each run', value=roop.globals.CFG.clear_output, elem_id='clear_output', interactive=True))
output_template = gr.Textbox(label="Filename Output Template", info="(file extension is added automatically)", lines=1, placeholder='{file}_{time}', value=roop.globals.CFG.output_template)
with gr.Column():
input_server_name = gr.Textbox(label="Server Name", lines=1, info="Leave blank to run locally", value=roop.globals.CFG.server_name)
with gr.Column():
input_server_port = gr.Number(label="Server Port", precision=0, info="Leave at 0 to use default", value=roop.globals.CFG.server_port)
with gr.Row():
with gr.Column():
settings_controls.append(gr.Dropdown(providerlist, label="Provider", value=roop.globals.CFG.provider, elem_id='provider', interactive=True))
chk_det_size = gr.Checkbox(label="Use default Det-Size", value=True, elem_id='default_det_size', interactive=True)
settings_controls.append(gr.Checkbox(label="Force CPU for Face Analyser", value=roop.globals.CFG.force_cpu, elem_id='force_cpu', interactive=True))
max_threads = gr.Slider(1, 32, value=roop.globals.CFG.max_threads, label="Max. Number of Threads", info='default: 3', step=1.0, interactive=True)
with gr.Column():
memory_limit = gr.Slider(0, 128, value=roop.globals.CFG.memory_limit, label="Max. Memory to use (Gb)", info='0 meaning no limit', step=1.0, interactive=True)
settings_controls.append(gr.Dropdown(image_formats, label="Image Output Format", info='default: png', value=roop.globals.CFG.output_image_format, elem_id='output_image_format', interactive=True))
with gr.Column():
settings_controls.append(gr.Dropdown(video_codecs, label="Video Codec", info='default: libx264', value=roop.globals.CFG.output_video_codec, elem_id='output_video_codec', interactive=True))
settings_controls.append(gr.Dropdown(video_formats, label="Video Output Format", info='default: mp4', value=roop.globals.CFG.output_video_format, elem_id='output_video_format', interactive=True))
video_quality = gr.Slider(0, 100, value=roop.globals.CFG.video_quality, label="Video Quality (crf)", info='default: 14', step=1.0, interactive=True)
with gr.Column():
button_apply_restart = gr.Button("Restart Server", variant='primary')
settings_controls.append(gr.Checkbox(label='Start with active live cam', value=roop.globals.CFG.live_cam_start_active, elem_id='live_cam_start_active', interactive=True))
button_clean_temp = gr.Button("Clean temp folder")
button_apply_settings = gr.Button("Apply Settings")
previewinputs = [preview_frame_num, bt_destfiles, fake_preview, selected_enhancer, selected_face_detection,
max_face_distance, blend_ratio, chk_useclip, clip_text]
input_faces.select(on_select_input_face, None, None).then(fn=on_preview_frame_changed, inputs=previewinputs, outputs=[previewimage, mask_top])
bt_remove_selected_input_face.click(fn=remove_selected_input_face, outputs=[input_faces])
bt_srcimg.change(fn=on_srcimg_changed, show_progress='full', inputs=bt_srcimg, outputs=[dynamic_face_selection, face_selection, input_faces])
mask_top.input(fn=on_mask_top_changed, inputs=[mask_top], show_progress='hidden')
target_faces.select(on_select_target_face, None, None)
bt_remove_selected_target_face.click(fn=remove_selected_target_face, outputs=[target_faces])
forced_fps.change(fn=on_fps_changed, inputs=[forced_fps], show_progress='hidden')
bt_destfiles.change(fn=on_destfiles_changed, inputs=[bt_destfiles], outputs=[preview_frame_num, text_frame_clip], show_progress='hidden').then(fn=on_preview_frame_changed, inputs=previewinputs, outputs=[previewimage, mask_top], show_progress='full')
bt_destfiles.select(fn=on_destfiles_selected, outputs=[preview_frame_num, text_frame_clip, forced_fps], show_progress='hidden').then(fn=on_preview_frame_changed, inputs=previewinputs, outputs=[previewimage, mask_top], show_progress='hidden')
bt_destfiles.clear(fn=on_clear_destfiles, outputs=[target_faces])
resultfiles.select(fn=on_resultfiles_selected, inputs=[resultfiles], outputs=[resultimage])
face_selection.select(on_select_face, None, None)
bt_faceselect.click(fn=on_selected_face, outputs=[input_faces, target_faces, selected_face_detection])
bt_cancelfaceselect.click(fn=on_end_face_selection, outputs=[dynamic_face_selection, face_selection])
bt_clear_input_faces.click(fn=on_clear_input_faces, outputs=[input_faces])
chk_det_size.select(fn=on_option_changed)
bt_add_local.click(fn=on_add_local_folder, inputs=[local_folder], outputs=[bt_destfiles])
bt_preview_mask.click(fn=on_preview_mask, inputs=[preview_frame_num, bt_destfiles, clip_text], outputs=[previewimage])
start_event = bt_start.click(fn=start_swap,
inputs=[selected_enhancer, selected_face_detection, roop.globals.keep_frames,
roop.globals.skip_audio, max_face_distance, blend_ratio, chk_useclip, clip_text,video_swapping_method],
outputs=[bt_start, resultfiles]).then(fn=on_resultfiles_finished, inputs=[resultfiles], outputs=[resultimage])
bt_stop.click(fn=stop_swap, cancels=[start_event])
bt_refresh_preview.click(fn=on_preview_frame_changed, inputs=previewinputs, outputs=[previewimage, mask_top])
fake_preview.change(fn=on_preview_frame_changed, inputs=previewinputs, outputs=[previewimage, mask_top])
preview_frame_num.change(fn=on_preview_frame_changed, inputs=previewinputs, outputs=[previewimage, mask_top], show_progress='hidden')
bt_use_face_from_preview.click(fn=on_use_face_from_selected, show_progress='full', inputs=[bt_destfiles, preview_frame_num], outputs=[dynamic_face_selection, face_selection, target_faces, selected_face_detection])
set_frame_start.click(fn=on_set_frame, inputs=[set_frame_start, preview_frame_num], outputs=[text_frame_clip])
set_frame_end.click(fn=on_set_frame, inputs=[set_frame_end, preview_frame_num], outputs=[text_frame_clip])
# Live Cam
cam_toggle.change(fn=on_cam_toggle, inputs=[cam_toggle])
if live_cam_active:
vcam_toggle.change(fn=on_vcam_toggle, inputs=[vcam_toggle, camera_num], outputs=[cam, fake_cam_image])
cam.stream(on_stream_swap_cam, inputs=[cam, selected_enhancer, blend_ratio], outputs=[fake_cam_image], preprocess=True, postprocess=True, show_progress="hidden")
# Extras
start_cut_video.click(fn=on_cut_video, inputs=[files_to_process, cut_start_time, cut_end_time], outputs=[extra_files_output])
# start_join_videos.click(fn=on_join_videos, inputs=[files_to_process], outputs=[extra_files_output])
start_extract_frames.click(fn=on_extract_frames, inputs=[files_to_process], outputs=[extra_files_output])
start_create_gif.click(fn=on_create_gif, inputs=[files_to_process], outputs=[extra_files_output])
# Settings
for s in settings_controls:
s.select(fn=on_settings_changed)
max_threads.input(fn=lambda a,b='max_threads':on_settings_changed_misc(a,b), inputs=[max_threads])
memory_limit.input(fn=lambda a,b='memory_limit':on_settings_changed_misc(a,b), inputs=[memory_limit])
video_quality.input(fn=lambda a,b='video_quality':on_settings_changed_misc(a,b), inputs=[video_quality])
button_clean_temp.click(fn=clean_temp, outputs=[bt_srcimg, input_faces, target_faces, bt_destfiles])
button_apply_settings.click(apply_settings, inputs=[themes, input_server_name, input_server_port, output_template])
button_apply_restart.click(restart)
restart_server = False
try:
ui.queue().launch(inbrowser=True, server_name=server_name, server_port=server_port, share=roop.globals.CFG.server_share, ssl_verify=ssl_verify, prevent_thread_lock=True, show_error=True)
except:
restart_server = True
run_server = False
try:
while restart_server == False:
time.sleep(1.0)
except (KeyboardInterrupt, OSError):
print("Keyboard interruption in main thread... closing server.")
run_server = False
ui.close()
def on_mask_top_changed(mask_top):
global SELECTED_INPUT_FACE_INDEX
if len(roop.globals.INPUT_FACES) > SELECTED_INPUT_FACE_INDEX:
roop.globals.INPUT_FACES[SELECTED_INPUT_FACE_INDEX].mask_top = mask_top
def on_option_changed(evt: gr.SelectData):
attribname = evt.target.elem_id
if isinstance(evt.target, gr.Checkbox):
if hasattr(roop.globals, attribname):
setattr(roop.globals, attribname, evt.selected)
return
elif isinstance(evt.target, gr.Dropdown):
if hasattr(roop.globals, attribname):
setattr(roop.globals, attribname, evt.value)
return
raise gr.Error(f'Unhandled Setting for {evt.target}')
def on_settings_changed_misc(new_val, attribname):
if hasattr(roop.globals.CFG, attribname):
setattr(roop.globals.CFG, attribname, new_val)
else:
print("Didn't find attrib!")
def on_settings_changed(evt: gr.SelectData):
attribname = evt.target.elem_id
if isinstance(evt.target, gr.Checkbox):
if hasattr(roop.globals.CFG, attribname):
setattr(roop.globals.CFG, attribname, evt.selected)
return
elif isinstance(evt.target, gr.Dropdown):
if hasattr(roop.globals.CFG, attribname):
setattr(roop.globals.CFG, attribname, evt.value)
return
raise gr.Error(f'Unhandled Setting for {evt.target}')
def on_add_local_folder(folder):
files = util.get_local_files_from_folder(folder)
if files is None:
gr.Warning("Empty folder or folder not found!")
return files
def on_srcimg_changed(imgsrc, progress=gr.Progress()):
global RECENT_DIRECTORY_SOURCE, SELECTION_FACES_DATA, IS_INPUT, input_faces, face_selection, input_thumbs, last_image
IS_INPUT = True
if imgsrc == None or last_image == imgsrc:
return gr.Column.update(visible=False), None, input_thumbs
last_image = imgsrc
progress(0, desc="Retrieving faces from image", )
source_path = imgsrc
thumbs = []
if util.is_image(source_path):
roop.globals.source_path = source_path
RECENT_DIRECTORY_SOURCE = os.path.dirname(roop.globals.source_path)
SELECTION_FACES_DATA = extract_face_images(roop.globals.source_path, (False, 0))
progress(0.5, desc="Retrieving faces from image")
for f in SELECTION_FACES_DATA:
image = convert_to_gradio(f[1])
thumbs.append(image)
progress(1.0, desc="Retrieving faces from image")
if len(thumbs) < 1:
raise gr.Error('No faces detected!')
if len(thumbs) == 1:
face = SELECTION_FACES_DATA[0][0]
face.mask_top = 0
roop.globals.INPUT_FACES.append(face)
input_thumbs.append(thumbs[0])
return gr.Column.update(visible=False), None, input_thumbs
return gr.Column.update(visible=True), thumbs, gr.Gallery.update(visible=True)
def on_select_input_face(evt: gr.SelectData):
global SELECTED_INPUT_FACE_INDEX
SELECTED_INPUT_FACE_INDEX = evt.index
def remove_selected_input_face():
global input_thumbs, SELECTED_INPUT_FACE_INDEX
if len(roop.globals.INPUT_FACES) > SELECTED_INPUT_FACE_INDEX:
f = roop.globals.INPUT_FACES.pop(SELECTED_INPUT_FACE_INDEX)
del f
if len(input_thumbs) > SELECTED_INPUT_FACE_INDEX:
f = input_thumbs.pop(SELECTED_INPUT_FACE_INDEX)
del f
return input_thumbs
def on_select_target_face(evt: gr.SelectData):
global SELECTED_TARGET_FACE_INDEX
SELECTED_TARGET_FACE_INDEX = evt.index
def remove_selected_target_face():
global target_thumbs, SELECTED_TARGET_FACE_INDEX
if len(roop.globals.TARGET_FACES) > SELECTED_TARGET_FACE_INDEX:
f = roop.globals.TARGET_FACES.pop(SELECTED_TARGET_FACE_INDEX)
del f
if len(target_thumbs) > SELECTED_TARGET_FACE_INDEX:
f = target_thumbs.pop(SELECTED_TARGET_FACE_INDEX)
del f
return target_thumbs
def on_use_face_from_selected(files, frame_num):
global IS_INPUT, SELECTION_FACES_DATA
IS_INPUT = False
thumbs = []
roop.globals.target_path = files[selected_preview_index].name
if util.is_image(roop.globals.target_path) and not roop.globals.target_path.lower().endswith(('gif')):
SELECTION_FACES_DATA = extract_face_images(roop.globals.target_path, (False, 0))
if len(SELECTION_FACES_DATA) > 0:
for f in SELECTION_FACES_DATA:
image = convert_to_gradio(f[1])
thumbs.append(image)
else:
gr.Info('No faces detected!')
roop.globals.target_path = None
elif util.is_video(roop.globals.target_path) or roop.globals.target_path.lower().endswith(('gif')):
selected_frame = frame_num
SELECTION_FACES_DATA = extract_face_images(roop.globals.target_path, (True, selected_frame))
if len(SELECTION_FACES_DATA) > 0:
for f in SELECTION_FACES_DATA:
image = convert_to_gradio(f[1])
thumbs.append(image)
else:
gr.Info('No faces detected!')
roop.globals.target_path = None
if len(thumbs) == 1:
roop.globals.TARGET_FACES.append(SELECTION_FACES_DATA[0][0])
target_thumbs.append(thumbs[0])
return gr.Row.update(visible=False), None, target_thumbs, gr.Dropdown.update(value='Selected face')
return gr.Row.update(visible=True), thumbs, gr.Gallery.update(visible=True), gr.Dropdown.update(visible=True)
def on_select_face(evt: gr.SelectData): # SelectData is a subclass of EventData
global SELECTED_FACE_INDEX
SELECTED_FACE_INDEX = evt.index
def on_selected_face():
global IS_INPUT, SELECTED_FACE_INDEX, SELECTION_FACES_DATA, input_thumbs, target_thumbs
fd = SELECTION_FACES_DATA[SELECTED_FACE_INDEX]
image = convert_to_gradio(fd[1])
if IS_INPUT:
fd[0].mask_top = 0
roop.globals.INPUT_FACES.append(fd[0])
input_thumbs.append(image)
return input_thumbs, gr.Gallery.update(visible=True), gr.Dropdown.update(visible=True)
else:
roop.globals.TARGET_FACES.append(fd[0])
target_thumbs.append(image)
return gr.Gallery.update(visible=True), target_thumbs, gr.Dropdown.update(value='Selected face')
# bt_faceselect.click(fn=on_selected_face, outputs=[dynamic_face_selection, face_selection, input_faces, target_faces])
def on_end_face_selection():
return gr.Column.update(visible=False), None
def on_preview_frame_changed(frame_num, files, fake_preview, enhancer, detection, face_distance, blend_ratio, use_clip, clip_text):
global SELECTED_INPUT_FACE_INDEX, is_processing
from roop.core import live_swap
mask_top = 0
if len(roop.globals.INPUT_FACES) > SELECTED_INPUT_FACE_INDEX:
if hasattr(roop.globals.INPUT_FACES[SELECTED_INPUT_FACE_INDEX], 'mask_top'):
mask_top = roop.globals.INPUT_FACES[SELECTED_INPUT_FACE_INDEX].mask_top
else:
roop.globals.INPUT_FACES[SELECTED_INPUT_FACE_INDEX].mask_top = mask_top
if is_processing or files is None or selected_preview_index >= len(files) or frame_num is None:
return None, mask_top
filename = files[selected_preview_index].name
if util.is_video(filename) or filename.lower().endswith('gif'):
current_frame = get_video_frame(filename, frame_num)
else:
current_frame = get_image_frame(filename)
if current_frame is None:
return None, mask_top
time.sleep(0.2)
if not fake_preview or len(roop.globals.INPUT_FACES) < 1:
return convert_to_gradio(current_frame), mask_top
roop.globals.face_swap_mode = translate_swap_mode(detection)
roop.globals.selected_enhancer = enhancer
roop.globals.distance_threshold = face_distance
roop.globals.blend_ratio = blend_ratio
if use_clip and clip_text is None or len(clip_text) < 1:
use_clip = False
roop.globals.execution_threads = roop.globals.CFG.max_threads
current_frame = live_swap(current_frame, roop.globals.face_swap_mode, use_clip, clip_text, SELECTED_INPUT_FACE_INDEX)
if current_frame is None:
return None, mask_top
return convert_to_gradio(current_frame), mask_top
def gen_processing_text(start, end):
return f'Processing frame range [{start} - {end}]'
def on_set_frame(sender:str, frame_num):
global selected_preview_index, list_files_process
idx = selected_preview_index
if list_files_process[idx].endframe == 0:
return gen_processing_text(0,0)
start = list_files_process[idx].startframe
end = list_files_process[idx].endframe
if sender.lower().endswith('start'):
list_files_process[idx].startframe = min(frame_num, end)
else:
list_files_process[idx].endframe = max(frame_num, start)
return gen_processing_text(list_files_process[idx].startframe,list_files_process[idx].endframe)
def on_preview_mask(frame_num, files, clip_text):
from roop.core import preview_mask
global is_processing
if is_processing:
return None
filename = files[selected_preview_index].name
if util.is_video(filename) or filename.lower().endswith('gif'):
current_frame = get_video_frame(filename, frame_num)
else:
current_frame = get_image_frame(filename)
if current_frame is None:
return None
current_frame = preview_mask(current_frame, clip_text)
return convert_to_gradio(current_frame)
def on_clear_input_faces():
global input_thumbs
input_thumbs.clear()
roop.globals.INPUT_FACES.clear()
return input_thumbs
def on_clear_destfiles():
global target_thumbs
roop.globals.TARGET_FACES.clear()
target_thumbs.clear()
return target_thumbs
def translate_swap_mode(dropdown_text):
if dropdown_text == "Selected face":
return "selected"
elif dropdown_text == "First found":
return "first"
elif dropdown_text == "All female":
return "all_female"
elif dropdown_text == "All male":
return "all_male"
return "all"
def start_swap( enhancer, detection, keep_frames, skip_audio, face_distance, blend_ratio,
use_clip, clip_text, processing_method, progress=gr.Progress(track_tqdm=False)):
from roop.core import batch_process
global is_processing, list_files_process
if list_files_process is None or len(list_files_process) <= 0:
return gr.Button.update(variant="primary"), None
if roop.globals.CFG.clear_output:
shutil.rmtree(roop.globals.output_path)
prepare_environment()
roop.globals.selected_enhancer = enhancer
roop.globals.target_path = None
roop.globals.distance_threshold = face_distance
roop.globals.blend_ratio = blend_ratio
roop.globals.keep_frames = keep_frames
roop.globals.skip_audio = skip_audio
roop.globals.face_swap_mode = translate_swap_mode(detection)
if use_clip and clip_text is None or len(clip_text) < 1:
use_clip = False
if roop.globals.face_swap_mode == 'selected':
if len(roop.globals.TARGET_FACES) < 1:
gr.Error('No Target Face selected!')
return gr.Button.update(variant="primary"), None
is_processing = True
yield gr.Button.update(variant="secondary"), None
roop.globals.execution_threads = roop.globals.CFG.max_threads
roop.globals.video_encoder = roop.globals.CFG.output_video_codec
roop.globals.video_quality = roop.globals.CFG.video_quality
roop.globals.max_memory = roop.globals.CFG.memory_limit if roop.globals.CFG.memory_limit > 0 else None
batch_process(list_files_process, use_clip, clip_text, processing_method == "In-Memory", progress)
is_processing = False
outdir = pathlib.Path(roop.globals.output_path)
outfiles = [item for item in outdir.rglob("*") if item.is_file()]
if len(outfiles) > 0:
yield gr.Button.update(variant="primary"),gr.Files.update(value=outfiles)
else:
yield gr.Button.update(variant="primary"),None
def stop_swap():
roop.globals.processing = False
gr.Info('Aborting processing - please wait for the remaining threads to be stopped')
def on_fps_changed(fps):
global selected_preview_index, list_files_process
if len(list_files_process) < 1 or list_files_process[selected_preview_index].endframe < 1:
return
list_files_process[selected_preview_index].fps = fps
def on_destfiles_changed(destfiles):
global selected_preview_index, list_files_process
if destfiles is None or len(destfiles) < 1:
list_files_process.clear()
return gr.Slider.update(value=0, maximum=0), ''
for f in destfiles:
list_files_process.append(ProcessEntry(f.name, 0,0, 0))
selected_preview_index = 0
idx = selected_preview_index
filename = list_files_process[idx].filename
if util.is_video(filename) or filename.lower().endswith('gif'):
total_frames = get_video_frame_total(filename)
else:
total_frames = 0
list_files_process[idx].endframe = total_frames
if total_frames > 0:
return gr.Slider.update(value=0, maximum=total_frames), gen_processing_text(list_files_process[idx].startframe,list_files_process[idx].endframe)
return gr.Slider.update(value=0, maximum=total_frames), ''
def on_destfiles_selected(evt: gr.SelectData):
global selected_preview_index, list_files_process
if evt is not None:
selected_preview_index = evt.index
idx = selected_preview_index
filename = list_files_process[idx].filename
fps = list_files_process[idx].fps
if util.is_video(filename) or filename.lower().endswith('gif'):
total_frames = get_video_frame_total(filename)
if list_files_process[idx].endframe == 0:
list_files_process[idx].endframe = total_frames
else:
total_frames = 0
if total_frames > 0:
return gr.Slider.update(value=list_files_process[idx].startframe, maximum=total_frames), gen_processing_text(list_files_process[idx].startframe,list_files_process[idx].endframe), fps
return gr.Slider.update(value=0, maximum=total_frames), gen_processing_text(0,0), fps
def on_resultfiles_selected(evt: gr.SelectData, files):
selected_index = evt.index
filename = files[selected_index].name
if util.is_video(filename) or filename.lower().endswith('gif'):
current_frame = get_video_frame(filename, 0)
else:
current_frame = get_image_frame(filename)
return convert_to_gradio(current_frame)
def on_resultfiles_finished(files):
selected_index = 0
if files is None or len(files) < 1:
return None
filename = files[selected_index].name
if util.is_video(filename) or filename.lower().endswith('gif'):
current_frame = get_video_frame(filename, 0)
else:
current_frame = get_image_frame(filename)
return convert_to_gradio(current_frame)
def on_cam_toggle(state):
from threading import Thread
from roop.virtualcam import virtualcamera, cam_active
global live_cam_active, restart_server, camthread
live_cam_active = state
gr.Warning('Server will be restarted for this change!')
restart_server = True
def on_vcam_toggle(state, num):
from roop.virtualcam import stop_virtual_cam, start_virtual_cam
if state:
start_virtual_cam(num)
return gr.Webcam.update(interactive=False), None
else:
stop_virtual_cam()
return gr.Webcam.update(interactive=True, mirror_webcam=True), None
def on_stream_swap_cam(camimage, enhancer, blend_ratio):
from roop.core import live_swap
global current_cam_image, cam_counter, cam_swapping, fake_cam_image, SELECTED_INPUT_FACE_INDEX
roop.globals.selected_enhancer = enhancer
roop.globals.blend_ratio = blend_ratio
if not cam_swapping:
cam_swapping = True
if len(roop.globals.INPUT_FACES) > 0:
current_cam_image = live_swap(camimage, "all", False, None, SELECTED_INPUT_FACE_INDEX)
else:
current_cam_image = camimage
cam_swapping = False
return current_cam_image
def on_cut_video(files, cut_start_frame, cut_end_frame):
if files is None:
return None
resultfiles = []
for tf in files:
f = tf.name
destfile = util.get_destfilename_from_path(f, roop.globals.output_path, '_cut')
util.cut_video(f, destfile, cut_start_frame, cut_end_frame)
if os.path.isfile(destfile):
resultfiles.append(destfile)
else:
gr.Error('Cutting video failed!')
return resultfiles
def on_join_videos(files):
if files is None:
return None
filenames = []
for f in files:
filenames.append(f.name)
destfile = util.get_destfilename_from_path(filenames[0], roop.globals.output_path, '_join')
util.join_videos(filenames, destfile)
resultfiles = []
if os.path.isfile(destfile):
resultfiles.append(destfile)
else:
gr.Error('Joining videos failed!')
return resultfiles
def on_extract_frames(files):
if files is None:
return None
resultfiles = []
for tf in files:
f = tf.name
resfolder = util.extract_frames(f)
for file in os.listdir(resfolder):
outfile = os.path.join(resfolder, file)
if os.path.isfile(outfile):
resultfiles.append(outfile)
return resultfiles
def on_create_gif(files):
if files is None:
return None
for tf in files:
f = tf.name
gifname = util.get_destfilename_from_path(f, './output', '.gif')
util.create_gif_from_video(f, gifname)
return gifname
def clean_temp():
global input_thumbs, target_thumbs
shutil.rmtree(os.environ["TEMP"])
prepare_environment()
input_thumbs.clear()
roop.globals.INPUT_FACES.clear()
roop.globals.TARGET_FACES.clear()
target_thumbs = []
gr.Info('Temp Files removed')
return None,None,None,None
def apply_settings(themes, input_server_name, input_server_port, output_template):
roop.globals.CFG.selected_theme = themes
roop.globals.CFG.server_name = input_server_name
roop.globals.CFG.server_port = input_server_port
roop.globals.CFG.output_template = output_template
roop.globals.CFG.save()
show_msg('Settings saved')
def restart():
global restart_server
restart_server = True
def show_msg(msg: str):
gr.Info(msg)
# Gradio wants Images in RGB
def convert_to_gradio(image):
if image is None:
return None
return cv2.cvtColor(image, cv2.COLOR_BGR2RGB)