LivePortrait-animal

Runtime error

App Files Files Community

LivePortrait-animal / src /config /argument_config.py

abreza

init

469635f about 2 months ago

raw

history blame contribute delete

4.97 kB

	# coding: utf-8

	"""
	All configs for user
	"""
	from dataclasses import dataclass
	import tyro
	from typing_extensions import Annotated
	from typing import Optional, Literal
	from .base_config import PrintableConfig, make_abs_path


	@dataclass(repr=False) # use repr from PrintableConfig
	class ArgumentConfig(PrintableConfig):
	########## input arguments ##########
	source: Annotated[str, tyro.conf.arg(aliases=["-s"])] = make_abs_path('../../assets/examples/source/s0.jpg') # path to the source portrait (human/animal) or video (human)
	driving: Annotated[str, tyro.conf.arg(aliases=["-d"])] = make_abs_path('../../assets/examples/driving/d0.mp4') # path to driving video or template (.pkl format)
	output_dir: Annotated[str, tyro.conf.arg(aliases=["-o"])] = 'animations/' # directory to save output video

	########## inference arguments ##########
	flag_use_half_precision: bool = True # whether to use half precision (FP16). If black boxes appear, it might be due to GPU incompatibility; set to False.
	flag_crop_driving_video: bool = False # whether to crop the driving video, if the given driving info is a video
	device_id: int = 0 # gpu device id
	flag_force_cpu: bool = False # force cpu inference, WIP!
	flag_normalize_lip: bool = False # whether to let the lip to close state before animation, only take effect when flag_eye_retargeting and flag_lip_retargeting is False
	flag_source_video_eye_retargeting: bool = False # when the input is a source video, whether to let the eye-open scalar of each frame to be the same as the first source frame before the animation, only take effect when flag_eye_retargeting and flag_lip_retargeting is False, may cause the inter-frame jittering
	flag_eye_retargeting: bool = False # not recommend to be True, WIP; whether to transfer the eyes-open ratio of each driving frame to the source image or the corresponding source frame
	flag_lip_retargeting: bool = False # not recommend to be True, WIP; whether to transfer the lip-open ratio of each driving frame to the source image or the corresponding source frame
	flag_stitching: bool = True # recommend to True if head movement is small, False if head movement is large or the source image is an animal
	flag_relative_motion: bool = True # whether to use relative motion
	flag_pasteback: bool = True # whether to paste-back/stitch the animated face cropping from the face-cropping space to the original image space
	flag_do_crop: bool = True # whether to crop the source portrait or video to the face-cropping space
	driving_option: Literal["expression-friendly", "pose-friendly"] = "expression-friendly" # "expression-friendly" or "pose-friendly"; "expression-friendly" would adapt the driving motion with the global multiplier, and could be used when the source is a human image
	driving_multiplier: float = 1.0 # be used only when driving_option is "expression-friendly"
	driving_smooth_observation_variance: float = 3e-7 # smooth strength scalar for the animated video when the input is a source video, the larger the number, the smoother the animated video; too much smoothness would result in loss of motion accuracy
	audio_priority: Literal['source', 'driving'] = 'driving' # whether to use the audio from source or driving video
	animation_region: Literal["exp", "pose", "lip", "eyes", "all"] = "all" # the region where the animation was performed, "exp" means the expression, "pose" means the head pose, "all" means all regions
	########## source crop arguments ##########
	det_thresh: float = 0.15 # detection threshold
	scale: float = 2.3 # the ratio of face area is smaller if scale is larger
	vx_ratio: float = 0 # the ratio to move the face to left or right in cropping space
	vy_ratio: float = -0.125 # the ratio to move the face to up or down in cropping space
	flag_do_rot: bool = True # whether to conduct the rotation when flag_do_crop is True
	source_max_dim: int = 1280 # the max dim of height and width of source image or video, you can change it to a larger number, e.g., 1920
	source_division: int = 2 # make sure the height and width of source image or video can be divided by this number

	########## driving crop arguments ##########
	scale_crop_driving_video: float = 2.2 # scale factor for cropping driving video
	vx_ratio_crop_driving_video: float = 0. # adjust y offset
	vy_ratio_crop_driving_video: float = -0.1 # adjust x offset

	########## gradio arguments ##########
	server_port: Annotated[int, tyro.conf.arg(aliases=["-p"])] = 8890 # port for gradio server
	share: bool = False # whether to share the server to public
	server_name: Optional[str] = "127.0.0.1" # set the local server name, "0.0.0.0" to broadcast all
	flag_do_torch_compile: bool = False # whether to use torch.compile to accelerate generation
	gradio_temp_dir: Optional[str] = None # directory to save gradio temp files