Spaces:
Running
on
Zero
Running
on
Zero
"""Constants used throughout the HunyuanVideo-Foley project.""" | |
from typing import Dict, List | |
# Model configuration | |
DEFAULT_AUDIO_SAMPLE_RATE = 48000 | |
DEFAULT_VIDEO_FPS = 25 | |
DEFAULT_AUDIO_CHANNELS = 2 | |
# Video processing | |
MAX_VIDEO_DURATION_SECONDS = 15.0 | |
MIN_VIDEO_DURATION_SECONDS = 1.0 | |
# Audio processing | |
AUDIO_VAE_LATENT_DIM = 128 | |
AUDIO_FRAME_RATE = 75 # frames per second in latent space | |
# Visual features | |
FPS_VISUAL: Dict[str, int] = { | |
"siglip2": 8, | |
"synchformer": 25 | |
} | |
# Model paths (can be overridden by environment variables) | |
DEFAULT_MODEL_PATH = "./pretrained_models/" | |
DEFAULT_CONFIG_PATH = "configs/hunyuanvideo-foley-xxl.yaml" | |
# Inference parameters | |
DEFAULT_GUIDANCE_SCALE = 4.5 | |
DEFAULT_NUM_INFERENCE_STEPS = 50 | |
MIN_GUIDANCE_SCALE = 1.0 | |
MAX_GUIDANCE_SCALE = 10.0 | |
MIN_INFERENCE_STEPS = 10 | |
MAX_INFERENCE_STEPS = 100 | |
# Text processing | |
MAX_TEXT_LENGTH = 100 | |
DEFAULT_NEGATIVE_PROMPT = "noisy, harsh" | |
# File extensions | |
SUPPORTED_VIDEO_EXTENSIONS: List[str] = [".mp4", ".avi", ".mov", ".mkv", ".webm"] | |
SUPPORTED_AUDIO_EXTENSIONS: List[str] = [".wav", ".mp3", ".flac", ".aac"] | |
# Quality settings | |
AUDIO_QUALITY_SETTINGS: Dict[str, List[str]] = { | |
"high": ["-b:a", "192k"], | |
"medium": ["-b:a", "128k"], | |
"low": ["-b:a", "96k"] | |
} | |
# Error messages | |
ERROR_MESSAGES: Dict[str, str] = { | |
"model_not_loaded": "Model is not loaded. Please load the model first.", | |
"invalid_video_format": "Unsupported video format. Supported formats: {formats}", | |
"video_too_long": f"Video duration exceeds maximum of {MAX_VIDEO_DURATION_SECONDS} seconds", | |
"ffmpeg_not_found": "ffmpeg not found. Please install ffmpeg: https://ffmpeg.org/download.html" | |
} |