|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from typing import Any, List |
|
|
|
import attrs |
|
|
|
from cosmos_transfer1.diffusion.config.transfer.model import CtrlModelConfig |
|
from cosmos_transfer1.diffusion.config.transfer.registry import register_configs |
|
from cosmos_transfer1.diffusion.model.model_ctrl import VideoDiffusionModelWithCtrl |
|
from cosmos_transfer1.utils import config |
|
from cosmos_transfer1.utils.config_helper import import_all_modules_from_package |
|
from cosmos_transfer1.utils.lazy_config import PLACEHOLDER |
|
from cosmos_transfer1.utils.lazy_config import LazyCall as L |
|
from cosmos_transfer1.utils.lazy_config import LazyDict |
|
|
|
|
|
@attrs.define(slots=False) |
|
class Config(config.Config): |
|
|
|
|
|
defaults: List[Any] = attrs.field( |
|
factory=lambda: [ |
|
"_self_", |
|
{"net": None}, |
|
{"net_ctrl": None}, |
|
{"hint_key": "control_input_edge"}, |
|
{"conditioner": "ctrlnet_add_fps_image_size_padding_mask"}, |
|
{"tokenizer": "vae1"}, |
|
{"experiment": None}, |
|
] |
|
) |
|
model_obj: LazyDict = L(VideoDiffusionModelWithCtrl)( |
|
config=PLACEHOLDER, |
|
) |
|
|
|
|
|
def make_config(): |
|
c = Config( |
|
model=CtrlModelConfig(), |
|
) |
|
register_configs() |
|
|
|
import_all_modules_from_package("cosmos_transfer1.diffusion.config.inference") |
|
return c |
|
|