Spaces:
Runtime error
Runtime error
Update config/models/ace_0.6b_1024.yaml
Browse files- config/models/ace_0.6b_1024.yaml +1 -153
config/models/ace_0.6b_1024.yaml
CHANGED
|
@@ -129,156 +129,4 @@ MODEL:
|
|
| 129 |
T5_DTYPE: bfloat16
|
| 130 |
ADDED_IDENTIFIER: [ '{image}', '{caption}', '{mask}', '{ref_image}', '{image1}', '{image2}', '{image3}', '{image4}', '{image5}', '{image6}', '{image7}', '{image8}', '{image9}' ]
|
| 131 |
CLEAN: whitespace
|
| 132 |
-
USE_GRAD: False
|
| 133 |
-
|
| 134 |
-
ACE_PROMPT: [
|
| 135 |
-
"A cute cartoon rabbit holding a whiteboard that says 'ACE Refiner', standing in a sunny meadow filled with flowers, with a big smile and bright colors.",
|
| 136 |
-
"A beautiful young woman with long flowing hair, wearing a summer dress, holding a whiteboard that reads 'ACE Refiner' while sitting on a park bench surrounded by cherry blossoms.",
|
| 137 |
-
"An adorable cartoon cat wearing oversized glasses, holding a whiteboard that says 'ACE Refiner', perched on a stack of colorful books in a cozy library setting.",
|
| 138 |
-
"A charming girl with pigtails, wearing a cute school uniform, enthusiastically holding a whiteboard that has 'ACE Refiner' written on it, in a bright and cheerful classroom full of educational posters.",
|
| 139 |
-
"A friendly cartoon dog with floppy ears, sitting in front of a doghouse, proudly holding a whiteboard that says 'ACE Refiner', with a playful expression and a blue sky in the background.",
|
| 140 |
-
"A cute anime girl with big expressive eyes, dressed in a colorful outfit, holding a whiteboard that reads 'ACE Refiner' in a fantastical landscape filled with mythical creatures.",
|
| 141 |
-
"A vibrant cartoon fox holding a whiteboard that says 'ACE Refiner', standing on a rock by a sparkling stream, surrounded by lush greenery and butterflies.",
|
| 142 |
-
"A stylish young woman in a business outfit, smiling as she holds a whiteboard written with 'ACE Refiner', in a modern office filled with plants and natural light.",
|
| 143 |
-
"A cute cartoon unicorn holding a sparkling whiteboard that says 'ACE Refiner', frolicking in a magical forest, with rainbows and stars in the background.",
|
| 144 |
-
"A happy family, consisting of a cute little girl and her playful puppy, holding a whiteboard that says 'ACE Refiner', together in their backyard on a sunny day."
|
| 145 |
-
]
|
| 146 |
-
REFINER_MODEL:
|
| 147 |
-
NAME: ""
|
| 148 |
-
IS_DEFAULT: False
|
| 149 |
-
DEFAULT_PARAS:
|
| 150 |
-
PARAS:
|
| 151 |
-
RESOLUTIONS: [ [ 1024, 1024 ] ]
|
| 152 |
-
INPUT:
|
| 153 |
-
INPUT_IMAGE:
|
| 154 |
-
INPUT_MASK:
|
| 155 |
-
TASK:
|
| 156 |
-
PROMPT: ""
|
| 157 |
-
NEGATIVE_PROMPT: ""
|
| 158 |
-
OUTPUT_HEIGHT: 1024
|
| 159 |
-
OUTPUT_WIDTH: 1024
|
| 160 |
-
SAMPLER: flow_euler
|
| 161 |
-
SAMPLE_STEPS: 30
|
| 162 |
-
GUIDE_SCALE: 3.5
|
| 163 |
-
GUIDE_RESCALE:
|
| 164 |
-
OUTPUT:
|
| 165 |
-
LATENT:
|
| 166 |
-
IMAGES:
|
| 167 |
-
SEED:
|
| 168 |
-
MODULES_PARAS:
|
| 169 |
-
FIRST_STAGE_MODEL:
|
| 170 |
-
FUNCTION:
|
| 171 |
-
- NAME: encode
|
| 172 |
-
DTYPE: bfloat16
|
| 173 |
-
INPUT: [ "IMAGE" ]
|
| 174 |
-
- NAME: decode
|
| 175 |
-
DTYPE: bfloat16
|
| 176 |
-
INPUT: [ "LATENT" ]
|
| 177 |
-
PARAS:
|
| 178 |
-
SCALE_FACTOR: 1.5305
|
| 179 |
-
SHIFT_FACTOR: 0.0609
|
| 180 |
-
SIZE_FACTOR: 8
|
| 181 |
-
DIFFUSION_MODEL:
|
| 182 |
-
FUNCTION:
|
| 183 |
-
- NAME: forward
|
| 184 |
-
DTYPE: bfloat16
|
| 185 |
-
INPUT: [ "SAMPLE_STEPS", "SAMPLE", "GUIDE_SCALE" ]
|
| 186 |
-
COND_STAGE_MODEL:
|
| 187 |
-
FUNCTION:
|
| 188 |
-
- NAME: encode
|
| 189 |
-
DTYPE: bfloat16
|
| 190 |
-
INPUT: [ "PROMPT" ]
|
| 191 |
-
|
| 192 |
-
MODEL:
|
| 193 |
-
DIFFUSION:
|
| 194 |
-
NAME: DiffusionFluxRF
|
| 195 |
-
PREDICTION_TYPE: raw
|
| 196 |
-
NOISE_SCHEDULER:
|
| 197 |
-
NAME: FlowMatchSigmaScheduler
|
| 198 |
-
WEIGHTING_SCHEME: logit_normal
|
| 199 |
-
SHIFT: 3.0
|
| 200 |
-
LOGIT_MEAN: 0.0
|
| 201 |
-
LOGIT_STD: 1.0
|
| 202 |
-
MODE_SCALE: 1.29
|
| 203 |
-
DIFFUSION_MODEL:
|
| 204 |
-
NAME: FluxMR
|
| 205 |
-
PRETRAINED_MODEL: ms://AI-ModelScope/[email protected]
|
| 206 |
-
IN_CHANNELS: 64
|
| 207 |
-
OUT_CHANNELS: 64
|
| 208 |
-
HIDDEN_SIZE: 3072
|
| 209 |
-
NUM_HEADS: 24
|
| 210 |
-
AXES_DIM: [ 16, 56, 56 ]
|
| 211 |
-
THETA: 10000
|
| 212 |
-
VEC_IN_DIM: 768
|
| 213 |
-
GUIDANCE_EMBED: True
|
| 214 |
-
CONTEXT_IN_DIM: 4096
|
| 215 |
-
MLP_RATIO: 4.0
|
| 216 |
-
QKV_BIAS: True
|
| 217 |
-
DEPTH: 19
|
| 218 |
-
DEPTH_SINGLE_BLOCKS: 38
|
| 219 |
-
USE_GRAD_CHECKPOINT: True
|
| 220 |
-
ATTN_BACKEND: flash_attn
|
| 221 |
-
#
|
| 222 |
-
FIRST_STAGE_MODEL:
|
| 223 |
-
NAME: AutoencoderKLFlux
|
| 224 |
-
EMBED_DIM: 16
|
| 225 |
-
PRETRAINED_MODEL: ms://AI-ModelScope/[email protected]
|
| 226 |
-
IGNORE_KEYS: [ ]
|
| 227 |
-
BATCH_SIZE: 8
|
| 228 |
-
USE_CONV: False
|
| 229 |
-
SCALE_FACTOR: 0.3611
|
| 230 |
-
SHIFT_FACTOR: 0.1159
|
| 231 |
-
#
|
| 232 |
-
ENCODER:
|
| 233 |
-
NAME: Encoder
|
| 234 |
-
USE_CHECKPOINT: False
|
| 235 |
-
CH: 128
|
| 236 |
-
OUT_CH: 3
|
| 237 |
-
NUM_RES_BLOCKS: 2
|
| 238 |
-
IN_CHANNELS: 3
|
| 239 |
-
ATTN_RESOLUTIONS: [ ]
|
| 240 |
-
CH_MULT: [ 1, 2, 4, 4 ]
|
| 241 |
-
Z_CHANNELS: 16
|
| 242 |
-
DOUBLE_Z: True
|
| 243 |
-
DROPOUT: 0.0
|
| 244 |
-
RESAMP_WITH_CONV: True
|
| 245 |
-
#
|
| 246 |
-
DECODER:
|
| 247 |
-
NAME: Decoder
|
| 248 |
-
USE_CHECKPOINT: False
|
| 249 |
-
CH: 128
|
| 250 |
-
OUT_CH: 3
|
| 251 |
-
NUM_RES_BLOCKS: 2
|
| 252 |
-
IN_CHANNELS: 3
|
| 253 |
-
ATTN_RESOLUTIONS: [ ]
|
| 254 |
-
CH_MULT: [ 1, 2, 4, 4 ]
|
| 255 |
-
Z_CHANNELS: 16
|
| 256 |
-
DROPOUT: 0.0
|
| 257 |
-
RESAMP_WITH_CONV: True
|
| 258 |
-
GIVE_PRE_END: False
|
| 259 |
-
TANH_OUT: False
|
| 260 |
-
#
|
| 261 |
-
COND_STAGE_MODEL:
|
| 262 |
-
NAME: T5PlusClipFluxEmbedder
|
| 263 |
-
T5_MODEL:
|
| 264 |
-
NAME: HFEmbedder
|
| 265 |
-
HF_MODEL_CLS: T5EncoderModel
|
| 266 |
-
MODEL_PATH: ms://AI-ModelScope/FLUX.1-dev@text_encoder_2/
|
| 267 |
-
HF_TOKENIZER_CLS: T5Tokenizer
|
| 268 |
-
TOKENIZER_PATH: ms://AI-ModelScope/FLUX.1-dev@tokenizer_2/
|
| 269 |
-
MAX_LENGTH: 512
|
| 270 |
-
OUTPUT_KEY: last_hidden_state
|
| 271 |
-
D_TYPE: bfloat16
|
| 272 |
-
BATCH_INFER: False
|
| 273 |
-
CLEAN: whitespace
|
| 274 |
-
CLIP_MODEL:
|
| 275 |
-
NAME: HFEmbedder
|
| 276 |
-
HF_MODEL_CLS: CLIPTextModel
|
| 277 |
-
MODEL_PATH: ms://AI-ModelScope/FLUX.1-dev@text_encoder/
|
| 278 |
-
HF_TOKENIZER_CLS: CLIPTokenizer
|
| 279 |
-
TOKENIZER_PATH: ms://AI-ModelScope/FLUX.1-dev@tokenizer/
|
| 280 |
-
MAX_LENGTH: 77
|
| 281 |
-
OUTPUT_KEY: pooler_output
|
| 282 |
-
D_TYPE: bfloat16
|
| 283 |
-
BATCH_INFER: True
|
| 284 |
-
CLEAN: whitespace
|
|
|
|
| 129 |
T5_DTYPE: bfloat16
|
| 130 |
ADDED_IDENTIFIER: [ '{image}', '{caption}', '{mask}', '{ref_image}', '{image1}', '{image2}', '{image3}', '{image4}', '{image5}', '{image6}', '{image7}', '{image8}', '{image9}' ]
|
| 131 |
CLEAN: whitespace
|
| 132 |
+
USE_GRAD: False
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|