Spaces:
Runtime error
Runtime error
| NAME: ACE_0.6B_512 | |
| IS_DEFAULT: False | |
| DEFAULT_PARAS: | |
| PARAS: | |
| # | |
| INPUT: | |
| INPUT_IMAGE: | |
| INPUT_MASK: | |
| TASK: | |
| PROMPT: "" | |
| NEGATIVE_PROMPT: "" | |
| OUTPUT_HEIGHT: 512 | |
| OUTPUT_WIDTH: 512 | |
| SAMPLER: ddim | |
| SAMPLE_STEPS: 20 | |
| GUIDE_SCALE: 4.5 | |
| GUIDE_RESCALE: 0.5 | |
| SEED: -1 | |
| TAR_INDEX: 0 | |
| OUTPUT: | |
| LATENT: | |
| IMAGES: | |
| SEED: | |
| MODULES_PARAS: | |
| FIRST_STAGE_MODEL: | |
| FUNCTION: | |
| - NAME: encode | |
| DTYPE: float16 | |
| INPUT: ["IMAGE"] | |
| - NAME: decode | |
| DTYPE: float16 | |
| INPUT: ["LATENT"] | |
| # | |
| DIFFUSION_MODEL: | |
| FUNCTION: | |
| - NAME: forward | |
| DTYPE: float16 | |
| INPUT: ["SAMPLE_STEPS", "SAMPLE", "GUIDE_SCALE"] | |
| # | |
| COND_STAGE_MODEL: | |
| FUNCTION: | |
| - NAME: encode_list | |
| DTYPE: bfloat16 | |
| INPUT: ["PROMPT"] | |
| # | |
| MODEL: | |
| NAME: LdmACE | |
| PRETRAINED_MODEL: | |
| IGNORE_KEYS: [ ] | |
| SCALE_FACTOR: 0.18215 | |
| SIZE_FACTOR: 8 | |
| DECODER_BIAS: 0.5 | |
| DEFAULT_N_PROMPT: "" | |
| TEXT_IDENTIFIER: [ '{image}', '{image1}', '{image2}', '{image3}', '{image4}', '{image5}', '{image6}', '{image7}', '{image8}', '{image9}' ] | |
| USE_TEXT_POS_EMBEDDINGS: True | |
| # | |
| DIFFUSION: | |
| NAME: ACEDiffusion | |
| PREDICTION_TYPE: eps | |
| MIN_SNR_GAMMA: | |
| NOISE_SCHEDULER: | |
| NAME: LinearScheduler | |
| NUM_TIMESTEPS: 1000 | |
| BETA_MIN: 0.0001 | |
| BETA_MAX: 0.02 | |
| # | |
| DIFFUSION_MODEL: | |
| NAME: DiTACE | |
| PRETRAINED_MODEL: hf://scepter-studio/ACE-0.6B-512px@models/dit/ace_0.6b_512px.pth | |
| IGNORE_KEYS: [ ] | |
| PATCH_SIZE: 2 | |
| IN_CHANNELS: 4 | |
| HIDDEN_SIZE: 1152 | |
| DEPTH: 28 | |
| NUM_HEADS: 16 | |
| MLP_RATIO: 4.0 | |
| PRED_SIGMA: True | |
| DROP_PATH: 0.0 | |
| WINDOW_DIZE: 0 | |
| Y_CHANNELS: 4096 | |
| MAX_SEQ_LEN: 1024 | |
| QK_NORM: True | |
| USE_GRAD_CHECKPOINT: True | |
| ATTENTION_BACKEND: flash_attn | |
| # | |
| FIRST_STAGE_MODEL: | |
| NAME: AutoencoderKL | |
| EMBED_DIM: 4 | |
| PRETRAINED_MODEL: hf://scepter-studio/ACE-0.6B-512px@models/vae/vae.bin | |
| IGNORE_KEYS: [] | |
| # | |
| ENCODER: | |
| NAME: Encoder | |
| CH: 128 | |
| OUT_CH: 3 | |
| NUM_RES_BLOCKS: 2 | |
| IN_CHANNELS: 3 | |
| ATTN_RESOLUTIONS: [ ] | |
| CH_MULT: [ 1, 2, 4, 4 ] | |
| Z_CHANNELS: 4 | |
| DOUBLE_Z: True | |
| DROPOUT: 0.0 | |
| RESAMP_WITH_CONV: True | |
| # | |
| DECODER: | |
| NAME: Decoder | |
| CH: 128 | |
| OUT_CH: 3 | |
| NUM_RES_BLOCKS: 2 | |
| IN_CHANNELS: 3 | |
| ATTN_RESOLUTIONS: [ ] | |
| CH_MULT: [ 1, 2, 4, 4 ] | |
| Z_CHANNELS: 4 | |
| DROPOUT: 0.0 | |
| RESAMP_WITH_CONV: True | |
| GIVE_PRE_END: False | |
| TANH_OUT: False | |
| # | |
| COND_STAGE_MODEL: | |
| NAME: ACETextEmbedder | |
| PRETRAINED_MODEL: hf://scepter-studio/ACE-0.6B-512px@models/text_encoder/t5-v1_1-xxl/ | |
| TOKENIZER_PATH: hf://scepter-studio/ACE-0.6B-512px@models/tokenizer/t5-v1_1-xxl | |
| LENGTH: 120 | |
| T5_DTYPE: bfloat16 | |
| ADDED_IDENTIFIER: [ '{image}', '{caption}', '{mask}', '{ref_image}', '{image1}', '{image2}', '{image3}', '{image4}', '{image5}', '{image6}', '{image7}', '{image8}', '{image9}' ] | |
| CLEAN: whitespace | |
| USE_GRAD: False | |