Spaces:
Running
on
Zero
Running
on
Zero
Update config/models/ace_0.6b_1024.yaml
Browse files- config/models/ace_0.6b_1024.yaml +1 -153
config/models/ace_0.6b_1024.yaml
CHANGED
@@ -129,156 +129,4 @@ MODEL:
|
|
129 |
T5_DTYPE: bfloat16
|
130 |
ADDED_IDENTIFIER: [ '{image}', '{caption}', '{mask}', '{ref_image}', '{image1}', '{image2}', '{image3}', '{image4}', '{image5}', '{image6}', '{image7}', '{image8}', '{image9}' ]
|
131 |
CLEAN: whitespace
|
132 |
-
USE_GRAD: False
|
133 |
-
|
134 |
-
ACE_PROMPT: [
|
135 |
-
"A cute cartoon rabbit holding a whiteboard that says 'ACE Refiner', standing in a sunny meadow filled with flowers, with a big smile and bright colors.",
|
136 |
-
"A beautiful young woman with long flowing hair, wearing a summer dress, holding a whiteboard that reads 'ACE Refiner' while sitting on a park bench surrounded by cherry blossoms.",
|
137 |
-
"An adorable cartoon cat wearing oversized glasses, holding a whiteboard that says 'ACE Refiner', perched on a stack of colorful books in a cozy library setting.",
|
138 |
-
"A charming girl with pigtails, wearing a cute school uniform, enthusiastically holding a whiteboard that has 'ACE Refiner' written on it, in a bright and cheerful classroom full of educational posters.",
|
139 |
-
"A friendly cartoon dog with floppy ears, sitting in front of a doghouse, proudly holding a whiteboard that says 'ACE Refiner', with a playful expression and a blue sky in the background.",
|
140 |
-
"A cute anime girl with big expressive eyes, dressed in a colorful outfit, holding a whiteboard that reads 'ACE Refiner' in a fantastical landscape filled with mythical creatures.",
|
141 |
-
"A vibrant cartoon fox holding a whiteboard that says 'ACE Refiner', standing on a rock by a sparkling stream, surrounded by lush greenery and butterflies.",
|
142 |
-
"A stylish young woman in a business outfit, smiling as she holds a whiteboard written with 'ACE Refiner', in a modern office filled with plants and natural light.",
|
143 |
-
"A cute cartoon unicorn holding a sparkling whiteboard that says 'ACE Refiner', frolicking in a magical forest, with rainbows and stars in the background.",
|
144 |
-
"A happy family, consisting of a cute little girl and her playful puppy, holding a whiteboard that says 'ACE Refiner', together in their backyard on a sunny day."
|
145 |
-
]
|
146 |
-
REFINER_MODEL:
|
147 |
-
NAME: ""
|
148 |
-
IS_DEFAULT: False
|
149 |
-
DEFAULT_PARAS:
|
150 |
-
PARAS:
|
151 |
-
RESOLUTIONS: [ [ 1024, 1024 ] ]
|
152 |
-
INPUT:
|
153 |
-
INPUT_IMAGE:
|
154 |
-
INPUT_MASK:
|
155 |
-
TASK:
|
156 |
-
PROMPT: ""
|
157 |
-
NEGATIVE_PROMPT: ""
|
158 |
-
OUTPUT_HEIGHT: 1024
|
159 |
-
OUTPUT_WIDTH: 1024
|
160 |
-
SAMPLER: flow_euler
|
161 |
-
SAMPLE_STEPS: 30
|
162 |
-
GUIDE_SCALE: 3.5
|
163 |
-
GUIDE_RESCALE:
|
164 |
-
OUTPUT:
|
165 |
-
LATENT:
|
166 |
-
IMAGES:
|
167 |
-
SEED:
|
168 |
-
MODULES_PARAS:
|
169 |
-
FIRST_STAGE_MODEL:
|
170 |
-
FUNCTION:
|
171 |
-
- NAME: encode
|
172 |
-
DTYPE: bfloat16
|
173 |
-
INPUT: [ "IMAGE" ]
|
174 |
-
- NAME: decode
|
175 |
-
DTYPE: bfloat16
|
176 |
-
INPUT: [ "LATENT" ]
|
177 |
-
PARAS:
|
178 |
-
SCALE_FACTOR: 1.5305
|
179 |
-
SHIFT_FACTOR: 0.0609
|
180 |
-
SIZE_FACTOR: 8
|
181 |
-
DIFFUSION_MODEL:
|
182 |
-
FUNCTION:
|
183 |
-
- NAME: forward
|
184 |
-
DTYPE: bfloat16
|
185 |
-
INPUT: [ "SAMPLE_STEPS", "SAMPLE", "GUIDE_SCALE" ]
|
186 |
-
COND_STAGE_MODEL:
|
187 |
-
FUNCTION:
|
188 |
-
- NAME: encode
|
189 |
-
DTYPE: bfloat16
|
190 |
-
INPUT: [ "PROMPT" ]
|
191 |
-
|
192 |
-
MODEL:
|
193 |
-
DIFFUSION:
|
194 |
-
NAME: DiffusionFluxRF
|
195 |
-
PREDICTION_TYPE: raw
|
196 |
-
NOISE_SCHEDULER:
|
197 |
-
NAME: FlowMatchSigmaScheduler
|
198 |
-
WEIGHTING_SCHEME: logit_normal
|
199 |
-
SHIFT: 3.0
|
200 |
-
LOGIT_MEAN: 0.0
|
201 |
-
LOGIT_STD: 1.0
|
202 |
-
MODE_SCALE: 1.29
|
203 |
-
DIFFUSION_MODEL:
|
204 |
-
NAME: FluxMR
|
205 |
-
PRETRAINED_MODEL: ms://AI-ModelScope/FLUX.1-dev@flux1-dev.safetensors
|
206 |
-
IN_CHANNELS: 64
|
207 |
-
OUT_CHANNELS: 64
|
208 |
-
HIDDEN_SIZE: 3072
|
209 |
-
NUM_HEADS: 24
|
210 |
-
AXES_DIM: [ 16, 56, 56 ]
|
211 |
-
THETA: 10000
|
212 |
-
VEC_IN_DIM: 768
|
213 |
-
GUIDANCE_EMBED: True
|
214 |
-
CONTEXT_IN_DIM: 4096
|
215 |
-
MLP_RATIO: 4.0
|
216 |
-
QKV_BIAS: True
|
217 |
-
DEPTH: 19
|
218 |
-
DEPTH_SINGLE_BLOCKS: 38
|
219 |
-
USE_GRAD_CHECKPOINT: True
|
220 |
-
ATTN_BACKEND: flash_attn
|
221 |
-
#
|
222 |
-
FIRST_STAGE_MODEL:
|
223 |
-
NAME: AutoencoderKLFlux
|
224 |
-
EMBED_DIM: 16
|
225 |
-
PRETRAINED_MODEL: ms://AI-ModelScope/FLUX.1-dev@ae.safetensors
|
226 |
-
IGNORE_KEYS: [ ]
|
227 |
-
BATCH_SIZE: 8
|
228 |
-
USE_CONV: False
|
229 |
-
SCALE_FACTOR: 0.3611
|
230 |
-
SHIFT_FACTOR: 0.1159
|
231 |
-
#
|
232 |
-
ENCODER:
|
233 |
-
NAME: Encoder
|
234 |
-
USE_CHECKPOINT: False
|
235 |
-
CH: 128
|
236 |
-
OUT_CH: 3
|
237 |
-
NUM_RES_BLOCKS: 2
|
238 |
-
IN_CHANNELS: 3
|
239 |
-
ATTN_RESOLUTIONS: [ ]
|
240 |
-
CH_MULT: [ 1, 2, 4, 4 ]
|
241 |
-
Z_CHANNELS: 16
|
242 |
-
DOUBLE_Z: True
|
243 |
-
DROPOUT: 0.0
|
244 |
-
RESAMP_WITH_CONV: True
|
245 |
-
#
|
246 |
-
DECODER:
|
247 |
-
NAME: Decoder
|
248 |
-
USE_CHECKPOINT: False
|
249 |
-
CH: 128
|
250 |
-
OUT_CH: 3
|
251 |
-
NUM_RES_BLOCKS: 2
|
252 |
-
IN_CHANNELS: 3
|
253 |
-
ATTN_RESOLUTIONS: [ ]
|
254 |
-
CH_MULT: [ 1, 2, 4, 4 ]
|
255 |
-
Z_CHANNELS: 16
|
256 |
-
DROPOUT: 0.0
|
257 |
-
RESAMP_WITH_CONV: True
|
258 |
-
GIVE_PRE_END: False
|
259 |
-
TANH_OUT: False
|
260 |
-
#
|
261 |
-
COND_STAGE_MODEL:
|
262 |
-
NAME: T5PlusClipFluxEmbedder
|
263 |
-
T5_MODEL:
|
264 |
-
NAME: HFEmbedder
|
265 |
-
HF_MODEL_CLS: T5EncoderModel
|
266 |
-
MODEL_PATH: ms://AI-ModelScope/FLUX.1-dev@text_encoder_2/
|
267 |
-
HF_TOKENIZER_CLS: T5Tokenizer
|
268 |
-
TOKENIZER_PATH: ms://AI-ModelScope/FLUX.1-dev@tokenizer_2/
|
269 |
-
MAX_LENGTH: 512
|
270 |
-
OUTPUT_KEY: last_hidden_state
|
271 |
-
D_TYPE: bfloat16
|
272 |
-
BATCH_INFER: False
|
273 |
-
CLEAN: whitespace
|
274 |
-
CLIP_MODEL:
|
275 |
-
NAME: HFEmbedder
|
276 |
-
HF_MODEL_CLS: CLIPTextModel
|
277 |
-
MODEL_PATH: ms://AI-ModelScope/FLUX.1-dev@text_encoder/
|
278 |
-
HF_TOKENIZER_CLS: CLIPTokenizer
|
279 |
-
TOKENIZER_PATH: ms://AI-ModelScope/FLUX.1-dev@tokenizer/
|
280 |
-
MAX_LENGTH: 77
|
281 |
-
OUTPUT_KEY: pooler_output
|
282 |
-
D_TYPE: bfloat16
|
283 |
-
BATCH_INFER: True
|
284 |
-
CLEAN: whitespace
|
|
|
129 |
T5_DTYPE: bfloat16
|
130 |
ADDED_IDENTIFIER: [ '{image}', '{caption}', '{mask}', '{ref_image}', '{image1}', '{image2}', '{image3}', '{image4}', '{image5}', '{image6}', '{image7}', '{image8}', '{image9}' ]
|
131 |
CLEAN: whitespace
|
132 |
+
USE_GRAD: False
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|