| job: extension | |
| config: | |
| name: kontext_diaosu | |
| process: | |
| - type: sd_trainer | |
| training_folder: output | |
| device: cuda:0 | |
| network: | |
| type: lora | |
| linear: 16 | |
| linear_alpha: 16 | |
| save: | |
| dtype: float16 | |
| save_every: 250 | |
| max_step_saves_to_keep: 4 | |
| push_to_hub: false | |
| datasets: | |
| - folder_path: datasets/diaosu_training/images | |
| control_path: datasets/diaosu_training/controls | |
| caption_ext: txt | |
| caption_dropout_rate: 0.05 | |
| shuffle_tokens: false | |
| cache_latents_to_disk: true | |
| resolution: | |
| - 512 | |
| - 768 | |
| - 1024 | |
| train: | |
| batch_size: 1 | |
| steps: 4000 | |
| gradient_accumulation_steps: 1 | |
| train_unet: true | |
| train_text_encoder: false | |
| gradient_checkpointing: true | |
| noise_scheduler: flowmatch | |
| optimizer: adamw8bit | |
| lr: 0.0001 | |
| timestep_type: weighted | |
| dtype: bf16 | |
| model: | |
| name_or_path: black-forest-labs/FLUX.1-Kontext-dev | |
| arch: flux_kontext | |
| quantize: true | |
| sample: | |
| sampler: flowmatch | |
| sample_every: 250 | |
| width: 1024 | |
| height: 1024 | |
| prompts: | |
| - turn the image into the miniature scene, sculptors are carving giant sculptures | |
| of Q-version characters uploaded from pictures,3D cartoon Q version scene | |
| illustration. --ctrl_img datasets/diaosu_training/controls/object_01.png | |
| neg: '' | |
| seed: 42 | |
| walk_seed: true | |
| guidance_scale: 4 | |
| sample_steps: 20 | |
| meta: | |
| name: kontext_diaosu | |
| version: '1.0' | |