| { | |
| "job": "extension", | |
| "config": { | |
| "name": "qwen_image_sethos_lora_v1", | |
| "process": [ | |
| { | |
| "type": "ui_trainer", | |
| "training_folder": "/home/featurize/ai-toolkit/output", | |
| "sqlite_db_path": "/home/featurize/ai-toolkit/aitk_db.db", | |
| "device": "cuda", | |
| "trigger_word": null, | |
| "performance_log_every": 10, | |
| "network": { | |
| "type": "lora", | |
| "linear": 16, | |
| "linear_alpha": 16, | |
| "conv": 16, | |
| "conv_alpha": 16, | |
| "lokr_full_rank": true, | |
| "lokr_factor": -1, | |
| "network_kwargs": { | |
| "ignore_if_contains": [] | |
| } | |
| }, | |
| "save": { | |
| "dtype": "bf16", | |
| "save_every": 250, | |
| "max_step_saves_to_keep": 4000, | |
| "save_format": "diffusers", | |
| "push_to_hub": false | |
| }, | |
| "datasets": [ | |
| { | |
| "folder_path": "/home/featurize/ai-toolkit/datasets/Sethos_Images_Captioned", | |
| "control_path": null, | |
| "mask_path": null, | |
| "mask_min_value": 0.1, | |
| "default_caption": "", | |
| "caption_ext": "txt", | |
| "caption_dropout_rate": 0.05, | |
| "cache_latents_to_disk": false, | |
| "is_reg": false, | |
| "network_weight": 1, | |
| "resolution": [ | |
| 512, | |
| 768, | |
| 1024 | |
| ], | |
| "controls": [], | |
| "shrink_video_to_frames": true, | |
| "num_frames": 1, | |
| "do_i2v": true | |
| } | |
| ], | |
| "train": { | |
| "batch_size": 1, | |
| "bypass_guidance_embedding": false, | |
| "steps": 30000, | |
| "gradient_accumulation": 1, | |
| "train_unet": true, | |
| "train_text_encoder": false, | |
| "gradient_checkpointing": true, | |
| "noise_scheduler": "flowmatch", | |
| "optimizer": "adamw8bit", | |
| "timestep_type": "weighted", | |
| "content_or_style": "balanced", | |
| "optimizer_params": { | |
| "weight_decay": 0.0001 | |
| }, | |
| "unload_text_encoder": false, | |
| "cache_text_embeddings": true, | |
| "lr": 0.0001, | |
| "ema_config": { | |
| "use_ema": false, | |
| "ema_decay": 0.99 | |
| }, | |
| "skip_first_sample": false, | |
| "disable_sampling": false, | |
| "dtype": "bf16", | |
| "diff_output_preservation": false, | |
| "diff_output_preservation_multiplier": 1, | |
| "diff_output_preservation_class": "person" | |
| }, | |
| "model": { | |
| "name_or_path": "Qwen/Qwen-Image", | |
| "quantize": true, | |
| "qtype": "uint3|ostris/accuracy_recovery_adapters/qwen_image_torchao_uint3.safetensors", | |
| "quantize_te": true, | |
| "qtype_te": "qfloat8", | |
| "arch": "qwen_image", | |
| "low_vram": true, | |
| "model_kwargs": {} | |
| }, | |
| "sample": { | |
| "sampler": "flowmatch", | |
| "sample_every": 250, | |
| "width": 768, | |
| "height": 768, | |
| "samples": [ | |
| { | |
| "prompt": "In the style of Sethos, This is a digital anime-style illustration featuring a young man with long, flowing black hair with green highlights and bright green eyes. He is dressed in a white and gold ornate outfit with purple accents and a yellow scarf. he is eating icecream." | |
| } | |
| ], | |
| "neg": "", | |
| "seed": 42, | |
| "walk_seed": true, | |
| "guidance_scale": 4, | |
| "sample_steps": 25, | |
| "num_frames": 1, | |
| "fps": 1 | |
| } | |
| } | |
| ] | |
| }, | |
| "meta": { | |
| "name": "[name]", | |
| "version": "1.0" | |
| } | |
| } |