| { | |
| "job": "extension", | |
| "config": { | |
| "name": "Flux_Xiang_lora", | |
| "process": [ | |
| { | |
| "type": "ui_trainer", | |
| "training_folder": "/home/featurize/ai-toolkit/output", | |
| "sqlite_db_path": "/home/featurize/ai-toolkit/aitk_db.db", | |
| "device": "cuda", | |
| "trigger_word": null, | |
| "performance_log_every": 10, | |
| "network": { | |
| "type": "lora", | |
| "linear": 32, | |
| "linear_alpha": 32, | |
| "conv": 16, | |
| "conv_alpha": 16, | |
| "lokr_full_rank": true, | |
| "lokr_factor": -1, | |
| "network_kwargs": { | |
| "ignore_if_contains": [] | |
| } | |
| }, | |
| "save": { | |
| "dtype": "bf16", | |
| "save_every": 250, | |
| "max_step_saves_to_keep": 4000, | |
| "save_format": "diffusers", | |
| "push_to_hub": false | |
| }, | |
| "datasets": [ | |
| { | |
| "folder_path": "/home/featurize/ai-toolkit/datasets/Xiang_Handsome_Flux_SRPO_Keye_EN_Captioned", | |
| "control_path": null, | |
| "mask_path": null, | |
| "mask_min_value": 0.1, | |
| "default_caption": "", | |
| "caption_ext": "txt", | |
| "caption_dropout_rate": 0.05, | |
| "cache_latents_to_disk": false, | |
| "is_reg": false, | |
| "network_weight": 1, | |
| "resolution": [ | |
| 512, | |
| 768, | |
| 1024 | |
| ], | |
| "controls": [], | |
| "shrink_video_to_frames": true, | |
| "num_frames": 1, | |
| "do_i2v": true, | |
| "flip_x": false, | |
| "flip_y": false | |
| } | |
| ], | |
| "train": { | |
| "batch_size": 1, | |
| "bypass_guidance_embedding": false, | |
| "steps": 30000, | |
| "gradient_accumulation": 1, | |
| "train_unet": true, | |
| "train_text_encoder": false, | |
| "gradient_checkpointing": true, | |
| "noise_scheduler": "flowmatch", | |
| "optimizer": "adamw8bit", | |
| "timestep_type": "sigmoid", | |
| "content_or_style": "balanced", | |
| "optimizer_params": { | |
| "weight_decay": 0.0001 | |
| }, | |
| "unload_text_encoder": false, | |
| "cache_text_embeddings": false, | |
| "lr": 0.0001, | |
| "ema_config": { | |
| "use_ema": false, | |
| "ema_decay": 0.99 | |
| }, | |
| "skip_first_sample": false, | |
| "force_first_sample": false, | |
| "disable_sampling": false, | |
| "dtype": "bf16", | |
| "diff_output_preservation": false, | |
| "diff_output_preservation_multiplier": 1, | |
| "diff_output_preservation_class": "person", | |
| "switch_boundary_every": 1 | |
| }, | |
| "model": { | |
| "name_or_path": "black-forest-labs/FLUX.1-dev", | |
| "quantize": true, | |
| "qtype": "qfloat8", | |
| "quantize_te": true, | |
| "qtype_te": "qfloat8", | |
| "arch": "flux", | |
| "low_vram": false, | |
| "model_kwargs": {} | |
| }, | |
| "sample": { | |
| "sampler": "flowmatch", | |
| "sample_every": 250, | |
| "width": 1024, | |
| "height": 1024, | |
| "samples": [ | |
| { | |
| "prompt": "Wang Xiang , Photograph of a young Asian male with fair skin and black, slightly tousled hair. He has a slender build and is wearing a dark blue hooded sweatshirt with large white letters \"KE\" on the chest. His hands are crossed and resting on a white horizontal bar in front of him. He has a soft, neutral expression with slightly parted lips and dark brown eyes. The background is a bright, overexposed window, creating a stark contrast with his dark clothing. The image has a soft, natural light and a slightly grainy texture." | |
| } | |
| ], | |
| "neg": "", | |
| "seed": 42, | |
| "walk_seed": true, | |
| "guidance_scale": 4, | |
| "sample_steps": 25, | |
| "num_frames": 1, | |
| "fps": 1 | |
| } | |
| } | |
| ] | |
| }, | |
| "meta": { | |
| "name": "[name]", | |
| "version": "1.0" | |
| } | |
| } |