Upload 5 files
Browse files- config.yaml +124 -0
- hardbody.safetensors +3 -0
- job_config.json +150 -0
- log.txt +0 -0
- pid.txt +1 -0
config.yaml
ADDED
|
@@ -0,0 +1,124 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
job: extension
|
| 2 |
+
config:
|
| 3 |
+
name: hardbody
|
| 4 |
+
process:
|
| 5 |
+
- type: diffusion_trainer
|
| 6 |
+
training_folder: /data/app/output
|
| 7 |
+
sqlite_db_path: /data/app/aitk_db.db
|
| 8 |
+
device: cuda
|
| 9 |
+
trigger_word: null
|
| 10 |
+
performance_log_every: 10
|
| 11 |
+
network:
|
| 12 |
+
type: lora
|
| 13 |
+
linear: 32
|
| 14 |
+
linear_alpha: 32
|
| 15 |
+
conv: 16
|
| 16 |
+
conv_alpha: 16
|
| 17 |
+
lokr_full_rank: true
|
| 18 |
+
lokr_factor: -1
|
| 19 |
+
network_kwargs:
|
| 20 |
+
ignore_if_contains: []
|
| 21 |
+
save:
|
| 22 |
+
dtype: bf16
|
| 23 |
+
save_every: 500
|
| 24 |
+
max_step_saves_to_keep: 4
|
| 25 |
+
save_format: diffusers
|
| 26 |
+
push_to_hub: false
|
| 27 |
+
datasets:
|
| 28 |
+
- folder_path: /data/app/datasets/body_v01
|
| 29 |
+
mask_path: null
|
| 30 |
+
mask_min_value: 0.1
|
| 31 |
+
default_caption: curvy female body
|
| 32 |
+
caption_ext: txt
|
| 33 |
+
caption_dropout_rate: 0.05
|
| 34 |
+
cache_latents_to_disk: false
|
| 35 |
+
is_reg: false
|
| 36 |
+
network_weight: 1
|
| 37 |
+
resolution:
|
| 38 |
+
- 512
|
| 39 |
+
- 768
|
| 40 |
+
- 1024
|
| 41 |
+
controls: []
|
| 42 |
+
shrink_video_to_frames: true
|
| 43 |
+
num_frames: 1
|
| 44 |
+
do_i2v: true
|
| 45 |
+
flip_x: false
|
| 46 |
+
flip_y: false
|
| 47 |
+
train:
|
| 48 |
+
batch_size: 1
|
| 49 |
+
bypass_guidance_embedding: false
|
| 50 |
+
steps: 3000
|
| 51 |
+
gradient_accumulation: 1
|
| 52 |
+
train_unet: true
|
| 53 |
+
train_text_encoder: false
|
| 54 |
+
gradient_checkpointing: true
|
| 55 |
+
noise_scheduler: flowmatch
|
| 56 |
+
optimizer: adamw8bit
|
| 57 |
+
timestep_type: weighted
|
| 58 |
+
content_or_style: balanced
|
| 59 |
+
optimizer_params:
|
| 60 |
+
weight_decay: 0.0001
|
| 61 |
+
unload_text_encoder: false
|
| 62 |
+
cache_text_embeddings: false
|
| 63 |
+
lr: 0.0001
|
| 64 |
+
ema_config:
|
| 65 |
+
use_ema: false
|
| 66 |
+
ema_decay: 0.99
|
| 67 |
+
skip_first_sample: false
|
| 68 |
+
force_first_sample: false
|
| 69 |
+
disable_sampling: false
|
| 70 |
+
dtype: bf16
|
| 71 |
+
diff_output_preservation: false
|
| 72 |
+
diff_output_preservation_multiplier: 1
|
| 73 |
+
diff_output_preservation_class: person
|
| 74 |
+
switch_boundary_every: 1
|
| 75 |
+
loss_type: mse
|
| 76 |
+
do_differential_guidance: true
|
| 77 |
+
differential_guidance_scale: 3
|
| 78 |
+
model:
|
| 79 |
+
name_or_path: Tongyi-MAI/Z-Image-Turbo
|
| 80 |
+
quantize: true
|
| 81 |
+
qtype: qfloat8
|
| 82 |
+
quantize_te: true
|
| 83 |
+
qtype_te: qfloat8
|
| 84 |
+
arch: zimage:turbo
|
| 85 |
+
low_vram: false
|
| 86 |
+
model_kwargs: {}
|
| 87 |
+
layer_offloading: false
|
| 88 |
+
layer_offloading_text_encoder_percent: 1
|
| 89 |
+
layer_offloading_transformer_percent: 1
|
| 90 |
+
assistant_lora_path: ostris/zimage_turbo_training_adapter/zimage_turbo_training_adapter_v2.safetensors
|
| 91 |
+
sample:
|
| 92 |
+
sampler: flowmatch
|
| 93 |
+
sample_every: 500
|
| 94 |
+
width: 512
|
| 95 |
+
height: 512
|
| 96 |
+
samples:
|
| 97 |
+
- prompt: a woman holding a coffee cup, in a beanie, sitting at a cafe, shorts
|
| 98 |
+
and tight tanktop
|
| 99 |
+
- prompt: woman playing the guitar, on stage, singing a song, laser lights,
|
| 100 |
+
punk rocker
|
| 101 |
+
- prompt: a naked woman holding a sign that says, 'hardbody'
|
| 102 |
+
- prompt: solo, full body, standing, front view, completely nude, voluptuous
|
| 103 |
+
curvy woman, huge natural breasts, detailed nipples, oiled shiny skin, glossy
|
| 104 |
+
wet body, thick thighs, navel piercing, smooth tanned skin, neutral expression,
|
| 105 |
+
gray studio background, soft lighting, photorealistic, ultra detailed, 8k
|
| 106 |
+
- prompt: ''
|
| 107 |
+
- prompt: beautiful nude woman, standing slightly turned three-quarter view,
|
| 108 |
+
massive breasts, erect nipples, oiled glossy skin, wide hips, thick thighs,
|
| 109 |
+
navel piercing, shiny bronze skin, full body, studio gray background, high
|
| 110 |
+
detail skin texture, photorealistic, masterpiece
|
| 111 |
+
- prompt: ''
|
| 112 |
+
- prompt: curvy nude female model, full body portrait, very large natural breasts,
|
| 113 |
+
shiny oiled skin, detailed anatomy, thick legs, standing pose, neutral face,
|
| 114 |
+
professional studio photography, ultra realistic, highres
|
| 115 |
+
neg: ''
|
| 116 |
+
seed: 42
|
| 117 |
+
walk_seed: true
|
| 118 |
+
guidance_scale: 1
|
| 119 |
+
sample_steps: 8
|
| 120 |
+
num_frames: 1
|
| 121 |
+
fps: 1
|
| 122 |
+
meta:
|
| 123 |
+
name: hardbody
|
| 124 |
+
version: '1.0'
|
hardbody.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8fbb3bc45ca22ad42336e48afd88dda3a54e4932526e0f4e587a297988c8c71
|
| 3 |
+
size 170128216
|
job_config.json
ADDED
|
@@ -0,0 +1,150 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"job": "extension",
|
| 3 |
+
"config": {
|
| 4 |
+
"name": "hardbody",
|
| 5 |
+
"process": [
|
| 6 |
+
{
|
| 7 |
+
"type": "diffusion_trainer",
|
| 8 |
+
"training_folder": "/data/app/output",
|
| 9 |
+
"sqlite_db_path": "/data/app/aitk_db.db",
|
| 10 |
+
"device": "cuda",
|
| 11 |
+
"trigger_word": null,
|
| 12 |
+
"performance_log_every": 10,
|
| 13 |
+
"network": {
|
| 14 |
+
"type": "lora",
|
| 15 |
+
"linear": 32,
|
| 16 |
+
"linear_alpha": 32,
|
| 17 |
+
"conv": 16,
|
| 18 |
+
"conv_alpha": 16,
|
| 19 |
+
"lokr_full_rank": true,
|
| 20 |
+
"lokr_factor": -1,
|
| 21 |
+
"network_kwargs": {
|
| 22 |
+
"ignore_if_contains": []
|
| 23 |
+
}
|
| 24 |
+
},
|
| 25 |
+
"save": {
|
| 26 |
+
"dtype": "bf16",
|
| 27 |
+
"save_every": 500,
|
| 28 |
+
"max_step_saves_to_keep": 4,
|
| 29 |
+
"save_format": "diffusers",
|
| 30 |
+
"push_to_hub": false
|
| 31 |
+
},
|
| 32 |
+
"datasets": [
|
| 33 |
+
{
|
| 34 |
+
"folder_path": "/data/app/datasets/body_v01",
|
| 35 |
+
"mask_path": null,
|
| 36 |
+
"mask_min_value": 0.1,
|
| 37 |
+
"default_caption": "curvy female body",
|
| 38 |
+
"caption_ext": "txt",
|
| 39 |
+
"caption_dropout_rate": 0.05,
|
| 40 |
+
"cache_latents_to_disk": false,
|
| 41 |
+
"is_reg": false,
|
| 42 |
+
"network_weight": 1,
|
| 43 |
+
"resolution": [
|
| 44 |
+
512,
|
| 45 |
+
768,
|
| 46 |
+
1024
|
| 47 |
+
],
|
| 48 |
+
"controls": [],
|
| 49 |
+
"shrink_video_to_frames": true,
|
| 50 |
+
"num_frames": 1,
|
| 51 |
+
"do_i2v": true,
|
| 52 |
+
"flip_x": false,
|
| 53 |
+
"flip_y": false
|
| 54 |
+
}
|
| 55 |
+
],
|
| 56 |
+
"train": {
|
| 57 |
+
"batch_size": 1,
|
| 58 |
+
"bypass_guidance_embedding": false,
|
| 59 |
+
"steps": 3000,
|
| 60 |
+
"gradient_accumulation": 1,
|
| 61 |
+
"train_unet": true,
|
| 62 |
+
"train_text_encoder": false,
|
| 63 |
+
"gradient_checkpointing": true,
|
| 64 |
+
"noise_scheduler": "flowmatch",
|
| 65 |
+
"optimizer": "adamw8bit",
|
| 66 |
+
"timestep_type": "weighted",
|
| 67 |
+
"content_or_style": "balanced",
|
| 68 |
+
"optimizer_params": {
|
| 69 |
+
"weight_decay": 0.0001
|
| 70 |
+
},
|
| 71 |
+
"unload_text_encoder": false,
|
| 72 |
+
"cache_text_embeddings": false,
|
| 73 |
+
"lr": 0.0001,
|
| 74 |
+
"ema_config": {
|
| 75 |
+
"use_ema": false,
|
| 76 |
+
"ema_decay": 0.99
|
| 77 |
+
},
|
| 78 |
+
"skip_first_sample": false,
|
| 79 |
+
"force_first_sample": false,
|
| 80 |
+
"disable_sampling": false,
|
| 81 |
+
"dtype": "bf16",
|
| 82 |
+
"diff_output_preservation": false,
|
| 83 |
+
"diff_output_preservation_multiplier": 1,
|
| 84 |
+
"diff_output_preservation_class": "person",
|
| 85 |
+
"switch_boundary_every": 1,
|
| 86 |
+
"loss_type": "mse",
|
| 87 |
+
"do_differential_guidance": true,
|
| 88 |
+
"differential_guidance_scale": 3
|
| 89 |
+
},
|
| 90 |
+
"model": {
|
| 91 |
+
"name_or_path": "Tongyi-MAI/Z-Image-Turbo",
|
| 92 |
+
"quantize": true,
|
| 93 |
+
"qtype": "qfloat8",
|
| 94 |
+
"quantize_te": true,
|
| 95 |
+
"qtype_te": "qfloat8",
|
| 96 |
+
"arch": "zimage:turbo",
|
| 97 |
+
"low_vram": false,
|
| 98 |
+
"model_kwargs": {},
|
| 99 |
+
"layer_offloading": false,
|
| 100 |
+
"layer_offloading_text_encoder_percent": 1,
|
| 101 |
+
"layer_offloading_transformer_percent": 1,
|
| 102 |
+
"assistant_lora_path": "ostris/zimage_turbo_training_adapter/zimage_turbo_training_adapter_v2.safetensors"
|
| 103 |
+
},
|
| 104 |
+
"sample": {
|
| 105 |
+
"sampler": "flowmatch",
|
| 106 |
+
"sample_every": 500,
|
| 107 |
+
"width": 512,
|
| 108 |
+
"height": 512,
|
| 109 |
+
"samples": [
|
| 110 |
+
{
|
| 111 |
+
"prompt": "a woman holding a coffee cup, in a beanie, sitting at a cafe, shorts and tight tanktop"
|
| 112 |
+
},
|
| 113 |
+
{
|
| 114 |
+
"prompt": "woman playing the guitar, on stage, singing a song, laser lights, punk rocker"
|
| 115 |
+
},
|
| 116 |
+
{
|
| 117 |
+
"prompt": "a naked woman holding a sign that says, 'hardbody'"
|
| 118 |
+
},
|
| 119 |
+
{
|
| 120 |
+
"prompt": "solo, full body, standing, front view, completely nude, voluptuous curvy woman, huge natural breasts, detailed nipples, oiled shiny skin, glossy wet body, thick thighs, navel piercing, smooth tanned skin, neutral expression, gray studio background, soft lighting, photorealistic, ultra detailed, 8k"
|
| 121 |
+
},
|
| 122 |
+
{
|
| 123 |
+
"prompt": ""
|
| 124 |
+
},
|
| 125 |
+
{
|
| 126 |
+
"prompt": "beautiful nude woman, standing slightly turned three-quarter view, massive breasts, erect nipples, oiled glossy skin, wide hips, thick thighs, navel piercing, shiny bronze skin, full body, studio gray background, high detail skin texture, photorealistic, masterpiece"
|
| 127 |
+
},
|
| 128 |
+
{
|
| 129 |
+
"prompt": ""
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"prompt": "curvy nude female model, full body portrait, very large natural breasts, shiny oiled skin, detailed anatomy, thick legs, standing pose, neutral face, professional studio photography, ultra realistic, highres"
|
| 133 |
+
}
|
| 134 |
+
],
|
| 135 |
+
"neg": "",
|
| 136 |
+
"seed": 42,
|
| 137 |
+
"walk_seed": true,
|
| 138 |
+
"guidance_scale": 1,
|
| 139 |
+
"sample_steps": 8,
|
| 140 |
+
"num_frames": 1,
|
| 141 |
+
"fps": 1
|
| 142 |
+
}
|
| 143 |
+
}
|
| 144 |
+
]
|
| 145 |
+
},
|
| 146 |
+
"meta": {
|
| 147 |
+
"name": "[name]",
|
| 148 |
+
"version": "1.0"
|
| 149 |
+
}
|
| 150 |
+
}
|
log.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
pid.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
8036
|