qwip-test2 / trainer_state.json
e-n-v-y's picture
Upload folder using huggingface_hub
fea966d verified
{
"global_step": 10000,
"epoch": 0,
"args": {
"sdxl_model": "/home/envy/sd_xl_base_1.0.safetensors",
"llm_model": "Qwen/Qwen1.5-7B-Chat",
"output_path": "/home/envy/qwip-10layers-pooled",
"resume_from_checkpoint": null,
"prompts_dir": "/home/envy/promptgen",
"train_layers": 10,
"epochs": 1,
"batch_size": 4,
"lr": 1e-05,
"scheduler_type": "cosine",
"cosine_num_cycles": 1,
"warmup_ratio": 0.1,
"loss_type": "mse",
"precision": "bf16",
"max_llm_length": 128,
"save_every_n_steps": 5000,
"seed": 42,
"gradient_accumulation_steps": 1,
"use_flash_attention_2": true,
"gradient_checkpointing": false,
"dataloader_num_workers": 4
}
}