|
adam_beta1: 0.9 |
|
adam_beta2: 0.999 |
|
adam_epsilon: 1.0e-08 |
|
adam_weight_decay: 0.01 |
|
allow_tf32: false |
|
beta_dpo: 2500 |
|
cache_dir: null |
|
checkpointing_steps: 2000 |
|
checkpoints_total_limit: null |
|
dataloader_num_workers: 0 |
|
dataset_name: kashif/pickascore |
|
dataset_split_name: validation |
|
enable_xformers_memory_efficient_attention: false |
|
gradient_accumulation_steps: 1 |
|
gradient_checkpointing: true |
|
hub_model_id: null |
|
hub_token: null |
|
learning_rate: 1.0e-05 |
|
local_rank: -1 |
|
logging_dir: logs |
|
loss_type: sigmoid |
|
lr_num_cycles: 1 |
|
lr_power: 1.0 |
|
lr_scheduler: constant |
|
lr_warmup_steps: 0 |
|
max_grad_norm: 1.0 |
|
max_train_samples: null |
|
max_train_steps: 10000 |
|
mixed_precision: fp16 |
|
no_hflip: false |
|
num_train_epochs: 20 |
|
output_dir: diffusion-dpo |
|
pretrained_model_name_or_path: runwayml/stable-diffusion-v1-5 |
|
prior_generation_precision: null |
|
push_to_hub: true |
|
random_crop: false |
|
rank: 8 |
|
report_to: tensorboard |
|
resolution: 512 |
|
resume_from_checkpoint: null |
|
revision: null |
|
run_validation: true |
|
scale_lr: false |
|
seed: 0 |
|
tracker_name: diffusion-dpo-lora |
|
train_batch_size: 1 |
|
use_8bit_adam: true |
|
vae_encode_batch_size: 8 |
|
validation_steps: 200 |
|
variant: null |
|
|