experiment_id: sotediffusion-wr3_3b-stage_b model_version: 3B dtype: float32 use_fsdp: False batch_size: 8 grad_accum_steps: 4 updates: 1024000 backup_every: 2048 save_every: 1024 warmup_updates: 128 lr: 8.0e-6 optimizer_type: AdamW adaptive_loss_weight: False stochastic_rounding: False image_size: 1024 multi_aspect_ratio: [1/1, 1/2, 1/3, 2/3, 3/4, 1/5, 2/5, 3/5, 4/5, 1/6, 5/6, 9/16] shift: 4 checkpoint_path: /home/ubuntu/out/ output_path: /home/ubuntu/out/ webdataset_path: file:/home/ubuntu/newest_best.tar effnet_checkpoint_path: /home/ubuntu/models/wuerstchen3/effnet_encoder.safetensors stage_a_checkpoint_path: /home/ubuntu/models/wuerstchen3/stage_a.safetensors generator_checkpoint_path: /home/ubuntu/models/wuerstchen3/generator-020480.safetensors