|
#!/bin/sh |
|
|
|
/home/ubuntu/dataset/combined/newest-best |
|
|
|
PAST=3 |
|
PAST_SUB=1 |
|
|
|
OUT_PATH="/home/ubuntu/out/sotediffusion-wr3_3b" |
|
PROMPT_PATH="/home/ubuntu/sotediffusion-prompt.txt" |
|
WUER_PATH="/home/ubuntu/models" |
|
|
|
|
|
accelerate launch --mixed_precision bf16 --multi_gpu stable_cascade_train_stage_c.py \ |
|
--mixed_precision bf16 \ |
|
--save_precision fp16 \ |
|
--sdpa \ |
|
--ddp_static_graph \ |
|
--resolution "1024,1024" \ |
|
--train_batch_size 16 \ |
|
--gradient_checkpointing \ |
|
--learning_rate 4e-6 \ |
|
--learning_rate_te1 0 \ |
|
--lr_scheduler constant_with_warmup \ |
|
--lr_warmup_steps 100 \ |
|
--optimizer_type adafactor \ |
|
--optimizer_args "scale_parameter=False" "relative_step=False" "warmup_init=False" \ |
|
--token_warmup_min 1 \ |
|
--token_warmup_step 0 \ |
|
--shuffle_caption \ |
|
--caption_separator ", " \ |
|
--caption_dropout_rate 0 \ |
|
--caption_tag_dropout_rate 0 \ |
|
--caption_dropout_every_n_epochs 0 \ |
|
--dataset_repeats 1 \ |
|
--save_state \ |
|
--save_every_n_steps 1024 \ |
|
--sample_every_n_steps 512 \ |
|
--max_token_length 225 \ |
|
--max_train_epochs 16 \ |
|
--caption_extension ".txt" \ |
|
--max_data_loader_n_workers 16 \ |
|
--persistent_data_loader_workers \ |
|
--enable_bucket \ |
|
--min_bucket_reso 256 \ |
|
--max_bucket_reso 4096 \ |
|
--bucket_reso_steps 64 \ |
|
--bucket_no_upscale \ |
|
--log_with tensorboard \ |
|
--output_name sotediffusion-wr3_3b \ |
|
--train_data_dir /home/ubuntu/dataset/newest-best \ |
|
--in_json /home/ubuntu/dataset/newest-best.json \ |
|
--output_dir /home/ubuntu/out/final \ |
|
--logging_dir /home/ubuntu/out/final/logs \ |
|
--stage_c_checkpoint_path $OUT_PATH-$PAST/$PAST_SUB/sotediffusion-wr3_3b.safetensors \ |
|
--text_model_checkpoint_path $OUT_PATH-$PAST/$PAST_SUB/sotediffusion-wr3_3b_text_model.safetensors \ |
|
--effnet_checkpoint_path $WUER_PATH/effnet_encoder.safetensors \ |
|
--previewer_checkpoint_path $WUER_PATH/previewer.safetensors \ |
|
--sample_prompts $PROMPT_PATH |
|
|