egrpo / scripts /finetune /finetune_g2rpo_hps_clip.sh
studyOverflow's picture
Add files using upload-large-folder tool
45d12c1 verified
export NNODES=${NODE_COUNT:-2}
export PROC_PER_NODE=${PROC_PER_NODE:-8}
export MASTER_ADDR=${MASTER_ADDR}
export NODE_RANK=${NODE_RANK}
export MASTER_PORT=29533
torchrun --nnodes=2 --nproc_per_node=$PROC_PER_NODE --node_rank $NODE_RANK --master_addr $MASTER_ADDR --master_port $MASTER_PORT \
fastvideo/train_g2rpo_hps_clip_merge.py \
--seed 42 \
--pretrained_model_name_or_path ckpt/flux \
--hps_path ckpt/hps/HPS_v2.1_compressed.pt \
--hps_clip_path ckpt/CLIP-ViT-H-14-laion2B-s32B-b79K/open_clip_pytorch_model.bin \
--clip_score_path ckpt/clip_score \
--data_json_path data/rl_embeddings/videos2caption.json \
--gradient_checkpointing \
--train_batch_size 1 \
--num_latent_t 1 \
--sp_size 1 \
--train_sp_batch_size 1 \
--dataloader_num_workers 4 \
--max_train_steps 301 \
--learning_rate 2e-6 \
--mixed_precision bf16 \
--checkpointing_steps 50 \
--cfg 0.0 \
--output_dir save_exp/hps_clip \
--h 720 \
--w 720 \
--t 1 \
--sampling_steps 16 \
--eta 0.7 \
--lr_warmup_steps 0 \
--sampler_seed 1223627 \
--max_grad_norm 1.0 \
--weight_decay 0.0001 \
--num_generations 12 \
--shift 3 \
--init_same_noise \
--clip_range 1e-4 \
--adv_clip_max 5.0 \
--eta_step_list 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 \
--granular_list 1 \