lykeven
/

uptest

Model card Files Files and versions

Metrics Training metrics Community

uptest / ptuning /train.sh

lykeven's picture

first model commit

54abf22 almost 3 years ago

history blame contribute delete

766 Bytes

	PRE_SEQ_LEN=128
	LR=2e-2

	CUDA_VISIBLE_DEVICES=0 python3 main.py \
	--do_train \
	--train_file AdvertiseGen/train.json \
	--validation_file AdvertiseGen/dev.json \
	--prompt_column content \
	--response_column summary \
	--overwrite_cache \
	--model_name_or_path /home/wangyan/project/hft/uptest \
	--output_dir output/adgen-chatglm-6b-pt-$PRE_SEQ_LEN-$LR \
	--overwrite_output_dir \
	--max_source_length 64 \
	--max_target_length 64 \
	--per_device_train_batch_size 1 \
	--per_device_eval_batch_size 1 \
	--gradient_accumulation_steps 16 \
	--predict_with_generate \
	--max_steps 100 \
	--logging_steps 10 \
	--save_steps 50 \
	--learning_rate $LR \
	--pre_seq_len $PRE_SEQ_LEN \
	--quantization_bit 4