tassadar667's picture
Upload 64 files
6672870
raw
history blame
716 Bytes
CUDA_VISIBLE_DEVICES=0 python main.py ^
--do_train ^
--train_file AdvertiseGen/train.json ^
--validation_file AdvertiseGen/dev.json ^
--prompt_column content ^
--response_column summary ^
--overwrite_cache ^
--model_name_or_path G:/CODE/Python/ChatGLM-6B-main ^
--output_dir output/adgen-chatglm-6b-pt ^
--overwrite_output_dir ^
--max_source_length 64 ^
--max_target_length 64 ^
--per_device_train_batch_size 1 ^
--per_device_eval_batch_size 1 ^
--gradient_accumulation_steps 16 ^
--predict_with_generate ^
--max_steps 3000 ^
--logging_steps 10 ^
--save_steps 1000 ^
--learning_rate 2e-2 ^
--pre_seq_len 512 ^
--quantization_bit 4