sentiment140-word-gap/roberta_with_year_from_scratch/2_run.sh
2021-11-11 10:49:15 +01:00

23 lines
750 B
Bash

#if [ -z ${CUDA_VISIBLE_DEVICES+x} ]; then echo "CUDA_VISIBLE_DEVICES NOT SET"; exit 1 ; else echo "using cuda devices '$CUDA_VISIBLE_DEVICES'"; fi
python run_mlm.py \
--model_name_or_path roberta-base \
--max_seq_length 64 \
--output_dir ./robertamodel \
--train_file ./train_in.csv \
--validation_file ./dev-0_in.csv \
--do_train \
--do_eval \
--per_device_train_batch_size=256 \
--per_device_eval_batch_size=256 \
--gradient_accumulation_steps=1 \
--fp16 False \
--save_steps 1000 \
--eval_steps 1000 \
--logging_steps 1000 \
--evaluation_strategy steps \
--num_train_epochs 40 \
--warmup_steps 1000 \
--tokenizer_name tokenizer_model \
| tee --append logs_regular.txt