-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathscript.txt
37 lines (33 loc) · 1.63 KB
/
script.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
# Working script
python prepare_data.py --task multi --valid_for_qg_only --model_type t5 --dataset_path ./data/squad_multitask --qg_format highlight_qg_format --max_source_length 512 --max_target_length 32 --train_file_name train_data_qa_qg_hl_t5.pt --valid_file_name valid_data_qg_hl_t5.pt
python run_qg.py --model_name_or_path t5-small --model_type t5 --tokenizer_name_or_path t5_qg_tokenizer --output_dir t5-small-qg-hl --train_file_path data/train_data_qg_hl_t5.pt --valid_file_path data/valid_data_qg_hl_t5.pt --per_device_train_batch_size 32 --per_device_eval_batch_size 32 --gradient_accumulation_steps 8 --learning_rate 1e-4 --num_train_epochs 10 --seed 42 --do_train --do_eval --evaluate_during_training --logging_steps 100
# Testing script
python prepare_data.py \
--task multi \
--valid_for_qg_only \
--model_type t5 \
--load_local \
--dataset_path ./data/squad2/ \
--train_file train-v2.0.json \
--valid_file dev-v2.0.json \
--qg_format highlight_qg_format \
--max_source_length 512 \
--max_target_length 32 \
--train_file_name train_data_qa_qg_hl_t5.pt \
--valid_file_name valid_data_qg_hl_t5.pt
python run_qg.py \
--model_name_or_path t5-base \
--model_type t5 \
--tokenizer_name_or_path t5_qg_tokenizer \
--output_dir t5-small-qg-hl \
--train_file_path data/train_data_qg_hl_t5.pt \
--valid_file_path data/valid_data_qg_hl_t5.pt \
--per_device_train_batch_size 32 \
--per_device_eval_batch_size 32 \
--gradient_accumulation_steps 8 \
--learning_rate 1e-4 \
--num_train_epochs 10 \
--seed 42 \
--do_train \
--do_eval \
--logging_steps 100