[examples] fixes arguments for summarization finetune scripts (#5157)
Authored-by: i.boytsov <i.boytsov@MAC867.local>
This commit is contained in:
@@ -1,7 +1,3 @@
|
|||||||
export OUTPUT_DIR=bart_cnn_finetune
|
|
||||||
|
|
||||||
# Make output directory if it doesn't exist
|
|
||||||
mkdir -p $OUTPUT_DIR
|
|
||||||
|
|
||||||
# Add parent directory to python path to access lightning_base.py
|
# Add parent directory to python path to access lightning_base.py
|
||||||
export PYTHONPATH="../":"${PYTHONPATH}"
|
export PYTHONPATH="../":"${PYTHONPATH}"
|
||||||
@@ -9,6 +5,7 @@ export PYTHONPATH="../":"${PYTHONPATH}"
|
|||||||
|
|
||||||
# --model_name_or_path=t5-base for t5
|
# --model_name_or_path=t5-base for t5
|
||||||
|
|
||||||
|
# the proper usage is documented in the README
|
||||||
python finetune.py \
|
python finetune.py \
|
||||||
--model_name_or_path=facebook/bart-large \
|
--model_name_or_path=facebook/bart-large \
|
||||||
--learning_rate=3e-5 \
|
--learning_rate=3e-5 \
|
||||||
|
|||||||
@@ -16,14 +16,13 @@ mkdir -p $OUTPUT_DIR
|
|||||||
export PYTHONPATH="../":"${PYTHONPATH}"
|
export PYTHONPATH="../":"${PYTHONPATH}"
|
||||||
python finetune.py \
|
python finetune.py \
|
||||||
--data_dir=cnn_tiny/ \
|
--data_dir=cnn_tiny/ \
|
||||||
--model_type=bart \
|
|
||||||
--model_name_or_path=sshleifer/bart-tiny-random \
|
--model_name_or_path=sshleifer/bart-tiny-random \
|
||||||
--learning_rate=3e-5 \
|
--learning_rate=3e-5 \
|
||||||
--train_batch_size=2 \
|
--train_batch_size=2 \
|
||||||
--eval_batch_size=2 \
|
--eval_batch_size=2 \
|
||||||
--output_dir=$OUTPUT_DIR \
|
--output_dir=$OUTPUT_DIR \
|
||||||
--num_train_epochs=1 \
|
--num_train_epochs=1 \
|
||||||
--n_gpu=0 \
|
--gpus=0 \
|
||||||
--do_train $@
|
--do_train $@
|
||||||
|
|
||||||
rm -rf cnn_tiny
|
rm -rf cnn_tiny
|
||||||
|
|||||||
@@ -11,7 +11,6 @@ export PYTHONPATH="../":"${PYTHONPATH}"
|
|||||||
python finetune.py \
|
python finetune.py \
|
||||||
--data_dir=./cnn-dailymail/cnn_dm \
|
--data_dir=./cnn-dailymail/cnn_dm \
|
||||||
--model_name_or_path=t5-large \
|
--model_name_or_path=t5-large \
|
||||||
--model_type=t5
|
|
||||||
--learning_rate=3e-5 \
|
--learning_rate=3e-5 \
|
||||||
--train_batch_size=4 \
|
--train_batch_size=4 \
|
||||||
--eval_batch_size=4 \
|
--eval_batch_size=4 \
|
||||||
|
|||||||
Reference in New Issue
Block a user