[s2s/distill] remove run_distiller.sh, fix xsum script (#8412)
This commit is contained in:
@@ -1,10 +0,0 @@
|
|||||||
# Add parent directory to python path to access lightning_base.py
|
|
||||||
export PYTHONPATH="../":"${PYTHONPATH}"
|
|
||||||
|
|
||||||
python distillation.py \
|
|
||||||
--learning_rate=3e-4 \
|
|
||||||
--do_train \
|
|
||||||
--do_predict \
|
|
||||||
--fp16 \
|
|
||||||
--val_check_interval 0.1 \
|
|
||||||
"$@"
|
|
||||||
@@ -2,6 +2,7 @@
|
|||||||
export PYTHONPATH="../":"${PYTHONPATH}"
|
export PYTHONPATH="../":"${PYTHONPATH}"
|
||||||
python distillation.py \
|
python distillation.py \
|
||||||
--teacher facebook/bart-large-xsum --data_dir xsum \
|
--teacher facebook/bart-large-xsum --data_dir xsum \
|
||||||
|
--tokenizer_name facebook/bart-large-xsum \
|
||||||
--student_decoder_layers 6 --student_encoder_layers 12 \
|
--student_decoder_layers 6 --student_encoder_layers 12 \
|
||||||
--freeze_encoder --freeze_embeds \
|
--freeze_encoder --freeze_embeds \
|
||||||
--learning_rate=3e-4 \
|
--learning_rate=3e-4 \
|
||||||
|
|||||||
Reference in New Issue
Block a user