From 15550ce0d18457e1b62634d0803c4cce835da417 Mon Sep 17 00:00:00 2001 From: Julien Chaumond Date: Fri, 15 May 2020 17:08:38 -0400 Subject: [PATCH] [skip ci] remove local rank --- .../language-modeling/run_language_modeling.py | 14 +++----------- src/transformers/configuration_roberta.py | 2 +- 2 files changed, 4 insertions(+), 12 deletions(-) diff --git a/examples/language-modeling/run_language_modeling.py b/examples/language-modeling/run_language_modeling.py index 822c0c948b..483d98fad9 100644 --- a/examples/language-modeling/run_language_modeling.py +++ b/examples/language-modeling/run_language_modeling.py @@ -115,7 +115,7 @@ class DataTrainingArguments: ) -def get_dataset(args: DataTrainingArguments, tokenizer: PreTrainedTokenizer, evaluate=False, local_rank=-1): +def get_dataset(args: DataTrainingArguments, tokenizer: PreTrainedTokenizer, evaluate=False): file_path = args.eval_data_file if evaluate else args.train_data_file if args.line_by_line: return LineByLineTextDataset(tokenizer=tokenizer, file_path=file_path, block_size=args.block_size) @@ -216,16 +216,8 @@ def main(): data_args.block_size = min(data_args.block_size, tokenizer.max_len) # Get datasets - train_dataset = ( - get_dataset(data_args, tokenizer=tokenizer, local_rank=training_args.local_rank) - if training_args.do_train - else None - ) - eval_dataset = ( - get_dataset(data_args, tokenizer=tokenizer, local_rank=training_args.local_rank, evaluate=True) - if training_args.do_eval - else None - ) + train_dataset = get_dataset(data_args, tokenizer=tokenizer) if training_args.do_train else None + eval_dataset = get_dataset(data_args, tokenizer=tokenizer, evaluate=True) if training_args.do_eval else None data_collator = DataCollatorForLanguageModeling( tokenizer=tokenizer, mlm=data_args.mlm, mlm_probability=data_args.mlm_probability ) diff --git a/src/transformers/configuration_roberta.py b/src/transformers/configuration_roberta.py index 03bdfe3031..80bb34e77b 100644 --- a/src/transformers/configuration_roberta.py +++ b/src/transformers/configuration_roberta.py @@ -68,6 +68,6 @@ class RobertaConfig(BertConfig): model_type = "roberta" def __init__(self, pad_token_id=1, bos_token_id=0, eos_token_id=2, **kwargs): - """Constructs FlaubertConfig. + """Constructs RobertaConfig. """ super().__init__(pad_token_id=pad_token_id, bos_token_id=bos_token_id, eos_token_id=eos_token_id, **kwargs)