Merge pull request #570 from MottoX/fix-1

Create optimizer only when args.do_train is True
This commit is contained in:
Thomas Wolf
2019-05-08 16:07:50 +02:00
committed by GitHub
5 changed files with 130 additions and 125 deletions

View File

@@ -534,6 +534,7 @@ def main():
model = torch.nn.DataParallel(model)
# Prepare optimizer
if args.do_train:
param_optimizer = list(model.named_parameters())
no_decay = ['bias', 'LayerNorm.bias', 'LayerNorm.weight']
optimizer_grouped_parameters = [

View File

@@ -763,6 +763,7 @@ def main():
model = torch.nn.DataParallel(model)
# Prepare optimizer
if args.do_train:
param_optimizer = list(model.named_parameters())
no_decay = ['bias', 'LayerNorm.bias', 'LayerNorm.weight']
optimizer_grouped_parameters = [

View File

@@ -183,6 +183,7 @@ def main():
eval_dataloader = DataLoader(eval_data, sampler=eval_sampler, batch_size=args.eval_batch_size)
# Prepare optimizer
if args.do_train:
param_optimizer = list(model.named_parameters())
no_decay = ['bias', 'LayerNorm.bias', 'LayerNorm.weight']
optimizer_grouped_parameters = [

View File

@@ -922,6 +922,7 @@ def main():
model = torch.nn.DataParallel(model)
# Prepare optimizer
if args.do_train:
param_optimizer = list(model.named_parameters())
# hack to remove pooler, which is not used

View File

@@ -385,6 +385,7 @@ def main():
model = torch.nn.DataParallel(model)
# Prepare optimizer
if args.do_train:
param_optimizer = list(model.named_parameters())
# hack to remove pooler, which is not used