diff --git a/examples/run_squad.py b/examples/run_squad.py index 08306bb50e..18a5a1c23f 100644 --- a/examples/run_squad.py +++ b/examples/run_squad.py @@ -388,7 +388,7 @@ def evaluate(args, model, tokenizer, prefix=""): predictions = compute_predictions_logits(examples, features, all_results, args.n_best_size, args.max_answer_length, args.do_lower_case, output_prediction_file, output_nbest_file, output_null_log_odds_file, args.verbose_logging, - args.version_2_with_negative, args.null_score_diff_threshold) + args.version_2_with_negative, args.null_score_diff_threshold, tokenizer) # Compute the F1 and exact scores. results = squad_evaluate(examples, predictions)