From 834b485b2e74e00697bfc51f8a97a5ba60d23b5d Mon Sep 17 00:00:00 2001
From: thomwolf <thomwolf@gmail.com>
Date: Sun, 4 Nov 2018 12:07:38 +0100
Subject: [PATCH] logging + update copyright

---
 convert_tf_checkpoint_to_pytorch.py | 13 ++++++++++++
 extract_features.py                 |  4 ++--
 modeling.py                         |  4 ++--
 optimization.py                     | 16 ++++++++++++++
 run_classifier.py                   |  2 +-
 run_squad.py                        | 33 +++--------------------------
 tokenization.py                     |  2 +-
 7 files changed, 38 insertions(+), 36 deletions(-)

diff --git a/convert_tf_checkpoint_to_pytorch.py b/convert_tf_checkpoint_to_pytorch.py
index c35ab1d248..dfcdbee42d 100644
--- a/convert_tf_checkpoint_to_pytorch.py
+++ b/convert_tf_checkpoint_to_pytorch.py
@@ -1,4 +1,17 @@
 # coding=utf-8
+# Copyright 2018 The HugginFace Inc. team.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
 """Convert BERT checkpoint."""
 
 from __future__ import absolute_import
diff --git a/extract_features.py b/extract_features.py
index 4f2f0b5d67..b9625c266d 100644
--- a/extract_features.py
+++ b/extract_features.py
@@ -1,5 +1,5 @@
 # coding=utf-8
-# Copyright 2018 The Google AI Language Team Authors.
+# Copyright 2018 The Google AI Language Team Authors and The HugginFace Inc. team.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,7 +12,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-"""Extract pre-computed feature vectors from BERT."""
+"""Extract pre-computed feature vectors from a PyTorch BERT model."""
 
 from __future__ import absolute_import
 from __future__ import division
diff --git a/modeling.py b/modeling.py
index db9ca6e0d8..a240474d96 100644
--- a/modeling.py
+++ b/modeling.py
@@ -1,5 +1,5 @@
 # coding=utf-8
-# Copyright 2018 The Google AI Language Team Authors.
+# Copyright 2018 The Google AI Language Team Authors and The HugginFace Inc. team.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -12,7 +12,7 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-"""Common utility functions related to TensorFlow."""
+"""PyTorch BERT model."""
 
 from __future__ import absolute_import
 from __future__ import division
diff --git a/optimization.py b/optimization.py
index 6ff62a7609..91701e4255 100644
--- a/optimization.py
+++ b/optimization.py
@@ -1,3 +1,19 @@
+# coding=utf-8
+# Copyright 2018 The Google AI Language Team Authors and The HugginFace Inc. team.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""PyTorch optimization for BERT model."""
+
 import math
 import torch
 from torch.optim import Optimizer
diff --git a/run_classifier.py b/run_classifier.py
index 367b0c5221..c4a2e7ee61 100644
--- a/run_classifier.py
+++ b/run_classifier.py
@@ -1,5 +1,5 @@
 # coding=utf-8
-# Copyright 2018 The Google AI Language Team Authors.
+# Copyright 2018 The Google AI Language Team Authors and The HugginFace Inc. team.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
diff --git a/run_squad.py b/run_squad.py
index 4529fc6ffc..51a5ad5963 100644
--- a/run_squad.py
+++ b/run_squad.py
@@ -1,5 +1,5 @@
 # coding=utf-8
-# Copyright 2018 The Google AI Language Team Authors.
+# Copyright 2018 The Google AI Language Team Authors and The HugginFace Inc. team.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -720,22 +720,6 @@ def main():
                         help="The maximum length of an answer that can be generated. This is needed because the start "
                              "and end predictions are not conditioned on one another.")
 
-    ### BEGIN - TO DELETE EVENTUALLY --> NO SENSE IN PYTORCH ###
-    # parser.add_argument("--use_tpu", default=False, action='store_true', help="Whether to use TPU or GPU/CPU.")
-    # parser.add_argument("--tpu_name", default=None, type=str,
-    #                     help="The Cloud TPU to use for training. This should be either the name used when creating the "
-    #                          "Cloud TPU, or a grpc://ip.address.of.tpu:8470 url.")
-    # parser.add_argument("--tpu_zone", default=None, type=str,
-    #                     help="[Optional] GCE zone where the Cloud TPU is located in. If not specified, we will attempt "
-    #                          "to automatically detect the GCE project from metadata.")
-    # parser.add_argument("--gcp_project", default=None, type=str,
-    #                     help="[Optional] Project name for the Cloud TPU-enabled project. If not specified, we will attempt "
-    #                          "to automatically detect the GCE project from metadata.")
-    # parser.add_argument("--master", default=None, type=str, help="[Optional] TensorFlow master URL.")
-    # parser.add_argument("--num_tpu_cores", default=8, type=int, help="Only used if `use_tpu` is True. "
-    #                                                                  "Total number of TPU cores to use.")
-    ### END - TO DELETE EVENTUALLY --> NO SENSE IN PYTORCH ###
-
     parser.add_argument("--verbose_logging", default=False, action='store_true',
                         help="If true, all of the warnings related to data processing will be printed. "
                              "A number of warnings are expected for a normal SQuAD evaluation.")
@@ -859,10 +843,10 @@ def main():
                 segment_ids = segment_ids.to(device)
                 start_positions = start_positions.to(device)
                 end_positions = start_positions.to(device)
-                
+
                 start_positions = start_positions.view(-1, 1)
                 end_positions = end_positions.view(-1, 1)
-                
+
                 loss, _ = model(input_ids, segment_ids, input_mask, start_positions, end_positions)
                 if n_gpu > 1:
                     loss = loss.mean() # mean() to average on multi-gpu.
@@ -871,7 +855,6 @@ def main():
                 loss.backward()
                 optimizer.step()
                 global_step += 1
-                logger.info("Done %s steps", global_step)
 
     if args.do_predict:
         eval_examples = read_squad_examples(
@@ -892,10 +875,8 @@ def main():
         all_input_ids = torch.tensor([f.input_ids for f in eval_features], dtype=torch.long)
         all_input_mask = torch.tensor([f.input_mask for f in eval_features], dtype=torch.long)
         all_segment_ids = torch.tensor([f.segment_ids for f in eval_features], dtype=torch.long)
-        #all_label_ids = torch.tensor([f.label_id for f in eval_features], dtype=torch.long)
         all_example_index = torch.arange(all_input_ids.size(0), dtype=torch.long)
 
-        #eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_label_ids, all_example_index)
         eval_data = TensorDataset(all_input_ids, all_input_mask, all_segment_ids, all_example_index)
         if args.local_rank == -1:
             eval_sampler = SequentialSampler(eval_data)
@@ -906,7 +887,6 @@ def main():
         model.eval()
         all_results = []
         logger.info("Start evaluating")
-        #for input_ids, input_mask, segment_ids, label_ids, example_index in eval_dataloader:
         for input_ids, input_mask, segment_ids, example_index in tqdm(eval_dataloader, descr="Evaluating"):
             if len(all_results) % 1000 == 0:
                 logger.info("Processing example: %d" % (len(all_results)))
@@ -918,9 +898,7 @@ def main():
             start_logits, end_logits = model(input_ids, segment_ids, input_mask)
 
             unique_id = [int(eval_features[e.item()].unique_id) for e in example_index]
-            #start_logits = [x.item() for x in start_logits]
             start_logits = [x.view(-1).detach().cpu().numpy() for x in start_logits]
-            #end_logits = [x.item() for x in end_logits]
             end_logits = [x.view(-1).detach().cpu().numpy() for x in end_logits]
             for idx, i in enumerate(unique_id):
                 s = [float(x) for x in start_logits[idx]]
@@ -932,11 +910,6 @@ def main():
                         end_logits=e
                     )
                 )
-            # all_results.append(
-            #     RawResult(
-            #         unique_id=unique_id,
-            #         start_logits=start_logits,
-            #         end_logits=end_logits))
 
         output_prediction_file = os.path.join(args.output_dir, "predictions.json")
         output_nbest_file = os.path.join(args.output_dir, "nbest_predictions.json")
diff --git a/tokenization.py b/tokenization.py
index cb0c78c0bd..83bc86e444 100644
--- a/tokenization.py
+++ b/tokenization.py
@@ -1,5 +1,5 @@
 # coding=utf-8
-# Copyright 2018 The Google AI Language Team Authors.
+# Copyright 2018 The Google AI Language Team Authors and The HugginFace Inc. team.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.