add initialization for everybody

2019-09-26 10:06:20 +02:00
parent f2a337b3ed
commit 5705333441
9 changed files with 195 additions and 99 deletions
--- a/examples/run_tf_glue.py
+++ b/examples/run_tf_glue.py
@@ -1,37 +1,48 @@
 import tensorflow as tf
 import tensorflow_datasets
-from transformers import *
+from pytorch_transformers import *

 # Load dataset, tokenizer, model from pretrained model/vocabulary
 tokenizer = BertTokenizer.from_pretrained('bert-base-cased')
-dataset = tensorflow_datasets.load('glue/mrpc')
 model = TFBertForSequenceClassification.from_pretrained('bert-base-cased')
+data = tensorflow_datasets.load('glue/mrpc')

 # Prepare dataset for GLUE as a tf.data.Dataset instance
-train_dataset = glue_convert_examples_to_features(dataset['train'], tokenizer, task='mrpc')
-valid_dataset = glue_convert_examples_to_features(dataset['validation'], tokenizer, task='mrpc')
-train_dataset = train_dataset.shuffle(100).batch(32).repeat(3)
+train_dataset = glue_convert_examples_to_features(data['train'], tokenizer, 128, 'mrpc')
+valid_dataset = glue_convert_examples_to_features(data['validation'], tokenizer, 128, 'mrpc')
+train_dataset = train_dataset.shuffle(100).batch(32).repeat(2)
 valid_dataset = valid_dataset.batch(64)

 # Prepare training: Compile tf.keras model with optimizer, loss and learning rate schedule 
-learning_rate = tf.keras.optimizers.schedules.PolynomialDecay(2e-5, 345, end_learning_rate=0)
-optimizer = tf.keras.optimizers.Adam(learning_rate=learning_rate, epsilon=1e-08, clipnorm=1.0)
+optimizer = tf.keras.optimizers.Adam(learning_rate=3e-5, epsilon=1e-08, clipnorm=1.0)
 loss = tf.keras.losses.SparseCategoricalCrossentropy(from_logits=True)
-
-model.compile(optimizer=optimizer, loss=loss, metrics=['sparse_categorical_accuracy'])
+metric = tf.keras.metrics.SparseCategoricalAccuracy('accuracy')
+model.compile(optimizer=optimizer, loss=loss, metrics=[metric])

 # Train and evaluate using tf.keras.Model.fit()
-model.fit(train_dataset, epochs=3, steps_per_epoch=115,
-          validation_data=valid_dataset, validation_steps=7)
+history = model.fit(train_dataset, epochs=2, steps_per_epoch=115,
+                    validation_data=valid_dataset, validation_steps=7)

-# Save the TensorFlow model and load it in PyTorch
+>>> Train for 115 steps, validate for 7 steps
+>>> Epoch 1/2
+>>> 115/115 [==============================] - 53s 459ms/step - loss: 0.6033 - accuracy: 0.6712 - val_loss: 0.4964 - val_accuracy: 0.7647
+>>> Epoch 2/2
+>>> 115/115 [==============================] - 33s 289ms/step - loss: 0.4141 - accuracy: 0.8160 - val_loss: 0.3914 - val_accuracy: 0.8382
+
+# Load the TensorFlow model in PyTorch for inspection
 model.save_pretrained('./save/')
 pytorch_model = BertForSequenceClassification.from_pretrained('./save/', from_tf=True)

-# Quickly inspect a few predictions - MRPC is a paraphrasing task
-inputs = tokenizer.encode_plus("The company is doing great",
-                               "The company has good results",
-                               add_special_tokens=True,
-                               return_tensors='pt')
-pred = pytorch_model(**inputs)
-print("Paraphrase" if pred.argmax().item() == 0 else "Not paraphrase")
+# Quickly test a few predictions - MRPC is a paraphrasing task, let's see if our model learned the task
+sentence_0 = "This research was consistent with his findings."
+sentence_1 = "His findings were compatible with this research."
+sentence_2 = "His findings were not compatible with this research."
+inputs_1 = tokenizer.encode_plus(sentence_0, sentence_1, add_special_tokens=True, return_tensors='pt')
+inputs_2 = tokenizer.encode_plus(sentence_0, sentence_2, add_special_tokens=True, return_tensors='pt')
+
+pred_1 = pytorch_model(**inputs_1)[0].argmax().item()
+pred_2 = pytorch_model(**inputs_2)[0].argmax().item()
+print("sentence_1 is", "a paraphrase" if pred_1 else "not a paraphrase", "of sentence_0")
+print("sentence_2 is", "a paraphrase" if pred_2 else "not a paraphrase", "of sentence_0")
+>>> sentence_1 is a paraphrase of sentence_0
+>>> sentence_2 is not a paraphrase of sentence_0