Remove my unhelpful comments :)

2019-03-27 10:45:11 -07:00
parent fda2f62395
commit 01520d5412
2 changed files with 2 additions and 6 deletions
--- a/pytorch_pretrained_bert/modeling_gpt2.py
+++ b/pytorch_pretrained_bert/modeling_gpt2.py
@@ -621,9 +621,7 @@ class GPT2LMHeadModel(GPT2PreTrainedModel):
            shift_logits = lm_logits[:, :-1].contiguous()
            shift_labels = lm_labels[:, 1:].contiguous()
-            # In tensorflow, it's [batch, d_0, d_1, ..., d_{r-1}, num_classes]
+            # Flatten the tokens
            # in pytorch, it's [batch, num_classes, d_0, d_1, ..., d_{r-1}]
            # We just flatten the tokens out this way.
            loss_fct = CrossEntropyLoss(ignore_index=-1)
            loss = loss_fct(shift_logits.view(-1, shift_logits.size(-1)),
                            shift_labels.view(-1))
--- a/pytorch_pretrained_bert/modeling_openai.py
+++ b/pytorch_pretrained_bert/modeling_openai.py
@@ -720,9 +720,7 @@ class OpenAIGPTLMHeadModel(OpenAIGPTPreTrainedModel):
            shift_logits = lm_logits[:, :-1].contiguous()
            shift_labels = lm_labels[:, 1:].contiguous()
-            # In tensorflow, it's [batch, d_0, d_1, ..., d_{r-1}, num_classes]
+            # Flatten the tokens
            # in pytorch, it's [batch, num_classes, d_0, d_1, ..., d_{r-1}]
            # We just flatten the tokens out this way.
            loss_fct = CrossEntropyLoss(ignore_index=-1)
            loss = loss_fct(shift_logits.view(-1, shift_logits.size(-1)),
                            shift_labels.view(-1))