[marian] Automate Tatoeba-Challenge conversion (#7709)

This commit is contained in:
Sam Shleifer
2020-10-12 12:24:25 -04:00
committed by GitHub
parent aacac8f708
commit 9c2b2db2cd
5 changed files with 1347 additions and 165 deletions

View File

@@ -0,0 +1,22 @@
import tempfile
import unittest
from transformers.convert_marian_tatoeba_to_pytorch import TatoebaConverter
from transformers.file_utils import cached_property
from transformers.testing_utils import slow
class TatoebaConversionTester(unittest.TestCase):
@cached_property
def resolver(self):
tmp_dir = tempfile.mkdtemp()
return TatoebaConverter(save_dir=tmp_dir)
@slow
def test_resolver(self):
self.resolver.convert_models(["heb-eng"])
@slow
def test_model_card(self):
content, mmeta = self.resolver.write_model_card("opus-mt-he-en", dry_run=True)
assert mmeta["long_pair"] == "heb-eng"