feat: allow prefix for any generative model (#5885)

* feat: allow padding_text for any generative model

* docs(pipelines.py): correct typo

* Update src/transformers/pipelines.py

Co-authored-by: Sam Shleifer <sshleifer@gmail.com>

* feat: rename padding_text to prefix

* fix: cannot tokenize empty text

* fix: pass prefix arg to pipeline

* test: add prefix to text-generetation pipeline

* style: fix style

* style: clean code and variable name more explicit

* set arg docstring to optional

Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>

Co-authored-by: Sam Shleifer <sshleifer@gmail.com>
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
This commit is contained in:
Boris Dayma
2020-09-07 02:03:45 -05:00
committed by GitHub
parent ce37be9d94
commit 995a958dd1
3 changed files with 38 additions and 24 deletions

View File

@@ -424,12 +424,14 @@ class MonoColumnInputTestCase(unittest.TestCase):
for model_name in TEXT_GENERATION_FINETUNED_MODELS:
nlp = pipeline(task="text-generation", model=model_name, tokenizer=model_name, framework="pt")
self._test_mono_column_pipeline(nlp, VALID_INPUTS, {})
self._test_mono_column_pipeline(nlp, VALID_INPUTS, {}, prefix="This is ")
@require_tf
def test_tf_text_generation(self):
for model_name in TEXT_GENERATION_FINETUNED_MODELS:
nlp = pipeline(task="text-generation", model=model_name, tokenizer=model_name, framework="tf")
self._test_mono_column_pipeline(nlp, VALID_INPUTS, {})
self._test_mono_column_pipeline(nlp, VALID_INPUTS, {}, prefix="This is ")
@slow
@require_torch