Patch recursive import (#11812)

This commit is contained in:
Lysandre Debut
2021-05-21 12:50:01 +02:00
committed by GitHub
parent bd9871657b
commit 1b652295c5
2 changed files with 8 additions and 2 deletions

View File

@@ -25,7 +25,6 @@ from tokenizers import Regex, Tokenizer, decoders, normalizers, pre_tokenizers,
from tokenizers.models import BPE, Unigram, WordPiece from tokenizers.models import BPE, Unigram, WordPiece
from .file_utils import requires_backends from .file_utils import requires_backends
from .models.roformer.tokenization_utils import JiebaPreTokenizer
class SentencePieceExtractor: class SentencePieceExtractor:
@@ -299,6 +298,8 @@ class RobertaConverter(Converter):
class RoFormerConverter(Converter): class RoFormerConverter(Converter):
def converted(self) -> Tokenizer: def converted(self) -> Tokenizer:
from .models.roformer.tokenization_utils import JiebaPreTokenizer
vocab = self.original_tokenizer.vocab vocab = self.original_tokenizer.vocab
tokenizer = Tokenizer(WordPiece(vocab, unk_token=str(self.original_tokenizer.unk_token))) tokenizer = Tokenizer(WordPiece(vocab, unk_token=str(self.original_tokenizer.unk_token)))

View File

@@ -12,6 +12,9 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and # See the License for the specific language governing permissions and
# limitations under the License. # limitations under the License.
"""
isort:skip_file
"""
import os import os
import pickle import pickle
import tempfile import tempfile
@@ -20,12 +23,14 @@ from typing import Callable, Optional
import numpy as np import numpy as np
# Ensure there are no circular imports when importing the parent class
from transformers import PreTrainedTokenizerFast
from transformers import ( from transformers import (
BatchEncoding, BatchEncoding,
BertTokenizer, BertTokenizer,
BertTokenizerFast, BertTokenizerFast,
PreTrainedTokenizer, PreTrainedTokenizer,
PreTrainedTokenizerFast,
TensorType, TensorType,
TokenSpan, TokenSpan,
is_tokenizers_available, is_tokenizers_available,