Remove-auth-token (#27060)
* don't use `use_auth_token`internally * let's use token everywhere * fixup
This commit is contained in:
@@ -99,7 +99,7 @@ Define a `model_init` function and pass it to the [`Trainer`], as an example:
|
|||||||
... config=config,
|
... config=config,
|
||||||
... cache_dir=model_args.cache_dir,
|
... cache_dir=model_args.cache_dir,
|
||||||
... revision=model_args.model_revision,
|
... revision=model_args.model_revision,
|
||||||
... use_auth_token=True if model_args.use_auth_token else None,
|
... token=True if model_args.use_auth_token else None,
|
||||||
... )
|
... )
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
@@ -118,9 +118,9 @@ See example below for a translation from romanian to german:
|
|||||||
>>> from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
|
>>> from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
|
||||||
|
|
||||||
>>> tokenizer = AutoTokenizer.from_pretrained(
|
>>> tokenizer = AutoTokenizer.from_pretrained(
|
||||||
... "facebook/nllb-200-distilled-600M", use_auth_token=True, src_lang="ron_Latn"
|
... "facebook/nllb-200-distilled-600M", token=True, src_lang="ron_Latn"
|
||||||
... )
|
... )
|
||||||
>>> model = AutoModelForSeq2SeqLM.from_pretrained("facebook/nllb-200-distilled-600M", use_auth_token=True)
|
>>> model = AutoModelForSeq2SeqLM.from_pretrained("facebook/nllb-200-distilled-600M", token=True)
|
||||||
|
|
||||||
>>> article = "Şeful ONU spune că nu există o soluţie militară în Siria"
|
>>> article = "Şeful ONU spune că nu există o soluţie militară în Siria"
|
||||||
>>> inputs = tokenizer(article, return_tensors="pt")
|
>>> inputs = tokenizer(article, return_tensors="pt")
|
||||||
|
|||||||
@@ -105,7 +105,7 @@ Wandbについては、[object_parameter](https://docs.wandb.ai/guides/sweeps/co
|
|||||||
... config=config,
|
... config=config,
|
||||||
... cache_dir=model_args.cache_dir,
|
... cache_dir=model_args.cache_dir,
|
||||||
... revision=model_args.model_revision,
|
... revision=model_args.model_revision,
|
||||||
... use_auth_token=True if model_args.use_auth_token else None,
|
... token=True if model_args.use_auth_token else None,
|
||||||
... )
|
... )
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
@@ -87,7 +87,7 @@ wandb의 경우, 해당 [object_parameter](https://docs.wandb.ai/guides/sweeps/c
|
|||||||
... config=config,
|
... config=config,
|
||||||
... cache_dir=model_args.cache_dir,
|
... cache_dir=model_args.cache_dir,
|
||||||
... revision=model_args.model_revision,
|
... revision=model_args.model_revision,
|
||||||
... use_auth_token=True if model_args.use_auth_token else None,
|
... token=True if model_args.use_auth_token else None,
|
||||||
... )
|
... )
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
@@ -1117,7 +1117,7 @@ params = model.init(key2, x)
|
|||||||
|
|
||||||
bytes_output = serialization.to_bytes(params)
|
bytes_output = serialization.to_bytes(params)
|
||||||
|
|
||||||
repo = Repository("flax-model", clone_from="flax-community/flax-model-dummy", use_auth_token=True)
|
repo = Repository("flax-model", clone_from="flax-community/flax-model-dummy", token=True)
|
||||||
with repo.commit("My cool Flax model :)"):
|
with repo.commit("My cool Flax model :)"):
|
||||||
with open("flax_model.msgpack", "wb") as f:
|
with open("flax_model.msgpack", "wb") as f:
|
||||||
f.write(bytes_output)
|
f.write(bytes_output)
|
||||||
|
|||||||
@@ -250,7 +250,7 @@ def main():
|
|||||||
"nielsr/funsd-layoutlmv3",
|
"nielsr/funsd-layoutlmv3",
|
||||||
data_args.dataset_config_name,
|
data_args.dataset_config_name,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
elif data_args.dataset_name == "cord":
|
elif data_args.dataset_name == "cord":
|
||||||
# Downloading and loading a dataset from the hub.
|
# Downloading and loading a dataset from the hub.
|
||||||
@@ -258,7 +258,7 @@ def main():
|
|||||||
"nielsr/cord-layoutlmv3",
|
"nielsr/cord-layoutlmv3",
|
||||||
data_args.dataset_config_name,
|
data_args.dataset_config_name,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
else:
|
else:
|
||||||
raise ValueError("This script only supports either FUNSD or CORD out-of-the-box.")
|
raise ValueError("This script only supports either FUNSD or CORD out-of-the-box.")
|
||||||
@@ -313,7 +313,7 @@ def main():
|
|||||||
finetuning_task=data_args.task_name,
|
finetuning_task=data_args.task_name,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
processor = AutoProcessor.from_pretrained(
|
processor = AutoProcessor.from_pretrained(
|
||||||
@@ -321,7 +321,7 @@ def main():
|
|||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_fast=True,
|
use_fast=True,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
add_prefix_space=True,
|
add_prefix_space=True,
|
||||||
apply_ocr=False,
|
apply_ocr=False,
|
||||||
)
|
)
|
||||||
@@ -332,7 +332,7 @@ def main():
|
|||||||
config=config,
|
config=config,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
# Set the correspondences label/ID inside the model config
|
# Set the correspondences label/ID inside the model config
|
||||||
|
|||||||
@@ -325,7 +325,7 @@ def main():
|
|||||||
config=config,
|
config=config,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
else:
|
else:
|
||||||
logger.info("Training new model from scratch")
|
logger.info("Training new model from scratch")
|
||||||
|
|||||||
@@ -322,14 +322,14 @@ def main():
|
|||||||
model_args.config_name if model_args.config_name else model_args.model_name_or_path,
|
model_args.config_name if model_args.config_name else model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
tokenizer = AutoTokenizer.from_pretrained(
|
tokenizer = AutoTokenizer.from_pretrained(
|
||||||
model_args.tokenizer_name if model_args.tokenizer_name else model_args.model_name_or_path,
|
model_args.tokenizer_name if model_args.tokenizer_name else model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_fast=True,
|
use_fast=True,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
model = QDQBertForQuestionAnswering.from_pretrained(
|
model = QDQBertForQuestionAnswering.from_pretrained(
|
||||||
model_args.model_name_or_path,
|
model_args.model_name_or_path,
|
||||||
@@ -337,7 +337,7 @@ def main():
|
|||||||
config=config,
|
config=config,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
# Tokenizer check: this script requires a fast tokenizer.
|
# Tokenizer check: this script requires a fast tokenizer.
|
||||||
|
|||||||
@@ -65,7 +65,7 @@ def normalize_text(text: str) -> str:
|
|||||||
|
|
||||||
def main(args):
|
def main(args):
|
||||||
# load dataset
|
# load dataset
|
||||||
dataset = load_dataset(args.dataset, args.config, split=args.split, use_auth_token=True)
|
dataset = load_dataset(args.dataset, args.config, split=args.split, token=True)
|
||||||
|
|
||||||
# for testing: only process the first two examples as a test
|
# for testing: only process the first two examples as a test
|
||||||
# dataset = dataset.select(range(10))
|
# dataset = dataset.select(range(10))
|
||||||
|
|||||||
@@ -418,7 +418,7 @@ def main():
|
|||||||
data_args.dataset_name,
|
data_args.dataset_name,
|
||||||
data_args.dataset_config_name,
|
data_args.dataset_config_name,
|
||||||
split=data_args.train_split_name,
|
split=data_args.train_split_name,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
|
|
||||||
if data_args.audio_column_name not in raw_datasets["train"].column_names:
|
if data_args.audio_column_name not in raw_datasets["train"].column_names:
|
||||||
@@ -443,7 +443,7 @@ def main():
|
|||||||
data_args.dataset_name,
|
data_args.dataset_name,
|
||||||
data_args.dataset_config_name,
|
data_args.dataset_config_name,
|
||||||
split=data_args.eval_split_name,
|
split=data_args.eval_split_name,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
|
|
||||||
if data_args.max_eval_samples is not None:
|
if data_args.max_eval_samples is not None:
|
||||||
@@ -481,7 +481,7 @@ def main():
|
|||||||
# the tokenizer
|
# the tokenizer
|
||||||
# load config
|
# load config
|
||||||
config = AutoConfig.from_pretrained(
|
config = AutoConfig.from_pretrained(
|
||||||
model_args.model_name_or_path, cache_dir=model_args.cache_dir, use_auth_token=data_args.use_auth_token
|
model_args.model_name_or_path, cache_dir=model_args.cache_dir, token=data_args.use_auth_token
|
||||||
)
|
)
|
||||||
|
|
||||||
# 4. Next, if no tokenizer file is defined,
|
# 4. Next, if no tokenizer file is defined,
|
||||||
@@ -532,11 +532,11 @@ def main():
|
|||||||
# load feature_extractor and tokenizer
|
# load feature_extractor and tokenizer
|
||||||
tokenizer = AutoTokenizer.from_pretrained(
|
tokenizer = AutoTokenizer.from_pretrained(
|
||||||
tokenizer_name_or_path,
|
tokenizer_name_or_path,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
**tokenizer_kwargs,
|
**tokenizer_kwargs,
|
||||||
)
|
)
|
||||||
feature_extractor = AutoFeatureExtractor.from_pretrained(
|
feature_extractor = AutoFeatureExtractor.from_pretrained(
|
||||||
model_args.model_name_or_path, cache_dir=model_args.cache_dir, use_auth_token=data_args.use_auth_token
|
model_args.model_name_or_path, cache_dir=model_args.cache_dir, token=data_args.use_auth_token
|
||||||
)
|
)
|
||||||
|
|
||||||
# adapt config
|
# adapt config
|
||||||
@@ -564,7 +564,7 @@ def main():
|
|||||||
model_args.model_name_or_path,
|
model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
config=config,
|
config=config,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
|
|
||||||
# freeze encoder
|
# freeze encoder
|
||||||
|
|||||||
@@ -395,7 +395,7 @@ def main():
|
|||||||
# so we just need to set the correct target sampling rate and normalize the input
|
# so we just need to set the correct target sampling rate and normalize the input
|
||||||
# via the `feature_extractor`
|
# via the `feature_extractor`
|
||||||
feature_extractor = AutoFeatureExtractor.from_pretrained(
|
feature_extractor = AutoFeatureExtractor.from_pretrained(
|
||||||
model_args.model_name_or_path, cache_dir=model_args.cache_dir, use_auth_token=data_args.use_auth_token
|
model_args.model_name_or_path, cache_dir=model_args.cache_dir, token=data_args.use_auth_token
|
||||||
)
|
)
|
||||||
|
|
||||||
if training_args.do_train:
|
if training_args.do_train:
|
||||||
@@ -403,7 +403,7 @@ def main():
|
|||||||
path=data_args.dataset_name,
|
path=data_args.dataset_name,
|
||||||
name=data_args.dataset_config_name,
|
name=data_args.dataset_config_name,
|
||||||
split=data_args.train_split_name,
|
split=data_args.train_split_name,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
streaming=True,
|
streaming=True,
|
||||||
sampling_rate=feature_extractor.sampling_rate,
|
sampling_rate=feature_extractor.sampling_rate,
|
||||||
)
|
)
|
||||||
@@ -431,7 +431,7 @@ def main():
|
|||||||
path=data_args.dataset_name,
|
path=data_args.dataset_name,
|
||||||
name=data_args.dataset_config_name,
|
name=data_args.dataset_config_name,
|
||||||
split=data_args.eval_split_name,
|
split=data_args.eval_split_name,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
streaming=True,
|
streaming=True,
|
||||||
sampling_rate=feature_extractor.sampling_rate,
|
sampling_rate=feature_extractor.sampling_rate,
|
||||||
)
|
)
|
||||||
@@ -465,7 +465,7 @@ def main():
|
|||||||
# 3. Next, let's load the config as we might need it to create
|
# 3. Next, let's load the config as we might need it to create
|
||||||
# the tokenizer
|
# the tokenizer
|
||||||
config = AutoConfig.from_pretrained(
|
config = AutoConfig.from_pretrained(
|
||||||
model_args.model_name_or_path, cache_dir=model_args.cache_dir, use_auth_token=data_args.use_auth_token
|
model_args.model_name_or_path, cache_dir=model_args.cache_dir, token=data_args.use_auth_token
|
||||||
)
|
)
|
||||||
|
|
||||||
# 4. Now we can instantiate the tokenizer and model
|
# 4. Now we can instantiate the tokenizer and model
|
||||||
@@ -481,7 +481,7 @@ def main():
|
|||||||
tokenizer = AutoTokenizer.from_pretrained(
|
tokenizer = AutoTokenizer.from_pretrained(
|
||||||
tokenizer_name_or_path,
|
tokenizer_name_or_path,
|
||||||
config=config,
|
config=config,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
|
|
||||||
# adapt config
|
# adapt config
|
||||||
@@ -509,7 +509,7 @@ def main():
|
|||||||
model_args.model_name_or_path,
|
model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
config=config,
|
config=config,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
|
|
||||||
# freeze encoder
|
# freeze encoder
|
||||||
|
|||||||
@@ -292,7 +292,7 @@ def main():
|
|||||||
num_labels=num_labels,
|
num_labels=num_labels,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
# load tapex tokenizer
|
# load tapex tokenizer
|
||||||
tokenizer = TapexTokenizer.from_pretrained(
|
tokenizer = TapexTokenizer.from_pretrained(
|
||||||
@@ -300,7 +300,7 @@ def main():
|
|||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_fast=model_args.use_fast_tokenizer,
|
use_fast=model_args.use_fast_tokenizer,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
add_prefix_space=True,
|
add_prefix_space=True,
|
||||||
)
|
)
|
||||||
model = BartForSequenceClassification.from_pretrained(
|
model = BartForSequenceClassification.from_pretrained(
|
||||||
@@ -309,7 +309,7 @@ def main():
|
|||||||
config=config,
|
config=config,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
# Padding strategy
|
# Padding strategy
|
||||||
|
|||||||
@@ -329,7 +329,7 @@ def main():
|
|||||||
model_args.config_name if model_args.config_name else model_args.model_name_or_path,
|
model_args.config_name if model_args.config_name else model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
|
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
|
||||||
@@ -344,7 +344,7 @@ def main():
|
|||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_fast=model_args.use_fast_tokenizer,
|
use_fast=model_args.use_fast_tokenizer,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
add_prefix_space=True,
|
add_prefix_space=True,
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -355,7 +355,7 @@ def main():
|
|||||||
config=config,
|
config=config,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
if model.config.decoder_start_token_id is None:
|
if model.config.decoder_start_token_id is None:
|
||||||
|
|||||||
@@ -327,7 +327,7 @@ def main():
|
|||||||
model_args.config_name if model_args.config_name else model_args.model_name_or_path,
|
model_args.config_name if model_args.config_name else model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
|
# IMPORTANT: the initial BART model's decoding is penalized by no_repeat_ngram_size, and thus
|
||||||
@@ -342,7 +342,7 @@ def main():
|
|||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_fast=model_args.use_fast_tokenizer,
|
use_fast=model_args.use_fast_tokenizer,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
add_prefix_space=True,
|
add_prefix_space=True,
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -353,7 +353,7 @@ def main():
|
|||||||
config=config,
|
config=config,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
if model.config.decoder_start_token_id is None:
|
if model.config.decoder_start_token_id is None:
|
||||||
|
|||||||
@@ -502,7 +502,7 @@ def main():
|
|||||||
data_args.dataset_name,
|
data_args.dataset_name,
|
||||||
config_name,
|
config_name,
|
||||||
split=data_args.train_split_name,
|
split=data_args.train_split_name,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -528,7 +528,7 @@ def main():
|
|||||||
data_args.dataset_name,
|
data_args.dataset_name,
|
||||||
config_name,
|
config_name,
|
||||||
split=data_args.eval_split_name,
|
split=data_args.eval_split_name,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -540,7 +540,7 @@ def main():
|
|||||||
data_args.dataset_name,
|
data_args.dataset_name,
|
||||||
config_name,
|
config_name,
|
||||||
split=data_args.predict_split_name,
|
split=data_args.predict_split_name,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -595,7 +595,7 @@ def main():
|
|||||||
# 3. Next, let's load the config as we might need it to create
|
# 3. Next, let's load the config as we might need it to create
|
||||||
# the tokenizer
|
# the tokenizer
|
||||||
config = AutoConfig.from_pretrained(
|
config = AutoConfig.from_pretrained(
|
||||||
model_args.model_name_or_path, cache_dir=model_args.cache_dir, use_auth_token=data_args.use_auth_token
|
model_args.model_name_or_path, cache_dir=model_args.cache_dir, token=data_args.use_auth_token
|
||||||
)
|
)
|
||||||
|
|
||||||
if is_text_target:
|
if is_text_target:
|
||||||
@@ -651,11 +651,11 @@ def main():
|
|||||||
if is_text_target:
|
if is_text_target:
|
||||||
tokenizer = AutoTokenizer.from_pretrained(
|
tokenizer = AutoTokenizer.from_pretrained(
|
||||||
tokenizer_name_or_path,
|
tokenizer_name_or_path,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
**tokenizer_kwargs,
|
**tokenizer_kwargs,
|
||||||
)
|
)
|
||||||
feature_extractor = AutoFeatureExtractor.from_pretrained(
|
feature_extractor = AutoFeatureExtractor.from_pretrained(
|
||||||
model_args.model_name_or_path, cache_dir=model_args.cache_dir, use_auth_token=data_args.use_auth_token
|
model_args.model_name_or_path, cache_dir=model_args.cache_dir, token=data_args.use_auth_token
|
||||||
)
|
)
|
||||||
|
|
||||||
# adapt config
|
# adapt config
|
||||||
@@ -694,14 +694,14 @@ def main():
|
|||||||
model_args.model_name_or_path,
|
model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
config=config,
|
config=config,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
elif config.is_encoder_decoder:
|
elif config.is_encoder_decoder:
|
||||||
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
model = AutoModelForSpeechSeq2Seq.from_pretrained(
|
||||||
model_args.model_name_or_path,
|
model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
config=config,
|
config=config,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
if model.config.decoder_start_token_id is None:
|
if model.config.decoder_start_token_id is None:
|
||||||
raise ValueError("Make sure that `config.decoder_start_token_id` is correctly defined")
|
raise ValueError("Make sure that `config.decoder_start_token_id` is correctly defined")
|
||||||
@@ -710,7 +710,7 @@ def main():
|
|||||||
model_args.model_name_or_path,
|
model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
config=config,
|
config=config,
|
||||||
use_auth_token=data_args.use_auth_token,
|
token=data_args.use_auth_token,
|
||||||
)
|
)
|
||||||
|
|
||||||
# freeze encoder
|
# freeze encoder
|
||||||
|
|||||||
@@ -716,7 +716,7 @@ class GenerationConfig(PushToHubMixin):
|
|||||||
proxies=proxies,
|
proxies=proxies,
|
||||||
resume_download=resume_download,
|
resume_download=resume_download,
|
||||||
local_files_only=local_files_only,
|
local_files_only=local_files_only,
|
||||||
use_auth_token=token,
|
token=token,
|
||||||
user_agent=user_agent,
|
user_agent=user_agent,
|
||||||
revision=revision,
|
revision=revision,
|
||||||
subfolder=subfolder,
|
subfolder=subfolder,
|
||||||
|
|||||||
@@ -179,7 +179,7 @@ class PeftAdapterMixin:
|
|||||||
|
|
||||||
peft_config = PeftConfig.from_pretrained(
|
peft_config = PeftConfig.from_pretrained(
|
||||||
peft_model_id,
|
peft_model_id,
|
||||||
use_auth_token=token,
|
token=token,
|
||||||
**adapter_kwargs,
|
**adapter_kwargs,
|
||||||
)
|
)
|
||||||
|
|
||||||
@@ -190,7 +190,7 @@ class PeftAdapterMixin:
|
|||||||
self._hf_peft_config_loaded = True
|
self._hf_peft_config_loaded = True
|
||||||
|
|
||||||
if peft_model_id is not None:
|
if peft_model_id is not None:
|
||||||
adapter_state_dict = load_peft_weights(peft_model_id, use_auth_token=token, **adapter_kwargs)
|
adapter_state_dict = load_peft_weights(peft_model_id, token=token, **adapter_kwargs)
|
||||||
|
|
||||||
# We need to pre-process the state dict to remove unneeded prefixes - for backward compatibility
|
# We need to pre-process the state dict to remove unneeded prefixes - for backward compatibility
|
||||||
processed_adapter_state_dict = {}
|
processed_adapter_state_dict = {}
|
||||||
|
|||||||
@@ -94,7 +94,7 @@ class BarkProcessor(ProcessorMixin):
|
|||||||
proxies=kwargs.pop("proxies", None),
|
proxies=kwargs.pop("proxies", None),
|
||||||
resume_download=kwargs.pop("resume_download", False),
|
resume_download=kwargs.pop("resume_download", False),
|
||||||
local_files_only=kwargs.pop("local_files_only", False),
|
local_files_only=kwargs.pop("local_files_only", False),
|
||||||
use_auth_token=kwargs.pop("use_auth_token", None),
|
token=kwargs.pop("use_auth_token", None),
|
||||||
revision=kwargs.pop("revision", None),
|
revision=kwargs.pop("revision", None),
|
||||||
)
|
)
|
||||||
if speaker_embeddings_path is None:
|
if speaker_embeddings_path is None:
|
||||||
@@ -190,7 +190,7 @@ class BarkProcessor(ProcessorMixin):
|
|||||||
proxies=kwargs.pop("proxies", None),
|
proxies=kwargs.pop("proxies", None),
|
||||||
resume_download=kwargs.pop("resume_download", False),
|
resume_download=kwargs.pop("resume_download", False),
|
||||||
local_files_only=kwargs.pop("local_files_only", False),
|
local_files_only=kwargs.pop("local_files_only", False),
|
||||||
use_auth_token=kwargs.pop("use_auth_token", None),
|
token=kwargs.pop("use_auth_token", None),
|
||||||
revision=kwargs.pop("revision", None),
|
revision=kwargs.pop("revision", None),
|
||||||
)
|
)
|
||||||
if path is None:
|
if path is None:
|
||||||
|
|||||||
@@ -226,7 +226,7 @@ class Tool:
|
|||||||
resolved_config_file = cached_file(
|
resolved_config_file = cached_file(
|
||||||
repo_id,
|
repo_id,
|
||||||
TOOL_CONFIG_FILE,
|
TOOL_CONFIG_FILE,
|
||||||
use_auth_token=token,
|
token=token,
|
||||||
**hub_kwargs,
|
**hub_kwargs,
|
||||||
_raise_exceptions_for_missing_entries=False,
|
_raise_exceptions_for_missing_entries=False,
|
||||||
_raise_exceptions_for_connection_errors=False,
|
_raise_exceptions_for_connection_errors=False,
|
||||||
@@ -236,7 +236,7 @@ class Tool:
|
|||||||
resolved_config_file = cached_file(
|
resolved_config_file = cached_file(
|
||||||
repo_id,
|
repo_id,
|
||||||
CONFIG_NAME,
|
CONFIG_NAME,
|
||||||
use_auth_token=token,
|
token=token,
|
||||||
**hub_kwargs,
|
**hub_kwargs,
|
||||||
_raise_exceptions_for_missing_entries=False,
|
_raise_exceptions_for_missing_entries=False,
|
||||||
_raise_exceptions_for_connection_errors=False,
|
_raise_exceptions_for_connection_errors=False,
|
||||||
@@ -259,7 +259,7 @@ class Tool:
|
|||||||
custom_tool = config
|
custom_tool = config
|
||||||
|
|
||||||
tool_class = custom_tool["tool_class"]
|
tool_class = custom_tool["tool_class"]
|
||||||
tool_class = get_class_from_dynamic_module(tool_class, repo_id, use_auth_token=token, **hub_kwargs)
|
tool_class = get_class_from_dynamic_module(tool_class, repo_id, token=token, **hub_kwargs)
|
||||||
|
|
||||||
if len(tool_class.name) == 0:
|
if len(tool_class.name) == 0:
|
||||||
tool_class.name = custom_tool["name"]
|
tool_class.name = custom_tool["name"]
|
||||||
|
|||||||
@@ -308,9 +308,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
|
|||||||
def test_push_to_hub(self):
|
def test_push_to_hub(self):
|
||||||
processor = Wav2Vec2Processor.from_pretrained(SAMPLE_PROCESSOR_CONFIG_DIR)
|
processor = Wav2Vec2Processor.from_pretrained(SAMPLE_PROCESSOR_CONFIG_DIR)
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
processor.save_pretrained(
|
processor.save_pretrained(os.path.join(tmp_dir, "test-processor"), push_to_hub=True, token=self._token)
|
||||||
os.path.join(tmp_dir, "test-processor"), push_to_hub=True, use_auth_token=self._token
|
|
||||||
)
|
|
||||||
|
|
||||||
new_processor = Wav2Vec2Processor.from_pretrained(f"{USER}/test-processor")
|
new_processor = Wav2Vec2Processor.from_pretrained(f"{USER}/test-processor")
|
||||||
for k, v in processor.feature_extractor.__dict__.items():
|
for k, v in processor.feature_extractor.__dict__.items():
|
||||||
@@ -324,7 +322,7 @@ class ProcessorPushToHubTester(unittest.TestCase):
|
|||||||
processor.save_pretrained(
|
processor.save_pretrained(
|
||||||
os.path.join(tmp_dir, "test-processor-org"),
|
os.path.join(tmp_dir, "test-processor-org"),
|
||||||
push_to_hub=True,
|
push_to_hub=True,
|
||||||
use_auth_token=self._token,
|
token=self._token,
|
||||||
organization="valid_org",
|
organization="valid_org",
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|||||||
@@ -314,14 +314,14 @@ def main():
|
|||||||
finetuning_task=data_args.task_name,
|
finetuning_task=data_args.task_name,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
tokenizer = AutoTokenizer.from_pretrained(
|
tokenizer = AutoTokenizer.from_pretrained(
|
||||||
model_args.tokenizer_name if model_args.tokenizer_name else model_args.model_name_or_path,
|
model_args.tokenizer_name if model_args.tokenizer_name else model_args.model_name_or_path,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
use_fast=model_args.use_fast_tokenizer,
|
use_fast=model_args.use_fast_tokenizer,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
model = AutoModelForSequenceClassification.from_pretrained(
|
model = AutoModelForSequenceClassification.from_pretrained(
|
||||||
model_args.model_name_or_path,
|
model_args.model_name_or_path,
|
||||||
@@ -329,7 +329,7 @@ def main():
|
|||||||
config=config,
|
config=config,
|
||||||
cache_dir=model_args.cache_dir,
|
cache_dir=model_args.cache_dir,
|
||||||
revision=model_args.model_revision,
|
revision=model_args.model_revision,
|
||||||
use_auth_token=True if model_args.use_auth_token else None,
|
token=True if model_args.use_auth_token else None,
|
||||||
)
|
)
|
||||||
|
|
||||||
# Preprocessing the datasets
|
# Preprocessing the datasets
|
||||||
|
|||||||
@@ -142,7 +142,7 @@ class ConfigPushToHubTester(unittest.TestCase):
|
|||||||
config = BertConfig(
|
config = BertConfig(
|
||||||
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
||||||
)
|
)
|
||||||
config.push_to_hub("valid_org/test-config-org", use_auth_token=self._token)
|
config.push_to_hub("valid_org/test-config-org", token=self._token)
|
||||||
|
|
||||||
new_config = BertConfig.from_pretrained("valid_org/test-config-org")
|
new_config = BertConfig.from_pretrained("valid_org/test-config-org")
|
||||||
for k, v in config.to_dict().items():
|
for k, v in config.to_dict().items():
|
||||||
@@ -154,9 +154,7 @@ class ConfigPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
config.save_pretrained(
|
config.save_pretrained(tmp_dir, repo_id="valid_org/test-config-org", push_to_hub=True, token=self._token)
|
||||||
tmp_dir, repo_id="valid_org/test-config-org", push_to_hub=True, use_auth_token=self._token
|
|
||||||
)
|
|
||||||
|
|
||||||
new_config = BertConfig.from_pretrained("valid_org/test-config-org")
|
new_config = BertConfig.from_pretrained("valid_org/test-config-org")
|
||||||
for k, v in config.to_dict().items():
|
for k, v in config.to_dict().items():
|
||||||
@@ -167,7 +165,7 @@ class ConfigPushToHubTester(unittest.TestCase):
|
|||||||
CustomConfig.register_for_auto_class()
|
CustomConfig.register_for_auto_class()
|
||||||
config = CustomConfig(attribute=42)
|
config = CustomConfig(attribute=42)
|
||||||
|
|
||||||
config.push_to_hub("test-dynamic-config", use_auth_token=self._token)
|
config.push_to_hub("test-dynamic-config", token=self._token)
|
||||||
|
|
||||||
# This has added the proper auto_map field to the config
|
# This has added the proper auto_map field to the config
|
||||||
self.assertDictEqual(config.auto_map, {"AutoConfig": "custom_configuration.CustomConfig"})
|
self.assertDictEqual(config.auto_map, {"AutoConfig": "custom_configuration.CustomConfig"})
|
||||||
|
|||||||
@@ -85,7 +85,7 @@ class FeatureExtractorPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
def test_push_to_hub(self):
|
def test_push_to_hub(self):
|
||||||
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(SAMPLE_FEATURE_EXTRACTION_CONFIG_DIR)
|
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(SAMPLE_FEATURE_EXTRACTION_CONFIG_DIR)
|
||||||
feature_extractor.push_to_hub("test-feature-extractor", use_auth_token=self._token)
|
feature_extractor.push_to_hub("test-feature-extractor", token=self._token)
|
||||||
|
|
||||||
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(f"{USER}/test-feature-extractor")
|
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(f"{USER}/test-feature-extractor")
|
||||||
for k, v in feature_extractor.__dict__.items():
|
for k, v in feature_extractor.__dict__.items():
|
||||||
@@ -97,7 +97,7 @@ class FeatureExtractorPushToHubTester(unittest.TestCase):
|
|||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
feature_extractor.save_pretrained(
|
feature_extractor.save_pretrained(
|
||||||
tmp_dir, repo_id="test-feature-extractor", push_to_hub=True, use_auth_token=self._token
|
tmp_dir, repo_id="test-feature-extractor", push_to_hub=True, token=self._token
|
||||||
)
|
)
|
||||||
|
|
||||||
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(f"{USER}/test-feature-extractor")
|
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(f"{USER}/test-feature-extractor")
|
||||||
@@ -106,7 +106,7 @@ class FeatureExtractorPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
def test_push_to_hub_in_organization(self):
|
def test_push_to_hub_in_organization(self):
|
||||||
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(SAMPLE_FEATURE_EXTRACTION_CONFIG_DIR)
|
feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained(SAMPLE_FEATURE_EXTRACTION_CONFIG_DIR)
|
||||||
feature_extractor.push_to_hub("valid_org/test-feature-extractor", use_auth_token=self._token)
|
feature_extractor.push_to_hub("valid_org/test-feature-extractor", token=self._token)
|
||||||
|
|
||||||
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained("valid_org/test-feature-extractor")
|
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained("valid_org/test-feature-extractor")
|
||||||
for k, v in feature_extractor.__dict__.items():
|
for k, v in feature_extractor.__dict__.items():
|
||||||
@@ -118,7 +118,7 @@ class FeatureExtractorPushToHubTester(unittest.TestCase):
|
|||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
feature_extractor.save_pretrained(
|
feature_extractor.save_pretrained(
|
||||||
tmp_dir, repo_id="valid_org/test-feature-extractor-org", push_to_hub=True, use_auth_token=self._token
|
tmp_dir, repo_id="valid_org/test-feature-extractor-org", push_to_hub=True, token=self._token
|
||||||
)
|
)
|
||||||
|
|
||||||
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained("valid_org/test-feature-extractor-org")
|
new_feature_extractor = Wav2Vec2FeatureExtractor.from_pretrained("valid_org/test-feature-extractor-org")
|
||||||
@@ -129,7 +129,7 @@ class FeatureExtractorPushToHubTester(unittest.TestCase):
|
|||||||
CustomFeatureExtractor.register_for_auto_class()
|
CustomFeatureExtractor.register_for_auto_class()
|
||||||
feature_extractor = CustomFeatureExtractor.from_pretrained(SAMPLE_FEATURE_EXTRACTION_CONFIG_DIR)
|
feature_extractor = CustomFeatureExtractor.from_pretrained(SAMPLE_FEATURE_EXTRACTION_CONFIG_DIR)
|
||||||
|
|
||||||
feature_extractor.push_to_hub("test-dynamic-feature-extractor", use_auth_token=self._token)
|
feature_extractor.push_to_hub("test-dynamic-feature-extractor", token=self._token)
|
||||||
|
|
||||||
# This has added the proper auto_map field to the config
|
# This has added the proper auto_map field to the config
|
||||||
self.assertDictEqual(
|
self.assertDictEqual(
|
||||||
|
|||||||
@@ -95,7 +95,7 @@ class ImageProcessorPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
def test_push_to_hub(self):
|
def test_push_to_hub(self):
|
||||||
image_processor = ViTImageProcessor.from_pretrained(SAMPLE_IMAGE_PROCESSING_CONFIG_DIR)
|
image_processor = ViTImageProcessor.from_pretrained(SAMPLE_IMAGE_PROCESSING_CONFIG_DIR)
|
||||||
image_processor.push_to_hub("test-image-processor", use_auth_token=self._token)
|
image_processor.push_to_hub("test-image-processor", token=self._token)
|
||||||
|
|
||||||
new_image_processor = ViTImageProcessor.from_pretrained(f"{USER}/test-image-processor")
|
new_image_processor = ViTImageProcessor.from_pretrained(f"{USER}/test-image-processor")
|
||||||
for k, v in image_processor.__dict__.items():
|
for k, v in image_processor.__dict__.items():
|
||||||
@@ -107,7 +107,7 @@ class ImageProcessorPushToHubTester(unittest.TestCase):
|
|||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
image_processor.save_pretrained(
|
image_processor.save_pretrained(
|
||||||
tmp_dir, repo_id="test-image-processor", push_to_hub=True, use_auth_token=self._token
|
tmp_dir, repo_id="test-image-processor", push_to_hub=True, token=self._token
|
||||||
)
|
)
|
||||||
|
|
||||||
new_image_processor = ViTImageProcessor.from_pretrained(f"{USER}/test-image-processor")
|
new_image_processor = ViTImageProcessor.from_pretrained(f"{USER}/test-image-processor")
|
||||||
@@ -116,7 +116,7 @@ class ImageProcessorPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
def test_push_to_hub_in_organization(self):
|
def test_push_to_hub_in_organization(self):
|
||||||
image_processor = ViTImageProcessor.from_pretrained(SAMPLE_IMAGE_PROCESSING_CONFIG_DIR)
|
image_processor = ViTImageProcessor.from_pretrained(SAMPLE_IMAGE_PROCESSING_CONFIG_DIR)
|
||||||
image_processor.push_to_hub("valid_org/test-image-processor", use_auth_token=self._token)
|
image_processor.push_to_hub("valid_org/test-image-processor", token=self._token)
|
||||||
|
|
||||||
new_image_processor = ViTImageProcessor.from_pretrained("valid_org/test-image-processor")
|
new_image_processor = ViTImageProcessor.from_pretrained("valid_org/test-image-processor")
|
||||||
for k, v in image_processor.__dict__.items():
|
for k, v in image_processor.__dict__.items():
|
||||||
@@ -128,7 +128,7 @@ class ImageProcessorPushToHubTester(unittest.TestCase):
|
|||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
image_processor.save_pretrained(
|
image_processor.save_pretrained(
|
||||||
tmp_dir, repo_id="valid_org/test-image-processor-org", push_to_hub=True, use_auth_token=self._token
|
tmp_dir, repo_id="valid_org/test-image-processor-org", push_to_hub=True, token=self._token
|
||||||
)
|
)
|
||||||
|
|
||||||
new_image_processor = ViTImageProcessor.from_pretrained("valid_org/test-image-processor-org")
|
new_image_processor = ViTImageProcessor.from_pretrained("valid_org/test-image-processor-org")
|
||||||
@@ -139,7 +139,7 @@ class ImageProcessorPushToHubTester(unittest.TestCase):
|
|||||||
CustomImageProcessor.register_for_auto_class()
|
CustomImageProcessor.register_for_auto_class()
|
||||||
image_processor = CustomImageProcessor.from_pretrained(SAMPLE_IMAGE_PROCESSING_CONFIG_DIR)
|
image_processor = CustomImageProcessor.from_pretrained(SAMPLE_IMAGE_PROCESSING_CONFIG_DIR)
|
||||||
|
|
||||||
image_processor.push_to_hub("test-dynamic-image-processor", use_auth_token=self._token)
|
image_processor.push_to_hub("test-dynamic-image-processor", token=self._token)
|
||||||
|
|
||||||
# This has added the proper auto_map field to the config
|
# This has added the proper auto_map field to the config
|
||||||
self.assertDictEqual(
|
self.assertDictEqual(
|
||||||
|
|||||||
@@ -60,7 +60,7 @@ class FlaxModelPushToHubTester(unittest.TestCase):
|
|||||||
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
||||||
)
|
)
|
||||||
model = FlaxBertModel(config)
|
model = FlaxBertModel(config)
|
||||||
model.push_to_hub("test-model-flax", use_auth_token=self._token)
|
model.push_to_hub("test-model-flax", token=self._token)
|
||||||
|
|
||||||
new_model = FlaxBertModel.from_pretrained(f"{USER}/test-model-flax")
|
new_model = FlaxBertModel.from_pretrained(f"{USER}/test-model-flax")
|
||||||
|
|
||||||
@@ -76,7 +76,7 @@ class FlaxModelPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
model.save_pretrained(tmp_dir, repo_id="test-model-flax", push_to_hub=True, use_auth_token=self._token)
|
model.save_pretrained(tmp_dir, repo_id="test-model-flax", push_to_hub=True, token=self._token)
|
||||||
|
|
||||||
new_model = FlaxBertModel.from_pretrained(f"{USER}/test-model-flax")
|
new_model = FlaxBertModel.from_pretrained(f"{USER}/test-model-flax")
|
||||||
|
|
||||||
@@ -92,7 +92,7 @@ class FlaxModelPushToHubTester(unittest.TestCase):
|
|||||||
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
||||||
)
|
)
|
||||||
model = FlaxBertModel(config)
|
model = FlaxBertModel(config)
|
||||||
model.push_to_hub("valid_org/test-model-flax-org", use_auth_token=self._token)
|
model.push_to_hub("valid_org/test-model-flax-org", token=self._token)
|
||||||
|
|
||||||
new_model = FlaxBertModel.from_pretrained("valid_org/test-model-flax-org")
|
new_model = FlaxBertModel.from_pretrained("valid_org/test-model-flax-org")
|
||||||
|
|
||||||
@@ -109,7 +109,7 @@ class FlaxModelPushToHubTester(unittest.TestCase):
|
|||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
model.save_pretrained(
|
model.save_pretrained(
|
||||||
tmp_dir, repo_id="valid_org/test-model-flax-org", push_to_hub=True, use_auth_token=self._token
|
tmp_dir, repo_id="valid_org/test-model-flax-org", push_to_hub=True, token=self._token
|
||||||
)
|
)
|
||||||
|
|
||||||
new_model = FlaxBertModel.from_pretrained("valid_org/test-model-flax-org")
|
new_model = FlaxBertModel.from_pretrained("valid_org/test-model-flax-org")
|
||||||
|
|||||||
@@ -572,7 +572,7 @@ class TFModelPushToHubTester(unittest.TestCase):
|
|||||||
logging.set_verbosity_info()
|
logging.set_verbosity_info()
|
||||||
logger = logging.get_logger("transformers.utils.hub")
|
logger = logging.get_logger("transformers.utils.hub")
|
||||||
with CaptureLogger(logger) as cl:
|
with CaptureLogger(logger) as cl:
|
||||||
model.push_to_hub("test-model-tf", use_auth_token=self._token)
|
model.push_to_hub("test-model-tf", token=self._token)
|
||||||
logging.set_verbosity_warning()
|
logging.set_verbosity_warning()
|
||||||
# Check the model card was created and uploaded.
|
# Check the model card was created and uploaded.
|
||||||
self.assertIn("Uploading the following files to __DUMMY_TRANSFORMERS_USER__/test-model-tf", cl.out)
|
self.assertIn("Uploading the following files to __DUMMY_TRANSFORMERS_USER__/test-model-tf", cl.out)
|
||||||
@@ -590,7 +590,7 @@ class TFModelPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
model.save_pretrained(tmp_dir, repo_id="test-model-tf", push_to_hub=True, use_auth_token=self._token)
|
model.save_pretrained(tmp_dir, repo_id="test-model-tf", push_to_hub=True, token=self._token)
|
||||||
|
|
||||||
new_model = TFBertModel.from_pretrained(f"{USER}/test-model-tf")
|
new_model = TFBertModel.from_pretrained(f"{USER}/test-model-tf")
|
||||||
models_equal = True
|
models_equal = True
|
||||||
@@ -638,7 +638,7 @@ class TFModelPushToHubTester(unittest.TestCase):
|
|||||||
# Make sure model is properly initialized
|
# Make sure model is properly initialized
|
||||||
model.build()
|
model.build()
|
||||||
|
|
||||||
model.push_to_hub("valid_org/test-model-tf-org", use_auth_token=self._token)
|
model.push_to_hub("valid_org/test-model-tf-org", token=self._token)
|
||||||
|
|
||||||
new_model = TFBertModel.from_pretrained("valid_org/test-model-tf-org")
|
new_model = TFBertModel.from_pretrained("valid_org/test-model-tf-org")
|
||||||
models_equal = True
|
models_equal = True
|
||||||
@@ -653,9 +653,7 @@ class TFModelPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
model.save_pretrained(
|
model.save_pretrained(tmp_dir, push_to_hub=True, token=self._token, repo_id="valid_org/test-model-tf-org")
|
||||||
tmp_dir, push_to_hub=True, use_auth_token=self._token, repo_id="valid_org/test-model-tf-org"
|
|
||||||
)
|
|
||||||
|
|
||||||
new_model = TFBertModel.from_pretrained("valid_org/test-model-tf-org")
|
new_model = TFBertModel.from_pretrained("valid_org/test-model-tf-org")
|
||||||
models_equal = True
|
models_equal = True
|
||||||
|
|||||||
@@ -1162,7 +1162,7 @@ class ModelPushToHubTester(unittest.TestCase):
|
|||||||
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
||||||
)
|
)
|
||||||
model = BertModel(config)
|
model = BertModel(config)
|
||||||
model.push_to_hub("test-model", use_auth_token=self._token)
|
model.push_to_hub("test-model", token=self._token)
|
||||||
|
|
||||||
new_model = BertModel.from_pretrained(f"{USER}/test-model")
|
new_model = BertModel.from_pretrained(f"{USER}/test-model")
|
||||||
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
||||||
@@ -1173,7 +1173,7 @@ class ModelPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
model.save_pretrained(tmp_dir, repo_id="test-model", push_to_hub=True, use_auth_token=self._token)
|
model.save_pretrained(tmp_dir, repo_id="test-model", push_to_hub=True, token=self._token)
|
||||||
|
|
||||||
new_model = BertModel.from_pretrained(f"{USER}/test-model")
|
new_model = BertModel.from_pretrained(f"{USER}/test-model")
|
||||||
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
||||||
@@ -1202,7 +1202,7 @@ The commit description supports markdown synthax see:
|
|||||||
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
vocab_size=99, hidden_size=32, num_hidden_layers=5, num_attention_heads=4, intermediate_size=37
|
||||||
)
|
)
|
||||||
model = BertModel(config)
|
model = BertModel(config)
|
||||||
model.push_to_hub("valid_org/test-model-org", use_auth_token=self._token)
|
model.push_to_hub("valid_org/test-model-org", token=self._token)
|
||||||
|
|
||||||
new_model = BertModel.from_pretrained("valid_org/test-model-org")
|
new_model = BertModel.from_pretrained("valid_org/test-model-org")
|
||||||
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
||||||
@@ -1213,9 +1213,7 @@ The commit description supports markdown synthax see:
|
|||||||
|
|
||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
model.save_pretrained(
|
model.save_pretrained(tmp_dir, push_to_hub=True, token=self._token, repo_id="valid_org/test-model-org")
|
||||||
tmp_dir, push_to_hub=True, use_auth_token=self._token, repo_id="valid_org/test-model-org"
|
|
||||||
)
|
|
||||||
|
|
||||||
new_model = BertModel.from_pretrained("valid_org/test-model-org")
|
new_model = BertModel.from_pretrained("valid_org/test-model-org")
|
||||||
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
for p1, p2 in zip(model.parameters(), new_model.parameters()):
|
||||||
@@ -1228,7 +1226,7 @@ The commit description supports markdown synthax see:
|
|||||||
config = CustomConfig(hidden_size=32)
|
config = CustomConfig(hidden_size=32)
|
||||||
model = CustomModel(config)
|
model = CustomModel(config)
|
||||||
|
|
||||||
model.push_to_hub("test-dynamic-model", use_auth_token=self._token)
|
model.push_to_hub("test-dynamic-model", token=self._token)
|
||||||
# checks
|
# checks
|
||||||
self.assertDictEqual(
|
self.assertDictEqual(
|
||||||
config.auto_map,
|
config.auto_map,
|
||||||
|
|||||||
@@ -146,7 +146,7 @@ class TokenizerPushToHubTester(unittest.TestCase):
|
|||||||
vocab_writer.write("".join([x + "\n" for x in self.vocab_tokens]))
|
vocab_writer.write("".join([x + "\n" for x in self.vocab_tokens]))
|
||||||
tokenizer = BertTokenizer(vocab_file)
|
tokenizer = BertTokenizer(vocab_file)
|
||||||
|
|
||||||
tokenizer.push_to_hub("test-tokenizer", use_auth_token=self._token)
|
tokenizer.push_to_hub("test-tokenizer", token=self._token)
|
||||||
new_tokenizer = BertTokenizer.from_pretrained(f"{USER}/test-tokenizer")
|
new_tokenizer = BertTokenizer.from_pretrained(f"{USER}/test-tokenizer")
|
||||||
self.assertDictEqual(new_tokenizer.vocab, tokenizer.vocab)
|
self.assertDictEqual(new_tokenizer.vocab, tokenizer.vocab)
|
||||||
|
|
||||||
@@ -155,7 +155,7 @@ class TokenizerPushToHubTester(unittest.TestCase):
|
|||||||
|
|
||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
tokenizer.save_pretrained(tmp_dir, repo_id="test-tokenizer", push_to_hub=True, use_auth_token=self._token)
|
tokenizer.save_pretrained(tmp_dir, repo_id="test-tokenizer", push_to_hub=True, token=self._token)
|
||||||
|
|
||||||
new_tokenizer = BertTokenizer.from_pretrained(f"{USER}/test-tokenizer")
|
new_tokenizer = BertTokenizer.from_pretrained(f"{USER}/test-tokenizer")
|
||||||
self.assertDictEqual(new_tokenizer.vocab, tokenizer.vocab)
|
self.assertDictEqual(new_tokenizer.vocab, tokenizer.vocab)
|
||||||
@@ -167,7 +167,7 @@ class TokenizerPushToHubTester(unittest.TestCase):
|
|||||||
vocab_writer.write("".join([x + "\n" for x in self.vocab_tokens]))
|
vocab_writer.write("".join([x + "\n" for x in self.vocab_tokens]))
|
||||||
tokenizer = BertTokenizer(vocab_file)
|
tokenizer = BertTokenizer(vocab_file)
|
||||||
|
|
||||||
tokenizer.push_to_hub("valid_org/test-tokenizer-org", use_auth_token=self._token)
|
tokenizer.push_to_hub("valid_org/test-tokenizer-org", token=self._token)
|
||||||
new_tokenizer = BertTokenizer.from_pretrained("valid_org/test-tokenizer-org")
|
new_tokenizer = BertTokenizer.from_pretrained("valid_org/test-tokenizer-org")
|
||||||
self.assertDictEqual(new_tokenizer.vocab, tokenizer.vocab)
|
self.assertDictEqual(new_tokenizer.vocab, tokenizer.vocab)
|
||||||
|
|
||||||
@@ -177,7 +177,7 @@ class TokenizerPushToHubTester(unittest.TestCase):
|
|||||||
# Push to hub via save_pretrained
|
# Push to hub via save_pretrained
|
||||||
with tempfile.TemporaryDirectory() as tmp_dir:
|
with tempfile.TemporaryDirectory() as tmp_dir:
|
||||||
tokenizer.save_pretrained(
|
tokenizer.save_pretrained(
|
||||||
tmp_dir, repo_id="valid_org/test-tokenizer-org", push_to_hub=True, use_auth_token=self._token
|
tmp_dir, repo_id="valid_org/test-tokenizer-org", push_to_hub=True, token=self._token
|
||||||
)
|
)
|
||||||
|
|
||||||
new_tokenizer = BertTokenizer.from_pretrained("valid_org/test-tokenizer-org")
|
new_tokenizer = BertTokenizer.from_pretrained("valid_org/test-tokenizer-org")
|
||||||
@@ -193,7 +193,7 @@ class TokenizerPushToHubTester(unittest.TestCase):
|
|||||||
tokenizer = CustomTokenizer(vocab_file)
|
tokenizer = CustomTokenizer(vocab_file)
|
||||||
|
|
||||||
# No fast custom tokenizer
|
# No fast custom tokenizer
|
||||||
tokenizer.push_to_hub("test-dynamic-tokenizer", use_auth_token=self._token)
|
tokenizer.push_to_hub("test-dynamic-tokenizer", token=self._token)
|
||||||
|
|
||||||
tokenizer = AutoTokenizer.from_pretrained(f"{USER}/test-dynamic-tokenizer", trust_remote_code=True)
|
tokenizer = AutoTokenizer.from_pretrained(f"{USER}/test-dynamic-tokenizer", trust_remote_code=True)
|
||||||
# Can't make an isinstance check because the new_model.config is from the CustomTokenizer class of a dynamic module
|
# Can't make an isinstance check because the new_model.config is from the CustomTokenizer class of a dynamic module
|
||||||
@@ -210,7 +210,7 @@ class TokenizerPushToHubTester(unittest.TestCase):
|
|||||||
bert_tokenizer.save_pretrained(tmp_dir)
|
bert_tokenizer.save_pretrained(tmp_dir)
|
||||||
tokenizer = CustomTokenizerFast.from_pretrained(tmp_dir)
|
tokenizer = CustomTokenizerFast.from_pretrained(tmp_dir)
|
||||||
|
|
||||||
tokenizer.push_to_hub("test-dynamic-tokenizer", use_auth_token=self._token)
|
tokenizer.push_to_hub("test-dynamic-tokenizer", token=self._token)
|
||||||
|
|
||||||
tokenizer = AutoTokenizer.from_pretrained(f"{USER}/test-dynamic-tokenizer", trust_remote_code=True)
|
tokenizer = AutoTokenizer.from_pretrained(f"{USER}/test-dynamic-tokenizer", trust_remote_code=True)
|
||||||
# Can't make an isinstance check because the new_model.config is from the FakeConfig class of a dynamic module
|
# Can't make an isinstance check because the new_model.config is from the FakeConfig class of a dynamic module
|
||||||
|
|||||||
@@ -132,10 +132,10 @@ class GetFromCacheTests(unittest.TestCase):
|
|||||||
"""Test download file from a gated repo fails with correct message when not authenticated."""
|
"""Test download file from a gated repo fails with correct message when not authenticated."""
|
||||||
with self.assertRaisesRegex(EnvironmentError, "You are trying to access a gated repo."):
|
with self.assertRaisesRegex(EnvironmentError, "You are trying to access a gated repo."):
|
||||||
# All files except README.md are protected on a gated repo.
|
# All files except README.md are protected on a gated repo.
|
||||||
cached_file(GATED_REPO, "gated_file.txt", use_auth_token=False)
|
cached_file(GATED_REPO, "gated_file.txt", token=False)
|
||||||
|
|
||||||
def test_has_file_gated_repo(self):
|
def test_has_file_gated_repo(self):
|
||||||
"""Test check file existence from a gated repo fails with correct message when not authenticated."""
|
"""Test check file existence from a gated repo fails with correct message when not authenticated."""
|
||||||
with self.assertRaisesRegex(EnvironmentError, "is a gated repository"):
|
with self.assertRaisesRegex(EnvironmentError, "is a gated repository"):
|
||||||
# All files except README.md are protected on a gated repo.
|
# All files except README.md are protected on a gated repo.
|
||||||
has_file(GATED_REPO, "gated_file.txt", use_auth_token=False)
|
has_file(GATED_REPO, "gated_file.txt", token=False)
|
||||||
|
|||||||
Reference in New Issue
Block a user