Update README.md

cc @patil-suraj
This commit is contained in:
Patrick von Platen
2021-07-20 13:51:15 +02:00
committed by GitHub
parent 66197adc98
commit 13fefdf340

View File

@@ -114,7 +114,7 @@ from transformers import RobertaConfig
model_dir = "./norwegian-roberta-base" # ${MODEL_DIR} model_dir = "./norwegian-roberta-base" # ${MODEL_DIR}
config = RobertaConfig.from_pretrained("roberta-base") config = RobertaConfig.from_pretrained("roberta-base", vocab_size=tokenizer.vocab_size)
config.save_pretrained(model_dir) config.save_pretrained(model_dir)
``` ```
@@ -211,7 +211,7 @@ from transformers import GPT2Config
model_dir = "./norwegian-gpt2" # ${MODEL_DIR} model_dir = "./norwegian-gpt2" # ${MODEL_DIR}
config = GPT2Config.from_pretrained("gpt2", resid_pdrop=0.0, embd_pdrop=0.0, attn_pdrop=0.0) config = GPT2Config.from_pretrained("gpt2", resid_pdrop=0.0, embd_pdrop=0.0, attn_pdrop=0.0, vocab_size=tokenizer.vocab_size)
config.save_pretrained(model_dir) config.save_pretrained(model_dir)
``` ```
@@ -349,7 +349,7 @@ from transformers import T5Config
model_dir = "./norwegian-t5-base" # ${MODEL_DIR} model_dir = "./norwegian-t5-base" # ${MODEL_DIR}
config = T5Config.from_pretrained("google/t5-v1_1-base") config = T5Config.from_pretrained("google/t5-v1_1-base", vocab_size=tokenizer.vocab_size)
config.save_pretrained(model_dir) config.save_pretrained(model_dir)
``` ```