Add checkpoint links in a few config classes (#19910)
* For CLIP * Others * update Co-authored-by: ydshieh <ydshieh@users.noreply.github.com>
This commit is contained in:
@@ -254,7 +254,9 @@ class CLIPVisionConfig(PretrainedConfig):
|
||||
class CLIPConfig(PretrainedConfig):
|
||||
r"""
|
||||
[`CLIPConfig`] is the configuration class to store the configuration of a [`CLIPModel`]. It is used to instantiate
|
||||
CLIP model according to the specified arguments, defining the text model and vision model configs.
|
||||
CLIP model according to the specified arguments, defining the text model and vision model configs. Instantiating a
|
||||
configuration with the defaults will yield a similar configuration to that of the CLIP
|
||||
[openai/clip-vit-base-patch32](https://huggingface.co/openai/clip-vit-base-patch32) architecture.
|
||||
|
||||
Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
|
||||
documentation from [`PretrainedConfig`] for more information.
|
||||
|
||||
@@ -273,7 +273,8 @@ class GroupViTConfig(PretrainedConfig):
|
||||
r"""
|
||||
[`GroupViTConfig`] is the configuration class to store the configuration of a [`GroupViTModel`]. It is used to
|
||||
instantiate a GroupViT model according to the specified arguments, defining the text model and vision model
|
||||
configs.
|
||||
configs. Instantiating a configuration with the defaults will yield a similar configuration to that of the GroupViT
|
||||
[nvidia/groupvit-gcc-yfcc](https://huggingface.co/nvidia/groupvit-gcc-yfcc) architecture.
|
||||
|
||||
Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
|
||||
documentation from [`PretrainedConfig`] for more information.
|
||||
|
||||
@@ -253,7 +253,8 @@ class OwlViTConfig(PretrainedConfig):
|
||||
r"""
|
||||
[`OwlViTConfig`] is the configuration class to store the configuration of an [`OwlViTModel`]. It is used to
|
||||
instantiate an OWL-ViT model according to the specified arguments, defining the text model and vision model
|
||||
configs.
|
||||
configs. Instantiating a configuration with the defaults will yield a similar configuration to that of the OWL-ViT
|
||||
[google/owlvit-base-patch32](https://huggingface.co/google/owlvit-base-patch32) architecture.
|
||||
|
||||
Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
|
||||
documentation from [`PretrainedConfig`] for more information.
|
||||
|
||||
@@ -272,6 +272,8 @@ class XCLIPConfig(PretrainedConfig):
|
||||
r"""
|
||||
[`XCLIPConfig`] is the configuration class to store the configuration of a [`XCLIPModel`]. It is used to
|
||||
instantiate X-CLIP model according to the specified arguments, defining the text model and vision model configs.
|
||||
Instantiating a configuration with the defaults will yield a similar configuration to that of the X-CLIP
|
||||
[microsoft/xclip-base-patch32](https://huggingface.co/microsoft/xclip-base-patch32) architecture.
|
||||
|
||||
Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
|
||||
documentation from [`PretrainedConfig`] for more information.
|
||||
|
||||
@@ -40,16 +40,12 @@ _re_checkpoint = re.compile("\[(.+?)\]\((https://huggingface\.co/.+?)\)")
|
||||
|
||||
|
||||
CONFIG_CLASSES_TO_IGNORE_FOR_DOCSTRING_CHECKPOINT_CHECK = {
|
||||
"CLIPConfig",
|
||||
"OwlViTConfig",
|
||||
"GroupViTConfig",
|
||||
"DecisionTransformerConfig",
|
||||
"EncoderDecoderConfig",
|
||||
"RagConfig",
|
||||
"SpeechEncoderDecoderConfig",
|
||||
"VisionEncoderDecoderConfig",
|
||||
"VisionTextDualEncoderConfig",
|
||||
"XCLIPConfig",
|
||||
}
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user