🔴 [VLM] Add base model without head (#37033)
* i guessreverted all CdGen classes * style * llava onevision * fix copies * fix some tests * some more tests * dump * skip these * nevermind, i am dumb * revert fix not needed * fixup * fixup * another fixup * more fixup to make ci finally happy * fixup after rebasing * fix qwen tests * add internVL + typos here and there * image token index -> id * style * fix init weights * revert blip-2 not supported * address comments * fix copies * revert blip2 test file as well * as discussed internally, revert back CdGen models * fix some tests * fix more tests for compile * CI red * fix copies * enumerate explicitly allowed models * address comments * fix tests * fixup * style again * add tests for new model class * another fixup ( x _ x ) * [fixup] unused attributes can be removed post-deprecation
This commit is contained in:
committed by
GitHub
parent
3fa8d9c20e
commit
17742bd9c8
@@ -3494,8 +3494,8 @@ class ModelTesterMixin:
|
||||
vision_model_name = [name for name in vision_model_names if hasattr(model_sdpa, name)][0]
|
||||
language_model_name = [name for name in language_model_names if hasattr(model_sdpa, name)][0]
|
||||
|
||||
vision_model_sdpa = getattr(model, vision_model_name)
|
||||
language_model_sdpa = getattr(model, language_model_name)
|
||||
vision_model_sdpa = getattr(model_sdpa, vision_model_name)
|
||||
language_model_sdpa = getattr(model_sdpa, language_model_name)
|
||||
text_attn = "sdpa" if language_model_sdpa._supports_sdpa else "eager"
|
||||
vision_attn = "sdpa" if vision_model_sdpa._supports_sdpa else "eager"
|
||||
|
||||
@@ -4489,7 +4489,8 @@ class ModelTesterMixin:
|
||||
@require_torch_gpu
|
||||
def test_flex_attention_with_grads(self):
|
||||
for model_class in self.all_model_classes:
|
||||
if not model_class._supports_flex_attn:
|
||||
# TODO: raushan, fix for composite models after making VLMs support new attn API
|
||||
if not model_class._supports_flex_attn or self._is_composite:
|
||||
self.skipTest(reason="This model does not support flex attention")
|
||||
config, inputs_dict = self.model_tester.prepare_config_and_inputs_for_common()
|
||||
config._attn_implementation = "flex_attention"
|
||||
|
||||
Reference in New Issue
Block a user