[VLM] Separate text-only and vision variants of the same model architecture (#13157)
This commit is contained in:
@@ -18,8 +18,7 @@ def test_can_initialize(model_arch):
|
||||
|
||||
# Avoid OOM
|
||||
def hf_overrides(hf_config: PretrainedConfig) -> PretrainedConfig:
|
||||
if hf_config.model_type == "deepseek_vl_v2":
|
||||
hf_config.update({"architectures": ["DeepseekVLV2ForCausalLM"]})
|
||||
hf_config.update(model_info.hf_overrides)
|
||||
|
||||
if hasattr(hf_config, "text_config"):
|
||||
text_config: PretrainedConfig = hf_config.text_config
|
||||
|
||||
Reference in New Issue
Block a user