[Misc] Update config loading for Qwen2-VL and remove Granite (#8837)

This commit is contained in:
Roger Wang
2024-09-26 07:45:30 -07:00
committed by GitHub
parent 7193774b1f
commit 4bb98f2190
7 changed files with 144 additions and 224 deletions

View File

@@ -25,6 +25,7 @@ from typing import Any, Dict, Iterable, List, Optional, Tuple, Union
import torch
from torch import nn
from transformers import GraniteConfig
from vllm.attention import Attention, AttentionMetadata
from vllm.config import CacheConfig, LoRAConfig
@@ -48,7 +49,6 @@ from vllm.model_executor.model_loader.weight_utils import (
default_weight_loader, kv_cache_scales_loader, maybe_remap_kv_scale_name)
from vllm.model_executor.sampling_metadata import SamplingMetadata
from vllm.sequence import IntermediateTensors
from vllm.transformers_utils.configs.granite import GraniteConfig
from vllm.utils import is_hip
from .interfaces import SupportsLoRA