[Model] Use merge_by_field_config for MM models (M-N) (#26710)
Signed-off-by: DarkLight1337 <tlleungac@connect.ust.hk>
This commit is contained in:
@@ -631,8 +631,11 @@ class InternS1ForConditionalGeneration(
|
||||
)
|
||||
|
||||
image_token_id = kwargs["image_token_id"]
|
||||
assert isinstance(image_token_id, torch.Tensor)
|
||||
self.img_context_token_id = image_token_id.flatten().unique().item()
|
||||
if isinstance(image_token_id, torch.Tensor):
|
||||
image_token_id = image_token_id.flatten().unique().item()
|
||||
|
||||
assert isinstance(image_token_id, int)
|
||||
self.img_context_token_id = image_token_id
|
||||
|
||||
if pixel_values is not None:
|
||||
h, w = self.config.vision_config.image_size
|
||||
@@ -665,8 +668,11 @@ class InternS1ForConditionalGeneration(
|
||||
)
|
||||
|
||||
video_token_id = kwargs["video_token_id"]
|
||||
assert isinstance(video_token_id, torch.Tensor)
|
||||
self.video_context_token_id = video_token_id.flatten().unique().item()
|
||||
if isinstance(video_token_id, torch.Tensor):
|
||||
video_token_id = video_token_id.flatten().unique().item()
|
||||
|
||||
assert isinstance(video_token_id, int)
|
||||
self.video_context_token_id = video_token_id
|
||||
|
||||
if pixel_values_flat_video is not None:
|
||||
h, w = self.config.vision_config.image_size
|
||||
|
||||
Reference in New Issue
Block a user