MERaLiON
/

MERaLiON-AudioLLM-Whisper-SEA-LION

@@ -1,18 +1,4 @@
-# coding=utf-8
-# Copyright 2024 the HuggingFace Inc. team. All rights reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-"""PyTorch MERaLiON model."""
 import math
 from dataclasses import dataclass
@@ -1161,37 +1147,6 @@ class MERaLiONForConditionalGeneration(MERaLiONPreTrainedModel, GenerationMixin)
         self.vocab_size = model_embeds.num_embeddings
         return model_embeds
-    def _get_multimodal_input_embeds(
-        self,
-        input_ids_left,
-        input_ids_right,
-        attention_mask_left,
-        attention_mask_right,
-        speech_audio_contexts_embeds,
-        speech_audio_contexts_atts,
-    ):
-        input_embeds_left = self.text_decoder.base_model.embed_tokens(input_ids_left)
-        input_embeds_right = self.text_decoder.base_model.embed_tokens(input_ids_right)
-        multimodal_embeds = torch.cat(
-            [
-                input_embeds_left,
-                speech_audio_contexts_embeds,
-                input_embeds_right,
-            ],
-            dim=1,
-        )
-        multimodal_attention_mask = torch.cat(
-            [
-                attention_mask_left,
-                speech_audio_contexts_atts,
-                attention_mask_right,
-            ],
-            dim=1,
-        )
-        return multimodal_embeds, multimodal_attention_mask
     @add_start_docstrings_to_model_forward(MERALION_INPUTS_DOCSTRING)
     @replace_return_docstrings(output_type=MERaLiONOutputWithPast, config_class=_CONFIG_FOR_DOC)
     def forward(

+"""PyTorch MERaLiON AudioLLM model."""
 import math
 from dataclasses import dataclass
         self.vocab_size = model_embeds.num_embeddings
         return model_embeds
     @add_start_docstrings_to_model_forward(MERALION_INPUTS_DOCSTRING)
     @replace_return_docstrings(output_type=MERaLiONOutputWithPast, config_class=_CONFIG_FOR_DOC)
     def forward(