AlexHung29629
/

test_mllama_v12

Feature Extraction

Model card Files Files and versions Community

alex-ht commited on Nov 25, 2024

Commit

7b01696

·

1 Parent(s): f767f82

update

Files changed (1) hide show

ultravox_processing.py +2 -1

ultravox_processing.py CHANGED Viewed

@@ -171,6 +171,7 @@ class UltravoxProcessor(transformers.ProcessorMixin):
                 text, list
             ), "Text must be a list."
             processed_text = []
             for t in text:
                 if self.audio_placeholder in t:
                     if "audio_token_len" not in data:
@@ -184,7 +185,7 @@ class UltravoxProcessor(transformers.ProcessorMixin):
                             add_special_tokens=False,
                         )
                     )
-                    data["audio_token_start_idx"] = [start_idx]
                     # Replace the audio placeholder with the audio token.
                     #   e.g. "Transcribe\n<|audio|>" -> "Transcribe </s></s></s></s></s></s></s></s>"

                 text, list
             ), "Text must be a list."
             processed_text = []
+            data["audio_token_start_idx"] = []
             for t in text:
                 if self.audio_placeholder in t:
                     if "audio_token_len" not in data:
                             add_special_tokens=False,
                         )
                     )
+                    data["audio_token_start_idx"].append(start_idx)
                     # Replace the audio placeholder with the audio token.
                     #   e.g. "Transcribe\n<|audio|>" -> "Transcribe </s></s></s></s></s></s></s></s>"