AlexHung29629
/

test_mllama_v12

Feature Extraction

Model card Files Files and versions Community

AlexHung29629 commited on Nov 26, 2024

Commit

8769079

·

verified ·

1 Parent(s): c1a531e

Update ultravox_processing.py

Files changed (1) hide show

ultravox_processing.py +2 -2

ultravox_processing.py CHANGED Viewed

@@ -171,14 +171,14 @@ class UltravoxProcessor(transformers.ProcessorMixin):
                     start_idx = len(
                         self.tokenizer.encode(
-                            t[: t.index(self.audio_placeholder)],
                             add_special_tokens=False,
                         )
                     )
                     data["audio_token_start_idx"].append(start_idx)
                     # Replace the audio placeholder with the audio token.
-                    #   e.g. "Transcribe\n<|audio|>" -> "Transcribe </s></s></s></s></s></s></s></s>"
                     #        where the number of </s> is the number of audio frames.
                     t = t.replace(
                         self.audio_placeholder,

                     start_idx = len(
                         self.tokenizer.encode(
+                            t.split(self.audio_placeholder)[0],
                             add_special_tokens=False,
                         )
                     )
                     data["audio_token_start_idx"].append(start_idx)
                     # Replace the audio placeholder with the audio token.
+                    #   e.g. "Transcribe <|audio|>" -> "Transcribe </s></s></s></s></s></s></s></s>"
                     #        where the number of </s> is the number of audio frames.
                     t = t.replace(
                         self.audio_placeholder,