Skip to content

Commit 4a0bcc8

Browse files
Isotr0pyrjgleaton
authored andcommitted
Fix missing fast tokenizer/image_processor in whisper/qwen2.5-omni processor (huggingface#39244)
* fix missing fast tokenizer in whisper processor Signed-off-by: Isotr0py <[email protected]> * fix processor test Signed-off-by: Isotr0py <[email protected]> * fix qwen2.5 omni processor Signed-off-by: Isotr0py <[email protected]> --------- Signed-off-by: Isotr0py <[email protected]>
1 parent 13dfb22 commit 4a0bcc8

File tree

3 files changed

+6
-6
lines changed

3 files changed

+6
-6
lines changed

src/transformers/models/qwen2_5_omni/processing_qwen2_5_omni.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -93,8 +93,8 @@ class Qwen2_5OmniProcessor(ProcessorMixin):
9393
"""
9494

9595
attributes = ["image_processor", "video_processor", "feature_extractor", "tokenizer"]
96-
image_processor_class = "Qwen2VLImageProcessor"
97-
video_processor_class = "Qwen2VLVideoProcessor"
96+
image_processor_class = "AutoImageProcessor"
97+
video_processor_class = "AutoVideoProcessor"
9898
feature_extractor_class = "WhisperFeatureExtractor"
9999
tokenizer_class = ("Qwen2Tokenizer", "Qwen2TokenizerFast")
100100

src/transformers/models/whisper/processing_whisper.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ class WhisperProcessor(ProcessorMixin):
3535
"""
3636

3737
feature_extractor_class = "WhisperFeatureExtractor"
38-
tokenizer_class = "WhisperTokenizer"
38+
tokenizer_class = ("WhisperTokenizer", "WhisperTokenizerFast")
3939

4040
def __init__(self, feature_extractor, tokenizer):
4141
super().__init__(feature_extractor, tokenizer)

tests/models/whisper/test_processor_whisper.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@
1919
import numpy as np
2020
import pytest
2121

22-
from transformers import WhisperTokenizer, is_speech_available
22+
from transformers import WhisperTokenizer, WhisperTokenizerFast, is_speech_available
2323
from transformers.testing_utils import require_sentencepiece, require_torch, require_torchaudio
2424

2525
from .test_feature_extraction_whisper import floats_list
@@ -60,7 +60,7 @@ def test_save_load_pretrained_default(self):
6060
processor = WhisperProcessor.from_pretrained(self.tmpdirname)
6161

6262
self.assertEqual(processor.tokenizer.get_vocab(), tokenizer.get_vocab())
63-
self.assertIsInstance(processor.tokenizer, WhisperTokenizer)
63+
self.assertIsInstance(processor.tokenizer, WhisperTokenizerFast)
6464

6565
self.assertEqual(processor.feature_extractor.to_json_string(), feature_extractor.to_json_string())
6666
self.assertIsInstance(processor.feature_extractor, WhisperFeatureExtractor)
@@ -77,7 +77,7 @@ def test_save_load_pretrained_additional_features(self):
7777
)
7878

7979
self.assertEqual(processor.tokenizer.get_vocab(), tokenizer_add_kwargs.get_vocab())
80-
self.assertIsInstance(processor.tokenizer, WhisperTokenizer)
80+
self.assertIsInstance(processor.tokenizer, WhisperTokenizerFast)
8181

8282
self.assertEqual(processor.feature_extractor.to_json_string(), feature_extractor_add_kwargs.to_json_string())
8383
self.assertIsInstance(processor.feature_extractor, WhisperFeatureExtractor)

0 commit comments

Comments
 (0)