".circleci/git@developer.sourcefind.cn:OpenDAS/torchaudio.git" did not exist on "3cf7f264f427f10b8b33ad1b8a4450aedf92693c"
Unverified Commit 3c15fd19 authored by Sanchit Gandhi's avatar Sanchit Gandhi Committed by GitHub
Browse files

[Seamless v2] Add FE to auto mapping (#27829)

parent 1d63b0ec
...@@ -78,6 +78,7 @@ FEATURE_EXTRACTOR_MAPPING_NAMES = OrderedDict( ...@@ -78,6 +78,7 @@ FEATURE_EXTRACTOR_MAPPING_NAMES = OrderedDict(
("regnet", "ConvNextFeatureExtractor"), ("regnet", "ConvNextFeatureExtractor"),
("resnet", "ConvNextFeatureExtractor"), ("resnet", "ConvNextFeatureExtractor"),
("seamless_m4t", "SeamlessM4TFeatureExtractor"), ("seamless_m4t", "SeamlessM4TFeatureExtractor"),
("seamless_m4t_v2", "SeamlessM4TFeatureExtractor"),
("segformer", "SegformerFeatureExtractor"), ("segformer", "SegformerFeatureExtractor"),
("sew", "Wav2Vec2FeatureExtractor"), ("sew", "Wav2Vec2FeatureExtractor"),
("sew-d", "Wav2Vec2FeatureExtractor"), ("sew-d", "Wav2Vec2FeatureExtractor"),
......
...@@ -1115,6 +1115,23 @@ class AutomaticSpeechRecognitionPipelineTests(unittest.TestCase): ...@@ -1115,6 +1115,23 @@ class AutomaticSpeechRecognitionPipelineTests(unittest.TestCase):
assert result == EXPECTED_RESULT assert result == EXPECTED_RESULT
@require_torch
@slow
def test_seamless_v2(self):
pipe = pipeline(
"automatic-speech-recognition",
model="facebook/seamless-m4t-v2-large",
device="cuda:0",
)
dataset = load_dataset("hf-internal-testing/librispeech_asr_dummy", "clean", split="validation")
sample = dataset[0]["audio"]
result = pipe(sample, generate_kwargs={"tgt_lang": "eng"})
EXPECTED_RESULT = "mister quilter is the apostle of the middle classes and we are glad to welcome his gospel"
assert result["text"] == EXPECTED_RESULT
@require_torch @require_torch
@slow @slow
def test_chunking_and_timestamps(self): def test_chunking_and_timestamps(self):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment