from transformers import pipeline classifier = pipeline(model="superb/wav2vec2-base-superb-ks") res = classifier("1.flac") #res = classifier("https://huggingface.co/datasets/Narsil/asr_dummy/resolve/main/1.flac") print(str(res)) #[{'score': 0.997, 'label': '_unknown_'}, {'score': 0.002, 'label': 'left'}, {'score': 0.0, 'label': 'yes'}, {'score': 0.0, 'label': 'down'}, {'score': 0.0, 'label': 'stop'}]