File size: 490 Bytes
9de729b 8a965da 9de729b 973bb39 33d11d7 61fdbff d9a32db db75012 cea67c6 07a3709 1c3fdf6 68ed0e8 9de729b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 |
# TEST MODEL
from transformers import pipeline
classifier = pipeline(task="zero-shot-audio-classification", model="mskov/whisper-small-esc50")
# classifier = pipeline(model="mskov/roberta-base-toxicity")
audio = "./candy-bar-chewing.wav"
labels = ["Sound of a dog", "Sound of vaccum cleaner", "chewing", "sneezing"]
result = []
for item in labels:
result.append(classifier(audio, input_ids=labels))
predicted_label = result[0]["label"]
print(f"Predicted label: {predicted_label}") |