File size: 490 Bytes
9de729b
8a965da
9de729b
973bb39
33d11d7
61fdbff
d9a32db
db75012
cea67c6
07a3709
1c3fdf6
 
 
68ed0e8
9de729b
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
# TEST MODEL

from transformers import pipeline


classifier = pipeline(task="zero-shot-audio-classification", model="mskov/whisper-small-esc50")
# classifier = pipeline(model="mskov/roberta-base-toxicity")

audio =  "./candy-bar-chewing.wav"
labels = ["Sound of a dog", "Sound of vaccum cleaner", "chewing", "sneezing"]
result = []
for item in labels:
    result.append(classifier(audio, input_ids=labels))

predicted_label = result[0]["label"]
print(f"Predicted label: {predicted_label}")