|
from transformers import pipeline, Wav2Vec2Processor, Wav2Vec2ForSequenceClassification |
|
import gradio as gr |
|
|
|
model_id = "Tirath5504/distilhubert-finetuned-gtzan" |
|
processor = Wav2Vec2Processor.from_pretrained(model_id) |
|
model = Wav2Vec2ForSequenceClassification.from_pretrained(model_id) |
|
pipe = pipeline("audio-classification", model=model, processor=processor) |
|
|
|
def classify_audio(filepath): |
|
preds = pipe(filepath) |
|
outputs = {} |
|
for p in preds: |
|
outputs[p["label"]] = p["score"] |
|
return outputs |
|
|
|
demo = gr.Interface( |
|
fn=classify_audio, inputs=gr.Audio(type="filepath"), outputs=gr.outputs.Label() |
|
) |
|
demo.launch(debug=True) |