Spaces:

AescF
/

LanguageClass

Runtime error

App Files Files Community

LanguageClass / app.py

AescF

Update app.py

db14524 about 2 years ago

raw

history blame

2.61 kB

	import gradio as gr
	import librosa
	import numpy as np
	import torch
	from transformers import pipeline


	language_classes = {
	0: "Arabic",
	1: "Basque",
	2: "Breton",
	3: "Catalan",
	4: "Chinese_China",
	5: "Chinese_Hongkong",
	6: "Chinese_Taiwan",
	7: "Chuvash",
	8: "Czech",
	9: "Dhivehi",
	10: "Dutch",
	11: "English",
	12: "Esperanto",
	13: "Estonian",
	14: "French",
	15: "Frisian",
	16: "Georgian",
	17: "German",
	18: "Greek",
	19: "Hakha_Chin",
	20: "Indonesian",
	21: "Interlingua",
	22: "Italian",
	23: "Japanese",
	24: "Kabyle",
	25: "Kinyarwanda",
	26: "Kyrgyz",
	27: "Latvian",
	28: "Maltese",
	29: "Mongolian",
	30: "Persian",
	31: "Polish",
	32: "Portuguese",
	33: "Romanian",
	34: "Romansh_Sursilvan",
	35: "Russian",
	36: "Sakha",
	37: "Slovenian",
	38: "Spanish",
	39: "Swedish",
	40: "Tamil",
	41: "Tatar",
	42: "Turkish",
	43: "Ukranian",
	44: "Welsh"
	}




	username = "AescF" ## Complete your username
	model_id = "AescF/hubert-base-ls960-finetuned-common_language"
	device = "cuda:0" if torch.cuda.is_available() else "cpu"
	pipe = pipeline("audio-classification", model=model_id, device=device)

	# def predict_trunc(filepath):
	# preprocessed = pipe.preprocess(filepath)
	# truncated = pipe.feature_extractor.pad(preprocessed,truncation=True, max_length = 16_000*30)
	# model_outputs = pipe.forward(truncated)
	# outputs = pipe.postprocess(model_outputs)

	# return outputs


	def classify_audio(filepath):


	preds = pipe(filepath)
	# preds = predict_trunc(filepath)
	outputs = {}
	for p in preds:
	outputs[p["label"]] = p["score"]
	return outputs


	title = "Language Classification Model"
	description = (
	"This model has been fine-tuned on a dataset containing various languages\n"
	"including Arabic, Basque, Catalan, Chinese, English, French, German, Japanese, Russian, and more.\n"
	"It is designed for audio classification, allowing it to predict the language spoken in a given audio clip.\n"
	"Try it out by uploading an audio sample and see how accurately it can identify the language being spoken!\n"
	"For more info, check out [GITHUB](https://github.com/AEscF)"
	)
	filenames = ['EN_0049.wav', "FR_0098.wav", "JP_0222.wav",]
	filenames = [[f"./{f}"] for f in filenames]
	demo = gr.Interface(
	fn=classify_audio,
	inputs=gr.Audio(type="filepath"),
	outputs=[gr.Label(label="Predictions")],
	title=title,
	description=description,
	examples=filenames,
	)
	demo.launch()