Spaces:

jasspier
/

asr_arena

Runtime error

asr_arena / app.py

Update app.py

2aa2fbe verified over 1 year ago

1.09 kB

	import gradio as gr
	import torch
	import torchaudio
	from torchaudio.transforms import Resample

	# 定义模型路径
	model_path = "https://huggingface.co/Tele-AI/TeleSpeech-ASR1.0/resolve/main/large.pt"

	# 下载模型文件
	torch.hub.download_url_to_file(model_path, 'large.pt')

	# 加载模型
	model = torch.jit.load('large.pt')
	model.eval()

	# 定义处理函数
	def transcribe(audio):
	waveform, sample_rate = torchaudio.load(audio)
	resample = Resample(orig_freq=sample_rate, new_freq=16000)
	waveform = resample(waveform)

	input_values = waveform.unsqueeze(0)
	with torch.no_grad():
	logits = model(input_values)
	predicted_ids = torch.argmax(logits, dim=-1)
	transcription = tokenizer.decode(predicted_ids[0])
	return transcription

	# 创建 Gradio 界面
	iface = gr.Interface(
	fn=transcribe,
	inputs=gr.Audio(source="microphone", type="filepath"),
	outputs="text",
	title="TeleSpeech ASR",
	description="Upload an audio file or record your voice to transcribe speech to text using the TeleSpeech ASR model."
	)

	iface.launch()