Spaces:

Dougaya
/

Audio_Transcription

Sleeping

App Files Files Community

Audio_Transcription / app.py

Dougaya

Update app.py

7bc32a4 verified 4 months ago

raw

history blame contribute delete

3.69 kB

	# importer gradio
	import gradio as gr
	from transformers import pipeline
	# Importer nemo.collections.asr
	import nemo.collections.asr as nemo_asr
	# Instancier le modèle
	asr_canary = nemo_asr.models.ASRModel.from_pretrained("nvidia/canary-1b-flash")
	# Instanstier le modèle
	asr_whisper = pipeline("automatic-speech-recognition", model="openai/whisper-small")

	# Fonction de transcription whisper
	def transcrire1(fpath):
	output = asr_whisper(fpath)
	return output["text"]

	# Fonction de transcription canary-1b-flash
	def transcrire2(fpath, source_lang, target_lang):
	transcriptions = asr_canary.transcribe([fpath],
	source_lang = source_lang, target_lang = target_lang)
	text = transcriptions[0].text

	return text

	# Créer les blocs
	demo = gr.Blocks(theme='JohnSmith9982/small_and_pretty')
	# Créer un interface ASR whisper avec un microphone
	mic_transcrire = gr.Interface(
	fn=transcrire1,
	inputs=gr.Audio(sources="microphone",
	type="filepath"),
	cache_examples=True,
	outputs=gr.Textbox(label="Transcription",
	lines=3),
	title = 'Transcrire par microphone - Whisper',
	description="""Transcription audio en temps réel via microphone avec le modèle Whisper d’OpenAI.

	Parlez directement dans votre microphone pour obtenir une transcription instantanée du contenu sonore."""
	)

	# Créer un interface ASR whisper par audio
	fich_transcrire = gr.Interface(
	fn=transcrire1,
	inputs=gr.Audio(sources="upload",
	type="filepath"),
	outputs=gr.Textbox(label="Transcription",
	lines=3),
	title = 'Transcrire un fichier audio - Whisper',
	description="""Transcription automatique d’un fichier audio téléversé avec le modèle Whisper d’OpenAI.

	Téléversez un fichier audio (wav, mp3, etc.) pour obtenir une transcription textuelle précise."""
	)

	# Créer un interface ASR canary avec un microphone
	mic_transcrire1 = gr.Interface(
	fn=transcrire2,
	inputs=[gr.Audio(sources="microphone",type="filepath"),
	gr.Dropdown(choices = ['fr', 'en'], label ='Source languge'),
	gr.Dropdown(choices = ['fr', 'en'], label = 'Target language')],
	cache_examples=True,
	outputs=gr.Textbox(label="Transcription",
	lines=3),
	title = 'Transcrire par microphone - Canary',
	description="""Transcription et traduction multilingue en temps réel via microphone avec le modèle Canary (NVIDIA).

	Enregistrez via microphone, sélectionnez la langue source et cible, et obtenez la transcription ou traduction instantanément."""
	)

	# Créer un interface ASR canary par audio
	fich_transcrire1 = gr.Interface(
	fn=transcrire2,
	inputs=[gr.Audio(sources="upload",type="filepath"),
	gr.Dropdown(choices = ['fr', 'en'], label ='Source languge'),
	gr.Dropdown(choices = ['fr', 'en'], label ='Target language')],
	outputs=gr.Textbox(label="Transcription",
	lines=3),
	title= 'Transcrire un fichier audio - Canary',
	description="""Transcription et traduction multilingue à partir d’un fichier audio téléversé avec le modèle Canary (NVIDIA).

	Téléversez un fichier audio, choisissez les langues source et cible, puis recevez la transcription ou traduction correspondante."""
	)

	# Faire un tabbed des interfaces sur demo
	with demo:
	gr.TabbedInterface(
	[mic_transcrire,
	fich_transcrire,
	mic_transcrire1,
	fich_transcrire1],
	["Transcrire Microphone",
	"Transcrire Audio",
	"Transcrire Microphone",
	"Transcrire Audio"],
	)

	demo.launch()