Spaces:

dashakoryakovskaya
/

Bilingual_Text-based_Emotion_Recognition

Running

App Files Files Community

dashakoryakovskaya commited on Jun 11

Commit

f4dbd19

verified ·

1 Parent(s): 538dfc3

Update app.py

Browse files

Files changed (1) hide show

app.py +59 -18

app.py CHANGED Viewed

@@ -62,21 +62,35 @@ def plotly_plot_audio(audio_path):
             "⚠️ Processing Error"
         )
-def create_demo():
     with gr.Blocks(theme=gr.themes.Soft(), title="Emotion Detection") as demo:
         gr.Markdown("# Text-based bilingual emotion recognition")
         with gr.Row():
-            with gr.Column():
-                audio_input = gr.Audio(
-                    sources=["upload", "microphone"],
-                    type="filepath",
-                    label="Record or Upload Audio",
-                    format="wav",
-                    interactive=True
-                )
-            with gr.Column():
-                text_input = gr.Text(label="Write Text")
         with gr.Row():
             top_emotion = gr.Markdown("## 🏆 Dominant Emotion: Waiting for input ...",
@@ -85,24 +99,51 @@ def create_demo():
         with gr.Row():
             text_plot = gr.Plot(label="Text Analysis")
         transcription = gr.Textbox(
             label="📜 Transcription Results",
             placeholder="Transcribed text will appear here...",
             lines=3,
             max_lines=6
         )
-        if text_input is not None:
-            text_input.change(fn=plotly_plot_text, inputs=text_input, outputs=[text_plot, transcription, top_emotion])
-        elif audio_input:
-            audio_input.change(fn=plotly_plot_audio, inputs=audio_input, outputs=[text_plot, transcription, top_emotion])
     return demo
 if __name__ == "__main__":
-    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
     model = Mamba(num_layers = 2, d_input = 1024, d_model = 512, num_classes=7, model_name='jina', pooling=None).to(device)
-    checkpoint = torch.load("Mamba_jina_checkpoint.pth", map_location=torch.device('cpu'))
     model.load_state_dict(checkpoint['model_state_dict'])
     demo = create_demo()
     demo.launch()

             "⚠️ Processing Error"
         )
+def plotly_plot_audio(audio_path):
+    data = pd.DataFrame()
+    data['Emotion'] = ['😠 anger', '🤢 disgust', '😨 fear', '😄 joy/happiness', '😐 neutral', '😢 sadness', '😲 surprise/enthusiasm']
+    try:
+        text = transcribe_audio(audio_path)
+        data['Probability'] = model.predict_proba([text])[0].tolist() if text.strip() else [0.0] * data.shape[0]
+        p = px.bar(data, x='Emotion', y='Probability', color="Probability")
+        return (
+            p,
+            f"🗣️ Transcription:\n{text}",
+            f"## 🏆 Dominant Emotion: {data['Emotion'].values[np.argmax(np.array(data['Probability']))]}"
+        )
+    except Exception as e:
+        logging.error(f"Processing failed: {e}")
+        data['Probability'] = [0] * data.shape[0]
+        p = px.bar(data, x='Emotion', y='Probability', color="Probability")
+        return (
+            p,
+            "❌ Error processing audio",
+            "⚠️ Processing Error"
+        )
+def create_demo_text():
     with gr.Blocks(theme=gr.themes.Soft(), title="Emotion Detection") as demo:
         gr.Markdown("# Text-based bilingual emotion recognition")
         with gr.Row():
+            text_input = gr.Textbox(label="Write Text")
         with gr.Row():
             top_emotion = gr.Markdown("## 🏆 Dominant Emotion: Waiting for input ...",
         with gr.Row():
             text_plot = gr.Plot(label="Text Analysis")
+        text_input.change(fn=plotly_plot_text, inputs=text_input, outputs=[text_plot, top_emotion])
+    return demo
+def create_demo_audio():
+    with gr.Blocks(theme=gr.themes.Soft(), title="Emotion Detection") as demo:
+        gr.Markdown("# Text-based bilingual emotion recognition")
+        with gr.Row():
+            audio_input = gr.Audio(
+                sources=["upload", "microphone"],
+                type="filepath",
+                label="Record or Upload Audio",
+                format="wav",
+                interactive=True
+            )
+        with gr.Row():
+            top_emotion = gr.Markdown("## 🏆 Dominant Emotion: Waiting for input ...",
+                                      elem_classes="dominant-emotion")
+        with gr.Row():
+            text_plot = gr.Plot(label="Text Analysis")
         transcription = gr.Textbox(
             label="📜 Transcription Results",
             placeholder="Transcribed text will appear here...",
             lines=3,
             max_lines=6
         )
+        audio_input.change(fn=plotly_plot_audio, inputs=audio_input, outputs=[text_plot, transcription, top_emotion])
     return demo
+def create_demo():
+    text = create_demo_text()
+    audio = create_demo_audio()
+    demo = gr.TabbedInterface(
+        [text, audio],
+        ["Text Prediction", "Transcribed Audio Prediction"],
+    )
+    return demo
 if __name__ == "__main__":
     model = Mamba(num_layers = 2, d_input = 1024, d_model = 512, num_classes=7, model_name='jina', pooling=None).to(device)
+    checkpoint = torch.load("models/Mamba_jina_checkpoint.pth", map_location=torch.device('cpu'))
     model.load_state_dict(checkpoint['model_state_dict'])
     demo = create_demo()
     demo.launch()