Spaces:

tenet
/

HRM

Runtime error

tenet commited on Aug 21

Commit

72165a4

verified ·

1 Parent(s): 4dcf554

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,6 +1,6 @@
 import gradio as gr
 from transformers import pipeline
 # ----------------
 # TEXT MODELS
 # ----------------
@@ -42,9 +42,11 @@ segmentation_pipeline = pipeline(
 def segment_image(image):
     results = segmentation_pipeline(image)
-    # Gradio AnnotatedImage expects (image, annotations)
-    ann = [(image, r["mask"]) for r in results]
-    return (image, ann)
 # ----------------
@@ -52,10 +54,13 @@ def segment_image(image):
 # ----------------
 asr_pipeline = pipeline("automatic-speech-recognition", model="openai/whisper-tiny")
-def transcribe(audio):
-    return asr_pipeline(audio)["text"]
 # ----------------
 # GRADIO APP
 # ----------------

 import gradio as gr
 from transformers import pipeline
+import librosa
 # ----------------
 # TEXT MODELS
 # ----------------
 def segment_image(image):
     results = segmentation_pipeline(image)
+    # Combine masks into a single image with labels
+    annotated = {}
+    for r in results:
+        annotated[r["label"]] = r["mask"]  # label → mask
+    return (image, annotated)
 # ----------------
 # ----------------
 asr_pipeline = pipeline("automatic-speech-recognition", model="openai/whisper-tiny")
+def transcribe(audio):
+    # Load with max 30s duration
+    speech, sr = librosa.load(audio, sr=16000, duration=30)
+    return asr_pipeline({"array": speech, "sampling_rate": sr}, return_timestamps=True)["text"]
 # ----------------
 # GRADIO APP
 # ----------------