Spaces:

DTabs
/

rephrase

Running

App Files Files Community

DTabs commited on 30 days ago

Commit

eb939d7

verified ·

1 Parent(s): 834bfd1

Update app.py

Browse files

Files changed (1) hide show

app.py +77 -42

app.py CHANGED Viewed

@@ -3,15 +3,17 @@ from parrot import Parrot
 import nltk
 from nltk.tokenize import sent_tokenize, word_tokenize
 import re
 # -----------------------------
 # Setup
 # -----------------------------
-nltk.data.path.append("./nltk_data")  # Local punkt
 parrot = None  # Lazy-loaded global model
 def get_parrot():
     global parrot
     if parrot is None:
         print("⏳ Loading Parrot model for the first time...")
@@ -24,7 +26,7 @@ MAX_TOKENS = 150  # limit per chunk for stability
 # -----------------------------
-# Helper: Common utilities
 # -----------------------------
 def clean_sentence(sent):
     sent = sent.strip()
@@ -46,6 +48,22 @@ def split_long_sentence(sentence, max_tokens=MAX_TOKENS):
     return [" ".join(words[i:i + max_tokens]) for i in range(0, len(words), max_tokens)]
 # -----------------------------
 # 🔹 App 1: Full Paragraph Rephraser
 # -----------------------------
@@ -58,57 +76,47 @@ def rephrase(text):
         chunks = split_long_sentence(s)
         paraphrased_chunks = []
         for c in chunks:
-            try:
-                p = model.augment(
-                    input_phrase=c,
-                    do_diverse=True,
-                    adequacy_threshold=0.85,
-                    fluency_threshold=0.9,
-                )
-                paraphrased_chunks.append(p[0][0] if p else c)
-            except Exception:
                 paraphrased_chunks.append(c)
         rephrased.append(" ".join(paraphrased_chunks))
     return clean_sentences(rephrased)
-rephrase_iface = gr.Interface(
-    fn=rephrase,
-    inputs=gr.Textbox(lines=10, placeholder="Paste your text here..."),
-    outputs="text",
-    title="Parrot Rephraser (Long Text)",
-    description="Paraphrases long text while maintaining punctuation and capitalization.",
-)
 # -----------------------------
 # 🔹 App 2: Sentence-wise Multiple Paraphrases
 # -----------------------------
 def generate_unique_paraphrases(sentence, N_OPTIONS=3):
     model = get_parrot()
-    try:
-        paraphrases = model.augment(
-            input_phrase=sentence,
-            do_diverse=True,
-            adequacy_threshold=0.85,
-            fluency_threshold=0.9,
-        )
-    except Exception:
-        paraphrases = []
-    if paraphrases:
-        texts = [p[0] for p in paraphrases]
-        unique = []
-        for t in texts:
-            if t not in unique:
-                unique.append(t)
-            if len(unique) == N_OPTIONS:
-                break
-        return unique
-    else:
         return [sentence]
 def rephrase_sentencewise_unique(text, N_OPTIONS=3):
     sentences = sent_tokenize(text.strip())
@@ -123,6 +131,34 @@ def rephrase_sentencewise_unique(text, N_OPTIONS=3):
     return "\n".join(results)
 sentencewise_iface = gr.Interface(
     fn=rephrase_sentencewise_unique,
     inputs=gr.Textbox(lines=10, placeholder="Paste text here..."),
@@ -131,7 +167,6 @@ sentencewise_iface = gr.Interface(
     description="Generates top 3 unique paraphrases per sentence. Optimized for HF free-tier.",
 )
 # -----------------------------
 # 🔹 Combine both interfaces into Tabs
 # -----------------------------
@@ -140,4 +175,4 @@ demo = gr.TabbedInterface(
     ["Full Text Rephraser", "Sentence-wise Paraphrases"],
 )
-demo.launch()

 import nltk
 from nltk.tokenize import sent_tokenize, word_tokenize
 import re
+import time
 # -----------------------------
 # Setup
 # -----------------------------
+nltk.data.path.append("./nltk_data")  # Local punkt (no downloading)
 parrot = None  # Lazy-loaded global model
 def get_parrot():
+    """Load the Parrot model lazily"""
     global parrot
     if parrot is None:
         print("⏳ Loading Parrot model for the first time...")
 # -----------------------------
+# Helper functions
 # -----------------------------
 def clean_sentence(sent):
     sent = sent.strip()
     return [" ".join(words[i:i + max_tokens]) for i in range(0, len(words), max_tokens)]
+# -----------------------------
+# 🔹 Retry Wrapper
+# -----------------------------
+def with_retry(func, *args, retries=1, delay=3, **kwargs):
+    """Try running a function twice before giving up"""
+    for attempt in range(retries + 1):
+        try:
+            return func(*args, **kwargs)
+        except Exception as e:
+            print(f"⚠️ Attempt {attempt + 1} failed: {e}")
+            if attempt < retries:
+                print("🔁 Retrying...")
+                time.sleep(delay)
+    return None
 # -----------------------------
 # 🔹 App 1: Full Paragraph Rephraser
 # -----------------------------
         chunks = split_long_sentence(s)
         paraphrased_chunks = []
         for c in chunks:
+            p = with_retry(
+                model.augment,
+                input_phrase=c,
+                do_diverse=True,
+                adequacy_threshold=0.85,
+                fluency_threshold=0.9,
+            )
+            if p:
+                paraphrased_chunks.append(p[0][0])
+            else:
                 paraphrased_chunks.append(c)
         rephrased.append(" ".join(paraphrased_chunks))
     return clean_sentences(rephrased)
 # -----------------------------
 # 🔹 App 2: Sentence-wise Multiple Paraphrases
 # -----------------------------
 def generate_unique_paraphrases(sentence, N_OPTIONS=3):
     model = get_parrot()
+    paraphrases = with_retry(
+        model.augment,
+        input_phrase=sentence,
+        do_diverse=True,
+        adequacy_threshold=0.85,
+        fluency_threshold=0.9,
+    )
+    if not paraphrases:
         return [sentence]
+    texts = [p[0] for p in paraphrases]
+    unique = []
+    for t in texts:
+        if t not in unique:
+            unique.append(t)
+        if len(unique) == N_OPTIONS:
+            break
+    return unique
 def rephrase_sentencewise_unique(text, N_OPTIONS=3):
     sentences = sent_tokenize(text.strip())
     return "\n".join(results)
+# -----------------------------
+# 🔹 Warm-up on startup
+# -----------------------------
+def warmup():
+    """Ping the model once to prevent timeout at first request"""
+    print("🔥 Warming up Parrot model...")
+    try:
+        model = get_parrot()
+        _ = model.augment(input_phrase="hello world", do_diverse=False)
+        print("✅ Warmup complete.")
+    except Exception as e:
+        print(f"⚠️ Warmup skipped: {e}")
+warmup()
+# -----------------------------
+# 🔹 Gradio Interfaces
+# -----------------------------
+rephrase_iface = gr.Interface(
+    fn=rephrase,
+    inputs=gr.Textbox(lines=10, placeholder="Paste your text here..."),
+    outputs="text",
+    title="Parrot Rephraser (Long Text)",
+    description="Paraphrases long text while maintaining punctuation and capitalization.",
+)
 sentencewise_iface = gr.Interface(
     fn=rephrase_sentencewise_unique,
     inputs=gr.Textbox(lines=10, placeholder="Paste text here..."),
     description="Generates top 3 unique paraphrases per sentence. Optimized for HF free-tier.",
 )
 # -----------------------------
 # 🔹 Combine both interfaces into Tabs
 # -----------------------------
     ["Full Text Rephraser", "Sentence-wise Paraphrases"],
 )
+demo.launch(server_port=7860, server_name="0.0.0.0", show_error=True)