Spaces:

Mustafa-albakkar
/

AnalizerAgent

Sleeping

App Files Files Community

Mustafa-albakkar commited on 15 days ago

Commit

d993f05

verified ·

1 Parent(s): 4be75eb

Update app.py

Browse files

Files changed (1) hide show

app.py +90 -60

app.py CHANGED Viewed

@@ -1,5 +1,5 @@
 # ============================================================
-# analyzer_agent_gradio/app.py — Telegram Analyzer Agent (Webhook & Gradio)
 # Mamba + GGUF LLM + python-telegram-bot + Gradio
 # ============================================================
@@ -22,9 +22,10 @@ from transformers import AutoTokenizer, AutoModelForCausalLM
 import telegram
 from telegram.error import TelegramError, BadRequest
 # استيرادات Webhook/Handlers
-from telegram.ext import Application, CommandHandler, MessageHandler, filters, CallbackContext # <<< إضافة هامة للـ Handlers
 from llama_cpp import Llama
 from huggingface_hub import hf_hub_download
 # ---------------- Logging ----------------
@@ -35,26 +36,27 @@ log = logging.getLogger("analyzer")
 # ---------------- Env & config ----------------
 TG_BOT_TOKEN = os.getenv("TG_BOT_TOKEN")
 TG_CHANNEL = os.getenv("TG_CHANNEL")
 LOG_PATH = os.getenv("ANALYZER_LOG", "analyzer_log.json")
 POSTS_LIMIT = int(os.getenv("ANALYZER_LIMIT", "80"))
 MAMBA_MODEL_PATH = os.getenv("MAMBA_MODEL_PATH", "state-spaces/mamba-1.4b-hf")
 # ---------------- Webhook Config ----------------
-# يجب تحديد هذا المتغير في بيئة التشغيل للعمل بوضع Webhook
-# مثال: https://your-domain.com/telegram_webhook_path
 WEBHOOK_URL = os.getenv("WEBHOOK_URL")
-WEBHOOK_PORT = int(os.getenv("WEBHOOK_PORT", "8443")) # المنفذ الذي سيستمع عليه الخادم
 LISTEN_ADDRESS = os.getenv("LISTEN_ADDRESS", "0.0.0.0")
 # ---------------- Initialization Check ----------------
-if not all([TG_BOT_TOKEN, TG_CHANNEL]):
-    log.error("Telegram Bot Token or Channel ID are missing in environment variables.")
     IS_SERVICE_READY = False
-    STATUS_MESSAGE = "❌ النظام غير جاهز: بيانات اعتماد البوت أو معرف القناة مفقودة."
 else:
     IS_SERVICE_READY = True
-    STATUS_MESSAGE = "✅ النظام جاهز للتحليل (Bot API)."
 # ---------------- Helpers for Non-Async Blocking Operations ----------------
 def async_wrap_blocking(func):
@@ -100,7 +102,7 @@ try:
         model_path=LLM_LOCAL_PATH,
         n_ctx=4096,
         n_threads=4,
-        n_gpu_layers=0  # إذا لديك GPU ضع قيمة أكبر
     )
     log.info("GGUF model loaded successfully.")
 except Exception as e:
@@ -109,18 +111,17 @@ except Exception as e:
     STATUS_MESSAGE = "❌ فشل تحميل نموذج GGUF."
-# ---------------- Telegram Bot Client ----------------
-# تعريف البوت
 if IS_SERVICE_READY:
     try:
-        # إنشاء كائن البوت (هذا أصبح يتم عبر Application الآن)
-        bot_client = telegram.Bot(token=TG_BOT_TOKEN)
     except Exception as e:
         log.error(f"Failed to initialize Telegram Bot: {e}")
         IS_SERVICE_READY = False
         STATUS_MESSAGE = "❌ فشل تهيئة كائن البوت."
-else:
-    bot_client = None
 # ---------------- Core Helpers ----------------
 def save_log(entry: Dict[str, Any]):
@@ -190,50 +191,83 @@ def interpret_with_llm(mamba_output: str) -> str:
     return res["choices"][0]["text"].strip()
-# ---------------- Fetch Telegram Stats (Bot API) ----------------
 async def fetch_telegram_stats(limit: int = POSTS_LIMIT) -> List[Dict[str, Any]]:
-    """Fetches general channel statistics from Telegram asynchronously using Bot API."""
-    # نستخدم bot_client لضمان وجود الكائن، أو Context.bot في الـ Handlers
-    if not IS_SERVICE_READY or bot_client is None:
         raise RuntimeError(STATUS_MESSAGE)
-    try:
-        log.info("Attempting to fetch channel info and administrators...")
-        # 1. جلب معلومات القناة الأساسية
-        chat_info = await bot_client.get_chat(chat_id=TG_CHANNEL)
-        # 2. جلب المشرفين
-        admins = await bot_client.get_chat_administrators(chat_id=TG_CHANNEL)
-        admins_count = len(admins)
-        # تحويل البيانات إلى تنسيق موحد للتحليل
-        stats = {
-            "chat_id": chat_info.id,
-            "title": chat_info.title,
-            "members": chat_info.members_count,
-            "admins_count": admins_count,
-            "description": chat_info.description,
-            "date": datetime.utcnow().isoformat(),
-        }
-        log.info(f"Successfully fetched stats for channel {stats['title']} with {stats['members']} members.")
-        return [stats]
-    except BadRequest as e:
-        error_msg = str(e).lower()
-        if 'unauthorized' in error_msg or 'forbidden' in error_msg:
-            log.error("Telegram Auth Error: The Bot Token is invalid or Bot is not a member.")
-            raise RuntimeError("فشل مصادقة Telegram: تأكد من صحة TG_BOT_TOKEN وأن البوت عضو في القناة.")
-        else:
-             log.error(f"Telegram Bot API Error: {e}")
-             raise RuntimeError(f"قناة Telegram غير صالحة: {TG_CHANNEL}. التفاصيل: {e}.")
-    except TelegramError as e:
-        log.error(f"An unexpected Telegram error occurred: {e}")
-        raise RuntimeError(f"خطأ غير متوقع في Telegram: {e}")
-    except Exception as e:
-        log.error(f"An unexpected error occurred during Telegram fetch: {e}")
-        raise RuntimeError(f"خطأ غير متوقع في جلب البيانات: {e}")
 # ---------------- Main Analysis Pipeline ----------------
@@ -362,7 +396,6 @@ def daily_job_wrapper():
     """Synchronous wrapper to run the async job in the scheduler."""
     log.info("Running scheduled analysis job via Gradio wrapper...")
     try:
-        # تشغيل الدالة async في حلقة الحدث الخاصة بها
         result = asyncio.run(run_analysis_pipeline())
         log.info(f"Scheduled job completed. Status: {result.get('status')}")
     except Exception as e:
@@ -376,6 +409,7 @@ with gr.Blocks(title="Telegram Channel Analyzer Agent") as demo:
     gr.Markdown("# 🤖 وكيل تحليل قناة Telegram (Webhook/Scheduled)")
     gr.Markdown(f"**حالة الخدمة:** {STATUS_MESSAGE}")
     gr.Markdown(f"**القناة المستهدفة:** `{TG_CHANNEL}`")
     gr.Markdown("---")
     with gr.Tab("تشغيل التحليل يدوياً"):
@@ -448,19 +482,15 @@ if __name__ == "__main__":
         # وضع Webhook
         log.info(f"Setting Webhook URL to: {WEBHOOK_URL}")
         try:
-            # يجب تعيين الـ URL بالكامل لـ Telegram
             application.bot.set_webhook(url=WEBHOOK_URL)
             log.info(f"Starting Webhook server on {LISTEN_ADDRESS}:{WEBHOOK_PORT}...")
-            # المسار الذي سيستمع عليه الخادم (يجب أن يتطابق مع الجزء الأخير من WEBHOOK_URL)
             url_path = WEBHOOK_URL.split('/')[-1] if WEBHOOK_URL.count('/') > 2 else ""
-            # تشغيل خادم Webhook
             application.run_webhook(
                 listen=LISTEN_ADDRESS,
                 port=WEBHOOK_PORT,
                 url_path=url_path,
-                # Note: يجب استخدام HTTPS وشهادة SSL/TLS في بيئة الإنتاج
             )
         except Exception as e:
             log.error(f"Failed to start Webhook: {e}")

 # ============================================================
+# analyzer_agent_gradio/app.py — Telegram Analyzer Agent (Via Replit Proxy)
 # Mamba + GGUF LLM + python-telegram-bot + Gradio
 # ============================================================
 import telegram
 from telegram.error import TelegramError, BadRequest
 # استيرادات Webhook/Handlers
+from telegram.ext import Application, CommandHandler, MessageHandler, filters, CallbackContext
 from llama_cpp import Llama
 from huggingface_hub import hf_hub_download
+import requests # <<< إضافة هامة للاتصال بالجسر
 # ---------------- Logging ----------------
 # ---------------- Env & config ----------------
 TG_BOT_TOKEN = os.getenv("TG_BOT_TOKEN")
 TG_CHANNEL = os.getenv("TG_CHANNEL")
+# المتغير الجديد: رابط تطبيق الجسر على Replit
+REPLIT_PROXY_URL = os.getenv("REPLIT_PROXY_URL")
 LOG_PATH = os.getenv("ANALYZER_LOG", "analyzer_log.json")
 POSTS_LIMIT = int(os.getenv("ANALYZER_LIMIT", "80"))
 MAMBA_MODEL_PATH = os.getenv("MAMBA_MODEL_PATH", "state-spaces/mamba-1.4b-hf")
 # ---------------- Webhook Config ----------------
 WEBHOOK_URL = os.getenv("WEBHOOK_URL")
+WEBHOOK_PORT = int(os.getenv("WEBHOOK_PORT", "8443"))
 LISTEN_ADDRESS = os.getenv("LISTEN_ADDRESS", "0.0.0.0")
 # ---------------- Initialization Check ----------------
+if not all([TG_BOT_TOKEN, TG_CHANNEL, REPLIT_PROXY_URL]): # <<< تعديل التحقق
+    log.error("Telegram Bot Token, Channel ID, or Replit Proxy URL are missing in environment variables.")
     IS_SERVICE_READY = False
+    STATUS_MESSAGE = "❌ النظام غير جاهز: بيانات اعتماد البوت، معرف القناة، أو رابط الجسر مفقودة."
 else:
     IS_SERVICE_READY = True
+    STATUS_MESSAGE = "✅ النظام جاهز للتحليل (Bot API via Replit Proxy)."
 # ---------------- Helpers for Non-Async Blocking Operations ----------------
 def async_wrap_blocking(func):
         model_path=LLM_LOCAL_PATH,
         n_ctx=4096,
         n_threads=4,
+        n_gpu_layers=0
     )
     log.info("GGUF model loaded successfully.")
 except Exception as e:
     STATUS_MESSAGE = "❌ فشل تحميل نموذج GGUF."
+# ---------------- Telegram Bot Client (for Webhook handlers) ----------------
+# لا يزال هذا الكائن ضرورياً لـ python-telegram-bot لاستقبال الأوامر والرد
 if IS_SERVICE_READY:
     try:
+        # لا نحتاج لـ bot_client لكن نحتاج للتحقق من التوكن لـ Application.builder
+        pass
     except Exception as e:
         log.error(f"Failed to initialize Telegram Bot: {e}")
         IS_SERVICE_READY = False
         STATUS_MESSAGE = "❌ فشل تهيئة كائن البوت."
 # ---------------- Core Helpers ----------------
 def save_log(entry: Dict[str, Any]):
     return res["choices"][0]["text"].strip()
+# ---------------- FETCH TELEGRAM STATS (VIA REPLIT PROXY) ----------------
 async def fetch_telegram_stats(limit: int = POSTS_LIMIT) -> List[Dict[str, Any]]:
+    """
+    Fetches general channel statistics by routing requests through the Replit Proxy.
+    """
+    if not IS_SERVICE_READY or not REPLIT_PROXY_URL:
         raise RuntimeError(STATUS_MESSAGE)
+    async def fetch_via_proxy(method: str, data: Optional[Dict[str, Any]] = None) -> Dict[str, Any]:
+        """Sends a request to the Replit proxy and returns the Telegram response result."""
+        url = f"{REPLIT_PROXY_URL}/route_telegram/{method}"
+        try:
+            # نستخدم to_thread لجعل طلب requests متزامن (Blocking) يعمل في خيط منفصل
+            response = await asyncio.to_thread(
+                requests.post,
+                url,
+                json=data if data is not None else {},
+                timeout=30
+            )
+            response.raise_for_status()
+            json_response = response.json()
+            if not json_response.get('ok'):
+                # يتم إلقاء خطأ Telegram API إذا كان الرد سلبياً
+                error_description = json_response.get('description', 'Unknown API Error')
+                raise requests.exceptions.HTTPError(
+                    f"Telegram API Error via Proxy: {error_description}",
+                    response=response
+                )
+            return json_response['result']
+        except requests.exceptions.HTTPError as e:
+            error_details = str(e)
+            log.error(f"Proxy/Telegram HTTP Error during {method}: {error_details}")
+            try:
+                error_data = e.response.json()
+                error_msg = error_data.get("description", error_details)
+            except:
+                error_msg = error_details
+            if 'unauthorized' in error_msg.lower() or 'forbidden' in error_msg.lower():
+                raise RuntimeError(f"فشل مصادقة Telegram (عبر الجسر): {error_msg}. تأكد من صحة TG_BOT_TOKEN في الجسر.")
+            else:
+                raise RuntimeError(f"خطأ في جلب البيانات عبر الجسر ({method}): {error_msg}.")
+        except Exception as e:
+            log.error(f"An unexpected error occurred during proxy fetch: {e}")
+            raise RuntimeError(f"خطأ غير متوقع في الاتصال بالجسر: {e}.")
+    # --- 1. جلب معلومات القناة الأساسية (getChat) ---
+    chat_info_data = await fetch_via_proxy(
+        "getChat",
+        data={"chat_id": TG_CHANNEL}
+    )
+    # --- 2. جلب المشرفين (getChatAdministrators) ---
+    admins_list = await fetch_via_proxy(
+        "getChatAdministrators",
+        data={"chat_id": TG_CHANNEL}
+    )
+    admins_count = len(admins_list)
+    # تحويل البيانات إلى تنسيق موحد للتحليل
+    stats = {
+        "chat_id": chat_info_data.get('id'),
+        "title": chat_info_data.get('title'),
+        "members": chat_info_data.get('members_count', 'N/A'),
+        "admins_count": admins_count,
+        "description": chat_info_data.get('description'),
+        "date": datetime.utcnow().isoformat(),
+    }
+    log.info(f"Successfully fetched stats (via proxy) for channel {stats['title']} with {stats['members']} members.")
+    return [stats]
 # ---------------- Main Analysis Pipeline ----------------
     """Synchronous wrapper to run the async job in the scheduler."""
     log.info("Running scheduled analysis job via Gradio wrapper...")
     try:
         result = asyncio.run(run_analysis_pipeline())
         log.info(f"Scheduled job completed. Status: {result.get('status')}")
     except Exception as e:
     gr.Markdown("# 🤖 وكيل تحليل قناة Telegram (Webhook/Scheduled)")
     gr.Markdown(f"**حالة الخدمة:** {STATUS_MESSAGE}")
     gr.Markdown(f"**القناة المستهدفة:** `{TG_CHANNEL}`")
+    gr.Markdown(f"**جسر Replit:** `{REPLIT_PROXY_URL}`")
     gr.Markdown("---")
     with gr.Tab("تشغيل التحليل يدوياً"):
         # وضع Webhook
         log.info(f"Setting Webhook URL to: {WEBHOOK_URL}")
         try:
             application.bot.set_webhook(url=WEBHOOK_URL)
             log.info(f"Starting Webhook server on {LISTEN_ADDRESS}:{WEBHOOK_PORT}...")
             url_path = WEBHOOK_URL.split('/')[-1] if WEBHOOK_URL.count('/') > 2 else ""
             application.run_webhook(
                 listen=LISTEN_ADDRESS,
                 port=WEBHOOK_PORT,
                 url_path=url_path,
             )
         except Exception as e:
             log.error(f"Failed to start Webhook: {e}")