Spaces:

infinityonline
/

dz

Running

App Files Files Community

infinityonline commited on 2 days ago

Commit

86a6197

verified ·

1 Parent(s): c73fb17

Update main.py

Browse files

Files changed (1) hide show

main.py +31 -20

main.py CHANGED Viewed

@@ -6,8 +6,9 @@ import asyncio
 import threading
 import json
 import re
 from fastapi import FastAPI, Request
-from fastapi.responses import JSONResponse
 # ====================================================================
 # Configuration
@@ -15,7 +16,7 @@ from fastapi.responses import JSONResponse
 API_SECRET_KEY = os.getenv("API_SECRET_KEY", "change-me-secret")
 POOL_SIZE      = int(os.getenv("POOL_SIZE", "5"))
 MAX_REQUESTS   = int(os.getenv("MAX_REQUESTS", "30"))
-QUEUE_TIMEOUT  = int(os.getenv("QUEUE_TIMEOUT", "300"))  # ثواني انتظار Queue
 DUCK_MODELS = {
     "gpt-5-mini":       "GPT-5 mini",
@@ -136,10 +137,8 @@ class BrowserWorker:
                 self.busy = False
     async def _do_chat(self, model_label: str, prompt: str) -> str:
-        # تأخير عشوائي لتبدو الطلبات طبيعية
         await asyncio.sleep(random.uniform(0.5, 2.0))
-        # تجديد context دورياً
         self._request_count += 1
         self._total_count   += 1
         if self._request_count >= MAX_REQUESTS:
@@ -324,7 +323,7 @@ class BrowserPool:
         self._thread         = threading.Thread(target=self._run, daemon=True)
         self._queue: asyncio.Queue | None = None
         self._total_requests = 0
-        self._rejected       = 0   # عدد الطلبات المرفوضة بسبب timeout
     def start(self):
         self._thread.start()
@@ -350,8 +349,6 @@ class BrowserPool:
     async def _process(self, model_label: str, prompt: str) -> str:
         self._total_requests += 1
-        # انتظر worker حر — بحد أقصى QUEUE_TIMEOUT ثانية
         try:
             worker: BrowserWorker = await asyncio.wait_for(
                 self._queue.get(), timeout=QUEUE_TIMEOUT
@@ -365,8 +362,7 @@ class BrowserPool:
                 f"Please retry in a moment. (rejected total: {self._rejected})"
             )
-        print(f"[POOL] Assigned W{worker.id} "
-              f"(total req: {self._total_requests}) ✓")
         try:
             return await worker.chat(model_label, prompt)
         finally:
@@ -598,27 +594,42 @@ async def health():
     busy  = sum(1 for w in pool.workers if w.busy)
     stats = [
         {
-            "id":                    w.id,
-            "busy":                  w.busy,
-            "total_requests":        w._total_count,
             "requests_until_rotation": MAX_REQUESTS - w._request_count,
         }
         for w in pool.workers
     ]
     return {
-        "status":           "running",
-        "message":          "Duck.ai API Pool Server is active!",
-        "models":           ALL_MODELS,
-        "pool_size":        POOL_SIZE,
-        "workers_busy":     busy,
-        "workers_free":     POOL_SIZE - busy,
-        "total_requests":   pool._total_requests,
         "rejected_requests": pool._rejected,
         "queue_timeout_sec": QUEUE_TIMEOUT,
-        "workers":          stats,
     }
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)

 import threading
 import json
 import re
+import psutil
 from fastapi import FastAPI, Request
+from fastapi.responses import JSONResponse, HTMLResponse
 # ====================================================================
 # Configuration
 API_SECRET_KEY = os.getenv("API_SECRET_KEY", "change-me-secret")
 POOL_SIZE      = int(os.getenv("POOL_SIZE", "5"))
 MAX_REQUESTS   = int(os.getenv("MAX_REQUESTS", "30"))
+QUEUE_TIMEOUT  = int(os.getenv("QUEUE_TIMEOUT", "300"))
 DUCK_MODELS = {
     "gpt-5-mini":       "GPT-5 mini",
                 self.busy = False
     async def _do_chat(self, model_label: str, prompt: str) -> str:
         await asyncio.sleep(random.uniform(0.5, 2.0))
         self._request_count += 1
         self._total_count   += 1
         if self._request_count >= MAX_REQUESTS:
         self._thread         = threading.Thread(target=self._run, daemon=True)
         self._queue: asyncio.Queue | None = None
         self._total_requests = 0
+        self._rejected       = 0
     def start(self):
         self._thread.start()
     async def _process(self, model_label: str, prompt: str) -> str:
         self._total_requests += 1
         try:
             worker: BrowserWorker = await asyncio.wait_for(
                 self._queue.get(), timeout=QUEUE_TIMEOUT
                 f"Please retry in a moment. (rejected total: {self._rejected})"
             )
+        print(f"[POOL] Assigned W{worker.id} (total req: {self._total_requests}) ✓")
         try:
             return await worker.chat(model_label, prompt)
         finally:
     busy  = sum(1 for w in pool.workers if w.busy)
     stats = [
         {
+            "id":                      w.id,
+            "busy":                    w.busy,
+            "total_requests":          w._total_count,
             "requests_until_rotation": MAX_REQUESTS - w._request_count,
         }
         for w in pool.workers
     ]
+    mem = psutil.virtual_memory()
     return {
+        "status":            "running",
+        "message":           "Duck.ai API Pool Server is active!",
+        "models":            ALL_MODELS,
+        "pool_size":         POOL_SIZE,
+        "workers_busy":      busy,
+        "workers_free":      POOL_SIZE - busy,
+        "total_requests":    pool._total_requests,
         "rejected_requests": pool._rejected,
         "queue_timeout_sec": QUEUE_TIMEOUT,
+        "workers":           stats,
+        "ram": {
+            "used_gb":  round(mem.used  / 1024**3, 2),
+            "total_gb": round(mem.total / 1024**3, 2),
+            "percent":  mem.percent,
+        },
+        "cpu": psutil.cpu_percent(interval=None),
     }
+@app.get("/dashboard", response_class=HTMLResponse)
+async def dashboard(request: Request):
+    if not _auth(request):
+        return HTMLResponse("<h1>401 Unauthorized</h1>", status_code=401)
+    with open("dashboard.html", "r", encoding="utf-8") as f:
+        return HTMLResponse(f.read())
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run(app, host="0.0.0.0", port=7860)