proxycf

Sleeping

App Files Files Community

Elysiadev11 commited on 13 days ago

Commit

503d0e3

verified ·

1 Parent(s): 6d91b7c

Upload proxy_cf.py

Browse files

Files changed (1) hide show

proxy_cf.py +563 -0

proxy_cf.py ADDED Viewed

	@@ -0,0 +1,563 @@

+import os
+import json
+import time
+import uuid
+import asyncio
+import httpx
+from fastapi import FastAPI, Request
+from fastapi.responses import JSONResponse, Response, StreamingResponse
+from starlette.requests import ClientDisconnect
+app = FastAPI()
+# =====================================================
+# CONFIG
+# =====================================================
+MASTER_API_KEY = os.getenv("MASTER_API_KEY", "olla")
+# Default CF Workers AI model (can override via request body)
+DEFAULT_CF_MODEL = os.getenv("DEFAULT_CF_MODEL", "@cf/meta/llama-3.3-70b-instruct-fp8-fast")
+# =====================================================
+# LOAD CF CREDENTIALS
+# Format env: CF_1=account_id,api_key
+# =====================================================
+CF_ACCOUNTS = []  # list of {"account_id": ..., "api_key": ...}
+for i in range(1, 101):
+    raw = os.getenv(f"CF_{i}")
+    if not raw:
+        continue
+    parts = raw.split(",", 1)
+    if len(parts) != 2:
+        print(f"[WARN] CF_{i} format invalid, expected 'account_id,api_key' — skipped")
+        continue
+    account_id, api_key = parts[0].strip(), parts[1].strip()
+    if account_id and api_key:
+        CF_ACCOUNTS.append({"account_id": account_id, "api_key": api_key})
+if not CF_ACCOUNTS:
+    print("[WARN] No CF credentials found, inserting dummy")
+    CF_ACCOUNTS.append({"account_id": "dummy", "api_key": "dummy"})
+# =====================================================
+# KEY STATUS
+# =====================================================
+key_status = {}
+for idx, acc in enumerate(CF_ACCOUNTS, 1):
+    kid = acc["account_id"]
+    key_status[kid] = {
+        "index": idx,
+        "healthy": True,
+        "busy": False,
+        "success": 0,
+        "fail": 0,
+    }
+rr_index = 0
+_key_lock = asyncio.Lock()
+# =====================================================
+# HELPERS
+# =====================================================
+def log(x):
+    print(f"[{time.strftime('%H:%M:%S')}] {x}", flush=True)
+def sse(obj):
+    return "data: " + json.dumps(obj, ensure_ascii=False) + "\n\n"
+def auth_ok(req: Request):
+    token = req.headers.get("Authorization", "").replace("Bearer ", "")
+    return token == MASTER_API_KEY
+CF_AI_BASE = "https://api.cloudflare.com/client/v4/accounts/{account_id}/ai/v1"
+def cf_base(account_id: str) -> str:
+    return CF_AI_BASE.format(account_id=account_id)
+def cf_url(account_id: str, model: str) -> str:
+    # Legacy /run endpoint (kept for fallback)
+    return f"https://api.cloudflare.com/client/v4/accounts/{account_id}/ai/run/{model}"
+async def get_key(exclude=None):
+    global rr_index
+    if exclude is None:
+        exclude = set()
+    async with _key_lock:
+        for _ in range(len(CF_ACCOUNTS)):
+            rr_index = (rr_index + 1) % len(CF_ACCOUNTS)
+            acc = CF_ACCOUNTS[rr_index]
+            kid = acc["account_id"]
+            st = key_status[kid]
+            if st["healthy"] and not st["busy"] and kid not in exclude:
+                st["busy"] = True
+                return acc  # returns dict {"account_id": ..., "api_key": ...}
+    return None
+async def release_key(acc):
+    async with _key_lock:
+        kid = acc["account_id"]
+        if kid in key_status:
+            key_status[kid]["busy"] = False
+async def mark_fail(acc):
+    async with _key_lock:
+        kid = acc["account_id"]
+        if kid in key_status:
+            key_status[kid]["fail"] += 1
+async def mark_ok(acc):
+    async with _key_lock:
+        kid = acc["account_id"]
+        if kid in key_status:
+            key_status[kid]["success"] += 1
+            key_status[kid]["fail"] = 0
+async def wait_for_free_key(exclude=None, max_wait=30.0, interval=0.3):
+    elapsed = 0.0
+    while elapsed < max_wait:
+        acc = await get_key(exclude)
+        if acc:
+            return acc
+        await asyncio.sleep(interval)
+        elapsed += interval
+    return None
+def is_rate_limited(status_code: int, text: str) -> bool:
+    t = text.lower()
+    return status_code == 429 or "rate limit" in t or "too many requests" in t or "usage limit" in t
+# =====================================================
+# ROOT
+# =====================================================
+@app.get("/")
+async def root():
+    async with _key_lock:
+        safe = {}
+        for kid, v in key_status.items():
+            masked = kid[:6] + "****" + kid[-4:]
+            safe[masked] = {
+                "index": v["index"],
+                "healthy": v["healthy"],
+                "busy": v["busy"],
+                "success": v["success"],
+                "fail": v["fail"],
+            }
+    return {
+        "status": "ok",
+        "accounts": len(CF_ACCOUNTS),
+        "default_model": DEFAULT_CF_MODEL,
+        "detail": safe
+    }
+# =====================================================
+# /v1/models  — live proxy langsung ke CF
+# =====================================================
+@app.get("/v1/models")
+async def models(req: Request):
+    if not auth_ok(req):
+        return JSONResponse({"error": "Unauthorized"}, status_code=401)
+    # Pakai account pertama yang healthy, tidak perlu mark busy
+    acc = None
+    async with _key_lock:
+        for a in CF_ACCOUNTS:
+            if key_status[a["account_id"]]["healthy"]:
+                acc = a
+                break
+    if not acc:
+        return JSONResponse({"error": "No healthy accounts"}, status_code=503)
+    try:
+        async with httpx.AsyncClient(timeout=30) as client:
+            r = await client.get(
+                f"{cf_base(acc['account_id'])}/models",
+                headers={"Authorization": f"Bearer {acc['api_key']}"}
+            )
+        if r.status_code != 200:
+            return JSONResponse({"error": f"CF returned {r.status_code}: {r.text}"}, status_code=r.status_code)
+        # CF sudah return OpenAI-compatible format, langsung forward
+        return Response(content=r.content, media_type="application/json")
+    except Exception as e:
+        log(f"[/v1/models] exception: {e}")
+        return JSONResponse({"error": str(e)}, status_code=500)
+# =====================================================
+# /v1/chat/completions  — OpenAI-compatible endpoint
+# =====================================================
+@app.post("/v1/chat/completions")
+async def chat(req: Request):
+    if not auth_ok(req):
+        return JSONResponse({"error": "Unauthorized"}, status_code=401)
+    try:
+        body = await req.json()
+    except Exception:
+        return JSONResponse({"error": "Bad JSON"}, status_code=400)
+    is_stream = body.get("stream", False)
+    model = body.get("model", DEFAULT_CF_MODEL)
+    # Pass body as-is ke CF — CF OpenAI-compatible endpoint terima format sama persis
+    cf_body = {**body, "model": model}
+    # -----------------------------------------
+    # NON STREAM — forward response langsung
+    # -----------------------------------------
+    if not is_stream:
+        tried = set()
+        for _ in range(len(CF_ACCOUNTS)):
+            acc = await wait_for_free_key(exclude=tried)
+            if not acc:
+                break
+            tried.add(acc["account_id"])
+            try:
+                async with httpx.AsyncClient(timeout=180) as client:
+                    r = await client.post(
+                        f"{cf_base(acc['account_id'])}/chat/completions",
+                        json=cf_body,
+                        headers={
+                            "Authorization": f"Bearer {acc['api_key']}",
+                            "Content-Type": "application/json",
+                        }
+                    )
+                if is_rate_limited(r.status_code, r.text):
+                    log(f"Account {acc['account_id'][:8]}... rate limited (non-stream), trying next")
+                    await mark_fail(acc)
+                    continue
+                if r.status_code != 200:
+                    log(f"Account {acc['account_id'][:8]}... HTTP {r.status_code}, trying next")
+                    await mark_fail(acc)
+                    continue
+                await mark_ok(acc)
+                # CF OpenAI-compatible → langsung forward, tidak perlu konversi
+                return Response(content=r.content, media_type="application/json")
+            except Exception as e:
+                log(f"Account {acc['account_id'][:8]}... exception: {e}")
+                await mark_fail(acc)
+            finally:
+                await release_key(acc)
+        return JSONResponse({"error": "All accounts failed"}, status_code=500)
+    # -----------------------------------------
+    # STREAM — CF kirim SSE OpenAI-format, langsung pipe ke client
+    # -----------------------------------------
+    async def gen():
+        tried = set()
+        for _ in range(len(CF_ACCOUNTS)):
+            acc = await wait_for_free_key(exclude=tried)
+            if not acc:
+                break
+            tried.add(acc["account_id"])
+            try:
+                async with httpx.AsyncClient(timeout=None) as client:
+                    async with client.stream(
+                        "POST",
+                        f"{cf_base(acc['account_id'])}/chat/completions",
+                        json=cf_body,
+                        headers={
+                            "Authorization": f"Bearer {acc['api_key']}",
+                            "Content-Type": "application/json",
+                        }
+                    ) as r:
+                        if is_rate_limited(r.status_code, ""):
+                            log(f"Account {acc['account_id'][:8]}... rate limited (stream), trying next")
+                            await mark_fail(acc)
+                            continue
+                        if r.status_code != 200:
+                            log(f"Account {acc['account_id'][:8]}... HTTP {r.status_code} (stream), trying next")
+                            await mark_fail(acc)
+                            continue
+                        hit_limit = False
+                        async for line in r.aiter_lines():
+                            if not line:
+                                continue
+                            if line.strip() == "data: [DONE]":
+                                break
+                            # Detect mid-stream rate limit dalam payload
+                            raw = line[6:] if line.startswith("data: ") else line
+                            if is_rate_limited(0, raw):
+                                log(f"Account {acc['account_id'][:8]}... mid-stream limit, switching key")
+                                hit_limit = True
+                                break
+                            # CF OpenAI-compatible SSE → pipe langsung ke client
+                            yield line + "\n\n"
+                        if hit_limit:
+                            await mark_fail(acc)
+                            continue
+                        yield "data: [DONE]\n\n"
+                        await mark_ok(acc)
+                        return
+            except Exception as e:
+                log(f"Account {acc['account_id'][:8]}... stream exception: {e}")
+                await mark_fail(acc)
+            finally:
+                await release_key(acc)
+        yield sse({"error": "All accounts failed"})
+        yield "data: [DONE]\n\n"
+    return StreamingResponse(gen(), media_type="text/event-stream")
+# =====================================================
+# /v1/messages  — Anthropic-compatible endpoint
+# Konversi Anthropic format → CF OpenAI-compatible
+# =====================================================
+@app.post("/v1/messages")
+async def anthropic(req: Request):
+    if not auth_ok(req):
+        return JSONResponse({"error": "Unauthorized"}, status_code=401)
+    try:
+        body = await req.json()
+    except ClientDisconnect:
+        return Response(status_code=499)
+    except Exception:
+        return JSONResponse({"error": "Bad JSON"}, status_code=400)
+    stream = body.get("stream", False)
+    model = body.get("model", DEFAULT_CF_MODEL)
+    max_tokens = body.get("max_tokens", 2048)
+    # Konversi Anthropic messages → OpenAI format
+    messages = []
+    if body.get("system"):
+        messages.append({"role": "system", "content": body["system"]})
+    for m in body.get("messages", []):
+        content = m.get("content", "")
+        if isinstance(content, list):
+            txt = "".join(x.get("text", "") for x in content if x.get("type") == "text")
+            content = txt
+        messages.append({"role": m["role"], "content": content})
+    cf_body = {
+        "model": model,
+        "messages": messages,
+        "max_tokens": max_tokens,
+        "stream": stream,
+    }
+    # -----------------------------------------
+    # NON STREAM
+    # -----------------------------------------
+    if not stream:
+        tried = set()
+        for _ in range(len(CF_ACCOUNTS)):
+            acc = await wait_for_free_key(exclude=tried)
+            if not acc:
+                break
+            tried.add(acc["account_id"])
+            try:
+                async with httpx.AsyncClient(timeout=180) as client:
+                    r = await client.post(
+                        f"{cf_base(acc['account_id'])}/chat/completions",
+                        json=cf_body,
+                        headers={
+                            "Authorization": f"Bearer {acc['api_key']}",
+                            "Content-Type": "application/json",
+                        }
+                    )
+                if is_rate_limited(r.status_code, r.text):
+                    log(f"Account {acc['account_id'][:8]}... rate limited (anthropic non-stream), trying next")
+                    await mark_fail(acc)
+                    continue
+                if r.status_code != 200:
+                    log(f"Account {acc['account_id'][:8]}... HTTP {r.status_code}, trying next")
+                    await mark_fail(acc)
+                    continue
+                data = r.json()
+                # CF OpenAI-compatible response → konversi ke Anthropic format
+                content_text = data["choices"][0]["message"]["content"]
+                usage = data.get("usage", {})
+                out = {
+                    "id": "msg_" + uuid.uuid4().hex[:10],
+                    "type": "message",
+                    "role": "assistant",
+                    "model": model,
+                    "content": [{"type": "text", "text": content_text}],
+                    "stop_reason": "end_turn",
+                    "stop_sequence": None,
+                    "usage": {
+                        "input_tokens": usage.get("prompt_tokens", 0),
+                        "output_tokens": usage.get("completion_tokens", 0),
+                    }
+                }
+                await mark_ok(acc)
+                return JSONResponse(out)
+            except Exception as e:
+                log(f"Account {acc['account_id'][:8]}... exception: {e}")
+                await mark_fail(acc)
+            finally:
+                await release_key(acc)
+        return JSONResponse({"error": "All accounts failed"}, status_code=500)
+    # -----------------------------------------
+    # STREAM — CF kirim OpenAI SSE, kita konversi ke Anthropic SSE
+    # -----------------------------------------
+    async def agen():
+        tried = set()
+        msg_id = "msg_" + uuid.uuid4().hex[:10]
+        sent_any_delta = False
+        for _ in range(len(CF_ACCOUNTS)):
+            acc = await wait_for_free_key(exclude=tried)
+            if not acc:
+                break
+            tried.add(acc["account_id"])
+            try:
+                async with httpx.AsyncClient(timeout=None) as client:
+                    async with client.stream(
+                        "POST",
+                        f"{cf_base(acc['account_id'])}/chat/completions",
+                        json=cf_body,
+                        headers={
+                            "Authorization": f"Bearer {acc['api_key']}",
+                            "Content-Type": "application/json",
+                        }
+                    ) as r:
+                        if is_rate_limited(r.status_code, ""):
+                            log(f"Account {acc['account_id'][:8]}... rate limited (anthropic stream), trying next")
+                            await mark_fail(acc)
+                            continue
+                        if r.status_code != 200:
+                            log(f"Account {acc['account_id'][:8]}... HTTP {r.status_code} (anthropic stream), trying next")
+                            await mark_fail(acc)
+                            continue
+                        # Emit Anthropic envelope sekali saja saat key pertama berhasil
+                        if not sent_any_delta:
+                            yield sse({
+                                "type": "message_start",
+                                "message": {
+                                    "id": msg_id,
+                                    "type": "message",
+                                    "role": "assistant",
+                                    "model": model,
+                                    "content": [],
+                                    "stop_reason": None,
+                                    "stop_sequence": None,
+                                    "usage": {"input_tokens": 0, "output_tokens": 0}
+                                }
+                            })
+                            yield sse({
+                                "type": "content_block_start",
+                                "index": 0,
+                                "content_block": {"type": "text"}
+                            })
+                        hit_limit = False
+                        async for line in r.aiter_lines():
+                            if not line:
+                                continue
+                            if line.strip() == "data: [DONE]":
+                                break
+                            raw = line[6:] if line.startswith("data: ") else line
+                            if is_rate_limited(0, raw):
+                                log(f"Account {acc['account_id'][:8]}... mid-stream limit (anthropic), switching key")
+                                hit_limit = True
+                                break
+                            try:
+                                j = json.loads(raw)
+                                token = j["choices"][0]["delta"].get("content", "")
+                            except Exception:
+                                continue
+                            if token:
+                                sent_any_delta = True
+                                yield sse({
+                                    "type": "content_block_delta",
+                                    "index": 0,
+                                    "delta": {"type": "text_delta", "text": token}
+                                })
+                        if hit_limit:
+                            await mark_fail(acc)
+                            continue
+                        await mark_ok(acc)
+                        break
+            except Exception as e:
+                log(f"Account {acc['account_id'][:8]}... agen exception: {e}")
+                await mark_fail(acc)
+            finally:
+                await release_key(acc)
+        # Tutup Anthropic SSE envelope
+        yield sse({"type": "content_block_stop", "index": 0})
+        yield sse({
+            "type": "message_delta",
+            "delta": {"stop_reason": "end_turn", "stop_sequence": None},
+            "usage": {"output_tokens": 0}
+        })
+        yield sse({"type": "message_stop"})
+    return StreamingResponse(agen(), media_type="text/event-stream")