Spaces:

bahi-bh
/

Gf4test

Sleeping

App Files Files Community

bahi-bh commited on 8 days ago

Commit

17aa345

verified ·

1 Parent(s): f535544

Update main.py

Browse files

Files changed (1) hide show

main.py +251 -255

main.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import os
 import json
 import time
-import logging
 import asyncio
-import g4f
 from fastapi import FastAPI, HTTPException, Header
 from fastapi.responses import StreamingResponse
@@ -11,449 +11,445 @@ from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 from typing import List, Optional
-# ================= Logging =================
-logging.basicConfig(
-    level=logging.INFO,
-    format="%(asctime)s %(levelname)s %(message)s"
-)
 logger=logging.getLogger(__name__)
-# ================= App =================
 app=FastAPI(
-    title="G4F Smart Gateway",
     version="2.0"
 )
 app.add_middleware(
     CORSMiddleware,
     allow_origins=["*"],
-    allow_credentials=False,
     allow_methods=["*"],
     allow_headers=["*"]
 )
 API_KEY=os.getenv(
     "API_KEY",
-    "your_fallback_secret"
 )
-# ================= Models =================
-class ChatMessage(BaseModel):
     role:str
     content:str
 class ChatRequest(BaseModel):
-    model:str="gpt-4o-mini"
-    messages:List[ChatMessage]
     stream:bool=False
     provider:Optional[str]=None
-    temperature:Optional[float]=0.7
-    max_tokens:Optional[int]=2048
-# ================= Auth =================
-def verify_key(auth:str):
     if not auth:
-        raise HTTPException(
-            status_code=401,
-            detail="Missing Authorization"
-        )
-    parts=auth.split()
-    if len(parts)!=2:
         raise HTTPException(
             status_code=401,
-            detail="Malformed Authorization"
         )
-    if parts[0]!="Bearer":
-        raise HTTPException(
-            status_code=401,
-            detail="Invalid Authorization"
-        )
-    if parts[1]!=API_KEY:
         raise HTTPException(
             status_code=401,
-            detail="Invalid API Key"
         )
-# ================= Provider Selection =================
-def choose_provider(model:str):
-    model=model.lower()
-    try:
-        if "qwen" in model:
-            return getattr(
-                g4f.Provider,
-                "DeepInfra",
-                None
-            )
-        elif "perplexity" in model:
-            return getattr(
-                g4f.Provider,
-                "PerplexityLabs",
-                None
-            )
-        elif "llama" in model:
-            return getattr(
-                g4f.Provider,
-                "DeepInfra",
-                None
-            )
-        elif "claude" in model:
-            return getattr(
-                g4f.Provider,
-                "OpenaiChat",
-                None
-            )
-        elif "gemini" in model:
-            return getattr(
-                g4f.Provider,
-                "OpenaiChat",
-                None
-            )
-        elif "gpt" in model:
-            return getattr(
-                g4f.Provider,
-                "OpenaiChat",
-                None
             )
-    except:
-        pass
-    return None
-# ================= Health =================
 @app.get("/")
 async def root():
     return {
-        "status":"online"
     }
-# ================= Models =================
 @app.get("/v1/models")
 async def models(
-    authorization:str=Header(None)
 ):
-    verify_key(
-        authorization
-    )
     try:
-        found=[]
-        if hasattr(
-            g4f.models,
-            "ModelUtils"
-        ):
-            found=list(
-                g4f.models.ModelUtils.convert.keys()
-            )
-        found=sorted(
-            list(set(found))
-        )
-        if not found:
-            found=[
-                "gpt-4o-mini",
-                "gpt-4",
-                "gpt-3.5-turbo",
-                "qwen-2.5-72b",
-                "llama-3-70b",
-                "perplexity"
-            ]
-        return {
-            "object":"list",
-            "data":[
-                {
                     "id":m,
                     "object":"model",
-                    "owned_by":"g4f"
-                }
-                for m in found
-            ]
-        }
     except Exception as e:
-        logger.exception(e)
-        return {
-            "object":"list",
-            "data":[
-                {
-                    "id":"gpt-4o-mini",
-                    "object":"model"
-                }
-            ]
-        }
-# ================= Chat =================
 @app.post("/v1/chat/completions")
 async def chat(
-    body:ChatRequest,
-    authorization:str=Header(None)
 ):
-    verify_key(
         authorization
     )
-    try:
-        messages=[
-            {
-                "role":m.role,
-                "content":m.content
-            }
-            for m in body.messages
-        ]
-        provider=None
-        if body.provider:
-            provider=getattr(
-                g4f.Provider,
-                body.provider,
-                None
-            )
-        else:
-            provider=choose_provider(
-                body.model
-            )
-        logger.info(
-            f"Model={body.model} Provider={provider}"
-        )
-        # ========= STREAM =========
-        if body.stream:
-            def generate():
-                try:
-                    response=g4f.ChatCompletion.create(
-                        model=body.model,
-                        messages=messages,
-                        provider=provider,
-                        stream=True
-                    )
-                    for chunk in response:
                         payload={
                             "id":"chatcmpl",
-                            "object":
-                            "chat.completion.chunk",
-                            "created":
-                            int(time.time()),
-                            "model":
-                            body.model,
-                            "choices":[
-                                {
-                                    "delta":{
-                                        "content":
-                                        str(chunk)
-                                    },
-                                    "index":0
-                                }
-                            ]
-                        }
-                        yield (
-                            f"data: {json.dumps(payload)}\n\n"
-                        )
-                    yield "data: [DONE]\n\n"
-                except Exception as e:
-                    logger.exception(e)
-                    yield (
-                        f"data:{json.dumps({'error':str(e)})}\n\n"
-                    )
-            return StreamingResponse(
-                generate(),
-                media_type="text/event-stream"
-            )
-        # ========= NORMAL =========
-        response=await asyncio.to_thread(
-            g4f.ChatCompletion.create,
-            model=body.model,
-            messages=messages,
-            provider=provider
-        )
-        return {
-            "id":"chatcmpl",
-            "object":"chat.completion",
-            "created":
-            int(time.time()),
-            "model":
-            body.model,
-            "choices":[
-                {
-                    "index":0,
-                    "message":{
-                        "role":
-                        "assistant",
-                        "content":
-                        str(response)
-                    },
-                    "finish_reason":
-                    "stop"
-                }
-            ]
-        }
-    except Exception as e:
-        logger.exception(e)
-        raise HTTPException(
-            status_code=500,
-            detail=str(e)
         )
-# ================= Test =================
-@app.get("/test/{model}")
-async def test_model(
-    model:str
-):
-    try:
-        provider=choose_provider(
-            model
         )
-        result=await asyncio.to_thread(
             g4f.ChatCompletion.create,
-            model=model,
-            provider=provider,
-            messages=[
-                {
-                    "role":"user",
-                    "content":"hello"
-                }
-            ]
-        )
-        return {
-            "model":model,
-            "provider":str(provider),
-            "working":True
-        }
-    except Exception as e:
-        return {
-            "model":model,
-            "working":False,
-            "error":str(e)
-        }

 import os
 import json
 import time
 import asyncio
+import logging
+import inspect
 from fastapi import FastAPI, HTTPException, Header
 from fastapi.responses import StreamingResponse
 from pydantic import BaseModel
 from typing import List, Optional
+import g4f
+import g4f.Provider as Provider
+import litellm
+# ----------------------------
+# Logging
+# ----------------------------
+logging.basicConfig(level=logging.INFO)
 logger=logging.getLogger(__name__)
+# ----------------------------
+# App
+# ----------------------------
 app=FastAPI(
+    title="AI Gateway",
     version="2.0"
 )
 app.add_middleware(
     CORSMiddleware,
     allow_origins=["*"],
     allow_methods=["*"],
     allow_headers=["*"]
 )
 API_KEY=os.getenv(
     "API_KEY",
+    "your_secret"
 )
+DEFAULT_MODEL=os.getenv(
+    "DEFAULT_MODEL",
+    "groq/llama-3.3-70b-versatile"
+)
+# ----------------------------
+# Models
+# ----------------------------
+class Message(BaseModel):
     role:str
     content:str
 class ChatRequest(BaseModel):
+    model:str=DEFAULT_MODEL
+    messages:List[Message]
     stream:bool=False
     provider:Optional[str]=None
+# ----------------------------
+# Auth
+# ----------------------------
+def verify(auth):
     if not auth:
         raise HTTPException(
             status_code=401,
+            detail="Missing token"
         )
+    if auth != f"Bearer {API_KEY}":
         raise HTTPException(
             status_code=401,
+            detail="Unauthorized"
         )
+# ----------------------------
+# g4f provider discovery
+# ----------------------------
+SKIP={
+"BaseProvider",
+"RetryProvider",
+"AsyncProvider"
+}
+def collect_models(cls):
+    result=[]
+    for attr in [
+        "default_model",
+        "models",
+        "model"
+    ]:
+        v=getattr(
+            cls,
+            attr,
+            None
+        )
+        if not v:
+            continue
+        if isinstance(v,str):
+            result.append(v)
+        elif isinstance(
+            v,
+            (list,tuple)
+        ):
+            result.extend(
+                [str(x) for x in v]
             )
+    return list(
+        set(result)
+    )
+# ----------------------------
+# health
+# ----------------------------
 @app.get("/")
 async def root():
     return {
+        "status":"online",
+        "default":DEFAULT_MODEL
     }
+# ----------------------------
+# models
+# ----------------------------
 @app.get("/v1/models")
 async def models(
+authorization:str=Header(None)
 ):
+    verify(authorization)
+    data=[]
     try:
+        # LiteLLM models
+        ll_models=[
+            "groq/llama-3.3-70b-versatile",
+            "groq/llama-3.1-8b-instant",
+            "openrouter/qwen/qwen-2.5-72b-instruct",
+            "huggingface/Qwen/Qwen2.5-72B-Instruct",
+            "openrouter/deepseek/deepseek-chat",
+            "openai/gpt-4o",
+            "openai/gpt-4o-mini"
+        ]
+        for m in ll_models:
+            data.append({
+                "id":m,
+                "object":"model",
+                "owned_by":"litellm"
+            })
+        # g4f dynamic providers
+        for name in dir(Provider):
+            if name.startswith("_"):
+                continue
+            if name in SKIP:
+                continue
+            cls=getattr(
+                Provider,
+                name
+            )
+            if not inspect.isclass(cls):
+                continue
+            models=collect_models(
+                cls
+            )
+            for m in models:
+                data.append({
                     "id":m,
                     "object":"model",
+                    "owned_by":name
+                })
     except Exception as e:
+        logger.error(e)
+    return {
+        "object":"list",
+        "data":data
+    }
+# ----------------------------
+# Chat
+# ----------------------------
 @app.post("/v1/chat/completions")
 async def chat(
+body:ChatRequest,
+authorization:str=Header(None)
 ):
+    verify(
         authorization
     )
+    messages=[
+        {
+            "role":m.role,
+            "content":m.content
+        }
+        for m in body.messages
+    ]
+    # =====================
+    # Streaming
+    # =====================
+    if body.stream:
+        async def generate():
+            try:
+                # LiteLLM first
+                response=litellm.completion(
+                    model=body.model,
+                    messages=messages,
+                    stream=True
+                )
+                for chunk in response:
+                    content=""
+                    try:
+                        content=chunk.choices[0].delta.content
+                    except:
+                        pass
+                    if content:
                         payload={
                             "id":"chatcmpl",
+                            "object":"chat.completion.chunk",
+                            "created":int(time.time()),
+                            "model":body.model,
+                            "choices":[{
+                                "delta":{
+                                    "content":content
+                                },
+                                "index":0
+                            }]
+                        }
+                        yield f"data:{json.dumps(payload)}\n\n"
+            except:
+                logger.info(
+                    "Fallback g4f"
+                )
+                response=g4f.ChatCompletion.create(
+                    model=body.model,
+                    messages=messages,
+                    stream=True
+                )
+                for chunk in response:
+                    payload={
+                        "choices":[{
+                            "delta":{
+                                "content":str(chunk)
+                            }
+                        }]
+                    }
+                    yield f"data:{json.dumps(payload)}\n\n"
+            yield "data:[DONE]\n\n"
+        return StreamingResponse(
+            generate(),
+            media_type="text/event-stream"
+        )
+    # =====================
+    # Normal
+    # =====================
+    try:
+        response=await asyncio.to_thread(
+            litellm.completion,
+            model=body.model,
+            messages=messages
         )
+        content=response.choices[0].message.content
+    except Exception:
+        logger.info(
+            "Using g4f fallback"
         )
+        content=await asyncio.to_thread(
             g4f.ChatCompletion.create,
+            model=body.model,
+            messages=messages
+        )
+    return {
+        "id":"chatcmpl",
+        "object":"chat.completion",
+        "created":int(time.time()),
+        "model":body.model,
+        "choices":[
+            {
+                "index":0,
+                "message":{
+                    "role":"assistant",
+                    "content":str(content)
+                },
+                "finish_reason":"stop"
+            }
+        ]
+    }