Spaces:

MINZO4546
/

minzo-api

Build error

MINZO4546 commited on 14 days ago

Commit

27cf60a

verified ·

1 Parent(s): d76d7d1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,7 +6,7 @@ import torch
 main = FastAPI()
-# CORS සක්‍රීය කිරීම - ඕනෑම තැනක සිට සම්බන්ධ වීමට
 main.add_middleware(
     CORSMiddleware,
     allow_origins=["*"],
@@ -15,14 +15,14 @@ main.add_middleware(
 )
 MODEL_ID = "tencent/Hy-MT1.5-1.8B-2bit"
-print(f"🔱 Specialist, Loading {MODEL_ID} (Public Mode)...")
-# Pipeline initialization
 pipe = pipeline(
     "text-generation",
     model=MODEL_ID,
     device_map="cpu",
-    model_kwargs={"trust_remote_code": True}
 )
 class ChatRequest(BaseModel):
@@ -32,10 +32,10 @@ class ChatRequest(BaseModel):
 async def chat(request_data: ChatRequest):
     user_query = request_data.message.strip()
-    # Prompt Setup
     prompt = f"User: {user_query}\nAssistant:"
-    # Text Generation
     results = pipe(
         prompt,
         max_new_tokens=150,
@@ -46,13 +46,14 @@ async def chat(request_data: ChatRequest):
     # Result Cleaning
     generated_text = results[0]['generated_text']
-    reply = generated_text.split("Assistant:")[-1].strip()
-    if not reply:
-        reply = "I am here, MINZO-PRIME. Systems are nominal."
     return {"reply": reply}
 @main.get("/")
 def health():
-    return {"status": "Public Inachi-Lite Online"}

 main = FastAPI()
+# CORS සක්‍රීය කිරීම
 main.add_middleware(
     CORSMiddleware,
     allow_origins=["*"],
 )
 MODEL_ID = "tencent/Hy-MT1.5-1.8B-2bit"
+print(f"🔱 Specialist, Loading {MODEL_ID} on CPU...")
+# 🔱 Pipeline එක නිවැරදිව load කිරීම
 pipe = pipeline(
     "text-generation",
     model=MODEL_ID,
     device_map="cpu",
+    trust_remote_code=True # කෙලින්ම මෙතනට පමණක් ලබා දෙන්න
 )
 class ChatRequest(BaseModel):
 async def chat(request_data: ChatRequest):
     user_query = request_data.message.strip()
+    # Simple Prompt
     prompt = f"User: {user_query}\nAssistant:"
+    # Response Generation
     results = pipe(
         prompt,
         max_new_tokens=150,
     # Result Cleaning
     generated_text = results[0]['generated_text']
+    # Assistant: කියන කොටසෙන් පස්සේ තියෙන ටික විතරක් ගැනීම
+    if "Assistant:" in generated_text:
+        reply = generated_text.split("Assistant:")[-1].strip()
+    else:
+        reply = generated_text.replace(prompt, "").strip()
     return {"reply": reply}
 @main.get("/")
 def health():
+    return {"status": "Inachi-Lite Online", "model": MODEL_ID}