Spaces:

gijl
/

hj

Running

App Files Files Community

gijl commited on 5 days ago

Commit

024a042

verified ·

1 Parent(s): 4ce8159

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -34

app.py CHANGED Viewed

@@ -1,55 +1,52 @@
 import gradio as gr
-from transformers import pipeline
 import torch
-# تحديد الجهاز (GPU إذا توفر، وإلا CPU)
-device = 0 if torch.cuda.is_available() else -1
-# تحميل النموذج
 model_id = "gijl/Medical-Master-1.5B"
-try:
-    pipe = pipeline(
-        "text-generation",
-        model=model_id,
-        device=device,
-        # استخدام float32 لتجنب مشاكل التوافق على CPU المساحات المجانية
-        model_kwargs={"torch_dtype": torch.float32}
-    )
-except Exception as e:
-    print(f"Error loading model: {e}")
-    pipe = None
 def medical_chat(message, history):
-    if pipe is None:
-        return "النموذج لا يزال قيد التحميل أو هناك مشكلة في الذاكرة."
     prompt = f"Question: {message}\nAnswer:"
-    # تقليل عدد التوكنز لتسريع الاستجابة وتجنب المهلة الزمنية (Timeout)
     results = pipe(
         prompt,
-        max_new_tokens=200,
         do_sample=True,
-        temperature=0.7,
-        top_p=0.9
     )
-    generated_text = results[0]['generated_text']
-    # استخراج الإجابة فقط
-    if "Answer:" in generated_text:
-        answer = generated_text.split("Answer:")[-1].strip()
-    else:
-        answer = generated_text
-    return answer
-# بناء الواجهة بدون وسيط theme لتجنب الخطأ
 demo = gr.ChatInterface(
     fn=medical_chat,
-    title="Medical Master 1.5B",
-    description="مساعد طبي ذكي - للاستخدام التعليمي فقط",
-    examples=["What are the symptoms of diabetes?", "كيف أحافظ على صحة القلب؟"],
 )
 if __name__ == "__main__":

 import gradio as gr
+from transformers import pipeline, AutoModelForCausalLM, AutoTokenizer
 import torch
 model_id = "gijl/Medical-Master-1.5B"
+# 1. تحميل التوكنايزر والنموذج بشكل منفصل لضمان الدقة
+tokenizer = AutoTokenizer.from_pretrained(model_id)
+model = AutoModelForCausalLM.from_pretrained(
+    model_id,
+    torch_dtype=torch.float32,
+    low_cpu_mem_usage=True,
+    trust_remote_code=True # مهم إذا كان هناك كود مخصص للنموذج
+)
+# 2. إعداد الـ Pipeline مع إيقاف التكرار
+pipe = pipeline(
+    "text-generation",
+    model=model,
+    tokenizer=tokenizer,
+    device=-1 # استخدام CPU للمساحات المجانية
+)
 def medical_chat(message, history):
+    # تجربة برومبت بسيط جداً بدون تعقيد
     prompt = f"Question: {message}\nAnswer:"
     results = pipe(
         prompt,
+        max_new_tokens=100,
         do_sample=True,
+        temperature=0.8,
+        top_p=0.9,
+        repetition_penalty=1.2, # لمنع التكرار أو الفراغ
+        return_full_text=False   # لكي يعطينا الإجابة فقط بدون السؤال
     )
+    response = results[0]['generated_text'].strip()
+    # إذا كان الرد لا يزال فارغاً، سنعيد رسالة توضيحية
+    if not response:
+        return "النموذج لم يولد أي نص. تأكد من أن ملف pytorch_model.bin متوافق مع config.json في مستودع النموذج."
+    return response
 demo = gr.ChatInterface(
     fn=medical_chat,
+    title="Medical Master Testing Mode",
+    description="اختبار المخرجات الخام للنموذج"
 )
 if __name__ == "__main__":