Spaces:

gijl
/

hj

Sleeping

App Files Files Community

gijl commited on 14 days ago

Commit

e878f2c

verified ·

1 Parent(s): 6868e14

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -36

app.py CHANGED Viewed

@@ -2,100 +2,75 @@ import gradio as gr
 import torch
 import json
 import torch.nn.functional as F
-from huggingface_hub import hf_hub_download # استيراد أداة التحميل
-from model import MedicalMasterAI # استيراد المعمارية الخاصة بك
-# تحديد الجهاز
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-# 1. تحميل التوكنايزر المخصص الخاص بك
-# نفترض أن هذا الملف موجود محلياً في المساحة
 with open("tokenizer_config.json", "r", encoding="utf-8") as f:
     vocab = json.load(f)
 stoi = vocab["stoi"]
 itos = vocab["itos"]
-# دوال التشفير وفك التشفير
 def encode(text):
     return [stoi.get(c, 0) for c in text]
 def decode(ids):
     return "".join([itos.get(str(i), "") for i in ids])
-# 2. بناء وتحميل النموذج
 try:
-    # تهيئة النموذج بنفس الأبعاد الموجودة في كودك
     model = MedicalMasterAI(vocab_size=115, n_layer=48, n_head=8, n_embd=768)
-    print("جاري سحب ملف الأوزان من المستودع... قد يستغرق هذا بعض الوقت.")
-    # سحب الملف الضخم من مستودعك مباشرة
-    # تأكد أن "gijl/Medical-Master-1.5B" هو المسار الصحيح لمستودعك
     model_path = hf_hub_download(repo_id="gijl/Medical-Master-1.5B", filename="pytorch_model.bin")
     print("تم التحميل بنجاح. جاري قراءة الأوزان...")
-    # تحميل الأوزان باستخدام المسار الذي أرجعته دالة التحميل
     state_dict = torch.load(model_path, map_location=device, weights_only=True)
-    model.load_state_dict(state_dict)
     model.to(device)
-    model.eval() # وضع التقييم
     model_loaded = True
     print("النموذج جاهز للعمل!")
 except Exception as e:
     print(f"Error loading model: {e}")
     model_loaded = False
-# 3. دالة المحادثة (التوليد التلقائي)
 def medical_chat(message, history):
     if not model_loaded:
-        return "حدث خطأ أثناء تحميل أوزان النموذج. يرجى مراجعة سجلات الأخطاء (Logs)."
     prompt = f"Question: {message} Answer:"
-    # تحويل النص إلى أرقام (Tensors)
     idx = torch.tensor([encode(prompt)], dtype=torch.long).to(device)
-    # عدد الأحرف التي سيولدها النموذج
     max_new_chars = 200
     generated_ids = []
     with torch.no_grad():
         for _ in range(max_new_chars):
-            # قص السياق إذا تجاوز 1024
-            idx_cond = idx[:, -1024:]
-            # تمرير البيانات للنموذج
             logits = model(idx_cond)
-            # التركيز على الحرف الأخير فقط
             logits = logits[:, -1, :]
-            # تطبيق الحرارة (Temperature)
             temperature = 0.8
             logits = logits / temperature
-            # تحويل القيم إلى احتمالات
             probs = F.softmax(logits, dim=-1)
-            # اختيار الحرف التالي
             idx_next = torch.multinomial(probs, num_samples=1)
-            # إضافة الحرف الجديد للسياق
             idx = torch.cat((idx, idx_next), dim=1)
             generated_ids.append(idx_next.item())
-    # فك تشفير الأحرف المولدة فقط
     answer = decode(generated_ids)
     return answer
-# 4. بناء واجهة Gradio
 demo = gr.ChatInterface(
     fn=medical_chat,
     title="Medical Master (Custom PyTorch AI)",
-    description="نموذج مبني من الصفر (Character-Level) للإجابة على الاستفسارات.",
 )
 if __name__ == "__main__":

 import torch
 import json
 import torch.nn.functional as F
+from huggingface_hub import hf_hub_download
+from model import MedicalMasterAI
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 with open("tokenizer_config.json", "r", encoding="utf-8") as f:
     vocab = json.load(f)
 stoi = vocab["stoi"]
 itos = vocab["itos"]
 def encode(text):
     return [stoi.get(c, 0) for c in text]
 def decode(ids):
     return "".join([itos.get(str(i), "") for i in ids])
 try:
     model = MedicalMasterAI(vocab_size=115, n_layer=48, n_head=8, n_embd=768)
+    print("جاري سحب ملف الأوزان من المستودع...")
     model_path = hf_hub_download(repo_id="gijl/Medical-Master-1.5B", filename="pytorch_model.bin")
     print("تم التحميل بنجاح. جاري قراءة الأوزان...")
     state_dict = torch.load(model_path, map_location=device, weights_only=True)
+    # إضافة strict=False لتجاهل طبقات الصور (image_projection) بأمان
+    model.load_state_dict(state_dict, strict=False)
     model.to(device)
+    model.eval()
     model_loaded = True
     print("النموذج جاهز للعمل!")
 except Exception as e:
     print(f"Error loading model: {e}")
     model_loaded = False
 def medical_chat(message, history):
     if not model_loaded:
+        return "حدث خطأ أثناء تحميل أوزان النموذج. يرجى مراجعة السجلات."
     prompt = f"Question: {message} Answer:"
     idx = torch.tensor([encode(prompt)], dtype=torch.long).to(device)
     max_new_chars = 200
     generated_ids = []
     with torch.no_grad():
         for _ in range(max_new_chars):
+            # تغيير 1024 إلى 256 ليتطابق مع حجم أوزان التدريب
+            idx_cond = idx[:, -256:]
             logits = model(idx_cond)
             logits = logits[:, -1, :]
             temperature = 0.8
             logits = logits / temperature
             probs = F.softmax(logits, dim=-1)
             idx_next = torch.multinomial(probs, num_samples=1)
             idx = torch.cat((idx, idx_next), dim=1)
             generated_ids.append(idx_next.item())
     answer = decode(generated_ids)
     return answer
 demo = gr.ChatInterface(
     fn=medical_chat,
     title="Medical Master (Custom PyTorch AI)",
+    description="نموذج مبني من الصفر للإجابة على الاستفسارات (يعمل بالوضع النصي حالياً).",
 )
 if __name__ == "__main__":