Spaces:

gijl
/

hj

Sleeping

App Files Files Community

gijl commited on 15 days ago

Commit

a5f0014

verified ·

1 Parent(s): cde5e54

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -9

app.py CHANGED Viewed

@@ -2,12 +2,14 @@ import gradio as gr
 import torch
 import json
 import torch.nn.functional as F
 from model import MedicalMasterAI # استيراد المعمارية الخاصة بك
 # تحديد الجهاز
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # 1. تحميل التوكنايزر المخصص الخاص بك
 with open("tokenizer_config.json", "r", encoding="utf-8") as f:
     vocab = json.load(f)
@@ -16,7 +18,6 @@ itos = vocab["itos"]
 # دوال التشفير وفك التشفير
 def encode(text):
-    # إذا لم يجد الحرف، يستبدله بمسافة (0)
     return [stoi.get(c, 0) for c in text]
 def decode(ids):
@@ -27,14 +28,20 @@ try:
     # تهيئة النموذج بنفس الأبعاد الموجودة في كودك
     model = MedicalMasterAI(vocab_size=115, n_layer=48, n_head=8, n_embd=768)
-    # تحميل الأوزان (تأكد من أن اسم الملف في المساحة هو pytorch_model.bin)
-    # استخدام weights_only=True لدواعي أمنية ولمنع التحذيرات
-    state_dict = torch.load("pytorch_model.bin", map_location=device, weights_only=True)
     model.load_state_dict(state_dict)
     model.to(device)
     model.eval() # وضع التقييم
     model_loaded = True
 except Exception as e:
     print(f"Error loading model: {e}")
     model_loaded = False
@@ -42,22 +49,21 @@ except Exception as e:
 # 3. دالة المحادثة (التوليد التلقائي)
 def medical_chat(message, history):
     if not model_loaded:
-        return "حدث خطأ أثناء تحميل أوزان النموذج. تأكد من وجود ملف pytorch_model.bin"
-    # ملاحظة: تم إزالة \n لأنها غير موجودة في قاموسك (stoi)
     prompt = f"Question: {message} Answer:"
     # تحويل النص إلى أرقام (Tensors)
     idx = torch.tensor([encode(prompt)], dtype=torch.long).to(device)
-    # عدد الأحرف التي سيولدها النموذج (بما أنه Character-level)
     max_new_chars = 200
     generated_ids = []
     with torch.no_grad():
         for _ in range(max_new_chars):
-            # قص السياق إذا تجاوز 1024 (الحد الأقصى للـ Position Embedding في كودك)
             idx_cond = idx[:, -1024:]
             # تمرير البيانات للنموذج
@@ -66,7 +72,7 @@ def medical_chat(message, history):
             # التركيز على الحرف الأخير فقط
             logits = logits[:, -1, :]
-            # تطبيق الحرارة (Temperature) لتنويع الإجابات
             temperature = 0.8
             logits = logits / temperature

 import torch
 import json
 import torch.nn.functional as F
+from huggingface_hub import hf_hub_download # استيراد أداة التحميل
 from model import MedicalMasterAI # استيراد المعمارية الخاصة بك
 # تحديد الجهاز
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # 1. تحميل التوكنايزر المخصص الخاص بك
+# نفترض أن هذا الملف موجود محلياً في المساحة
 with open("tokenizer_config.json", "r", encoding="utf-8") as f:
     vocab = json.load(f)
 # دوال التشفير وفك التشفير
 def encode(text):
     return [stoi.get(c, 0) for c in text]
 def decode(ids):
     # تهيئة النموذج بنفس الأبعاد الموجودة في كودك
     model = MedicalMasterAI(vocab_size=115, n_layer=48, n_head=8, n_embd=768)
+    print("جاري سحب ملف الأوزان من المستودع... قد يستغرق هذا بعض الوقت.")
+    # سحب الملف الضخم من مستودعك مباشرة
+    # تأكد أن "gijl/Medical-Master-1.5B" هو المسار الصحيح لمستودعك
+    model_path = hf_hub_download(repo_id="gijl/Medical-Master-1.5B", filename="pytorch_model.bin")
+    print("تم التحميل بنجاح. جاري قراءة الأوزان...")
+    # تحميل الأوزان باستخدام المسار الذي أرجعته دالة التحميل
+    state_dict = torch.load(model_path, map_location=device, weights_only=True)
     model.load_state_dict(state_dict)
     model.to(device)
     model.eval() # وضع التقييم
     model_loaded = True
+    print("النموذج جاهز للعمل!")
 except Exception as e:
     print(f"Error loading model: {e}")
     model_loaded = False
 # 3. دالة المحادثة (التوليد التلقائي)
 def medical_chat(message, history):
     if not model_loaded:
+        return "حدث خطأ أثناء تحميل أوزان النموذج. يرجى مراجعة سجلات الأخطاء (Logs)."
     prompt = f"Question: {message} Answer:"
     # تحويل النص إلى أرقام (Tensors)
     idx = torch.tensor([encode(prompt)], dtype=torch.long).to(device)
+    # عدد الأحرف التي سيولدها النموذج
     max_new_chars = 200
     generated_ids = []
     with torch.no_grad():
         for _ in range(max_new_chars):
+            # قص السياق إذا تجاوز 1024
             idx_cond = idx[:, -1024:]
             # تمرير البيانات للنموذج
             # التركيز على الحرف الأخير فقط
             logits = logits[:, -1, :]
+            # تطبيق الحرارة (Temperature)
             temperature = 0.8
             logits = logits / temperature