Spaces:

gijl
/

hj

Running

App Files Files Community

gijl commited on 5 days ago

Commit

6382a0d

verified ·

1 Parent(s): 024a042

Update app.py

Browse files

Files changed (1) hide show

app.py +82 -39

app.py CHANGED Viewed

@@ -1,52 +1,95 @@
 import gradio as gr
-from transformers import pipeline, AutoModelForCausalLM, AutoTokenizer
 import torch
-model_id = "gijl/Medical-Master-1.5B"
-# 1. تحميل التوكنايزر والنموذج بشكل منفصل لضمان الدقة
-tokenizer = AutoTokenizer.from_pretrained(model_id)
-model = AutoModelForCausalLM.from_pretrained(
-    model_id,
-    torch_dtype=torch.float32,
-    low_cpu_mem_usage=True,
-    trust_remote_code=True # مهم إذا كان هناك كود مخصص للنموذج
-)
-# 2. إعداد الـ Pipeline مع إيقاف التكرار
-pipe = pipeline(
-    "text-generation",
-    model=model,
-    tokenizer=tokenizer,
-    device=-1 # استخدام CPU للمساحات المجانية
-)
 def medical_chat(message, history):
-    # تجربة برومبت بسيط جداً بدون تعقيد
-    prompt = f"Question: {message}\nAnswer:"
-    results = pipe(
-        prompt,
-        max_new_tokens=100,
-        do_sample=True,
-        temperature=0.8,
-        top_p=0.9,
-        repetition_penalty=1.2, # لمنع التكرار أو الفراغ
-        return_full_text=False   # لكي يعطينا الإجابة فقط بدون السؤال
-    )
-    response = results[0]['generated_text'].strip()
-    # إذا كان الرد لا يزال فارغاً، سنعيد رسالة توضيحية
-    if not response:
-        return "النموذج لم يولد أي نص. تأكد من أن ملف pytorch_model.bin متوافق مع config.json في مستودع النموذج."
-    return response
 demo = gr.ChatInterface(
     fn=medical_chat,
-    title="Medical Master Testing Mode",
-    description="اختبار المخرجات الخام للنموذج"
 )
 if __name__ == "__main__":

 import gradio as gr
 import torch
+import json
+import torch.nn.functional as F
+from model import MedicalMasterAI # استيراد المعمارية الخاصة بك
+# تحديد الجهاز
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# 1. تحميل التوكنايزر المخصص الخاص بك
+with open("tokenizer_config.json", "r", encoding="utf-8") as f:
+    vocab = json.load(f)
+stoi = vocab["stoi"]
+itos = vocab["itos"]
+# دوال التشفير وفك التشفير
+def encode(text):
+    # إذا لم يجد الحرف، يستبدله بمسافة (0)
+    return [stoi.get(c, 0) for c in text]
+def decode(ids):
+    return "".join([itos.get(str(i), "") for i in ids])
+# 2. بناء وتحميل النموذج
+try:
+    # تهيئة النموذج بنفس الأبعاد الموجودة في كودك
+    model = MedicalMasterAI(vocab_size=115, n_layer=48, n_head=8, n_embd=768)
+    # تحميل الأوزان (تأكد من أن اسم الملف في المساحة هو pytorch_model.bin)
+    # استخدام weights_only=True لدواعي أمنية ولمنع التحذيرات
+    state_dict = torch.load("pytorch_model.bin", map_location=device, weights_only=True)
+    model.load_state_dict(state_dict)
+    model.to(device)
+    model.eval() # وضع التقييم
+    model_loaded = True
+except Exception as e:
+    print(f"Error loading model: {e}")
+    model_loaded = False
+# 3. دالة المحادثة (التوليد التلقائي)
 def medical_chat(message, history):
+    if not model_loaded:
+        return "حدث خطأ أثناء تحميل أوزان النموذج. تأكد من وجود ملف pytorch_model.bin"
+    # ملاحظة: تم إزالة \n لأنها غير موجودة في قاموسك (stoi)
+    prompt = f"Question: {message} Answer:"
+    # تحويل النص إلى أرقام (Tensors)
+    idx = torch.tensor([encode(prompt)], dtype=torch.long).to(device)
+    # عدد الأحرف التي سيولدها النموذج (بما أنه Character-level)
+    max_new_chars = 200
+    generated_ids = []
+    with torch.no_grad():
+        for _ in range(max_new_chars):
+            # قص السياق إذا تجاوز 1024 (الحد الأقصى للـ Position Embedding في كودك)
+            idx_cond = idx[:, -1024:]
+            # تمرير البيانات للنموذج
+            logits = model(idx_cond)
+            # التركيز على الحرف الأخير فقط
+            logits = logits[:, -1, :]
+            # تطبيق الحرارة (Temperature) لتنويع الإجابات
+            temperature = 0.8
+            logits = logits / temperature
+            # تحويل القيم إلى احتمالات
+            probs = F.softmax(logits, dim=-1)
+            # اختيار الحرف التالي
+            idx_next = torch.multinomial(probs, num_samples=1)
+            # إضافة الحرف الجديد للسياق
+            idx = torch.cat((idx, idx_next), dim=1)
+            generated_ids.append(idx_next.item())
+    # فك تشفير الأحرف المولدة فقط
+    answer = decode(generated_ids)
+    return answer
+# 4. بناء واجهة Gradio
 demo = gr.ChatInterface(
     fn=medical_chat,
+    title="Medical Master (Custom PyTorch AI)",
+    description="نموذج مبني من الصفر (Character-Level) للإجابة على الاستفسارات.",
 )
 if __name__ == "__main__":