Spaces:

Neon-tech
/

Test

Running

Neon-tech commited on 11 days ago

Commit

764e46b

verified ·

1 Parent(s): a4bb98a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,7 +9,7 @@ model = Llama.from_pretrained(
     repo_id="unsloth/Qwen3.5-35B-A3B-GGUF",
     filename="Qwen3.5-35B-A3B-UD-IQ4_XS.gguf",
     n_ctx=2048,
-    n_threads=2,
 )
 def get_stats():
@@ -22,9 +22,6 @@ def get_stats():
 def chat(message, history):
     messages = [{"role": "system", "content": "Reply directly without any reasoning or thinking process."}]
-    for user, assistant in history:
-        messages.append({"role": "user", "content": user})
-        messages.append({"role": "assistant", "content": assistant})
     messages.append({"role": "user", "content": message})
     output = ""

     repo_id="unsloth/Qwen3.5-35B-A3B-GGUF",
     filename="Qwen3.5-35B-A3B-UD-IQ4_XS.gguf",
     n_ctx=2048,
+    n_threads=8,
 )
 def get_stats():
 def chat(message, history):
     messages = [{"role": "system", "content": "Reply directly without any reasoning or thinking process."}]
     messages.append({"role": "user", "content": message})
     output = ""