File size: 392 Bytes
2d79847 0663f25 2d79847 0663f25 2d79847 0663f25 2d79847 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 | import gradio as gr
from llama_cpp import Llama
llm = Llama.from_pretrained(
repo_id="TheBloke/TinyLlama-1.1B-GGUF",
filename="tinyllama-1.1b.Q4_K_M.gguf"
)
def chat(message, history):
response = llm.create_chat_completion(
messages=[{"role": "user", "content": message}]
)
return response["choices"][0]["message"]["content"]
gr.ChatInterface(fn=chat).launch()
|