Ken Sang Tang commited on
Commit
7b2cec5
·
verified ·
1 Parent(s): d0cc061

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +14 -6
app.py CHANGED
@@ -1,16 +1,24 @@
1
  from transformers import AutoTokenizer, AutoModelForCausalLM
2
  import gradio as gr
 
3
 
4
- # Load a suitable LLM model (replace with the chosen model name)
5
- model_name = "databricks/dolly-v2-3b" # Example: you can replace with a financial model
 
6
  tokenizer = AutoTokenizer.from_pretrained(model_name)
7
  model = AutoModelForCausalLM.from_pretrained(model_name)
8
 
 
 
9
  def generate_response(prompt):
10
- inputs = tokenizer(prompt, return_tensors="pt")
11
- outputs = model.generate(**inputs, max_length=100)
12
- response = tokenizer.decode(outputs[0], skip_special_tokens=True)
13
- return response
 
 
 
 
14
 
15
  # Set up Gradio interface
16
  gr.Interface(fn=generate_response, inputs="text", outputs="text").launch()
 
1
  from transformers import AutoTokenizer, AutoModelForCausalLM
2
  import gradio as gr
3
+ import torch
4
 
5
+
6
+ # Load the Dolly model and tokenizer
7
+ model_name = "databricks/dolly-v2-3b"
8
  tokenizer = AutoTokenizer.from_pretrained(model_name)
9
  model = AutoModelForCausalLM.from_pretrained(model_name)
10
 
11
+
12
+ # Function to generate model response
13
  def generate_response(prompt):
14
+ try:
15
+ inputs = tokenizer(prompt, return_tensors="pt")
16
+ outputs = model.generate(**inputs, max_length=200, num_return_sequences=1)
17
+ response = tokenizer.decode(outputs[0], skip_special_tokens=True)
18
+ return response
19
+ except Exception as e:
20
+ return f"An error occurred: {e}"
21
+
22
 
23
  # Set up Gradio interface
24
  gr.Interface(fn=generate_response, inputs="text", outputs="text").launch()