ysharma HF Staff commited on
Commit
ffc2dd6
·
verified ·
1 Parent(s): b8511f6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -17,11 +17,11 @@ model = AutoModelForCausalLM.from_pretrained(MODEL_ID, torch_dtype=torch.bfloat1
17
  def _generate(text: str):
18
  inputs = tok.apply_chat_template(
19
  [{"role": "user", "content": f"Summarize in 3 bullets:\n\n{text}"}],
20
- return_tensors="pt", add_generation_prompt=True,
21
  ).to("cuda")
22
  streamer = TextIteratorStreamer(tok, skip_prompt=True, skip_special_tokens=True)
23
  Thread(target=model.generate, kwargs=dict(
24
- inputs=inputs, streamer=streamer, max_new_tokens=300, do_sample=False,
25
  )).start()
26
  return streamer
27
 
 
17
  def _generate(text: str):
18
  inputs = tok.apply_chat_template(
19
  [{"role": "user", "content": f"Summarize in 3 bullets:\n\n{text}"}],
20
+ return_tensors="pt", return_dict=True, add_generation_prompt=True,
21
  ).to("cuda")
22
  streamer = TextIteratorStreamer(tok, skip_prompt=True, skip_special_tokens=True)
23
  Thread(target=model.generate, kwargs=dict(
24
+ **inputs, streamer=streamer, max_new_tokens=300, do_sample=False,
25
  )).start()
26
  return streamer
27