vishesh-t27 commited on
Commit
a2fa178
·
verified ·
1 Parent(s): 9457222

Updated readme.md

Browse files
Files changed (1) hide show
  1. README.md +24 -14
README.md CHANGED
@@ -100,12 +100,17 @@ Human-Eval, IfEval & GSM8K have been evaluated using Greedy-decoding for now for
100
  ```python
101
  !pip install transformers=='5.4.0'
102
 
103
- from transformers import AutoModelForCausalLM, AutoTokenizer
 
104
 
105
-
106
- model_name = "Rta-AILabs/Nandi-mini-150M-Instruct"
107
 
108
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
 
 
 
 
 
109
 
110
  model = AutoModelForCausalLM.from_pretrained(
111
  model_name,
@@ -113,14 +118,18 @@ model = AutoModelForCausalLM.from_pretrained(
113
  device_map="auto",
114
  ).eval()
115
 
116
- prompt = """
117
- Explain Newton's second Law of Motion
118
- """
119
- model_inputs = tokenizer([prompt], return_tensors="pt").to(model.device)
120
 
121
- outputs = model.generate(
122
- **model_inputs,
123
- max_new_tokens=50,
 
 
 
 
 
 
 
124
  do_sample=True,
125
  temperature=0.3,
126
  top_k=20,
@@ -128,10 +137,11 @@ outputs = model.generate(
128
  top_p=0.95
129
  )
130
 
131
- response = tokenizer.decode(
132
- outputs[0],
133
- skip_special_tokens=True,
134
- )
 
135
 
136
  print(response)
137
  ```
 
100
  ```python
101
  !pip install transformers=='5.4.0'
102
 
103
+ from transformers import AutoTokenizer, AutoModelForCausalLM
104
+ import torch
105
 
106
+ model_name = "Rta-AILabs/Nandi-Mini-150M-Instruct"
 
107
 
108
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
109
+ model = AutoModelForCausalLM.from_pretrained(
110
+ model_name,
111
+ trust_remote_code=True,
112
+ dtype=torch.bfloat16
113
+ ).cuda()
114
 
115
  model = AutoModelForCausalLM.from_pretrained(
116
  model_name,
 
118
  device_map="auto",
119
  ).eval()
120
 
121
+ prompt = "Explain newton's second law of motion"
 
 
 
122
 
123
+ messages = [
124
+ {"role": "user", "content": prompt}
125
+ ]
126
+
127
+ prompt = tokenizer.apply_chat_template(messages, tokenize=False)
128
+ inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
129
+
130
+ generated_ids = model.generate(
131
+ **inputs,
132
+ max_new_tokens=500,
133
  do_sample=True,
134
  temperature=0.3,
135
  top_k=20,
 
137
  top_p=0.95
138
  )
139
 
140
+ generated_ids = [
141
+ output_ids[len(input_ids):] for input_ids, output_ids in zip(inputs.input_ids, generated_ids)
142
+ ]
143
+
144
+ response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
145
 
146
  print(response)
147
  ```