Spaces:

LLM-course
/

lipogram_private

Sleeping

nathanael-fijalkow commited on Feb 24

Commit

6538c21

1 Parent(s): 3247744

Fix for Transformers v5

Files changed (2) hide show

app.py CHANGED Viewed

@@ -66,9 +66,10 @@ def compute_mean_logprob(prompt_text, generated_text):
     # Always use chat template: the model is an instruct model, so
     # logprobs are meaningful only in the chat context.
     message = [{"role": "user", "content": prompt_text}]
-    prompt_ids = tokenizer.apply_chat_template(
         message, add_generation_prompt=True, return_tensors="pt"
-    ).to(model.device)
     gen_ids = tokenizer.encode(
         generated_text, add_special_tokens=False, return_tensors="pt"
     ).to(model.device)

     # Always use chat template: the model is an instruct model, so
     # logprobs are meaningful only in the chat context.
     message = [{"role": "user", "content": prompt_text}]
+    encoded = tokenizer.apply_chat_template(
         message, add_generation_prompt=True, return_tensors="pt"
+    )
+    prompt_ids = (encoded if isinstance(encoded, torch.Tensor) else encoded["input_ids"]).to(model.device)
     gen_ids = tokenizer.encode(
         generated_text, add_special_tokens=False, return_tensors="pt"
     ).to(model.device)

solution.py CHANGED Viewed

@@ -29,7 +29,8 @@ class LaDisparition:
     def __call__(self, prompt, max_tokens=20, beam_width=5):
         # Option 2: we use self.tokenizer.apply_chat_template to tokenize the prompt
         message = [{"role": "user", "content": prompt}]
-        input_ids = self.tokenizer.apply_chat_template(message, add_generation_prompt=True, return_tensors="pt").to(self.model.device)
         prompt_len = input_ids.shape[1]
         # Beam search: maintain multiple hypotheses
@@ -155,7 +156,8 @@ class ToulouseSequence:
     def __call__(self, prompt, max_tokens=20):
         # Option 2: we use self.tokenizer.apply_chat_template to tokenize the prompt
         message = [{"role": "user", "content": prompt}]
-        inputs = self.tokenizer.apply_chat_template(message, add_generation_prompt=True, return_tensors="pt").to(self.model.device)
         prompt_length = inputs.shape[1]
         # Generate tokens one by one

     def __call__(self, prompt, max_tokens=20, beam_width=5):
         # Option 2: we use self.tokenizer.apply_chat_template to tokenize the prompt
         message = [{"role": "user", "content": prompt}]
+        encoded = self.tokenizer.apply_chat_template(message, add_generation_prompt=True, return_tensors="pt")
+        input_ids = (encoded if isinstance(encoded, torch.Tensor) else encoded["input_ids"]).to(self.model.device)
         prompt_len = input_ids.shape[1]
         # Beam search: maintain multiple hypotheses
     def __call__(self, prompt, max_tokens=20):
         # Option 2: we use self.tokenizer.apply_chat_template to tokenize the prompt
         message = [{"role": "user", "content": prompt}]
+        encoded = self.tokenizer.apply_chat_template(message, add_generation_prompt=True, return_tensors="pt")
+        inputs = (encoded if isinstance(encoded, torch.Tensor) else encoded["input_ids"]).to(self.model.device)
         prompt_length = inputs.shape[1]
         # Generate tokens one by one