HemanthSai7 commited on
Commit
bf277cf
·
verified ·
1 Parent(s): feaca64

Update tokenization_nandi.py

Browse files
Files changed (1) hide show
  1. tokenization_nandi.py +1 -1
tokenization_nandi.py CHANGED
@@ -106,7 +106,7 @@ class NandiTokenizer(TokenizersBackend):
106
  ):
107
  if isinstance(text, str):
108
  # This is a temporary fix to match the behaviour of the training pipeline
109
- text = "<|im_start|> " + text
110
  return super().encode(
111
  text,
112
  text_pair=text_pair,
 
106
  ):
107
  if isinstance(text, str):
108
  # This is a temporary fix to match the behaviour of the training pipeline
109
+ text = "<|im_start|>" + " " + text
110
  return super().encode(
111
  text,
112
  text_pair=text_pair,