Spaces:
Running on Zero
Running on Zero
Switch to LLM2Vec 3.1 pair to fix Space 401 on gated Llama 3.0
Browse files
kimodo/model/llm2vec/llm2vec.py
CHANGED
|
@@ -173,7 +173,10 @@ class LLM2Vec(nn.Module):
|
|
| 173 |
return cls(model=model, tokenizer=tokenizer, **config)
|
| 174 |
|
| 175 |
def prepare_for_tokenization(self, text):
|
| 176 |
-
if self.model.config._name_or_path
|
|
|
|
|
|
|
|
|
|
| 177 |
text = "<|start_header_id|>user<|end_header_id|>\n\n" + text.strip() + "<|eot_id|>"
|
| 178 |
return text
|
| 179 |
if self.model.config._name_or_path in [
|
|
|
|
| 173 |
return cls(model=model, tokenizer=tokenizer, **config)
|
| 174 |
|
| 175 |
def prepare_for_tokenization(self, text):
|
| 176 |
+
if self.model.config._name_or_path in [
|
| 177 |
+
"meta-llama/Meta-Llama-3-8B-Instruct",
|
| 178 |
+
"meta-llama/Meta-Llama-3.1-8B-Instruct",
|
| 179 |
+
]:
|
| 180 |
text = "<|start_header_id|>user<|end_header_id|>\n\n" + text.strip() + "<|eot_id|>"
|
| 181 |
return text
|
| 182 |
if self.model.config._name_or_path in [
|
kimodo/model/load_model.py
CHANGED
|
@@ -30,8 +30,8 @@ TEXT_ENCODER_PRESETS = {
|
|
| 30 |
"llm2vec": {
|
| 31 |
"target": "kimodo.model.LLM2VecEncoder",
|
| 32 |
"kwargs": {
|
| 33 |
-
"base_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-
|
| 34 |
-
"peft_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-
|
| 35 |
"dtype": "bfloat16",
|
| 36 |
"llm_dim": 4096,
|
| 37 |
},
|
|
|
|
| 30 |
"llm2vec": {
|
| 31 |
"target": "kimodo.model.LLM2VecEncoder",
|
| 32 |
"kwargs": {
|
| 33 |
+
"base_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-31-8B-Instruct-mntp",
|
| 34 |
+
"peft_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-31-8B-Instruct-mntp-supervised",
|
| 35 |
"dtype": "bfloat16",
|
| 36 |
"llm_dim": 4096,
|
| 37 |
},
|
kimodo/scripts/run_text_encoder_server.py
CHANGED
|
@@ -22,8 +22,8 @@ TEXT_ENCODER_PRESETS = {
|
|
| 22 |
"llm2vec": {
|
| 23 |
"target": "kimodo.model.LLM2VecEncoder",
|
| 24 |
"kwargs": {
|
| 25 |
-
"base_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-
|
| 26 |
-
"peft_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-
|
| 27 |
"dtype": "bfloat16",
|
| 28 |
"llm_dim": 4096,
|
| 29 |
},
|
|
|
|
| 22 |
"llm2vec": {
|
| 23 |
"target": "kimodo.model.LLM2VecEncoder",
|
| 24 |
"kwargs": {
|
| 25 |
+
"base_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-31-8B-Instruct-mntp",
|
| 26 |
+
"peft_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-31-8B-Instruct-mntp-supervised",
|
| 27 |
"dtype": "bfloat16",
|
| 28 |
"llm_dim": 4096,
|
| 29 |
},
|
kimodo/scripts/text_encoder_health.py
CHANGED
|
@@ -12,8 +12,8 @@ from transformers import AutoConfig
|
|
| 12 |
|
| 13 |
TEXT_ENCODER_PRESETS = {
|
| 14 |
"llm2vec": {
|
| 15 |
-
"base_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-
|
| 16 |
-
"peft_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-
|
| 17 |
}
|
| 18 |
}
|
| 19 |
|
|
|
|
| 12 |
|
| 13 |
TEXT_ENCODER_PRESETS = {
|
| 14 |
"llm2vec": {
|
| 15 |
+
"base_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-31-8B-Instruct-mntp",
|
| 16 |
+
"peft_model_name_or_path": "McGill-NLP/LLM2Vec-Meta-Llama-31-8B-Instruct-mntp-supervised",
|
| 17 |
}
|
| 18 |
}
|
| 19 |
|