Add files using upload-large-folder tool
Browse files- README.md +31 -0
- config.json +0 -0
- generation_config.json +9 -0
- model-00002-of-00185.safetensors +3 -0
- model-00006-of-00185.safetensors +3 -0
- model-00032-of-00185.safetensors +3 -0
- model-00063-of-00185.safetensors +3 -0
- model-00072-of-00185.safetensors +3 -0
- model-00084-of-00185.safetensors +3 -0
- model-00093-of-00185.safetensors +3 -0
- model-00095-of-00185.safetensors +3 -0
- model-00101-of-00185.safetensors +3 -0
- model-00107-of-00185.safetensors +3 -0
- model-00108-of-00185.safetensors +3 -0
- model-00111-of-00185.safetensors +3 -0
- model-00120-of-00185.safetensors +3 -0
- model-00132-of-00185.safetensors +3 -0
- model.safetensors.index.json +0 -0
- tokenizer.json +0 -0
- tokenizer_config.json +14 -0
README.md
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
language: en
|
| 3 |
+
tags:
|
| 4 |
+
- mlx
|
| 5 |
+
pipeline_tag: text-generation
|
| 6 |
+
library_name: mlx
|
| 7 |
+
---
|
| 8 |
+
|
| 9 |
+
# mlx-community/DeepSeek-V4-Pro-8bit
|
| 10 |
+
|
| 11 |
+
## Use with mlx
|
| 12 |
+
|
| 13 |
+
```bash
|
| 14 |
+
pip install mlx-lm
|
| 15 |
+
```
|
| 16 |
+
|
| 17 |
+
```python
|
| 18 |
+
from mlx_lm import load, generate
|
| 19 |
+
|
| 20 |
+
model, tokenizer = load("mlx-community/DeepSeek-V4-Pro-8bit")
|
| 21 |
+
|
| 22 |
+
prompt = "hello"
|
| 23 |
+
|
| 24 |
+
if tokenizer.chat_template is not None:
|
| 25 |
+
messages = [{"role": "user", "content": prompt}]
|
| 26 |
+
prompt = tokenizer.apply_chat_template(
|
| 27 |
+
messages, add_generation_prompt=True, return_dict=False,
|
| 28 |
+
)
|
| 29 |
+
|
| 30 |
+
response = generate(model, tokenizer, prompt=prompt, verbose=True)
|
| 31 |
+
```
|
config.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
generation_config.json
ADDED
|
@@ -0,0 +1,9 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_from_model_config": true,
|
| 3 |
+
"bos_token_id": 0,
|
| 4 |
+
"eos_token_id": 1,
|
| 5 |
+
"do_sample": true,
|
| 6 |
+
"temperature": 1.0,
|
| 7 |
+
"top_p": 1.0,
|
| 8 |
+
"transformers_version": "4.46.3"
|
| 9 |
+
}
|
model-00002-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4192daf82fc47c5922bf83acb9c06cb1aba4f7708a10c06359933300db3a90f1
|
| 3 |
+
size 4492099867
|
model-00006-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80962f49af725a1571ba4632cd5c8c51b162fcd5001cac3d5b353cf7b8a43f92
|
| 3 |
+
size 4492099863
|
model-00032-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4ab7a0727609326effa7e951e54246cefe7b6944e705ae8930805e9124f7830
|
| 3 |
+
size 4492099869
|
model-00063-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3fb510d6a5722a7a32578609f7fd83a83b5a856b6eb1eef8b5f3bd3d814ae27
|
| 3 |
+
size 4492099865
|
model-00072-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c901730c0aaec347e31d62de859ab9ef1d7c953d9c197662df548e9f51ac094
|
| 3 |
+
size 4492099865
|
model-00084-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a02515370fc132666a4505daeef5439e6407dcf2701564ddf879ed69b2c4aadc
|
| 3 |
+
size 4492099865
|
model-00093-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e02f27b69e4fa1917ae301562d42f17e7672922b91df2f3afc695084b3e59d2
|
| 3 |
+
size 4492099865
|
model-00095-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1da9d4b06c5906071120147b01a57d08c28b647e14a00eaac5650d0caea0ecd9
|
| 3 |
+
size 4492099869
|
model-00101-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e814b4b707d9f23b36e453bda13c33fcba584225f84d37ae43e7c915adec488
|
| 3 |
+
size 4492099869
|
model-00107-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b5353d64ceab4bec393d4382c150151f37a24fde5a2ad3b918ea1b05174d759b
|
| 3 |
+
size 4492099869
|
model-00108-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c208a5189f287e5905818645069c177a4dec4abc32607336b1e176476fedf5f
|
| 3 |
+
size 4492099865
|
model-00111-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:adef5d61483bb84480ce245c2f03ff3611e3b7b765d22106f09a30283af48fd8
|
| 3 |
+
size 4492099865
|
model-00120-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:688b3cc2cb17ab9127150575315e050d961a571d68140ea80ea62f32d1c80272
|
| 3 |
+
size 4492099865
|
model-00132-of-00185.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f08a8b185921c827ab4f633e48c76ce891e24842766e49d73d00e0b8c504c2e5
|
| 3 |
+
size 4492099865
|
model.safetensors.index.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"backend": "tokenizers",
|
| 3 |
+
"bos_token": "<|begin▁of▁sentence|>",
|
| 4 |
+
"clean_up_tokenization_spaces": false,
|
| 5 |
+
"eos_token": "<|end▁of▁sentence|>",
|
| 6 |
+
"is_local": true,
|
| 7 |
+
"legacy": true,
|
| 8 |
+
"local_files_only": false,
|
| 9 |
+
"model_max_length": 1048576,
|
| 10 |
+
"pad_token": "<|end▁of▁sentence|>",
|
| 11 |
+
"sp_model_kwargs": {},
|
| 12 |
+
"tokenizer_class": "TokenizersBackend",
|
| 13 |
+
"unk_token": null
|
| 14 |
+
}
|