Upload folder using huggingface_hub
Browse files- .gitattributes +10 -0
- checkpoint-100000/config.json +23 -0
- checkpoint-100000/model.safetensors +3 -0
- checkpoint-100000/optimizer.pt +3 -0
- checkpoint-100000/rng_state.pth +0 -0
- checkpoint-100000/scheduler.pt +0 -0
- checkpoint-100000/trainer_state.json +3 -0
- checkpoint-100000/training_args.bin +0 -0
- checkpoint-98000/config.json +23 -0
- checkpoint-98000/model.safetensors +3 -0
- checkpoint-98000/optimizer.pt +3 -0
- checkpoint-98000/rng_state.pth +0 -0
- checkpoint-98000/scheduler.pt +0 -0
- checkpoint-98000/trainer_state.json +3 -0
- checkpoint-98000/training_args.bin +0 -0
- checkpoint-99000/config.json +23 -0
- checkpoint-99000/model.safetensors +3 -0
- checkpoint-99000/optimizer.pt +3 -0
- checkpoint-99000/rng_state.pth +0 -0
- checkpoint-99000/scheduler.pt +0 -0
- checkpoint-99000/trainer_state.json +3 -0
- checkpoint-99000/training_args.bin +0 -0
- final/config.json +23 -0
- final/model.safetensors +3 -0
- final/training_args.bin +0 -0
.gitattributes
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
checkpoint-100000/model.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 2 |
+
checkpoint-100000/optimizer.pt filter=lfs diff=lfs merge=lfs -text
|
| 3 |
+
checkpoint-100000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 4 |
+
checkpoint-98000/model.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 5 |
+
checkpoint-98000/optimizer.pt filter=lfs diff=lfs merge=lfs -text
|
| 6 |
+
checkpoint-98000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 7 |
+
checkpoint-99000/model.safetensors filter=lfs diff=lfs merge=lfs -text
|
| 8 |
+
checkpoint-99000/optimizer.pt filter=lfs diff=lfs merge=lfs -text
|
| 9 |
+
checkpoint-99000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 10 |
+
final/model.safetensors filter=lfs diff=lfs merge=lfs -text
|
checkpoint-100000/config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"TokenSeparator"
|
| 4 |
+
],
|
| 5 |
+
"bos_token_id": 1024,
|
| 6 |
+
"codebook_decoder_layers": 4,
|
| 7 |
+
"codebook_size": 1024,
|
| 8 |
+
"d_model": 768,
|
| 9 |
+
"dim_feedforward": 3072,
|
| 10 |
+
"dropout": 0.1,
|
| 11 |
+
"dtype": "float32",
|
| 12 |
+
"latent_dim": 128,
|
| 13 |
+
"model_type": "token_separator",
|
| 14 |
+
"n_stems": 4,
|
| 15 |
+
"nhead": 8,
|
| 16 |
+
"num_layers": 8,
|
| 17 |
+
"predict_n_q": 16,
|
| 18 |
+
"rope_base": 10000.0,
|
| 19 |
+
"tie_codebook_embeddings": false,
|
| 20 |
+
"transformers_version": "5.2.0",
|
| 21 |
+
"use_cache": false,
|
| 22 |
+
"vocab_size": 1025
|
| 23 |
+
}
|
checkpoint-100000/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f53a7a99ddbd806ac277ba8f94e49e67b16e545f43dda58ddaad11ffdda64e7
|
| 3 |
+
size 869663248
|
checkpoint-100000/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3feb28baf2bbfebebd75757f9e1aa20e3c32ab1fa36f1cd31ab08bebf804d919
|
| 3 |
+
size 1733303031
|
checkpoint-100000/rng_state.pth
ADDED
|
Binary file (14.6 kB). View file
|
|
|
checkpoint-100000/scheduler.pt
ADDED
|
Binary file (1.47 kB). View file
|
|
|
checkpoint-100000/trainer_state.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61e4e8d08fb6f597dda054ef941c758dc2b1ab148ce2a804bd97ac7aabb96bd3
|
| 3 |
+
size 15930894
|
checkpoint-100000/training_args.bin
ADDED
|
Binary file (5.2 kB). View file
|
|
|
checkpoint-98000/config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"TokenSeparator"
|
| 4 |
+
],
|
| 5 |
+
"bos_token_id": 1024,
|
| 6 |
+
"codebook_decoder_layers": 4,
|
| 7 |
+
"codebook_size": 1024,
|
| 8 |
+
"d_model": 768,
|
| 9 |
+
"dim_feedforward": 3072,
|
| 10 |
+
"dropout": 0.1,
|
| 11 |
+
"dtype": "float32",
|
| 12 |
+
"latent_dim": 128,
|
| 13 |
+
"model_type": "token_separator",
|
| 14 |
+
"n_stems": 4,
|
| 15 |
+
"nhead": 8,
|
| 16 |
+
"num_layers": 8,
|
| 17 |
+
"predict_n_q": 16,
|
| 18 |
+
"rope_base": 10000.0,
|
| 19 |
+
"tie_codebook_embeddings": false,
|
| 20 |
+
"transformers_version": "5.2.0",
|
| 21 |
+
"use_cache": false,
|
| 22 |
+
"vocab_size": 1025
|
| 23 |
+
}
|
checkpoint-98000/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51626cc6522617ae017fa3e515db83050accaa3436b260fecba2fc6b1e7773aa
|
| 3 |
+
size 869663248
|
checkpoint-98000/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90de66e8cb2c29eb5246a2fac131f41fac7a809d1263817d010d28f22bb82c01
|
| 3 |
+
size 1733303031
|
checkpoint-98000/rng_state.pth
ADDED
|
Binary file (14.6 kB). View file
|
|
|
checkpoint-98000/scheduler.pt
ADDED
|
Binary file (1.47 kB). View file
|
|
|
checkpoint-98000/trainer_state.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5a9687d57682b34f76589421cc3601b01b9992c2e4d6800a62b6bc25312c13c2
|
| 3 |
+
size 15612171
|
checkpoint-98000/training_args.bin
ADDED
|
Binary file (5.2 kB). View file
|
|
|
checkpoint-99000/config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"TokenSeparator"
|
| 4 |
+
],
|
| 5 |
+
"bos_token_id": 1024,
|
| 6 |
+
"codebook_decoder_layers": 4,
|
| 7 |
+
"codebook_size": 1024,
|
| 8 |
+
"d_model": 768,
|
| 9 |
+
"dim_feedforward": 3072,
|
| 10 |
+
"dropout": 0.1,
|
| 11 |
+
"dtype": "float32",
|
| 12 |
+
"latent_dim": 128,
|
| 13 |
+
"model_type": "token_separator",
|
| 14 |
+
"n_stems": 4,
|
| 15 |
+
"nhead": 8,
|
| 16 |
+
"num_layers": 8,
|
| 17 |
+
"predict_n_q": 16,
|
| 18 |
+
"rope_base": 10000.0,
|
| 19 |
+
"tie_codebook_embeddings": false,
|
| 20 |
+
"transformers_version": "5.2.0",
|
| 21 |
+
"use_cache": false,
|
| 22 |
+
"vocab_size": 1025
|
| 23 |
+
}
|
checkpoint-99000/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f7ea9608a59c39021b2675e1295dd596eb9d31550d66024aebfc24eae2acfb6
|
| 3 |
+
size 869663248
|
checkpoint-99000/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43f8d3f3f2635fec669291d742d169d27359fdf2bc41c932974db1bb28f55259
|
| 3 |
+
size 1733303031
|
checkpoint-99000/rng_state.pth
ADDED
|
Binary file (14.6 kB). View file
|
|
|
checkpoint-99000/scheduler.pt
ADDED
|
Binary file (1.47 kB). View file
|
|
|
checkpoint-99000/trainer_state.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8b8c251c0a822ef1a2cb6c2b0780b766700409656adbdff4bf1a7388eeb0375e
|
| 3 |
+
size 15771582
|
checkpoint-99000/training_args.bin
ADDED
|
Binary file (5.2 kB). View file
|
|
|
final/config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"TokenSeparator"
|
| 4 |
+
],
|
| 5 |
+
"bos_token_id": 1024,
|
| 6 |
+
"codebook_decoder_layers": 4,
|
| 7 |
+
"codebook_size": 1024,
|
| 8 |
+
"d_model": 768,
|
| 9 |
+
"dim_feedforward": 3072,
|
| 10 |
+
"dropout": 0.1,
|
| 11 |
+
"dtype": "float32",
|
| 12 |
+
"latent_dim": 128,
|
| 13 |
+
"model_type": "token_separator",
|
| 14 |
+
"n_stems": 4,
|
| 15 |
+
"nhead": 8,
|
| 16 |
+
"num_layers": 8,
|
| 17 |
+
"predict_n_q": 16,
|
| 18 |
+
"rope_base": 10000.0,
|
| 19 |
+
"tie_codebook_embeddings": false,
|
| 20 |
+
"transformers_version": "5.2.0",
|
| 21 |
+
"use_cache": false,
|
| 22 |
+
"vocab_size": 1025
|
| 23 |
+
}
|
final/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7f53a7a99ddbd806ac277ba8f94e49e67b16e545f43dda58ddaad11ffdda64e7
|
| 3 |
+
size 869663248
|
final/training_args.bin
ADDED
|
Binary file (5.2 kB). View file
|
|
|