Leon299 commited on
Commit
4b5d3f8
·
verified ·
1 Parent(s): 9bdba73

Upload folder using huggingface_hub

Browse files
.gitattributes ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ checkpoint-100000/model.safetensors filter=lfs diff=lfs merge=lfs -text
2
+ checkpoint-100000/optimizer.pt filter=lfs diff=lfs merge=lfs -text
3
+ checkpoint-100000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
4
+ checkpoint-98000/model.safetensors filter=lfs diff=lfs merge=lfs -text
5
+ checkpoint-98000/optimizer.pt filter=lfs diff=lfs merge=lfs -text
6
+ checkpoint-98000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
7
+ checkpoint-99000/model.safetensors filter=lfs diff=lfs merge=lfs -text
8
+ checkpoint-99000/optimizer.pt filter=lfs diff=lfs merge=lfs -text
9
+ checkpoint-99000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
10
+ final/model.safetensors filter=lfs diff=lfs merge=lfs -text
checkpoint-100000/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "TokenSeparator"
4
+ ],
5
+ "bos_token_id": 1024,
6
+ "codebook_decoder_layers": 4,
7
+ "codebook_size": 1024,
8
+ "d_model": 768,
9
+ "dim_feedforward": 3072,
10
+ "dropout": 0.1,
11
+ "dtype": "float32",
12
+ "latent_dim": 128,
13
+ "model_type": "token_separator",
14
+ "n_stems": 4,
15
+ "nhead": 8,
16
+ "num_layers": 8,
17
+ "predict_n_q": 16,
18
+ "rope_base": 10000.0,
19
+ "tie_codebook_embeddings": false,
20
+ "transformers_version": "5.2.0",
21
+ "use_cache": false,
22
+ "vocab_size": 1025
23
+ }
checkpoint-100000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f53a7a99ddbd806ac277ba8f94e49e67b16e545f43dda58ddaad11ffdda64e7
3
+ size 869663248
checkpoint-100000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3feb28baf2bbfebebd75757f9e1aa20e3c32ab1fa36f1cd31ab08bebf804d919
3
+ size 1733303031
checkpoint-100000/rng_state.pth ADDED
Binary file (14.6 kB). View file
 
checkpoint-100000/scheduler.pt ADDED
Binary file (1.47 kB). View file
 
checkpoint-100000/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61e4e8d08fb6f597dda054ef941c758dc2b1ab148ce2a804bd97ac7aabb96bd3
3
+ size 15930894
checkpoint-100000/training_args.bin ADDED
Binary file (5.2 kB). View file
 
checkpoint-98000/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "TokenSeparator"
4
+ ],
5
+ "bos_token_id": 1024,
6
+ "codebook_decoder_layers": 4,
7
+ "codebook_size": 1024,
8
+ "d_model": 768,
9
+ "dim_feedforward": 3072,
10
+ "dropout": 0.1,
11
+ "dtype": "float32",
12
+ "latent_dim": 128,
13
+ "model_type": "token_separator",
14
+ "n_stems": 4,
15
+ "nhead": 8,
16
+ "num_layers": 8,
17
+ "predict_n_q": 16,
18
+ "rope_base": 10000.0,
19
+ "tie_codebook_embeddings": false,
20
+ "transformers_version": "5.2.0",
21
+ "use_cache": false,
22
+ "vocab_size": 1025
23
+ }
checkpoint-98000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51626cc6522617ae017fa3e515db83050accaa3436b260fecba2fc6b1e7773aa
3
+ size 869663248
checkpoint-98000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90de66e8cb2c29eb5246a2fac131f41fac7a809d1263817d010d28f22bb82c01
3
+ size 1733303031
checkpoint-98000/rng_state.pth ADDED
Binary file (14.6 kB). View file
 
checkpoint-98000/scheduler.pt ADDED
Binary file (1.47 kB). View file
 
checkpoint-98000/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a9687d57682b34f76589421cc3601b01b9992c2e4d6800a62b6bc25312c13c2
3
+ size 15612171
checkpoint-98000/training_args.bin ADDED
Binary file (5.2 kB). View file
 
checkpoint-99000/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "TokenSeparator"
4
+ ],
5
+ "bos_token_id": 1024,
6
+ "codebook_decoder_layers": 4,
7
+ "codebook_size": 1024,
8
+ "d_model": 768,
9
+ "dim_feedforward": 3072,
10
+ "dropout": 0.1,
11
+ "dtype": "float32",
12
+ "latent_dim": 128,
13
+ "model_type": "token_separator",
14
+ "n_stems": 4,
15
+ "nhead": 8,
16
+ "num_layers": 8,
17
+ "predict_n_q": 16,
18
+ "rope_base": 10000.0,
19
+ "tie_codebook_embeddings": false,
20
+ "transformers_version": "5.2.0",
21
+ "use_cache": false,
22
+ "vocab_size": 1025
23
+ }
checkpoint-99000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f7ea9608a59c39021b2675e1295dd596eb9d31550d66024aebfc24eae2acfb6
3
+ size 869663248
checkpoint-99000/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43f8d3f3f2635fec669291d742d169d27359fdf2bc41c932974db1bb28f55259
3
+ size 1733303031
checkpoint-99000/rng_state.pth ADDED
Binary file (14.6 kB). View file
 
checkpoint-99000/scheduler.pt ADDED
Binary file (1.47 kB). View file
 
checkpoint-99000/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b8c251c0a822ef1a2cb6c2b0780b766700409656adbdff4bf1a7388eeb0375e
3
+ size 15771582
checkpoint-99000/training_args.bin ADDED
Binary file (5.2 kB). View file
 
final/config.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "TokenSeparator"
4
+ ],
5
+ "bos_token_id": 1024,
6
+ "codebook_decoder_layers": 4,
7
+ "codebook_size": 1024,
8
+ "d_model": 768,
9
+ "dim_feedforward": 3072,
10
+ "dropout": 0.1,
11
+ "dtype": "float32",
12
+ "latent_dim": 128,
13
+ "model_type": "token_separator",
14
+ "n_stems": 4,
15
+ "nhead": 8,
16
+ "num_layers": 8,
17
+ "predict_n_q": 16,
18
+ "rope_base": 10000.0,
19
+ "tie_codebook_embeddings": false,
20
+ "transformers_version": "5.2.0",
21
+ "use_cache": false,
22
+ "vocab_size": 1025
23
+ }
final/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f53a7a99ddbd806ac277ba8f94e49e67b16e545f43dda58ddaad11ffdda64e7
3
+ size 869663248
final/training_args.bin ADDED
Binary file (5.2 kB). View file