cfei621 commited on
Commit
3988212
·
verified ·
1 Parent(s): ce0e22c

Training in progress, step 200

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/ibex/user/feic/pjs/open-r1-contradiction/checkpoints/GRPO_TAG_REWARD/checkpoint-1000",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "/ibex/user/feic/pjs/model/DeepSeek-R1-Distill-Llama-8B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9691ef4705bf94b768c9d724342f9991a9272e041ee9ad1995c72bc6f6d7bc25
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68fe9d253e5578dc4906bbc3dcee08790beab64d4ad9e2ecc5dfb8593d692594
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9ded06ee83d6453337e0e24e1fa8bdbbc9058f1a67f6754e21b4df1c2f88508
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:767eefa4cf450a75e9219c81965bfc95edb87cf0525244a1a22f19d1fa5b92f6
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7335aa7f385799571ad16e117cb3b61aef9177c7ae3af67fb991f527367287e
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c09d7a08097b75a716505c2c2449eed83d1fbc55043c33a839bb19c13c4216e
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2cc1119ed4da032231c35db0e622782a76d8f5d4a4c5f47dcf95e96f583021ad
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2646d2d8ffab41b18573f0f0c6e3edc5d0cd0d41a7e831dfa4fee1b14097f87
3
  size 1168138808
tokenizer_config.json CHANGED
@@ -2058,12 +2058,8 @@
2058
  "eos_token": "<|end▁of▁sentence|>",
2059
  "extra_special_tokens": {},
2060
  "legacy": true,
2061
- "max_length": null,
2062
  "model_max_length": 16384,
2063
- "pad_to_multiple_of": null,
2064
  "pad_token": "<|end▁of▁sentence|>",
2065
- "pad_token_type_id": 0,
2066
- "padding_side": "left",
2067
  "sp_model_kwargs": {},
2068
  "tokenizer_class": "LlamaTokenizerFast",
2069
  "unk_token": null,
 
2058
  "eos_token": "<|end▁of▁sentence|>",
2059
  "extra_special_tokens": {},
2060
  "legacy": true,
 
2061
  "model_max_length": 16384,
 
2062
  "pad_token": "<|end▁of▁sentence|>",
 
 
2063
  "sp_model_kwargs": {},
2064
  "tokenizer_class": "LlamaTokenizerFast",
2065
  "unk_token": null,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2620dddb3d0da4771459207ee1239aad907614d798e8bcccddbfad25a9ab2ab8
3
- size 10296
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc32f04d2e66943f6d9563b1e5f851b71c2be337eb4b47bc28175b74ba13ab73
3
+ size 10360