cfei621 commited on
Commit
b00c9ad
·
verified ·
1 Parent(s): 835faae

Training in progress, step 800

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/ibex/user/feic/pjs/model/DeepSeek-R1-Distill-Llama-8B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "/ibex/user/feic/pjs/open-r1-contradiction/checkpoints/snli/DS-8B-GRPO_ACC_TAG_REWARD_long",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aefef14d0fa0e535974078bf6bcb49d7c8df57a6e51ee5d75ca97b8a3d8109e2
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31c9dd0555d30aedf359759e4aa4a06a05db8aa8a5fe5ca3bb2c3a0b90590d42
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4e3bd4d81263468dbae202ea58905de4fc00db4f1b0c01b0917b153dfa77e67
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9b68666116e1dc43aa39d452218a365e888899f734f81e64fe9c71de8aa0503
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0feb6e3fd440cd1b7db08ccf066c480172161987639690dda3ca7680c930f6ef
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0bfaeb2e0f5cd6f33c6171d2ae088b64a1d07d10f6c735e739c31a09d85fe61
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:646ec58c6e3cd775c7ec73fa0c632e2d155fb68dadb8ec308cd29d06f7567d9a
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:594804758e5dc5ba1575cd4a6e406a209e24e44e9e5718b8e554b06176065cda
3
  size 1168138808
tokenizer_config.json CHANGED
@@ -2058,8 +2058,12 @@
2058
  "eos_token": "<|end▁of▁sentence|>",
2059
  "extra_special_tokens": {},
2060
  "legacy": true,
 
2061
  "model_max_length": 16384,
 
2062
  "pad_token": "<|end▁of▁sentence|>",
 
 
2063
  "sp_model_kwargs": {},
2064
  "tokenizer_class": "LlamaTokenizerFast",
2065
  "unk_token": null,
 
2058
  "eos_token": "<|end▁of▁sentence|>",
2059
  "extra_special_tokens": {},
2060
  "legacy": true,
2061
+ "max_length": null,
2062
  "model_max_length": 16384,
2063
+ "pad_to_multiple_of": null,
2064
  "pad_token": "<|end▁of▁sentence|>",
2065
+ "pad_token_type_id": 0,
2066
+ "padding_side": "left",
2067
  "sp_model_kwargs": {},
2068
  "tokenizer_class": "LlamaTokenizerFast",
2069
  "unk_token": null,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d9630a15b0336db5b9d12d7dfd6aef2ed1a75cba61387c2640a6352bbc739d1
3
- size 10360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d94a6951a2ceadb33aea5dca1c9a537d88932617cf6acf13bffed6c8bcec4831
3
+ size 10424