cfei621 commited on
Commit
5f997c6
·
verified ·
1 Parent(s): 945c518

Training in progress, step 200

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/ibex/user/feic/pjs/open-r1-contradiction/checkpoints/snli/DS-8B-GRPO_ACC_TAG_REWARD_long",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "/ibex/user/feic/pjs/model/DeepSeek-R1-Distill-Llama-8B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d0dc4bc5cdccc232e22b20e8f4fd1a96b27e12948b26ae13ac1079213d5aa0a
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db0170971e7648b745a09975e59c75427283896da07a9fb451a1ca0ac9a5fb26
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad6a34f1064c7d236a4e95f1af6ed6010bba8c75d6b243bddf31a6ae6d0c8ca0
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c9fe5499f077d6851eaeddb70a6879bf00e234f239df68f7cbf12ff98074b7b
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:556ef7530a36b9b5ef0db55269b97fc2779ef0dc4178a5061f69fff67ae047b4
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:367f91d19895f8f06ad29d02b7dc86a0e48b13a8c3340865ff029e472d364e6b
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9696b1bc6913503c344d4197cf5c133944c2b686df33d0e1472e7aa2468076a
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afd6655080b1ae85c743cf2e447a32c5913e2679ef1fee479bcd64de5852db1a
3
  size 1168138808
tokenizer_config.json CHANGED
@@ -2058,12 +2058,8 @@
2058
  "eos_token": "<|end▁of▁sentence|>",
2059
  "extra_special_tokens": {},
2060
  "legacy": true,
2061
- "max_length": null,
2062
  "model_max_length": 16384,
2063
- "pad_to_multiple_of": null,
2064
  "pad_token": "<|end▁of▁sentence|>",
2065
- "pad_token_type_id": 0,
2066
- "padding_side": "left",
2067
  "sp_model_kwargs": {},
2068
  "tokenizer_class": "LlamaTokenizerFast",
2069
  "unk_token": null,
 
2058
  "eos_token": "<|end▁of▁sentence|>",
2059
  "extra_special_tokens": {},
2060
  "legacy": true,
 
2061
  "model_max_length": 16384,
 
2062
  "pad_token": "<|end▁of▁sentence|>",
 
 
2063
  "sp_model_kwargs": {},
2064
  "tokenizer_class": "LlamaTokenizerFast",
2065
  "unk_token": null,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d94a6951a2ceadb33aea5dca1c9a537d88932617cf6acf13bffed6c8bcec4831
3
- size 10424
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63cb48269b127dca2213b74960c06311204596d2ba66413d3d9cbec01819a1f1
3
+ size 10360