ericmelz commited on
Commit
cd84f60
·
verified ·
1 Parent(s): 7b7a2ef

Training in progress, step 125

Browse files
Files changed (4) hide show
  1. README.md +4 -3
  2. model.safetensors +1 -1
  3. tokenizer.json +1 -6
  4. training_args.bin +2 -2
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: mistral-supervised
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - sft
 
9
  licence: license
10
  ---
11
 
@@ -27,13 +27,14 @@ print(output["generated_text"])
27
 
28
  ## Training procedure
29
 
 
30
 
31
 
32
  This model was trained with SFT.
33
 
34
  ### Framework versions
35
 
36
- - TRL: 0.12.0
37
  - Transformers: 4.54.0
38
  - Pytorch: 2.7.1
39
  - Datasets: 4.0.0
@@ -48,7 +49,7 @@ Cite TRL as:
48
  ```bibtex
49
  @misc{vonwerra2022trl,
50
  title = {{TRL: Transformer Reinforcement Learning}},
51
- author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallouédec},
52
  year = 2020,
53
  journal = {GitHub repository},
54
  publisher = {GitHub},
 
4
  model_name: mistral-supervised
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
 
27
 
28
  ## Training procedure
29
 
30
+
31
 
32
 
33
  This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.20.0
38
  - Transformers: 4.54.0
39
  - Pytorch: 2.7.1
40
  - Datasets: 4.0.0
 
49
  ```bibtex
50
  @misc{vonwerra2022trl,
51
  title = {{TRL: Transformer Reinforcement Learning}},
52
+ author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallou{\'e}dec},
53
  year = 2020,
54
  journal = {GitHub repository},
55
  publisher = {GitHub},
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:98f5ae2aad1cdd22c6ee19f0df9ef9f79f4537e1d22d80056d9474550072f877
3
  size 338197712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0299c3d0a1274718f7072c15573620fe605875f8d06e2c221d0bffe67685eb19
3
  size 338197712
tokenizer.json CHANGED
@@ -1,11 +1,6 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 512,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
  "padding": null,
10
  "added_tokens": [
11
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2229bae4bb325b571e23eafc16b133a7b62c79e3f9994ca8a140e5ed1efc65a
3
- size 5969
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a4cbc2c8f0f687165bfcbcc5879bac2fe8161afd799e83f593608ff9a333d41
3
+ size 6097