Thrillcrazyer commited on
Commit
a6045bb
·
verified ·
1 Parent(s): 2518de8

step 10000

Browse files
Files changed (3) hide show
  1. config.json +3 -0
  2. model.safetensors +2 -2
  3. tokenizer_config.json +1 -1
config.json CHANGED
@@ -87,6 +87,7 @@
87
  "vocab_size": 151936
88
  },
89
  "base_model_name_or_path": "Qwen/Qwen3-8B",
 
90
  "decoder_layer_indices": [
91
  35
92
  ],
@@ -100,8 +101,10 @@
100
  6,
101
  7
102
  ],
 
103
  "hidden_size": 4096,
104
  "model_type": "lds",
 
105
  "q_threshold": 0.9,
106
  "reasoning_layer_indices": [
107
  8,
 
87
  "vocab_size": 151936
88
  },
89
  "base_model_name_or_path": "Qwen/Qwen3-8B",
90
+ "convergence_epsilon": 0.01,
91
  "decoder_layer_indices": [
92
  35
93
  ],
 
101
  6,
102
  7
103
  ],
104
+ "halting_strategy": "threshold",
105
  "hidden_size": 4096,
106
  "model_type": "lds",
107
+ "q_eval_interval": 1,
108
  "q_threshold": 0.9,
109
  "reasoning_layer_indices": [
110
  8,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac289ef85ce448872b34d79b622ed497a03cf8df6d6f06bdaacd9110f3be7bf2
3
- size 16389989668
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2713b65854a2625f702b4f5cdb74199cfca4cea544e1c6390bfa438f5e0b5f1b
3
+ size 16385754482
tokenizer_config.json CHANGED
@@ -20,7 +20,7 @@
20
  "<|image_pad|>",
21
  "<|video_pad|>"
22
  ],
23
- "is_local": false,
24
  "model_max_length": 131072,
25
  "pad_token": "<|endoftext|>",
26
  "split_special_tokens": false,
 
20
  "<|image_pad|>",
21
  "<|video_pad|>"
22
  ],
23
+ "is_local": true,
24
  "model_max_length": 131072,
25
  "pad_token": "<|endoftext|>",
26
  "split_special_tokens": false,