File size: 338 Bytes
0d86d1b
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
max_seq_len: 4096
tokenizer_info:
  boq: <|im_start|>
  condition_mapping:
    cot: <|object_ref_end|>
    direct: <|object_ref_start|>
    noisy: <|quad_start|>
    synth: <|quad_end|>
  eoa: <|box_end|>
  eoq: <|im_end|>
  tokenizer_path: /home/work/.data/hrm_text_prepared/sft_swe_glm_mix_v1
total_length: 251170780
vocab_size: 131072