File size: 531 Bytes
d17228e
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
pip install -q transformers datasets sentencepiece accelerate
python3 train_tokenizer.py
python3 train_model.py
python3 inference.py
sed -i 's/"max_position_embeddings": 256/"max_position_embeddings": 1024/' Supra-Mini-0.1m-FINAL/config.json
pip install lm-eval
lm_eval --model hf     --model_args pretrained=./Supra-Mini-0.1m-FINAL,max_length=1024     --tasks arc_easy,wikitext,blimp     --device cuda     --batch_size 16
sed -i 's/"max_position_embeddings": 1024/"max_position_embeddings": 256/' Supra-Mini-0.1m-FINAL/config.json