LH-Tech-AI's picture
Create run.sh
c592e63 verified
raw
history blame contribute delete
541 Bytes
pip install -q transformers datasets sentencepiece accelerate
python3 train_tokenizer.py
python3 train_model.py
python3 inference.py
sed -i 's/"max_position_embeddings": 256/"max_position_embeddings": 1024/' Supra-Mini-v2-0.1m-FINAL/config.json
pip install lm-eval
lm_eval --model hf --model_args pretrained=./Supra-Mini-v2-0.1m-FINAL,max_length=1024 --tasks arc_easy,wikitext,blimp --device cuda --batch_size 16
sed -i 's/"max_position_embeddings": 1024/"max_position_embeddings": 256/' Supra-Mini-v2-0.1m-FINAL/config.json