Move Llama-2-7b-chat-hf checkpoints under model folder
Browse filesThis view is limited to 50 files because it contains too many changes. Β See raw diff
- .gitattributes +3 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/adapter_config.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/adapter_model.safetensors +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/eval.log +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/optimizer.pt +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_0.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_1.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_2.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_3.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/scheduler.pt +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/special_tokens_map.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/tokenizer.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/tokenizer.model +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/tokenizer_config.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/trainer_state.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/training_args.bin +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/adapter_config.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/adapter_model.safetensors +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/eval.log +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/optimizer.pt +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_0.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_1.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_2.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_3.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/scheduler.pt +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/special_tokens_map.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/tokenizer.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/tokenizer.model +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/tokenizer_config.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/trainer_state.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/training_args.bin +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/adapter_config.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/adapter_model.safetensors +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/eval.log +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/optimizer.pt +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_0.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_1.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_2.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_3.pth +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/scheduler.pt +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/special_tokens_map.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/tokenizer.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/tokenizer.model +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/tokenizer_config.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/trainer_state.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/training_args.bin +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/adapter_config.json +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/adapter_model.safetensors +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/eval.log +0 -0
- {PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/optimizer.pt +0 -0
.gitattributes
CHANGED
|
@@ -39,3 +39,6 @@ PO/LastFM/DynamicPO_SDPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
| 39 |
PO/LastFM/DMPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
PO/LastFM/MPPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 41 |
PO/LastFM/SDPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
PO/LastFM/DMPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 40 |
PO/LastFM/MPPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 41 |
PO/LastFM/SDPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
Llama-2-7b-chat-hf/PO/LastFM/DMPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
Llama-2-7b-chat-hf/PO/LastFM/MPPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
Llama-2-7b-chat-hf/PO/LastFM/SDPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/adapter_config.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/adapter_model.safetensors
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/eval.log
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/optimizer.pt
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_0.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_1.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_2.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/rng_state_3.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/scheduler.pt
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/special_tokens_map.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/tokenizer.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/tokenizer.model
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/tokenizer_config.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/trainer_state.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/DynamicPO/training_args.bin
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/adapter_config.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/adapter_model.safetensors
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/eval.log
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/optimizer.pt
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_0.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_1.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_2.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/rng_state_3.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/scheduler.pt
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/special_tokens_map.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/tokenizer.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/tokenizer.model
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/tokenizer_config.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/trainer_state.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/DMPO/Vanilla/training_args.bin
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/adapter_config.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/adapter_model.safetensors
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/eval.log
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/optimizer.pt
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_0.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_1.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_2.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/rng_state_3.pth
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/scheduler.pt
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/special_tokens_map.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/tokenizer.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/tokenizer.model
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/tokenizer_config.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/trainer_state.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/DynamicPO/training_args.bin
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/adapter_config.json
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/adapter_model.safetensors
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/eval.log
RENAMED
|
File without changes
|
{PO β Llama-2-7b-chat-hf/PO}/LastFM/MPPO/Vanilla/optimizer.pt
RENAMED
|
File without changes
|