diff --git a/.gitattributes b/.gitattributes index 99ea07d5f8f943f08d3cf2ca9a5accd7d1febe91..dcae67507c21a17788f088f2f33ba4a0c3f3dd8a 100644 --- a/.gitattributes +++ b/.gitattributes @@ -36,3 +36,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text PO/LastFM/DynamicPO_DMPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text PO/LastFM/DynamicPO_MPPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text PO/LastFM/DynamicPO_SDPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text +PO/LastFM/DMPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text +PO/LastFM/MPPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text +PO/LastFM/SDPO/DynamicPO/trainer_state.json filter=lfs diff=lfs merge=lfs -text diff --git a/PO/LastFM/DynamicPO_DMPO/adapter_config.json b/PO/LastFM/DMPO/DynamicPO/adapter_config.json similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/adapter_config.json rename to PO/LastFM/DMPO/DynamicPO/adapter_config.json diff --git a/PO/LastFM/DynamicPO_DMPO/adapter_model.safetensors b/PO/LastFM/DMPO/DynamicPO/adapter_model.safetensors similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/adapter_model.safetensors rename to PO/LastFM/DMPO/DynamicPO/adapter_model.safetensors diff --git a/PO/LastFM/DynamicPO_DMPO/eval.log b/PO/LastFM/DMPO/DynamicPO/eval.log similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/eval.log rename to PO/LastFM/DMPO/DynamicPO/eval.log diff --git a/PO/LastFM/DynamicPO_DMPO/optimizer.pt b/PO/LastFM/DMPO/DynamicPO/optimizer.pt similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/optimizer.pt rename to PO/LastFM/DMPO/DynamicPO/optimizer.pt diff --git a/PO/LastFM/DynamicPO_DMPO/rng_state_0.pth b/PO/LastFM/DMPO/DynamicPO/rng_state_0.pth similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/rng_state_0.pth rename to PO/LastFM/DMPO/DynamicPO/rng_state_0.pth diff --git a/PO/LastFM/DynamicPO_DMPO/rng_state_1.pth b/PO/LastFM/DMPO/DynamicPO/rng_state_1.pth similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/rng_state_1.pth rename to PO/LastFM/DMPO/DynamicPO/rng_state_1.pth diff --git a/PO/LastFM/DynamicPO_DMPO/rng_state_2.pth b/PO/LastFM/DMPO/DynamicPO/rng_state_2.pth similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/rng_state_2.pth rename to PO/LastFM/DMPO/DynamicPO/rng_state_2.pth diff --git a/PO/LastFM/DynamicPO_DMPO/rng_state_3.pth b/PO/LastFM/DMPO/DynamicPO/rng_state_3.pth similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/rng_state_3.pth rename to PO/LastFM/DMPO/DynamicPO/rng_state_3.pth diff --git a/PO/LastFM/DynamicPO_DMPO/scheduler.pt b/PO/LastFM/DMPO/DynamicPO/scheduler.pt similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/scheduler.pt rename to PO/LastFM/DMPO/DynamicPO/scheduler.pt diff --git a/PO/LastFM/DMPO/special_tokens_map.json b/PO/LastFM/DMPO/DynamicPO/special_tokens_map.json similarity index 100% rename from PO/LastFM/DMPO/special_tokens_map.json rename to PO/LastFM/DMPO/DynamicPO/special_tokens_map.json diff --git a/PO/LastFM/DMPO/tokenizer.json b/PO/LastFM/DMPO/DynamicPO/tokenizer.json similarity index 100% rename from PO/LastFM/DMPO/tokenizer.json rename to PO/LastFM/DMPO/DynamicPO/tokenizer.json diff --git a/PO/LastFM/DMPO/tokenizer.model b/PO/LastFM/DMPO/DynamicPO/tokenizer.model similarity index 100% rename from PO/LastFM/DMPO/tokenizer.model rename to PO/LastFM/DMPO/DynamicPO/tokenizer.model diff --git a/PO/LastFM/DMPO/tokenizer_config.json b/PO/LastFM/DMPO/DynamicPO/tokenizer_config.json similarity index 100% rename from PO/LastFM/DMPO/tokenizer_config.json rename to PO/LastFM/DMPO/DynamicPO/tokenizer_config.json diff --git a/PO/LastFM/DynamicPO_DMPO/trainer_state.json b/PO/LastFM/DMPO/DynamicPO/trainer_state.json similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/trainer_state.json rename to PO/LastFM/DMPO/DynamicPO/trainer_state.json diff --git a/PO/LastFM/DynamicPO_DMPO/training_args.bin b/PO/LastFM/DMPO/DynamicPO/training_args.bin similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/training_args.bin rename to PO/LastFM/DMPO/DynamicPO/training_args.bin diff --git a/PO/LastFM/DMPO/adapter_config.json b/PO/LastFM/DMPO/Vanilla/adapter_config.json similarity index 100% rename from PO/LastFM/DMPO/adapter_config.json rename to PO/LastFM/DMPO/Vanilla/adapter_config.json diff --git a/PO/LastFM/DMPO/adapter_model.safetensors b/PO/LastFM/DMPO/Vanilla/adapter_model.safetensors similarity index 100% rename from PO/LastFM/DMPO/adapter_model.safetensors rename to PO/LastFM/DMPO/Vanilla/adapter_model.safetensors diff --git a/PO/LastFM/DMPO/eval.log b/PO/LastFM/DMPO/Vanilla/eval.log similarity index 100% rename from PO/LastFM/DMPO/eval.log rename to PO/LastFM/DMPO/Vanilla/eval.log diff --git a/PO/LastFM/DMPO/optimizer.pt b/PO/LastFM/DMPO/Vanilla/optimizer.pt similarity index 100% rename from PO/LastFM/DMPO/optimizer.pt rename to PO/LastFM/DMPO/Vanilla/optimizer.pt diff --git a/PO/LastFM/DMPO/rng_state_0.pth b/PO/LastFM/DMPO/Vanilla/rng_state_0.pth similarity index 100% rename from PO/LastFM/DMPO/rng_state_0.pth rename to PO/LastFM/DMPO/Vanilla/rng_state_0.pth diff --git a/PO/LastFM/DMPO/rng_state_1.pth b/PO/LastFM/DMPO/Vanilla/rng_state_1.pth similarity index 100% rename from PO/LastFM/DMPO/rng_state_1.pth rename to PO/LastFM/DMPO/Vanilla/rng_state_1.pth diff --git a/PO/LastFM/DMPO/rng_state_2.pth b/PO/LastFM/DMPO/Vanilla/rng_state_2.pth similarity index 100% rename from PO/LastFM/DMPO/rng_state_2.pth rename to PO/LastFM/DMPO/Vanilla/rng_state_2.pth diff --git a/PO/LastFM/DMPO/rng_state_3.pth b/PO/LastFM/DMPO/Vanilla/rng_state_3.pth similarity index 100% rename from PO/LastFM/DMPO/rng_state_3.pth rename to PO/LastFM/DMPO/Vanilla/rng_state_3.pth diff --git a/PO/LastFM/DMPO/scheduler.pt b/PO/LastFM/DMPO/Vanilla/scheduler.pt similarity index 100% rename from PO/LastFM/DMPO/scheduler.pt rename to PO/LastFM/DMPO/Vanilla/scheduler.pt diff --git a/PO/LastFM/DynamicPO_DMPO/special_tokens_map.json b/PO/LastFM/DMPO/Vanilla/special_tokens_map.json similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/special_tokens_map.json rename to PO/LastFM/DMPO/Vanilla/special_tokens_map.json diff --git a/PO/LastFM/DynamicPO_DMPO/tokenizer.json b/PO/LastFM/DMPO/Vanilla/tokenizer.json similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/tokenizer.json rename to PO/LastFM/DMPO/Vanilla/tokenizer.json diff --git a/PO/LastFM/DynamicPO_DMPO/tokenizer.model b/PO/LastFM/DMPO/Vanilla/tokenizer.model similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/tokenizer.model rename to PO/LastFM/DMPO/Vanilla/tokenizer.model diff --git a/PO/LastFM/DynamicPO_DMPO/tokenizer_config.json b/PO/LastFM/DMPO/Vanilla/tokenizer_config.json similarity index 100% rename from PO/LastFM/DynamicPO_DMPO/tokenizer_config.json rename to PO/LastFM/DMPO/Vanilla/tokenizer_config.json diff --git a/PO/LastFM/DMPO/trainer_state.json b/PO/LastFM/DMPO/Vanilla/trainer_state.json similarity index 100% rename from PO/LastFM/DMPO/trainer_state.json rename to PO/LastFM/DMPO/Vanilla/trainer_state.json diff --git a/PO/LastFM/DMPO/training_args.bin b/PO/LastFM/DMPO/Vanilla/training_args.bin similarity index 100% rename from PO/LastFM/DMPO/training_args.bin rename to PO/LastFM/DMPO/Vanilla/training_args.bin diff --git a/PO/LastFM/DynamicPO_MPPO/adapter_config.json b/PO/LastFM/MPPO/DynamicPO/adapter_config.json similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/adapter_config.json rename to PO/LastFM/MPPO/DynamicPO/adapter_config.json diff --git a/PO/LastFM/DynamicPO_MPPO/adapter_model.safetensors b/PO/LastFM/MPPO/DynamicPO/adapter_model.safetensors similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/adapter_model.safetensors rename to PO/LastFM/MPPO/DynamicPO/adapter_model.safetensors diff --git a/PO/LastFM/DynamicPO_MPPO/eval.log b/PO/LastFM/MPPO/DynamicPO/eval.log similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/eval.log rename to PO/LastFM/MPPO/DynamicPO/eval.log diff --git a/PO/LastFM/DynamicPO_MPPO/optimizer.pt b/PO/LastFM/MPPO/DynamicPO/optimizer.pt similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/optimizer.pt rename to PO/LastFM/MPPO/DynamicPO/optimizer.pt diff --git a/PO/LastFM/DynamicPO_MPPO/rng_state_0.pth b/PO/LastFM/MPPO/DynamicPO/rng_state_0.pth similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/rng_state_0.pth rename to PO/LastFM/MPPO/DynamicPO/rng_state_0.pth diff --git a/PO/LastFM/DynamicPO_MPPO/rng_state_1.pth b/PO/LastFM/MPPO/DynamicPO/rng_state_1.pth similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/rng_state_1.pth rename to PO/LastFM/MPPO/DynamicPO/rng_state_1.pth diff --git a/PO/LastFM/DynamicPO_MPPO/rng_state_2.pth b/PO/LastFM/MPPO/DynamicPO/rng_state_2.pth similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/rng_state_2.pth rename to PO/LastFM/MPPO/DynamicPO/rng_state_2.pth diff --git a/PO/LastFM/DynamicPO_MPPO/rng_state_3.pth b/PO/LastFM/MPPO/DynamicPO/rng_state_3.pth similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/rng_state_3.pth rename to PO/LastFM/MPPO/DynamicPO/rng_state_3.pth diff --git a/PO/LastFM/DynamicPO_MPPO/scheduler.pt b/PO/LastFM/MPPO/DynamicPO/scheduler.pt similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/scheduler.pt rename to PO/LastFM/MPPO/DynamicPO/scheduler.pt diff --git a/PO/LastFM/DynamicPO_MPPO/special_tokens_map.json b/PO/LastFM/MPPO/DynamicPO/special_tokens_map.json similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/special_tokens_map.json rename to PO/LastFM/MPPO/DynamicPO/special_tokens_map.json diff --git a/PO/LastFM/DynamicPO_MPPO/tokenizer.json b/PO/LastFM/MPPO/DynamicPO/tokenizer.json similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/tokenizer.json rename to PO/LastFM/MPPO/DynamicPO/tokenizer.json diff --git a/PO/LastFM/DynamicPO_MPPO/tokenizer.model b/PO/LastFM/MPPO/DynamicPO/tokenizer.model similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/tokenizer.model rename to PO/LastFM/MPPO/DynamicPO/tokenizer.model diff --git a/PO/LastFM/DynamicPO_MPPO/tokenizer_config.json b/PO/LastFM/MPPO/DynamicPO/tokenizer_config.json similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/tokenizer_config.json rename to PO/LastFM/MPPO/DynamicPO/tokenizer_config.json diff --git a/PO/LastFM/DynamicPO_MPPO/trainer_state.json b/PO/LastFM/MPPO/DynamicPO/trainer_state.json similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/trainer_state.json rename to PO/LastFM/MPPO/DynamicPO/trainer_state.json diff --git a/PO/LastFM/DynamicPO_MPPO/training_args.bin b/PO/LastFM/MPPO/DynamicPO/training_args.bin similarity index 100% rename from PO/LastFM/DynamicPO_MPPO/training_args.bin rename to PO/LastFM/MPPO/DynamicPO/training_args.bin diff --git a/PO/LastFM/MPPO/adapter_config.json b/PO/LastFM/MPPO/Vanilla/adapter_config.json similarity index 100% rename from PO/LastFM/MPPO/adapter_config.json rename to PO/LastFM/MPPO/Vanilla/adapter_config.json diff --git a/PO/LastFM/MPPO/adapter_model.safetensors b/PO/LastFM/MPPO/Vanilla/adapter_model.safetensors similarity index 100% rename from PO/LastFM/MPPO/adapter_model.safetensors rename to PO/LastFM/MPPO/Vanilla/adapter_model.safetensors diff --git a/PO/LastFM/MPPO/eval.log b/PO/LastFM/MPPO/Vanilla/eval.log similarity index 100% rename from PO/LastFM/MPPO/eval.log rename to PO/LastFM/MPPO/Vanilla/eval.log diff --git a/PO/LastFM/MPPO/optimizer.pt b/PO/LastFM/MPPO/Vanilla/optimizer.pt similarity index 100% rename from PO/LastFM/MPPO/optimizer.pt rename to PO/LastFM/MPPO/Vanilla/optimizer.pt diff --git a/PO/LastFM/MPPO/rng_state_0.pth b/PO/LastFM/MPPO/Vanilla/rng_state_0.pth similarity index 100% rename from PO/LastFM/MPPO/rng_state_0.pth rename to PO/LastFM/MPPO/Vanilla/rng_state_0.pth diff --git a/PO/LastFM/MPPO/rng_state_1.pth b/PO/LastFM/MPPO/Vanilla/rng_state_1.pth similarity index 100% rename from PO/LastFM/MPPO/rng_state_1.pth rename to PO/LastFM/MPPO/Vanilla/rng_state_1.pth diff --git a/PO/LastFM/MPPO/rng_state_2.pth b/PO/LastFM/MPPO/Vanilla/rng_state_2.pth similarity index 100% rename from PO/LastFM/MPPO/rng_state_2.pth rename to PO/LastFM/MPPO/Vanilla/rng_state_2.pth diff --git a/PO/LastFM/MPPO/rng_state_3.pth b/PO/LastFM/MPPO/Vanilla/rng_state_3.pth similarity index 100% rename from PO/LastFM/MPPO/rng_state_3.pth rename to PO/LastFM/MPPO/Vanilla/rng_state_3.pth diff --git a/PO/LastFM/DynamicPO_SDPO/scheduler.pt b/PO/LastFM/MPPO/Vanilla/scheduler.pt similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/scheduler.pt rename to PO/LastFM/MPPO/Vanilla/scheduler.pt diff --git a/PO/LastFM/DynamicPO_SDPO/special_tokens_map.json b/PO/LastFM/MPPO/Vanilla/special_tokens_map.json similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/special_tokens_map.json rename to PO/LastFM/MPPO/Vanilla/special_tokens_map.json diff --git a/PO/LastFM/DynamicPO_SDPO/tokenizer.json b/PO/LastFM/MPPO/Vanilla/tokenizer.json similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/tokenizer.json rename to PO/LastFM/MPPO/Vanilla/tokenizer.json diff --git a/PO/LastFM/DynamicPO_SDPO/tokenizer.model b/PO/LastFM/MPPO/Vanilla/tokenizer.model similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/tokenizer.model rename to PO/LastFM/MPPO/Vanilla/tokenizer.model diff --git a/PO/LastFM/DynamicPO_SDPO/tokenizer_config.json b/PO/LastFM/MPPO/Vanilla/tokenizer_config.json similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/tokenizer_config.json rename to PO/LastFM/MPPO/Vanilla/tokenizer_config.json diff --git a/PO/LastFM/MPPO/trainer_state.json b/PO/LastFM/MPPO/Vanilla/trainer_state.json similarity index 100% rename from PO/LastFM/MPPO/trainer_state.json rename to PO/LastFM/MPPO/Vanilla/trainer_state.json diff --git a/PO/LastFM/MPPO/training_args.bin b/PO/LastFM/MPPO/Vanilla/training_args.bin similarity index 100% rename from PO/LastFM/MPPO/training_args.bin rename to PO/LastFM/MPPO/Vanilla/training_args.bin diff --git a/PO/LastFM/DynamicPO_SDPO/adapter_config.json b/PO/LastFM/SDPO/DynamicPO/adapter_config.json similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/adapter_config.json rename to PO/LastFM/SDPO/DynamicPO/adapter_config.json diff --git a/PO/LastFM/DynamicPO_SDPO/adapter_model.safetensors b/PO/LastFM/SDPO/DynamicPO/adapter_model.safetensors similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/adapter_model.safetensors rename to PO/LastFM/SDPO/DynamicPO/adapter_model.safetensors diff --git a/PO/LastFM/DynamicPO_SDPO/eval.log b/PO/LastFM/SDPO/DynamicPO/eval.log similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/eval.log rename to PO/LastFM/SDPO/DynamicPO/eval.log diff --git a/PO/LastFM/DynamicPO_SDPO/optimizer.pt b/PO/LastFM/SDPO/DynamicPO/optimizer.pt similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/optimizer.pt rename to PO/LastFM/SDPO/DynamicPO/optimizer.pt diff --git a/PO/LastFM/DynamicPO_SDPO/rng_state_0.pth b/PO/LastFM/SDPO/DynamicPO/rng_state_0.pth similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/rng_state_0.pth rename to PO/LastFM/SDPO/DynamicPO/rng_state_0.pth diff --git a/PO/LastFM/DynamicPO_SDPO/rng_state_1.pth b/PO/LastFM/SDPO/DynamicPO/rng_state_1.pth similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/rng_state_1.pth rename to PO/LastFM/SDPO/DynamicPO/rng_state_1.pth diff --git a/PO/LastFM/DynamicPO_SDPO/rng_state_2.pth b/PO/LastFM/SDPO/DynamicPO/rng_state_2.pth similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/rng_state_2.pth rename to PO/LastFM/SDPO/DynamicPO/rng_state_2.pth diff --git a/PO/LastFM/DynamicPO_SDPO/rng_state_3.pth b/PO/LastFM/SDPO/DynamicPO/rng_state_3.pth similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/rng_state_3.pth rename to PO/LastFM/SDPO/DynamicPO/rng_state_3.pth diff --git a/PO/LastFM/MPPO/scheduler.pt b/PO/LastFM/SDPO/DynamicPO/scheduler.pt similarity index 100% rename from PO/LastFM/MPPO/scheduler.pt rename to PO/LastFM/SDPO/DynamicPO/scheduler.pt diff --git a/PO/LastFM/MPPO/special_tokens_map.json b/PO/LastFM/SDPO/DynamicPO/special_tokens_map.json similarity index 100% rename from PO/LastFM/MPPO/special_tokens_map.json rename to PO/LastFM/SDPO/DynamicPO/special_tokens_map.json diff --git a/PO/LastFM/MPPO/tokenizer.json b/PO/LastFM/SDPO/DynamicPO/tokenizer.json similarity index 100% rename from PO/LastFM/MPPO/tokenizer.json rename to PO/LastFM/SDPO/DynamicPO/tokenizer.json diff --git a/PO/LastFM/MPPO/tokenizer.model b/PO/LastFM/SDPO/DynamicPO/tokenizer.model similarity index 100% rename from PO/LastFM/MPPO/tokenizer.model rename to PO/LastFM/SDPO/DynamicPO/tokenizer.model diff --git a/PO/LastFM/MPPO/tokenizer_config.json b/PO/LastFM/SDPO/DynamicPO/tokenizer_config.json similarity index 100% rename from PO/LastFM/MPPO/tokenizer_config.json rename to PO/LastFM/SDPO/DynamicPO/tokenizer_config.json diff --git a/PO/LastFM/DynamicPO_SDPO/trainer_state.json b/PO/LastFM/SDPO/DynamicPO/trainer_state.json similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/trainer_state.json rename to PO/LastFM/SDPO/DynamicPO/trainer_state.json diff --git a/PO/LastFM/DynamicPO_SDPO/training_args.bin b/PO/LastFM/SDPO/DynamicPO/training_args.bin similarity index 100% rename from PO/LastFM/DynamicPO_SDPO/training_args.bin rename to PO/LastFM/SDPO/DynamicPO/training_args.bin diff --git a/PO/LastFM/SDPO/adapter_config.json b/PO/LastFM/SDPO/Vanilla/adapter_config.json similarity index 100% rename from PO/LastFM/SDPO/adapter_config.json rename to PO/LastFM/SDPO/Vanilla/adapter_config.json diff --git a/PO/LastFM/SDPO/adapter_model.safetensors b/PO/LastFM/SDPO/Vanilla/adapter_model.safetensors similarity index 100% rename from PO/LastFM/SDPO/adapter_model.safetensors rename to PO/LastFM/SDPO/Vanilla/adapter_model.safetensors diff --git a/PO/LastFM/SDPO/eval.log b/PO/LastFM/SDPO/Vanilla/eval.log similarity index 100% rename from PO/LastFM/SDPO/eval.log rename to PO/LastFM/SDPO/Vanilla/eval.log diff --git a/PO/LastFM/SDPO/optimizer.pt b/PO/LastFM/SDPO/Vanilla/optimizer.pt similarity index 100% rename from PO/LastFM/SDPO/optimizer.pt rename to PO/LastFM/SDPO/Vanilla/optimizer.pt diff --git a/PO/LastFM/SDPO/rng_state_0.pth b/PO/LastFM/SDPO/Vanilla/rng_state_0.pth similarity index 100% rename from PO/LastFM/SDPO/rng_state_0.pth rename to PO/LastFM/SDPO/Vanilla/rng_state_0.pth diff --git a/PO/LastFM/SDPO/rng_state_1.pth b/PO/LastFM/SDPO/Vanilla/rng_state_1.pth similarity index 100% rename from PO/LastFM/SDPO/rng_state_1.pth rename to PO/LastFM/SDPO/Vanilla/rng_state_1.pth diff --git a/PO/LastFM/SDPO/rng_state_2.pth b/PO/LastFM/SDPO/Vanilla/rng_state_2.pth similarity index 100% rename from PO/LastFM/SDPO/rng_state_2.pth rename to PO/LastFM/SDPO/Vanilla/rng_state_2.pth diff --git a/PO/LastFM/SDPO/rng_state_3.pth b/PO/LastFM/SDPO/Vanilla/rng_state_3.pth similarity index 100% rename from PO/LastFM/SDPO/rng_state_3.pth rename to PO/LastFM/SDPO/Vanilla/rng_state_3.pth diff --git a/PO/LastFM/SDPO/scheduler.pt b/PO/LastFM/SDPO/Vanilla/scheduler.pt similarity index 100% rename from PO/LastFM/SDPO/scheduler.pt rename to PO/LastFM/SDPO/Vanilla/scheduler.pt diff --git a/PO/LastFM/SDPO/special_tokens_map.json b/PO/LastFM/SDPO/Vanilla/special_tokens_map.json similarity index 100% rename from PO/LastFM/SDPO/special_tokens_map.json rename to PO/LastFM/SDPO/Vanilla/special_tokens_map.json diff --git a/PO/LastFM/SDPO/tokenizer.json b/PO/LastFM/SDPO/Vanilla/tokenizer.json similarity index 100% rename from PO/LastFM/SDPO/tokenizer.json rename to PO/LastFM/SDPO/Vanilla/tokenizer.json diff --git a/PO/LastFM/SDPO/tokenizer.model b/PO/LastFM/SDPO/Vanilla/tokenizer.model similarity index 100% rename from PO/LastFM/SDPO/tokenizer.model rename to PO/LastFM/SDPO/Vanilla/tokenizer.model diff --git a/PO/LastFM/SDPO/tokenizer_config.json b/PO/LastFM/SDPO/Vanilla/tokenizer_config.json similarity index 100% rename from PO/LastFM/SDPO/tokenizer_config.json rename to PO/LastFM/SDPO/Vanilla/tokenizer_config.json diff --git a/PO/LastFM/SDPO/trainer_state.json b/PO/LastFM/SDPO/Vanilla/trainer_state.json similarity index 100% rename from PO/LastFM/SDPO/trainer_state.json rename to PO/LastFM/SDPO/Vanilla/trainer_state.json diff --git a/PO/LastFM/SDPO/training_args.bin b/PO/LastFM/SDPO/Vanilla/training_args.bin similarity index 100% rename from PO/LastFM/SDPO/training_args.bin rename to PO/LastFM/SDPO/Vanilla/training_args.bin