run_name: bert-tiny-stage2-sbert model_name: QuangDuy/bert-tiny-stage2-hf output_dir: outputs/bert-tiny-stage2-sbert train_dataset: - batmangiaicuuthegioi/zalo-legal-triplets - QuangDuy/mmarco-vi-hard-negatives train_split: train eval_dataset: another-symato/VMTEB-Zalo-legel-retrieval-wseg eval_corpus_config: corpus eval_queries_config: queries eval_labels_config: data_ir eval_split: train seed: 42 max_seq_length: 512 pooling: mean normalize_embeddings: true include_hard_negatives: true num_train_epochs: 5 train_batch_size: 64 learning_rate: 2.0e-05 warmup_ratio: 0.1 weight_decay: 0.01 precision: bf16 use_amp: true use_cached_mnrl: false validation_size: 0.05 validation_subset: null evaluation_steps: 2000 checkpoint_save_steps: 2000 checkpoint_save_total_limit: 5 early_stopping_patience: 4 hf_repo_id: QuangDuy/bert-tiny-stage2-sbert hf_private: false hf_push_on_save: true run_retrieval_eval_after_train: true retrieval_eval_limit_queries: null retrieval_eval_extra_corpus_docs: null matryoshka_dims: - 384 - 256 - 128 - 64 truncate_dims: - 384 - 256 - 128 - 64 top_k: - 1 - 3 - 5 - 10 map_at_k: 100 eval_batch_size: 128