| # 混合 SFT 数据配置(采样版) | |
| # 自动生成 by sample_sft_data.py | |
| # Image: 738,590 条 | |
| # Video: 800,001 条 | |
| # 总计: 1,538,591 条 | |
| datasets: | |
| # ===== Image ===== | |
| - json_path: /mnt/bn/strategy-mllm-train/common/datasets/image_sft_full_v800k.json | |
| sampling_strategy: all | |
| # ===== Video ===== | |
| - json_path: /mnt/bn/strategy-mllm-train/common/datasets/video_sft_full_v800k.json | |
| sampling_strategy: all | |