| *.7z filter=lfs diff=lfs merge=lfs -text |
| *.arrow filter=lfs diff=lfs merge=lfs -text |
| *.bin filter=lfs diff=lfs merge=lfs -text |
| *.bz2 filter=lfs diff=lfs merge=lfs -text |
| *.ckpt filter=lfs diff=lfs merge=lfs -text |
| *.ftz filter=lfs diff=lfs merge=lfs -text |
| *.gz filter=lfs diff=lfs merge=lfs -text |
| *.h5 filter=lfs diff=lfs merge=lfs -text |
| *.joblib filter=lfs diff=lfs merge=lfs -text |
| *.lfs.* filter=lfs diff=lfs merge=lfs -text |
| *.mlmodel filter=lfs diff=lfs merge=lfs -text |
| *.model filter=lfs diff=lfs merge=lfs -text |
| *.msgpack filter=lfs diff=lfs merge=lfs -text |
| *.npy filter=lfs diff=lfs merge=lfs -text |
| *.npz filter=lfs diff=lfs merge=lfs -text |
| *.onnx filter=lfs diff=lfs merge=lfs -text |
| *.ot filter=lfs diff=lfs merge=lfs -text |
| *.parquet filter=lfs diff=lfs merge=lfs -text |
| *.pb filter=lfs diff=lfs merge=lfs -text |
| *.pickle filter=lfs diff=lfs merge=lfs -text |
| *.pkl filter=lfs diff=lfs merge=lfs -text |
| *.pt filter=lfs diff=lfs merge=lfs -text |
| *.pth filter=lfs diff=lfs merge=lfs -text |
| *.rar filter=lfs diff=lfs merge=lfs -text |
| *.safetensors filter=lfs diff=lfs merge=lfs -text |
| saved_model/**/* filter=lfs diff=lfs merge=lfs -text |
| *.tar.* filter=lfs diff=lfs merge=lfs -text |
| *.tar filter=lfs diff=lfs merge=lfs -text |
| *.tflite filter=lfs diff=lfs merge=lfs -text |
| *.tgz filter=lfs diff=lfs merge=lfs -text |
| *.wasm filter=lfs diff=lfs merge=lfs -text |
| *.xz filter=lfs diff=lfs merge=lfs -text |
| *.zip filter=lfs diff=lfs merge=lfs -text |
| *.zst filter=lfs diff=lfs merge=lfs -text |
| *tfevents* filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004114.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001650.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003265.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000033.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000401.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000290.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001684.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/infer_07-17-04:25_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004221.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004114.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001650.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003265.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000033.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000401.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000290.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001684.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-05:57_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004221.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001477.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004074.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000005162.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003872.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001788.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000002642.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000002347.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004387.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000925.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001397.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001485.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004345.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004904.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001197.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000418.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003135.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000002707.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000005188.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004404.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004114.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003931.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003235.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001650.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000230.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001483.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003265.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000008.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003403.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003204.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000002972.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000005324.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000033.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004693.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000005004.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000002651.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000401.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001075.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003919.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000005177.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001934.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004877.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004213.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003844.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000290.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001684.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000734.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004446.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003699.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000005136.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000005239.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000003921.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000000810.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000004221.wav filter=lfs diff=lfs merge=lfs -text |
| latent_diffusion/2023_08_23_reproduce_audioldm/audioldm_original/val_12585_07-17-06:29_cfg_scale_3.5_ddim_200_n_cand_3/Y0000001090.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001477.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004074.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000005162.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003872.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001788.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000002642.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000002347.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004387.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000925.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001397.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004345.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001485.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004904.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001197.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000418.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003135.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000002707.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000005188.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004404.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004114.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003931.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003235.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001650.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000230.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003265.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001483.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000008.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003403.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003204.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000002972.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000033.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000005324.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000005004.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004693.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000002651.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000401.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001075.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000005177.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003919.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001934.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004877.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004213.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003844.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000290.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001684.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000734.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004446.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003699.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000005136.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000005239.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000003921.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000000810.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000004221.wav filter=lfs diff=lfs merge=lfs -text |
| testset_data/audiocaps/Y0000001090.wav filter=lfs diff=lfs merge=lfs -text |
|
|