| { |
| "architectures": [ |
| "PeAudioVideoModel" |
| ], |
| "audio_video_config": { |
| "attention_bias": false, |
| "attention_dropout": 0.0, |
| "audio_config": { |
| "_name_or_path": "", |
| "add_cross_attention": false, |
| "architectures": null, |
| "attention_bias": false, |
| "attention_dropout": 0.0, |
| "bos_token_id": null, |
| "chunk_size_feed_forward": 0, |
| "cross_attention_hidden_size": null, |
| "dac_config": { |
| "_name_or_path": "", |
| "add_cross_attention": false, |
| "architectures": null, |
| "bos_token_id": null, |
| "chunk_size_feed_forward": 0, |
| "codebook_dim": 128, |
| "codebook_loss_weight": 1.0, |
| "codebook_size": 1024, |
| "commitment_loss_weight": 0.25, |
| "cross_attention_hidden_size": null, |
| "decoder_hidden_size": 1536, |
| "decoder_start_token_id": null, |
| "downsampling_ratios": [ |
| 2, |
| 8, |
| 10, |
| 12 |
| ], |
| "dtype": null, |
| "encoder_hidden_size": 64, |
| "eos_token_id": null, |
| "finetuning_task": null, |
| "hidden_size": 1024, |
| "hop_length": 1920, |
| "id2label": { |
| "0": "LABEL_0", |
| "1": "LABEL_1" |
| }, |
| "is_decoder": false, |
| "is_encoder_decoder": false, |
| "label2id": { |
| "LABEL_0": 0, |
| "LABEL_1": 1 |
| }, |
| "model_type": "dac", |
| "n_codebooks": 16, |
| "output_attentions": false, |
| "output_hidden_states": false, |
| "pad_token_id": null, |
| "prefix": null, |
| "problem_type": null, |
| "quantizer_dropout": 0, |
| "return_dict": true, |
| "sampling_rate": 48000, |
| "sep_token_id": null, |
| "task_specific_params": null, |
| "tie_encoder_decoder": false, |
| "tie_word_embeddings": true, |
| "tokenizer_class": null, |
| "upsampling_ratios": [ |
| 12, |
| 10, |
| 8, |
| 2 |
| ] |
| }, |
| "decoder_start_token_id": null, |
| "dtype": null, |
| "eos_token_id": null, |
| "finetuning_task": null, |
| "head_dim": 128, |
| "hidden_act": "silu", |
| "hidden_size": 1024, |
| "id2label": { |
| "0": "LABEL_0", |
| "1": "LABEL_1" |
| }, |
| "initializer_range": 0.02, |
| "intermediate_size": 2752, |
| "is_decoder": false, |
| "is_encoder_decoder": false, |
| "label2id": { |
| "LABEL_0": 0, |
| "LABEL_1": 1 |
| }, |
| "max_position_embeddings": 10000, |
| "model_type": "pe_audio_encoder", |
| "num_attention_heads": 8, |
| "num_hidden_layers": 16, |
| "num_key_value_heads": 8, |
| "output_attentions": false, |
| "output_hidden_states": false, |
| "pad_token_id": null, |
| "prefix": null, |
| "problem_type": null, |
| "return_dict": true, |
| "rms_norm_eps": 1e-05, |
| "rope_parameters": { |
| "rope_theta": 20000, |
| "rope_type": "default" |
| }, |
| "sep_token_id": null, |
| "task_specific_params": null, |
| "tie_encoder_decoder": false, |
| "tie_word_embeddings": true, |
| "tokenizer_class": null |
| }, |
| "dtype": "float32", |
| "head_dim": 128, |
| "hidden_act": "silu", |
| "hidden_size": 1024, |
| "initializer_range": 0.02, |
| "intermediate_size": 2752, |
| "max_position_embeddings": 10000, |
| "model_type": "pe_audio_video_encoder", |
| "num_attention_heads": 8, |
| "num_hidden_layers": 6, |
| "num_key_value_heads": 8, |
| "rms_norm_eps": 1e-05, |
| "rope_parameters": { |
| "rope_theta": 20000, |
| "rope_type": "default" |
| }, |
| "video_config": { |
| "_name_or_path": "", |
| "add_cross_attention": false, |
| "architectures": null, |
| "attention_bias": false, |
| "attention_dropout": 0.0, |
| "bos_token_id": null, |
| "chunk_size_feed_forward": 0, |
| "cross_attention_hidden_size": null, |
| "decoder_start_token_id": null, |
| "dtype": null, |
| "eos_token_id": null, |
| "finetuning_task": null, |
| "head_dim": 128, |
| "hidden_act": "silu", |
| "hidden_size": 1024, |
| "id2label": { |
| "0": "LABEL_0", |
| "1": "LABEL_1" |
| }, |
| "initializer_range": 0.02, |
| "intermediate_size": 2752, |
| "is_decoder": false, |
| "is_encoder_decoder": false, |
| "label2id": { |
| "LABEL_0": 0, |
| "LABEL_1": 1 |
| }, |
| "max_position_embeddings": 10000, |
| "model_type": "pe_video_encoder", |
| "num_attention_heads": 8, |
| "num_hidden_layers": 4, |
| "num_key_value_heads": 8, |
| "output_attentions": false, |
| "output_hidden_states": false, |
| "pad_token_id": null, |
| "prefix": null, |
| "problem_type": null, |
| "return_dict": true, |
| "rms_norm_eps": 1e-05, |
| "rope_parameters": { |
| "rope_theta": 20000, |
| "rope_type": "default" |
| }, |
| "sep_token_id": null, |
| "task_specific_params": null, |
| "tie_encoder_decoder": false, |
| "tie_word_embeddings": true, |
| "tokenizer_class": null, |
| "vision_config": { |
| "_name_or_path": "", |
| "add_cross_attention": false, |
| "architecture": "vit_pe_core_large_patch14_336", |
| "architectures": null, |
| "bos_token_id": null, |
| "chunk_size_feed_forward": 0, |
| "cross_attention_hidden_size": null, |
| "decoder_start_token_id": null, |
| "do_pooling": true, |
| "dtype": null, |
| "eos_token_id": null, |
| "finetuning_task": null, |
| "global_pool": "map", |
| "initializer_range": 0.02, |
| "is_decoder": false, |
| "is_encoder_decoder": false, |
| "label_names": [ |
| "LABEL_0", |
| "LABEL_1", |
| "LABEL_2", |
| "LABEL_3", |
| "LABEL_4", |
| "LABEL_5", |
| "LABEL_6", |
| "LABEL_7", |
| "LABEL_8", |
| "LABEL_9", |
| "LABEL_10", |
| "LABEL_11", |
| "LABEL_12", |
| "LABEL_13", |
| "LABEL_14", |
| "LABEL_15", |
| "LABEL_16", |
| "LABEL_17", |
| "LABEL_18", |
| "LABEL_19", |
| "LABEL_20", |
| "LABEL_21", |
| "LABEL_22", |
| "LABEL_23", |
| "LABEL_24", |
| "LABEL_25", |
| "LABEL_26", |
| "LABEL_27", |
| "LABEL_28", |
| "LABEL_29", |
| "LABEL_30", |
| "LABEL_31", |
| "LABEL_32", |
| "LABEL_33", |
| "LABEL_34", |
| "LABEL_35", |
| "LABEL_36", |
| "LABEL_37", |
| "LABEL_38", |
| "LABEL_39", |
| "LABEL_40", |
| "LABEL_41", |
| "LABEL_42", |
| "LABEL_43", |
| "LABEL_44", |
| "LABEL_45", |
| "LABEL_46", |
| "LABEL_47", |
| "LABEL_48", |
| "LABEL_49", |
| "LABEL_50", |
| "LABEL_51", |
| "LABEL_52", |
| "LABEL_53", |
| "LABEL_54", |
| "LABEL_55", |
| "LABEL_56", |
| "LABEL_57", |
| "LABEL_58", |
| "LABEL_59", |
| "LABEL_60", |
| "LABEL_61", |
| "LABEL_62", |
| "LABEL_63", |
| "LABEL_64", |
| "LABEL_65", |
| "LABEL_66", |
| "LABEL_67", |
| "LABEL_68", |
| "LABEL_69", |
| "LABEL_70", |
| "LABEL_71", |
| "LABEL_72", |
| "LABEL_73", |
| "LABEL_74", |
| "LABEL_75", |
| "LABEL_76", |
| "LABEL_77", |
| "LABEL_78", |
| "LABEL_79", |
| "LABEL_80", |
| "LABEL_81", |
| "LABEL_82", |
| "LABEL_83", |
| "LABEL_84", |
| "LABEL_85", |
| "LABEL_86", |
| "LABEL_87", |
| "LABEL_88", |
| "LABEL_89", |
| "LABEL_90", |
| "LABEL_91", |
| "LABEL_92", |
| "LABEL_93", |
| "LABEL_94", |
| "LABEL_95", |
| "LABEL_96", |
| "LABEL_97", |
| "LABEL_98", |
| "LABEL_99", |
| "LABEL_100", |
| "LABEL_101", |
| "LABEL_102", |
| "LABEL_103", |
| "LABEL_104", |
| "LABEL_105", |
| "LABEL_106", |
| "LABEL_107", |
| "LABEL_108", |
| "LABEL_109", |
| "LABEL_110", |
| "LABEL_111", |
| "LABEL_112", |
| "LABEL_113", |
| "LABEL_114", |
| "LABEL_115", |
| "LABEL_116", |
| "LABEL_117", |
| "LABEL_118", |
| "LABEL_119", |
| "LABEL_120", |
| "LABEL_121", |
| "LABEL_122", |
| "LABEL_123", |
| "LABEL_124", |
| "LABEL_125", |
| "LABEL_126", |
| "LABEL_127", |
| "LABEL_128", |
| "LABEL_129", |
| "LABEL_130", |
| "LABEL_131", |
| "LABEL_132", |
| "LABEL_133", |
| "LABEL_134", |
| "LABEL_135", |
| "LABEL_136", |
| "LABEL_137", |
| "LABEL_138", |
| "LABEL_139", |
| "LABEL_140", |
| "LABEL_141", |
| "LABEL_142", |
| "LABEL_143", |
| "LABEL_144", |
| "LABEL_145", |
| "LABEL_146", |
| "LABEL_147", |
| "LABEL_148", |
| "LABEL_149", |
| "LABEL_150", |
| "LABEL_151", |
| "LABEL_152", |
| "LABEL_153", |
| "LABEL_154", |
| "LABEL_155", |
| "LABEL_156", |
| "LABEL_157", |
| "LABEL_158", |
| "LABEL_159", |
| "LABEL_160", |
| "LABEL_161", |
| "LABEL_162", |
| "LABEL_163", |
| "LABEL_164", |
| "LABEL_165", |
| "LABEL_166", |
| "LABEL_167", |
| "LABEL_168", |
| "LABEL_169", |
| "LABEL_170", |
| "LABEL_171", |
| "LABEL_172", |
| "LABEL_173", |
| "LABEL_174", |
| "LABEL_175", |
| "LABEL_176", |
| "LABEL_177", |
| "LABEL_178", |
| "LABEL_179", |
| "LABEL_180", |
| "LABEL_181", |
| "LABEL_182", |
| "LABEL_183", |
| "LABEL_184", |
| "LABEL_185", |
| "LABEL_186", |
| "LABEL_187", |
| "LABEL_188", |
| "LABEL_189", |
| "LABEL_190", |
| "LABEL_191", |
| "LABEL_192", |
| "LABEL_193", |
| "LABEL_194", |
| "LABEL_195", |
| "LABEL_196", |
| "LABEL_197", |
| "LABEL_198", |
| "LABEL_199", |
| "LABEL_200", |
| "LABEL_201", |
| "LABEL_202", |
| "LABEL_203", |
| "LABEL_204", |
| "LABEL_205", |
| "LABEL_206", |
| "LABEL_207", |
| "LABEL_208", |
| "LABEL_209", |
| "LABEL_210", |
| "LABEL_211", |
| "LABEL_212", |
| "LABEL_213", |
| "LABEL_214", |
| "LABEL_215", |
| "LABEL_216", |
| "LABEL_217", |
| "LABEL_218", |
| "LABEL_219", |
| "LABEL_220", |
| "LABEL_221", |
| "LABEL_222", |
| "LABEL_223", |
| "LABEL_224", |
| "LABEL_225", |
| "LABEL_226", |
| "LABEL_227", |
| "LABEL_228", |
| "LABEL_229", |
| "LABEL_230", |
| "LABEL_231", |
| "LABEL_232", |
| "LABEL_233", |
| "LABEL_234", |
| "LABEL_235", |
| "LABEL_236", |
| "LABEL_237", |
| "LABEL_238", |
| "LABEL_239", |
| "LABEL_240", |
| "LABEL_241", |
| "LABEL_242", |
| "LABEL_243", |
| "LABEL_244", |
| "LABEL_245", |
| "LABEL_246", |
| "LABEL_247", |
| "LABEL_248", |
| "LABEL_249", |
| "LABEL_250", |
| "LABEL_251", |
| "LABEL_252", |
| "LABEL_253", |
| "LABEL_254", |
| "LABEL_255", |
| "LABEL_256", |
| "LABEL_257", |
| "LABEL_258", |
| "LABEL_259", |
| "LABEL_260", |
| "LABEL_261", |
| "LABEL_262", |
| "LABEL_263", |
| "LABEL_264", |
| "LABEL_265", |
| "LABEL_266", |
| "LABEL_267", |
| "LABEL_268", |
| "LABEL_269", |
| "LABEL_270", |
| "LABEL_271", |
| "LABEL_272", |
| "LABEL_273", |
| "LABEL_274", |
| "LABEL_275", |
| "LABEL_276", |
| "LABEL_277", |
| "LABEL_278", |
| "LABEL_279", |
| "LABEL_280", |
| "LABEL_281", |
| "LABEL_282", |
| "LABEL_283", |
| "LABEL_284", |
| "LABEL_285", |
| "LABEL_286", |
| "LABEL_287", |
| "LABEL_288", |
| "LABEL_289", |
| "LABEL_290", |
| "LABEL_291", |
| "LABEL_292", |
| "LABEL_293", |
| "LABEL_294", |
| "LABEL_295", |
| "LABEL_296", |
| "LABEL_297", |
| "LABEL_298", |
| "LABEL_299", |
| "LABEL_300", |
| "LABEL_301", |
| "LABEL_302", |
| "LABEL_303", |
| "LABEL_304", |
| "LABEL_305", |
| "LABEL_306", |
| "LABEL_307", |
| "LABEL_308", |
| "LABEL_309", |
| "LABEL_310", |
| "LABEL_311", |
| "LABEL_312", |
| "LABEL_313", |
| "LABEL_314", |
| "LABEL_315", |
| "LABEL_316", |
| "LABEL_317", |
| "LABEL_318", |
| "LABEL_319", |
| "LABEL_320", |
| "LABEL_321", |
| "LABEL_322", |
| "LABEL_323", |
| "LABEL_324", |
| "LABEL_325", |
| "LABEL_326", |
| "LABEL_327", |
| "LABEL_328", |
| "LABEL_329", |
| "LABEL_330", |
| "LABEL_331", |
| "LABEL_332", |
| "LABEL_333", |
| "LABEL_334", |
| "LABEL_335", |
| "LABEL_336", |
| "LABEL_337", |
| "LABEL_338", |
| "LABEL_339", |
| "LABEL_340", |
| "LABEL_341", |
| "LABEL_342", |
| "LABEL_343", |
| "LABEL_344", |
| "LABEL_345", |
| "LABEL_346", |
| "LABEL_347", |
| "LABEL_348", |
| "LABEL_349", |
| "LABEL_350", |
| "LABEL_351", |
| "LABEL_352", |
| "LABEL_353", |
| "LABEL_354", |
| "LABEL_355", |
| "LABEL_356", |
| "LABEL_357", |
| "LABEL_358", |
| "LABEL_359", |
| "LABEL_360", |
| "LABEL_361", |
| "LABEL_362", |
| "LABEL_363", |
| "LABEL_364", |
| "LABEL_365", |
| "LABEL_366", |
| "LABEL_367", |
| "LABEL_368", |
| "LABEL_369", |
| "LABEL_370", |
| "LABEL_371", |
| "LABEL_372", |
| "LABEL_373", |
| "LABEL_374", |
| "LABEL_375", |
| "LABEL_376", |
| "LABEL_377", |
| "LABEL_378", |
| "LABEL_379", |
| "LABEL_380", |
| "LABEL_381", |
| "LABEL_382", |
| "LABEL_383", |
| "LABEL_384", |
| "LABEL_385", |
| "LABEL_386", |
| "LABEL_387", |
| "LABEL_388", |
| "LABEL_389", |
| "LABEL_390", |
| "LABEL_391", |
| "LABEL_392", |
| "LABEL_393", |
| "LABEL_394", |
| "LABEL_395", |
| "LABEL_396", |
| "LABEL_397", |
| "LABEL_398", |
| "LABEL_399", |
| "LABEL_400", |
| "LABEL_401", |
| "LABEL_402", |
| "LABEL_403", |
| "LABEL_404", |
| "LABEL_405", |
| "LABEL_406", |
| "LABEL_407", |
| "LABEL_408", |
| "LABEL_409", |
| "LABEL_410", |
| "LABEL_411", |
| "LABEL_412", |
| "LABEL_413", |
| "LABEL_414", |
| "LABEL_415", |
| "LABEL_416", |
| "LABEL_417", |
| "LABEL_418", |
| "LABEL_419", |
| "LABEL_420", |
| "LABEL_421", |
| "LABEL_422", |
| "LABEL_423", |
| "LABEL_424", |
| "LABEL_425", |
| "LABEL_426", |
| "LABEL_427", |
| "LABEL_428", |
| "LABEL_429", |
| "LABEL_430", |
| "LABEL_431", |
| "LABEL_432", |
| "LABEL_433", |
| "LABEL_434", |
| "LABEL_435", |
| "LABEL_436", |
| "LABEL_437", |
| "LABEL_438", |
| "LABEL_439", |
| "LABEL_440", |
| "LABEL_441", |
| "LABEL_442", |
| "LABEL_443", |
| "LABEL_444", |
| "LABEL_445", |
| "LABEL_446", |
| "LABEL_447", |
| "LABEL_448", |
| "LABEL_449", |
| "LABEL_450", |
| "LABEL_451", |
| "LABEL_452", |
| "LABEL_453", |
| "LABEL_454", |
| "LABEL_455", |
| "LABEL_456", |
| "LABEL_457", |
| "LABEL_458", |
| "LABEL_459", |
| "LABEL_460", |
| "LABEL_461", |
| "LABEL_462", |
| "LABEL_463", |
| "LABEL_464", |
| "LABEL_465", |
| "LABEL_466", |
| "LABEL_467", |
| "LABEL_468", |
| "LABEL_469", |
| "LABEL_470", |
| "LABEL_471", |
| "LABEL_472", |
| "LABEL_473", |
| "LABEL_474", |
| "LABEL_475", |
| "LABEL_476", |
| "LABEL_477", |
| "LABEL_478", |
| "LABEL_479", |
| "LABEL_480", |
| "LABEL_481", |
| "LABEL_482", |
| "LABEL_483", |
| "LABEL_484", |
| "LABEL_485", |
| "LABEL_486", |
| "LABEL_487", |
| "LABEL_488", |
| "LABEL_489", |
| "LABEL_490", |
| "LABEL_491", |
| "LABEL_492", |
| "LABEL_493", |
| "LABEL_494", |
| "LABEL_495", |
| "LABEL_496", |
| "LABEL_497", |
| "LABEL_498", |
| "LABEL_499", |
| "LABEL_500", |
| "LABEL_501", |
| "LABEL_502", |
| "LABEL_503", |
| "LABEL_504", |
| "LABEL_505", |
| "LABEL_506", |
| "LABEL_507", |
| "LABEL_508", |
| "LABEL_509", |
| "LABEL_510", |
| "LABEL_511", |
| "LABEL_512", |
| "LABEL_513", |
| "LABEL_514", |
| "LABEL_515", |
| "LABEL_516", |
| "LABEL_517", |
| "LABEL_518", |
| "LABEL_519", |
| "LABEL_520", |
| "LABEL_521", |
| "LABEL_522", |
| "LABEL_523", |
| "LABEL_524", |
| "LABEL_525", |
| "LABEL_526", |
| "LABEL_527", |
| "LABEL_528", |
| "LABEL_529", |
| "LABEL_530", |
| "LABEL_531", |
| "LABEL_532", |
| "LABEL_533", |
| "LABEL_534", |
| "LABEL_535", |
| "LABEL_536", |
| "LABEL_537", |
| "LABEL_538", |
| "LABEL_539", |
| "LABEL_540", |
| "LABEL_541", |
| "LABEL_542", |
| "LABEL_543", |
| "LABEL_544", |
| "LABEL_545", |
| "LABEL_546", |
| "LABEL_547", |
| "LABEL_548", |
| "LABEL_549", |
| "LABEL_550", |
| "LABEL_551", |
| "LABEL_552", |
| "LABEL_553", |
| "LABEL_554", |
| "LABEL_555", |
| "LABEL_556", |
| "LABEL_557", |
| "LABEL_558", |
| "LABEL_559", |
| "LABEL_560", |
| "LABEL_561", |
| "LABEL_562", |
| "LABEL_563", |
| "LABEL_564", |
| "LABEL_565", |
| "LABEL_566", |
| "LABEL_567", |
| "LABEL_568", |
| "LABEL_569", |
| "LABEL_570", |
| "LABEL_571", |
| "LABEL_572", |
| "LABEL_573", |
| "LABEL_574", |
| "LABEL_575", |
| "LABEL_576", |
| "LABEL_577", |
| "LABEL_578", |
| "LABEL_579", |
| "LABEL_580", |
| "LABEL_581", |
| "LABEL_582", |
| "LABEL_583", |
| "LABEL_584", |
| "LABEL_585", |
| "LABEL_586", |
| "LABEL_587", |
| "LABEL_588", |
| "LABEL_589", |
| "LABEL_590", |
| "LABEL_591", |
| "LABEL_592", |
| "LABEL_593", |
| "LABEL_594", |
| "LABEL_595", |
| "LABEL_596", |
| "LABEL_597", |
| "LABEL_598", |
| "LABEL_599", |
| "LABEL_600", |
| "LABEL_601", |
| "LABEL_602", |
| "LABEL_603", |
| "LABEL_604", |
| "LABEL_605", |
| "LABEL_606", |
| "LABEL_607", |
| "LABEL_608", |
| "LABEL_609", |
| "LABEL_610", |
| "LABEL_611", |
| "LABEL_612", |
| "LABEL_613", |
| "LABEL_614", |
| "LABEL_615", |
| "LABEL_616", |
| "LABEL_617", |
| "LABEL_618", |
| "LABEL_619", |
| "LABEL_620", |
| "LABEL_621", |
| "LABEL_622", |
| "LABEL_623", |
| "LABEL_624", |
| "LABEL_625", |
| "LABEL_626", |
| "LABEL_627", |
| "LABEL_628", |
| "LABEL_629", |
| "LABEL_630", |
| "LABEL_631", |
| "LABEL_632", |
| "LABEL_633", |
| "LABEL_634", |
| "LABEL_635", |
| "LABEL_636", |
| "LABEL_637", |
| "LABEL_638", |
| "LABEL_639", |
| "LABEL_640", |
| "LABEL_641", |
| "LABEL_642", |
| "LABEL_643", |
| "LABEL_644", |
| "LABEL_645", |
| "LABEL_646", |
| "LABEL_647", |
| "LABEL_648", |
| "LABEL_649", |
| "LABEL_650", |
| "LABEL_651", |
| "LABEL_652", |
| "LABEL_653", |
| "LABEL_654", |
| "LABEL_655", |
| "LABEL_656", |
| "LABEL_657", |
| "LABEL_658", |
| "LABEL_659", |
| "LABEL_660", |
| "LABEL_661", |
| "LABEL_662", |
| "LABEL_663", |
| "LABEL_664", |
| "LABEL_665", |
| "LABEL_666", |
| "LABEL_667", |
| "LABEL_668", |
| "LABEL_669", |
| "LABEL_670", |
| "LABEL_671", |
| "LABEL_672", |
| "LABEL_673", |
| "LABEL_674", |
| "LABEL_675", |
| "LABEL_676", |
| "LABEL_677", |
| "LABEL_678", |
| "LABEL_679", |
| "LABEL_680", |
| "LABEL_681", |
| "LABEL_682", |
| "LABEL_683", |
| "LABEL_684", |
| "LABEL_685", |
| "LABEL_686", |
| "LABEL_687", |
| "LABEL_688", |
| "LABEL_689", |
| "LABEL_690", |
| "LABEL_691", |
| "LABEL_692", |
| "LABEL_693", |
| "LABEL_694", |
| "LABEL_695", |
| "LABEL_696", |
| "LABEL_697", |
| "LABEL_698", |
| "LABEL_699", |
| "LABEL_700", |
| "LABEL_701", |
| "LABEL_702", |
| "LABEL_703", |
| "LABEL_704", |
| "LABEL_705", |
| "LABEL_706", |
| "LABEL_707", |
| "LABEL_708", |
| "LABEL_709", |
| "LABEL_710", |
| "LABEL_711", |
| "LABEL_712", |
| "LABEL_713", |
| "LABEL_714", |
| "LABEL_715", |
| "LABEL_716", |
| "LABEL_717", |
| "LABEL_718", |
| "LABEL_719", |
| "LABEL_720", |
| "LABEL_721", |
| "LABEL_722", |
| "LABEL_723", |
| "LABEL_724", |
| "LABEL_725", |
| "LABEL_726", |
| "LABEL_727", |
| "LABEL_728", |
| "LABEL_729", |
| "LABEL_730", |
| "LABEL_731", |
| "LABEL_732", |
| "LABEL_733", |
| "LABEL_734", |
| "LABEL_735", |
| "LABEL_736", |
| "LABEL_737", |
| "LABEL_738", |
| "LABEL_739", |
| "LABEL_740", |
| "LABEL_741", |
| "LABEL_742", |
| "LABEL_743", |
| "LABEL_744", |
| "LABEL_745", |
| "LABEL_746", |
| "LABEL_747", |
| "LABEL_748", |
| "LABEL_749", |
| "LABEL_750", |
| "LABEL_751", |
| "LABEL_752", |
| "LABEL_753", |
| "LABEL_754", |
| "LABEL_755", |
| "LABEL_756", |
| "LABEL_757", |
| "LABEL_758", |
| "LABEL_759", |
| "LABEL_760", |
| "LABEL_761", |
| "LABEL_762", |
| "LABEL_763", |
| "LABEL_764", |
| "LABEL_765", |
| "LABEL_766", |
| "LABEL_767", |
| "LABEL_768", |
| "LABEL_769", |
| "LABEL_770", |
| "LABEL_771", |
| "LABEL_772", |
| "LABEL_773", |
| "LABEL_774", |
| "LABEL_775", |
| "LABEL_776", |
| "LABEL_777", |
| "LABEL_778", |
| "LABEL_779", |
| "LABEL_780", |
| "LABEL_781", |
| "LABEL_782", |
| "LABEL_783", |
| "LABEL_784", |
| "LABEL_785", |
| "LABEL_786", |
| "LABEL_787", |
| "LABEL_788", |
| "LABEL_789", |
| "LABEL_790", |
| "LABEL_791", |
| "LABEL_792", |
| "LABEL_793", |
| "LABEL_794", |
| "LABEL_795", |
| "LABEL_796", |
| "LABEL_797", |
| "LABEL_798", |
| "LABEL_799", |
| "LABEL_800", |
| "LABEL_801", |
| "LABEL_802", |
| "LABEL_803", |
| "LABEL_804", |
| "LABEL_805", |
| "LABEL_806", |
| "LABEL_807", |
| "LABEL_808", |
| "LABEL_809", |
| "LABEL_810", |
| "LABEL_811", |
| "LABEL_812", |
| "LABEL_813", |
| "LABEL_814", |
| "LABEL_815", |
| "LABEL_816", |
| "LABEL_817", |
| "LABEL_818", |
| "LABEL_819", |
| "LABEL_820", |
| "LABEL_821", |
| "LABEL_822", |
| "LABEL_823", |
| "LABEL_824", |
| "LABEL_825", |
| "LABEL_826", |
| "LABEL_827", |
| "LABEL_828", |
| "LABEL_829", |
| "LABEL_830", |
| "LABEL_831", |
| "LABEL_832", |
| "LABEL_833", |
| "LABEL_834", |
| "LABEL_835", |
| "LABEL_836", |
| "LABEL_837", |
| "LABEL_838", |
| "LABEL_839", |
| "LABEL_840", |
| "LABEL_841", |
| "LABEL_842", |
| "LABEL_843", |
| "LABEL_844", |
| "LABEL_845", |
| "LABEL_846", |
| "LABEL_847", |
| "LABEL_848", |
| "LABEL_849", |
| "LABEL_850", |
| "LABEL_851", |
| "LABEL_852", |
| "LABEL_853", |
| "LABEL_854", |
| "LABEL_855", |
| "LABEL_856", |
| "LABEL_857", |
| "LABEL_858", |
| "LABEL_859", |
| "LABEL_860", |
| "LABEL_861", |
| "LABEL_862", |
| "LABEL_863", |
| "LABEL_864", |
| "LABEL_865", |
| "LABEL_866", |
| "LABEL_867", |
| "LABEL_868", |
| "LABEL_869", |
| "LABEL_870", |
| "LABEL_871", |
| "LABEL_872", |
| "LABEL_873", |
| "LABEL_874", |
| "LABEL_875", |
| "LABEL_876", |
| "LABEL_877", |
| "LABEL_878", |
| "LABEL_879", |
| "LABEL_880", |
| "LABEL_881", |
| "LABEL_882", |
| "LABEL_883", |
| "LABEL_884", |
| "LABEL_885", |
| "LABEL_886", |
| "LABEL_887", |
| "LABEL_888", |
| "LABEL_889", |
| "LABEL_890", |
| "LABEL_891", |
| "LABEL_892", |
| "LABEL_893", |
| "LABEL_894", |
| "LABEL_895", |
| "LABEL_896", |
| "LABEL_897", |
| "LABEL_898", |
| "LABEL_899", |
| "LABEL_900", |
| "LABEL_901", |
| "LABEL_902", |
| "LABEL_903", |
| "LABEL_904", |
| "LABEL_905", |
| "LABEL_906", |
| "LABEL_907", |
| "LABEL_908", |
| "LABEL_909", |
| "LABEL_910", |
| "LABEL_911", |
| "LABEL_912", |
| "LABEL_913", |
| "LABEL_914", |
| "LABEL_915", |
| "LABEL_916", |
| "LABEL_917", |
| "LABEL_918", |
| "LABEL_919", |
| "LABEL_920", |
| "LABEL_921", |
| "LABEL_922", |
| "LABEL_923", |
| "LABEL_924", |
| "LABEL_925", |
| "LABEL_926", |
| "LABEL_927", |
| "LABEL_928", |
| "LABEL_929", |
| "LABEL_930", |
| "LABEL_931", |
| "LABEL_932", |
| "LABEL_933", |
| "LABEL_934", |
| "LABEL_935", |
| "LABEL_936", |
| "LABEL_937", |
| "LABEL_938", |
| "LABEL_939", |
| "LABEL_940", |
| "LABEL_941", |
| "LABEL_942", |
| "LABEL_943", |
| "LABEL_944", |
| "LABEL_945", |
| "LABEL_946", |
| "LABEL_947", |
| "LABEL_948", |
| "LABEL_949", |
| "LABEL_950", |
| "LABEL_951", |
| "LABEL_952", |
| "LABEL_953", |
| "LABEL_954", |
| "LABEL_955", |
| "LABEL_956", |
| "LABEL_957", |
| "LABEL_958", |
| "LABEL_959", |
| "LABEL_960", |
| "LABEL_961", |
| "LABEL_962", |
| "LABEL_963", |
| "LABEL_964", |
| "LABEL_965", |
| "LABEL_966", |
| "LABEL_967", |
| "LABEL_968", |
| "LABEL_969", |
| "LABEL_970", |
| "LABEL_971", |
| "LABEL_972", |
| "LABEL_973", |
| "LABEL_974", |
| "LABEL_975", |
| "LABEL_976", |
| "LABEL_977", |
| "LABEL_978", |
| "LABEL_979", |
| "LABEL_980", |
| "LABEL_981", |
| "LABEL_982", |
| "LABEL_983", |
| "LABEL_984", |
| "LABEL_985", |
| "LABEL_986", |
| "LABEL_987", |
| "LABEL_988", |
| "LABEL_989", |
| "LABEL_990", |
| "LABEL_991", |
| "LABEL_992", |
| "LABEL_993", |
| "LABEL_994", |
| "LABEL_995", |
| "LABEL_996", |
| "LABEL_997", |
| "LABEL_998", |
| "LABEL_999", |
| "LABEL_1000", |
| "LABEL_1001", |
| "LABEL_1002", |
| "LABEL_1003", |
| "LABEL_1004", |
| "LABEL_1005", |
| "LABEL_1006", |
| "LABEL_1007", |
| "LABEL_1008", |
| "LABEL_1009", |
| "LABEL_1010", |
| "LABEL_1011", |
| "LABEL_1012", |
| "LABEL_1013", |
| "LABEL_1014", |
| "LABEL_1015", |
| "LABEL_1016", |
| "LABEL_1017", |
| "LABEL_1018", |
| "LABEL_1019", |
| "LABEL_1020", |
| "LABEL_1021", |
| "LABEL_1022", |
| "LABEL_1023" |
| ], |
| "model_args": {}, |
| "model_type": "timm_wrapper", |
| "num_classes": 1024, |
| "output_attentions": false, |
| "output_hidden_states": false, |
| "pad_token_id": null, |
| "prefix": null, |
| "problem_type": null, |
| "return_dict": true, |
| "sep_token_id": null, |
| "task_specific_params": null, |
| "tie_encoder_decoder": false, |
| "tie_word_embeddings": true, |
| "tokenizer_class": null |
| } |
| } |
| }, |
| "dtype": "float32", |
| "model_type": "pe_audio_video", |
| "text_config": { |
| "attention_bias": false, |
| "attention_dropout": 0.0, |
| "bos_token_id": 50281, |
| "classifier_activation": "gelu", |
| "classifier_bias": false, |
| "classifier_dropout": 0.0, |
| "classifier_pooling": "cls", |
| "cls_token_id": 50281, |
| "decoder_bias": true, |
| "deterministic_flash_attn": false, |
| "dtype": "float32", |
| "embedding_dropout": 0.0, |
| "eos_token_id": 50282, |
| "global_attn_every_n_layers": 3, |
| "hidden_activation": "gelu", |
| "hidden_size": 1024, |
| "initializer_cutoff_factor": 2.0, |
| "initializer_range": 0.02, |
| "intermediate_size": 2624, |
| "layer_types": [ |
| "full_attention", |
| "sliding_attention", |
| "sliding_attention", |
| "full_attention", |
| "sliding_attention", |
| "sliding_attention", |
| "full_attention", |
| "sliding_attention", |
| "sliding_attention", |
| "full_attention", |
| "sliding_attention", |
| "sliding_attention", |
| "full_attention", |
| "sliding_attention", |
| "sliding_attention", |
| "full_attention", |
| "sliding_attention", |
| "sliding_attention", |
| "full_attention", |
| "sliding_attention", |
| "sliding_attention", |
| "full_attention" |
| ], |
| "local_attention": 128, |
| "max_position_embeddings": 8192, |
| "mlp_bias": false, |
| "mlp_dropout": 0.0, |
| "model_type": "modernbert", |
| "norm_bias": false, |
| "norm_eps": 1e-05, |
| "num_attention_heads": 16, |
| "num_hidden_layers": 22, |
| "pad_token_id": 50283, |
| "repad_logits_with_grad": false, |
| "rope_parameters": { |
| "full_attention": { |
| "rope_theta": 160000.0, |
| "rope_type": "default" |
| }, |
| "sliding_attention": { |
| "rope_theta": 10000.0, |
| "rope_type": "default" |
| } |
| }, |
| "sep_token_id": 50282, |
| "sparse_pred_ignore_index": -100, |
| "sparse_prediction": false, |
| "tie_word_embeddings": true, |
| "vocab_size": 50368 |
| }, |
| "tie_word_embeddings": true, |
| "transformers_version": "5.0.1.dev0" |
| } |
|
|