domain-labeler / config.json
davidmezzetti's picture
Add model
6f6a301
{
"architectures": [
"ModernBertForSequenceClassification"
],
"attention_bias": false,
"attention_dropout": 0.0,
"bos_token_id": null,
"causal_mask": false,
"classifier_activation": "gelu",
"classifier_bias": false,
"classifier_dropout": 0.0,
"classifier_pooling": "mean",
"cls_token_id": 50281,
"decoder_bias": true,
"deterministic_flash_attn": false,
"dtype": "float32",
"embedding_dropout": 0.0,
"eos_token_id": null,
"global_attn_every_n_layers": 3,
"global_rope_theta": 160000.0,
"gradient_checkpointing": false,
"hidden_activation": "gelu",
"hidden_size": 384,
"id2label": {
"0": "aerospace",
"1": "agronomy",
"2": "artistic",
"3": "astronomy",
"4": "atmospheric_science",
"5": "automotive",
"6": "beauty",
"7": "biology",
"8": "celebrity",
"9": "chemistry",
"10": "civil_engineering",
"11": "communication_engineering",
"12": "computer_science_and_technology",
"13": "design",
"14": "drama_and_film",
"15": "economics",
"16": "electronic_science",
"17": "entertainment",
"18": "environmental_science",
"19": "fashion",
"20": "finance",
"21": "food",
"22": "gamble",
"23": "game",
"24": "geography",
"25": "health",
"26": "history",
"27": "hobby",
"28": "hydraulic_engineering",
"29": "instrument_science",
"30": "journalism_and_media_communication",
"31": "landscape_architecture",
"32": "law",
"33": "library",
"34": "literature",
"35": "materials_science",
"36": "mathematics",
"37": "mechanical_engineering",
"38": "medical",
"39": "mining_engineering",
"40": "movie",
"41": "music_and_dance",
"42": "news",
"43": "nuclear_science",
"44": "ocean_science",
"45": "optical_engineering",
"46": "painting",
"47": "pet",
"48": "petroleum_and_natural_gas_engineering",
"49": "philosophy",
"50": "photo",
"51": "physics",
"52": "politics",
"53": "psychology",
"54": "public_administration",
"55": "relationship",
"56": "religion",
"57": "sociology",
"58": "sports",
"59": "statistics",
"60": "systems_science",
"61": "textile_science",
"62": "topicality",
"63": "transportation_engineering",
"64": "travel",
"65": "urban_planning",
"66": "vulgar_language"
},
"initializer_cutoff_factor": 2.0,
"initializer_range": 0.02,
"intermediate_size": 576,
"is_causal": false,
"label2id": {
"aerospace": 0,
"agronomy": 1,
"artistic": 2,
"astronomy": 3,
"atmospheric_science": 4,
"automotive": 5,
"beauty": 6,
"biology": 7,
"celebrity": 8,
"chemistry": 9,
"civil_engineering": 10,
"communication_engineering": 11,
"computer_science_and_technology": 12,
"design": 13,
"drama_and_film": 14,
"economics": 15,
"electronic_science": 16,
"entertainment": 17,
"environmental_science": 18,
"fashion": 19,
"finance": 20,
"food": 21,
"gamble": 22,
"game": 23,
"geography": 24,
"health": 25,
"history": 26,
"hobby": 27,
"hydraulic_engineering": 28,
"instrument_science": 29,
"journalism_and_media_communication": 30,
"landscape_architecture": 31,
"law": 32,
"library": 33,
"literature": 34,
"materials_science": 35,
"mathematics": 36,
"mechanical_engineering": 37,
"medical": 38,
"mining_engineering": 39,
"movie": 40,
"music_and_dance": 41,
"news": 42,
"nuclear_science": 43,
"ocean_science": 44,
"optical_engineering": 45,
"painting": 46,
"pet": 47,
"petroleum_and_natural_gas_engineering": 48,
"philosophy": 49,
"photo": 50,
"physics": 51,
"politics": 52,
"psychology": 53,
"public_administration": 54,
"relationship": 55,
"religion": 56,
"sociology": 57,
"sports": 58,
"statistics": 59,
"systems_science": 60,
"textile_science": 61,
"topicality": 62,
"transportation_engineering": 63,
"travel": 64,
"urban_planning": 65,
"vulgar_language": 66
},
"layer_norm_eps": 1e-05,
"local_attention": 128,
"local_rope_theta": 160000.0,
"max_position_embeddings": 7999,
"mlp_bias": false,
"mlp_dropout": 0.0,
"model_type": "modernbert",
"norm_bias": false,
"norm_eps": 1e-05,
"num_attention_heads": 6,
"num_hidden_layers": 10,
"pad_token_id": 50283,
"position_embedding_type": "sans_pos",
"problem_type": "single_label_classification",
"repad_logits_with_grad": false,
"sep_token_id": 50282,
"sparse_pred_ignore_index": -100,
"sparse_prediction": false,
"transformers_version": "4.57.6",
"vocab_size": 50368
}