{ "architectures": [ "ModernBertForSequenceClassification" ], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 50281, "classifier_activation": "gelu", "classifier_bias": false, "classifier_dropout": 0.0, "classifier_pooling": "mean", "cls_token_id": 50281, "decoder_bias": true, "deterministic_flash_attn": false, "embedding_dropout": 0.0, "eos_token_id": 50282, "global_attn_every_n_layers": 3, "global_rope_theta": 160000.0, "gradient_checkpointing": false, "hidden_activation": "gelu", "hidden_size": 768, "num_labels": 24, "id2label": { "0": "Adult", "1": "Art & Design", "10": "Food & Dining", "11": "Games", "12": "Health", "13": "History", "14": "Home & Hobbies", "15": "Industrial", "16": "Literature", "17": "Politics", "18": "Religion", "19": "Science & Tech.", "2": "Software Dev.", "20": "Software", "21": "Sports & Fitness", "22": "Transportation", "23": "Travel", "3": "Crime & Law", "4": "Education & Jobs", "5": "Hardware", "6": "Entertainment", "7": "Social Life", "8": "Fashion & Beauty", "9": "Finance & Business" }, "initializer_cutoff_factor": 2.0, "initializer_range": 0.02, "intermediate_size": 1152, "label2id": { "Adult": 0, "Art & Design": 1, "Crime & Law": 3, "Education & Jobs": 4, "Entertainment": 6, "Fashion & Beauty": 8, "Finance & Business": 9, "Food & Dining": 10, "Games": 11, "Hardware": 5, "Health": 12, "History": 13, "Home & Hobbies": 14, "Industrial": 15, "Literature": 16, "Politics": 17, "Religion": 18, "Science & Tech.": 19, "Social Life": 7, "Software": 20, "Software Dev.": 2, "Sports & Fitness": 21, "Transportation": 22, "Travel": 23 }, "layer_norm_eps": 1e-05, "local_attention": 128, "local_rope_theta": 10000.0, "max_position_embeddings": 8192, "mlp_bias": false, "mlp_dropout": 0.0, "model_type": "modernbert", "norm_bias": false, "norm_eps": 1e-05, "num_attention_heads": 12, "num_hidden_layers": 22, "pad_token_id": 50283, "position_embedding_type": "absolute", "reference_compile": true, "repad_logits_with_grad": false, "sep_token_id": 50282, "sparse_pred_ignore_index": -100, "sparse_prediction": false, "torch_dtype": "bfloat16", "transformers_version": "4.50.0", "vocab_size": 50368 }