HeathStar's picture
Training in progress, step 10670
15fd76c verified
{
"_name_or_path": "dslim/distilbert-NER",
"activation": "gelu",
"architectures": [
"DistilBertForTokenClassification"
],
"attention_dropout": 0.1,
"dim": 768,
"dropout": 0.1,
"hidden_dim": 3072,
"id2label": {
"0": "O",
"1": "B-ALGEBRA",
"2": "E-ALGEBRA",
"3": "S-ALGEBRA",
"4": "I-ALGEBRA",
"5": "B-APPLIED-MATHEMATICS",
"6": "E-APPLIED-MATHEMATICS",
"7": "S-APPLIED-MATHEMATICS",
"8": "I-APPLIED-MATHEMATICS",
"9": "B-CALCULUS-AND-ANALYSIS",
"10": "I-CALCULUS-AND-ANALYSIS",
"11": "E-CALCULUS-AND-ANALYSIS",
"12": "S-CALCULUS-AND-ANALYSIS",
"13": "S-DETERMINANTS",
"14": "B-DETERMINANTS",
"15": "E-DETERMINANTS",
"16": "I-DETERMINANTS",
"17": "S-DISCRETE-MATHEMATICS",
"18": "B-DISCRETE-MATHEMATICS",
"19": "I-DISCRETE-MATHEMATICS",
"20": "E-DISCRETE-MATHEMATICS",
"21": "S-FOUNDATIONS-OF-MATHEMATICS",
"22": "B-FOUNDATIONS-OF-MATHEMATICS",
"23": "E-FOUNDATIONS-OF-MATHEMATICS",
"24": "I-FOUNDATIONS-OF-MATHEMATICS",
"25": "S-GEOMETRY",
"26": "B-GEOMETRY",
"27": "E-GEOMETRY",
"28": "I-GEOMETRY",
"29": "B-LIE-ALGEBRA",
"30": "E-LIE-ALGEBRA",
"31": "S-LIE-ALGEBRA",
"32": "I-LIE-ALGEBRA",
"33": "B-LINEAR-ALGEBRA",
"34": "E-LINEAR-ALGEBRA",
"35": "I-LINEAR-ALGEBRA",
"36": "S-LINEAR-ALGEBRA",
"37": "S-LINEAR-INDEPENDENCE",
"38": "B-LINEAR-SYSTEMS-OF-EQUATIONS",
"39": "E-LINEAR-SYSTEMS-OF-EQUATIONS",
"40": "I-LINEAR-SYSTEMS-OF-EQUATIONS",
"41": "B-LOC",
"42": "I-LOC",
"43": "S-MATRICES",
"44": "B-MATRICES",
"45": "E-MATRICES",
"46": "I-MATRICES",
"47": "S-NUMBER-THEORY",
"48": "B-NUMBER-THEORY",
"49": "E-NUMBER-THEORY",
"50": "I-NUMBER-THEORY",
"51": "B-ORG",
"52": "I-ORG",
"53": "S-PERMANENTS",
"54": "S-PROBABILITY-AND-STATISTICS",
"55": "B-PROBABILITY-AND-STATISTICS",
"56": "E-PROBABILITY-AND-STATISTICS",
"57": "I-PROBABILITY-AND-STATISTICS",
"58": "S-RECREATIONAL-MATHEMATICS",
"59": "B-RECREATIONAL-MATHEMATICS",
"60": "E-RECREATIONAL-MATHEMATICS",
"61": "I-RECREATIONAL-MATHEMATICS",
"62": "S-TOPOLOGY",
"63": "B-TOPOLOGY",
"64": "I-TOPOLOGY",
"65": "E-TOPOLOGY"
},
"initializer_range": 0.02,
"label2id": {
"B-ALGEBRA": 1,
"B-APPLIED-MATHEMATICS": 5,
"B-CALCULUS-AND-ANALYSIS": 9,
"B-DETERMINANTS": 14,
"B-DISCRETE-MATHEMATICS": 18,
"B-FOUNDATIONS-OF-MATHEMATICS": 22,
"B-GEOMETRY": 26,
"B-LIE-ALGEBRA": 29,
"B-LINEAR-ALGEBRA": 33,
"B-LINEAR-SYSTEMS-OF-EQUATIONS": 38,
"B-LOC": 41,
"B-MATRICES": 44,
"B-NUMBER-THEORY": 48,
"B-ORG": 51,
"B-PROBABILITY-AND-STATISTICS": 55,
"B-RECREATIONAL-MATHEMATICS": 59,
"B-TOPOLOGY": 63,
"E-ALGEBRA": 2,
"E-APPLIED-MATHEMATICS": 6,
"E-CALCULUS-AND-ANALYSIS": 11,
"E-DETERMINANTS": 15,
"E-DISCRETE-MATHEMATICS": 20,
"E-FOUNDATIONS-OF-MATHEMATICS": 23,
"E-GEOMETRY": 27,
"E-LIE-ALGEBRA": 30,
"E-LINEAR-ALGEBRA": 34,
"E-LINEAR-SYSTEMS-OF-EQUATIONS": 39,
"E-MATRICES": 45,
"E-NUMBER-THEORY": 49,
"E-PROBABILITY-AND-STATISTICS": 56,
"E-RECREATIONAL-MATHEMATICS": 60,
"E-TOPOLOGY": 65,
"I-ALGEBRA": 4,
"I-APPLIED-MATHEMATICS": 8,
"I-CALCULUS-AND-ANALYSIS": 10,
"I-DETERMINANTS": 16,
"I-DISCRETE-MATHEMATICS": 19,
"I-FOUNDATIONS-OF-MATHEMATICS": 24,
"I-GEOMETRY": 28,
"I-LIE-ALGEBRA": 32,
"I-LINEAR-ALGEBRA": 35,
"I-LINEAR-SYSTEMS-OF-EQUATIONS": 40,
"I-LOC": 42,
"I-MATRICES": 46,
"I-NUMBER-THEORY": 50,
"I-ORG": 52,
"I-PROBABILITY-AND-STATISTICS": 57,
"I-RECREATIONAL-MATHEMATICS": 61,
"I-TOPOLOGY": 64,
"O": 0,
"S-ALGEBRA": 3,
"S-APPLIED-MATHEMATICS": 7,
"S-CALCULUS-AND-ANALYSIS": 12,
"S-DETERMINANTS": 13,
"S-DISCRETE-MATHEMATICS": 17,
"S-FOUNDATIONS-OF-MATHEMATICS": 21,
"S-GEOMETRY": 25,
"S-LIE-ALGEBRA": 31,
"S-LINEAR-ALGEBRA": 36,
"S-LINEAR-INDEPENDENCE": 37,
"S-MATRICES": 43,
"S-NUMBER-THEORY": 47,
"S-PERMANENTS": 53,
"S-PROBABILITY-AND-STATISTICS": 54,
"S-RECREATIONAL-MATHEMATICS": 58,
"S-TOPOLOGY": 62
},
"max_position_embeddings": 512,
"model_type": "distilbert",
"n_heads": 12,
"n_layers": 6,
"output_past": true,
"pad_token_id": 0,
"qa_dropout": 0.1,
"seq_classif_dropout": 0.2,
"sinusoidal_pos_embds": false,
"tie_weights_": true,
"torch_dtype": "float32",
"transformers_version": "4.47.1",
"vocab_size": 28996
}