roberta-arxiv-tags / config.json
waleko's picture
waleko/roberta-arxiv-tags
20c0384 verified
{
"_name_or_path": "FacebookAI/roberta-base",
"architectures": [
"RobertaForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"bos_token_id": 0,
"classifier_dropout": null,
"eos_token_id": 2,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "cs.AI",
"1": "cs.CL",
"2": "cs.CV",
"3": "cs.NE",
"4": "stat.ML",
"5": "cs.LG",
"6": "68T45",
"7": "physics.soc-ph",
"8": "68Txx",
"9": "I.2.4",
"10": "68T50",
"11": "I.2.6; I.2.7",
"12": "stat.AP",
"13": "cs.RO",
"14": "cs.SE",
"15": "cs.MA",
"16": "math.OC",
"17": "cs.IR",
"18": "cond-mat.dis-nn",
"19": "68",
"20": "stat.ME",
"21": "physics.chem-ph",
"22": "cs.DC",
"23": "stat.CO",
"24": "q-bio.NC",
"25": "cs.GT",
"26": "cs.MM",
"27": "cs.CG",
"28": "cs.CR",
"29": "cs.HC",
"30": "eess.AS",
"31": "cs.SD",
"32": "math.DS",
"33": "cs.GR",
"34": "math.NA",
"35": "cs.CY",
"36": "physics.data-an",
"37": "math.ST",
"38": "stat.TH",
"39": "cs.IT",
"40": "math.IT",
"41": "quant-ph",
"42": "astro-ph.IM",
"43": "cs.SI",
"44": "cs.DB",
"45": "I.2.7",
"46": "68T05",
"47": "I.2.7; I.2.6",
"48": "I.2.6",
"49": "cs.LO",
"50": "nlin.AO",
"51": "cs.PF",
"52": "cs.ET",
"53": "eess.IV",
"54": "68U10",
"55": "I.2",
"56": "cs.AR",
"57": "cs.SY",
"58": "I.2.6; I.5.1",
"59": "cs.CC",
"60": "q-bio.BM",
"61": "q-bio.QM",
"62": "cs.NI",
"63": "cs.DS",
"64": "cond-mat.stat-mech",
"65": "cs.NA",
"66": "cs.DM",
"67": "eess.SP",
"68": "cs.MS",
"69": "physics.med-ph",
"70": "68T01",
"71": "H.3.3",
"72": "physics.optics",
"73": "cs.FL",
"74": "cs.SC",
"75": "math.PR",
"76": "nlin.CD",
"77": "cs.CE",
"78": "physics.ao-ph",
"79": "68T20",
"80": "cs.PL",
"81": "math.FA",
"82": "I.5.4",
"83": "68T10",
"84": "F.2.2",
"85": "62H30",
"86": "physics.comp-ph",
"87": "cs.DL",
"88": "math.CO",
"89": "G.1.6",
"90": "I.2.8",
"91": "I.2.0",
"92": "F.4.1",
"93": "I.4; I.5",
"94": "J.3",
"95": "I.2.1",
"96": "H.2.8",
"97": "I.2.3",
"98": "68T30",
"99": "G.3",
"100": "q-fin.ST",
"101": "q-bio.GN",
"102": "nlin.CG",
"103": "math.LO",
"104": "math.CT",
"105": "H.3.3; I.2.7",
"106": "q-bio.PE",
"107": "physics.bio-ph",
"108": "math.AG",
"109": "cmp-lg",
"110": "math.DG",
"111": "I.2.4; F.4.1",
"112": "q-bio.MN",
"113": "I.2.3; I.2.4",
"114": "I.2.11",
"115": "I.4.8",
"116": "I.4.6"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"62H30": 85,
"68": 19,
"68T01": 70,
"68T05": 46,
"68T10": 83,
"68T20": 79,
"68T30": 98,
"68T45": 6,
"68T50": 10,
"68Txx": 8,
"68U10": 54,
"F.2.2": 84,
"F.4.1": 92,
"G.1.6": 89,
"G.3": 99,
"H.2.8": 96,
"H.3.3": 71,
"H.3.3; I.2.7": 105,
"I.2": 55,
"I.2.0": 91,
"I.2.1": 95,
"I.2.11": 114,
"I.2.3": 97,
"I.2.3; I.2.4": 113,
"I.2.4": 9,
"I.2.4; F.4.1": 111,
"I.2.6": 48,
"I.2.6; I.2.7": 11,
"I.2.6; I.5.1": 58,
"I.2.7": 45,
"I.2.7; I.2.6": 47,
"I.2.8": 90,
"I.4.6": 116,
"I.4.8": 115,
"I.4; I.5": 93,
"I.5.4": 82,
"J.3": 94,
"astro-ph.IM": 42,
"cmp-lg": 109,
"cond-mat.dis-nn": 18,
"cond-mat.stat-mech": 64,
"cs.AI": 0,
"cs.AR": 56,
"cs.CC": 59,
"cs.CE": 77,
"cs.CG": 27,
"cs.CL": 1,
"cs.CR": 28,
"cs.CV": 2,
"cs.CY": 35,
"cs.DB": 44,
"cs.DC": 22,
"cs.DL": 87,
"cs.DM": 66,
"cs.DS": 63,
"cs.ET": 52,
"cs.FL": 73,
"cs.GR": 33,
"cs.GT": 25,
"cs.HC": 29,
"cs.IR": 17,
"cs.IT": 39,
"cs.LG": 5,
"cs.LO": 49,
"cs.MA": 15,
"cs.MM": 26,
"cs.MS": 68,
"cs.NA": 65,
"cs.NE": 3,
"cs.NI": 62,
"cs.PF": 51,
"cs.PL": 80,
"cs.RO": 13,
"cs.SC": 74,
"cs.SD": 31,
"cs.SE": 14,
"cs.SI": 43,
"cs.SY": 57,
"eess.AS": 30,
"eess.IV": 53,
"eess.SP": 67,
"math.AG": 108,
"math.CO": 88,
"math.CT": 104,
"math.DG": 110,
"math.DS": 32,
"math.FA": 81,
"math.IT": 40,
"math.LO": 103,
"math.NA": 34,
"math.OC": 16,
"math.PR": 75,
"math.ST": 37,
"nlin.AO": 50,
"nlin.CD": 76,
"nlin.CG": 102,
"physics.ao-ph": 78,
"physics.bio-ph": 107,
"physics.chem-ph": 21,
"physics.comp-ph": 86,
"physics.data-an": 36,
"physics.med-ph": 69,
"physics.optics": 72,
"physics.soc-ph": 7,
"q-bio.BM": 60,
"q-bio.GN": 101,
"q-bio.MN": 112,
"q-bio.NC": 24,
"q-bio.PE": 106,
"q-bio.QM": 61,
"q-fin.ST": 100,
"quant-ph": 41,
"stat.AP": 12,
"stat.CO": 23,
"stat.ME": 20,
"stat.ML": 4,
"stat.TH": 38
},
"layer_norm_eps": 1e-05,
"max_position_embeddings": 514,
"model_type": "roberta",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 1,
"position_embedding_type": "absolute",
"problem_type": "multi_label_classification",
"torch_dtype": "float32",
"transformers_version": "4.49.0",
"type_vocab_size": 1,
"use_cache": true,
"vocab_size": 50265
}