{ "_name_or_path": "microsoft/deberta-v3-base", "architectures": [ "DebertaV2ForSequenceClassification" ], "attention_probs_dropout_prob": 0.1, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": { "0": "cs.AI", "1": "cs.AR", "2": "cs.CC", "3": "cs.CE", "4": "cs.CG", "5": "cs.CL", "6": "cs.CR", "7": "cs.CV", "8": "cs.CY", "9": "cs.DB", "10": "cs.DC", "11": "cs.DL", "12": "cs.DM", "13": "cs.DS", "14": "cs.ET", "15": "cs.FL", "16": "cs.GL", "17": "cs.GR", "18": "cs.GT", "19": "cs.HC", "20": "cs.IR", "21": "cs.IT", "22": "cs.LG", "23": "cs.LO", "24": "cs.MA", "25": "cs.MM", "26": "cs.MS", "27": "cs.NA", "28": "cs.NE", "29": "cs.NI", "30": "cs.OH", "31": "cs.OS", "32": "cs.PF", "33": "cs.PL", "34": "cs.RO", "35": "cs.SC", "36": "cs.SD", "37": "cs.SE", "38": "cs.SI", "39": "cs.SY", "40": "econ.EM", "41": "econ.GN", "42": "econ.TH", "43": "eess.AS", "44": "eess.IV", "45": "eess.SP", "46": "eess.SY", "47": "math.AC", "48": "math.AG", "49": "math.AP", "50": "math.AT", "51": "math.CA", "52": "math.CO", "53": "math.CT", "54": "math.CV", "55": "math.DG", "56": "math.DS", "57": "math.FA", "58": "math.GM", "59": "math.GN", "60": "math.GR", "61": "math.GT", "62": "math.HO", "63": "math.IT", "64": "math.KT", "65": "math.LO", "66": "math.MG", "67": "math.MP", "68": "math.NA", "69": "math.NT", "70": "math.OA", "71": "math.OC", "72": "math.PR", "73": "math.QA", "74": "math.RA", "75": "math.RT", "76": "math.SG", "77": "math.SP", "78": "math.ST", "79": "astro-ph.CO", "80": "astro-ph.EP", "81": "astro-ph.GA", "82": "astro-ph.HE", "83": "astro-ph.IM", "84": "astro-ph.SR", "85": "cond-mat.dis-nn", "86": "cond-mat.mes-hall", "87": "cond-mat.mtrl-sci", "88": "cond-mat.other", "89": "cond-mat.quant-gas", "90": "cond-mat.soft", "91": "cond-mat.stat-mech", "92": "cond-mat.str-el", "93": "cond-mat.supr-con", "94": "gr-qc", "95": "hep-ex", "96": "hep-lat", "97": "hep-ph", "98": "hep-th", "99": "math-ph", "100": "nlin.AO", "101": "nlin.CD", "102": "nlin.CG", "103": "nlin.PS", "104": "nlin.SI", "105": "nucl-ex", "106": "nucl-th", "107": "physics.acc-ph", "108": "physics.ao-ph", "109": "physics.app-ph", "110": "physics.atm-clus", "111": "physics.atom-ph", "112": "physics.bio-ph", "113": "physics.chem-ph", "114": "physics.class-ph", "115": "physics.comp-ph", "116": "physics.data-an", "117": "physics.ed-ph", "118": "physics.flu-dyn", "119": "physics.gen-ph", "120": "physics.geo-ph", "121": "physics.hist-ph", "122": "physics.ins-det", "123": "physics.med-ph", "124": "physics.optics", "125": "physics.plasm-ph", "126": "physics.pop-ph", "127": "physics.soc-ph", "128": "physics.space-ph", "129": "quant-ph", "130": "q-bio.BM", "131": "q-bio.CB", "132": "q-bio.GN", "133": "q-bio.MN", "134": "q-bio.NC", "135": "q-bio.OT", "136": "q-bio.PE", "137": "q-bio.QM", "138": "q-bio.SC", "139": "q-bio.TO", "140": "q-fin.CP", "141": "q-fin.EC", "142": "q-fin.GN", "143": "q-fin.MF", "144": "q-fin.PM", "145": "q-fin.PR", "146": "q-fin.RM", "147": "q-fin.ST", "148": "q-fin.TR", "149": "stat.AP", "150": "stat.CO", "151": "stat.ME", "152": "stat.ML", "153": "stat.OT", "154": "stat.TH" }, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "astro-ph.CO": 79, "astro-ph.EP": 80, "astro-ph.GA": 81, "astro-ph.HE": 82, "astro-ph.IM": 83, "astro-ph.SR": 84, "cond-mat.dis-nn": 85, "cond-mat.mes-hall": 86, "cond-mat.mtrl-sci": 87, "cond-mat.other": 88, "cond-mat.quant-gas": 89, "cond-mat.soft": 90, "cond-mat.stat-mech": 91, "cond-mat.str-el": 92, "cond-mat.supr-con": 93, "cs.AI": 0, "cs.AR": 1, "cs.CC": 2, "cs.CE": 3, "cs.CG": 4, "cs.CL": 5, "cs.CR": 6, "cs.CV": 7, "cs.CY": 8, "cs.DB": 9, "cs.DC": 10, "cs.DL": 11, "cs.DM": 12, "cs.DS": 13, "cs.ET": 14, "cs.FL": 15, "cs.GL": 16, "cs.GR": 17, "cs.GT": 18, "cs.HC": 19, "cs.IR": 20, "cs.IT": 21, "cs.LG": 22, "cs.LO": 23, "cs.MA": 24, "cs.MM": 25, "cs.MS": 26, "cs.NA": 27, "cs.NE": 28, "cs.NI": 29, "cs.OH": 30, "cs.OS": 31, "cs.PF": 32, "cs.PL": 33, "cs.RO": 34, "cs.SC": 35, "cs.SD": 36, "cs.SE": 37, "cs.SI": 38, "cs.SY": 39, "econ.EM": 40, "econ.GN": 41, "econ.TH": 42, "eess.AS": 43, "eess.IV": 44, "eess.SP": 45, "eess.SY": 46, "gr-qc": 94, "hep-ex": 95, "hep-lat": 96, "hep-ph": 97, "hep-th": 98, "math-ph": 99, "math.AC": 47, "math.AG": 48, "math.AP": 49, "math.AT": 50, "math.CA": 51, "math.CO": 52, "math.CT": 53, "math.CV": 54, "math.DG": 55, "math.DS": 56, "math.FA": 57, "math.GM": 58, "math.GN": 59, "math.GR": 60, "math.GT": 61, "math.HO": 62, "math.IT": 63, "math.KT": 64, "math.LO": 65, "math.MG": 66, "math.MP": 67, "math.NA": 68, "math.NT": 69, "math.OA": 70, "math.OC": 71, "math.PR": 72, "math.QA": 73, "math.RA": 74, "math.RT": 75, "math.SG": 76, "math.SP": 77, "math.ST": 78, "nlin.AO": 100, "nlin.CD": 101, "nlin.CG": 102, "nlin.PS": 103, "nlin.SI": 104, "nucl-ex": 105, "nucl-th": 106, "physics.acc-ph": 107, "physics.ao-ph": 108, "physics.app-ph": 109, "physics.atm-clus": 110, "physics.atom-ph": 111, "physics.bio-ph": 112, "physics.chem-ph": 113, "physics.class-ph": 114, "physics.comp-ph": 115, "physics.data-an": 116, "physics.ed-ph": 117, "physics.flu-dyn": 118, "physics.gen-ph": 119, "physics.geo-ph": 120, "physics.hist-ph": 121, "physics.ins-det": 122, "physics.med-ph": 123, "physics.optics": 124, "physics.plasm-ph": 125, "physics.pop-ph": 126, "physics.soc-ph": 127, "physics.space-ph": 128, "q-bio.BM": 130, "q-bio.CB": 131, "q-bio.GN": 132, "q-bio.MN": 133, "q-bio.NC": 134, "q-bio.OT": 135, "q-bio.PE": 136, "q-bio.QM": 137, "q-bio.SC": 138, "q-bio.TO": 139, "q-fin.CP": 140, "q-fin.EC": 141, "q-fin.GN": 142, "q-fin.MF": 143, "q-fin.PM": 144, "q-fin.PR": 145, "q-fin.RM": 146, "q-fin.ST": 147, "q-fin.TR": 148, "quant-ph": 129, "stat.AP": 149, "stat.CO": 150, "stat.ME": 151, "stat.ML": 152, "stat.OT": 153, "stat.TH": 154 }, "layer_norm_eps": 1e-07, "max_position_embeddings": 512, "max_relative_positions": -1, "model_type": "deberta-v2", "norm_rel_ebd": "layer_norm", "num_attention_heads": 12, "num_hidden_layers": 12, "pad_token_id": 0, "pooler_dropout": 0, "pooler_hidden_act": "gelu", "pooler_hidden_size": 768, "pos_att_type": [ "p2c", "c2p" ], "position_biased_input": false, "position_buckets": 256, "relative_attention": true, "share_att_key": true, "torch_dtype": "float32", "transformers_version": "4.26.0", "type_vocab_size": 0, "vocab_size": 128100 }