File size: 3,510 Bytes
e1bb66b 9ba3f05 e1bb66b 9ba3f05 e1bb66b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 |
{
"_name_or_path": "Yozhikoff/arxiv-topics-distilbert-base-cased",
"activation": "gelu",
"architectures": [
"DistilBertForSequenceClassification"
],
"attention_dropout": 0.1,
"dim": 768,
"dropout": 0.1,
"hidden_dim": 3072,
"id2label": {
"0": "Computer Vision and Pattern Recognition",
"1": "Machine Learning",
"2": "Artificial Intelligence",
"3": "Machine Learning",
"4": "Computation and Language",
"5": "Neural and Evolutionary Computing",
"6": "Information Retrieval",
"7": "Optimization and Control",
"8": "Robotics",
"9": "Logic in Computer Science",
"10": "Social and Information Networks",
"11": "Data Structures and Algorithms",
"12": "Information Theory",
"13": "Information Theory",
"14": "Quantitative Biology - Neurons and Cognition",
"15": "Methodology",
"16": "Human-Computer Interaction",
"17": "Cryptography and Security",
"18": "Distributed, Parallel, and Cluster Computing",
"19": "Sound",
"20": "Computers and Society",
"21": "Applications",
"22": "Multimedia",
"23": "Statistics Theory",
"24": "Statistics Theory",
"25": "Databases",
"26": "Computer Science and Game Theory",
"27": "Natural Language Processing",
"28": "Physics and Society",
"29": "Computational Engineering, Finance, and Science",
"30": "Systems and Control",
"31": "Multiagent Systems",
"32": "Combinatorics",
"33": "Numerical Analysis",
"34": "Quantitative Biology - Quantitative Methods",
"35": "Graphics",
"36": "Computational Complexity",
"37": "Data Analysis, Statistics and Probability",
"38": "Software Engineering",
"39": "Numerical Analysis",
"40": "Probability",
"41": "Quantum Physics",
"42": "Digital Libraries",
"43": "Networking and Internet Architecture",
"44": "Learning",
"45": "Programming Languages",
"46": "Disordered Systems and Neural Networks",
"47": "Adaptation and Self-Organizing Systems",
"48": "Computation and Language",
"49": "Discrete Mathematics"
},
"initializer_range": 0.02,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_10": 10,
"LABEL_11": 11,
"LABEL_12": 12,
"LABEL_13": 13,
"LABEL_14": 14,
"LABEL_15": 15,
"LABEL_16": 16,
"LABEL_17": 17,
"LABEL_18": 18,
"LABEL_19": 19,
"LABEL_2": 2,
"LABEL_20": 20,
"LABEL_21": 21,
"LABEL_22": 22,
"LABEL_23": 23,
"LABEL_24": 24,
"LABEL_25": 25,
"LABEL_26": 26,
"LABEL_27": 27,
"LABEL_28": 28,
"LABEL_29": 29,
"LABEL_3": 3,
"LABEL_30": 30,
"LABEL_31": 31,
"LABEL_32": 32,
"LABEL_33": 33,
"LABEL_34": 34,
"LABEL_35": 35,
"LABEL_36": 36,
"LABEL_37": 37,
"LABEL_38": 38,
"LABEL_39": 39,
"LABEL_4": 4,
"LABEL_40": 40,
"LABEL_41": 41,
"LABEL_42": 42,
"LABEL_43": 43,
"LABEL_44": 44,
"LABEL_45": 45,
"LABEL_46": 46,
"LABEL_47": 47,
"LABEL_48": 48,
"LABEL_49": 49,
"LABEL_5": 5,
"LABEL_6": 6,
"LABEL_7": 7,
"LABEL_8": 8,
"LABEL_9": 9
},
"max_position_embeddings": 512,
"model_type": "distilbert",
"n_heads": 12,
"n_layers": 6,
"output_past": true,
"pad_token_id": 0,
"problem_type": "multi_label_classification",
"qa_dropout": 0.1,
"seq_classif_dropout": 0.2,
"sinusoidal_pos_embds": false,
"tie_weights_": true,
"torch_dtype": "float32",
"transformers_version": "4.27.4",
"vocab_size": 28996
}
|