Yozhikoff's picture
Upload 2 files
9ba3f05
{
"_name_or_path": "Yozhikoff/arxiv-topics-distilbert-base-cased",
"activation": "gelu",
"architectures": [
"DistilBertForSequenceClassification"
],
"attention_dropout": 0.1,
"dim": 768,
"dropout": 0.1,
"hidden_dim": 3072,
"id2label": {
"0": "Computer Vision and Pattern Recognition",
"1": "Machine Learning",
"2": "Artificial Intelligence",
"3": "Machine Learning",
"4": "Computation and Language",
"5": "Neural and Evolutionary Computing",
"6": "Information Retrieval",
"7": "Optimization and Control",
"8": "Robotics",
"9": "Logic in Computer Science",
"10": "Social and Information Networks",
"11": "Data Structures and Algorithms",
"12": "Information Theory",
"13": "Information Theory",
"14": "Quantitative Biology - Neurons and Cognition",
"15": "Methodology",
"16": "Human-Computer Interaction",
"17": "Cryptography and Security",
"18": "Distributed, Parallel, and Cluster Computing",
"19": "Sound",
"20": "Computers and Society",
"21": "Applications",
"22": "Multimedia",
"23": "Statistics Theory",
"24": "Statistics Theory",
"25": "Databases",
"26": "Computer Science and Game Theory",
"27": "Natural Language Processing",
"28": "Physics and Society",
"29": "Computational Engineering, Finance, and Science",
"30": "Systems and Control",
"31": "Multiagent Systems",
"32": "Combinatorics",
"33": "Numerical Analysis",
"34": "Quantitative Biology - Quantitative Methods",
"35": "Graphics",
"36": "Computational Complexity",
"37": "Data Analysis, Statistics and Probability",
"38": "Software Engineering",
"39": "Numerical Analysis",
"40": "Probability",
"41": "Quantum Physics",
"42": "Digital Libraries",
"43": "Networking and Internet Architecture",
"44": "Learning",
"45": "Programming Languages",
"46": "Disordered Systems and Neural Networks",
"47": "Adaptation and Self-Organizing Systems",
"48": "Computation and Language",
"49": "Discrete Mathematics"
},
"initializer_range": 0.02,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_10": 10,
"LABEL_11": 11,
"LABEL_12": 12,
"LABEL_13": 13,
"LABEL_14": 14,
"LABEL_15": 15,
"LABEL_16": 16,
"LABEL_17": 17,
"LABEL_18": 18,
"LABEL_19": 19,
"LABEL_2": 2,
"LABEL_20": 20,
"LABEL_21": 21,
"LABEL_22": 22,
"LABEL_23": 23,
"LABEL_24": 24,
"LABEL_25": 25,
"LABEL_26": 26,
"LABEL_27": 27,
"LABEL_28": 28,
"LABEL_29": 29,
"LABEL_3": 3,
"LABEL_30": 30,
"LABEL_31": 31,
"LABEL_32": 32,
"LABEL_33": 33,
"LABEL_34": 34,
"LABEL_35": 35,
"LABEL_36": 36,
"LABEL_37": 37,
"LABEL_38": 38,
"LABEL_39": 39,
"LABEL_4": 4,
"LABEL_40": 40,
"LABEL_41": 41,
"LABEL_42": 42,
"LABEL_43": 43,
"LABEL_44": 44,
"LABEL_45": 45,
"LABEL_46": 46,
"LABEL_47": 47,
"LABEL_48": 48,
"LABEL_49": 49,
"LABEL_5": 5,
"LABEL_6": 6,
"LABEL_7": 7,
"LABEL_8": 8,
"LABEL_9": 9
},
"max_position_embeddings": 512,
"model_type": "distilbert",
"n_heads": 12,
"n_layers": 6,
"output_past": true,
"pad_token_id": 0,
"problem_type": "multi_label_classification",
"qa_dropout": 0.1,
"seq_classif_dropout": 0.2,
"sinusoidal_pos_embds": false,
"tie_weights_": true,
"torch_dtype": "float32",
"transformers_version": "4.27.4",
"vocab_size": 28996
}