{ "_name_or_path": "Yozhikoff/arxiv-topics-distilbert-base-cased", "activation": "gelu", "architectures": [ "DistilBertForSequenceClassification" ], "attention_dropout": 0.1, "dim": 768, "dropout": 0.1, "hidden_dim": 3072, "id2label": { "0": "Computer Vision and Pattern Recognition", "1": "Machine Learning", "2": "Artificial Intelligence", "3": "Machine Learning", "4": "Computation and Language", "5": "Neural and Evolutionary Computing", "6": "Information Retrieval", "7": "Optimization and Control", "8": "Robotics", "9": "Logic in Computer Science", "10": "Social and Information Networks", "11": "Data Structures and Algorithms", "12": "Information Theory", "13": "Information Theory", "14": "Quantitative Biology - Neurons and Cognition", "15": "Methodology", "16": "Human-Computer Interaction", "17": "Cryptography and Security", "18": "Distributed, Parallel, and Cluster Computing", "19": "Sound", "20": "Computers and Society", "21": "Applications", "22": "Multimedia", "23": "Statistics Theory", "24": "Statistics Theory", "25": "Databases", "26": "Computer Science and Game Theory", "27": "Natural Language Processing", "28": "Physics and Society", "29": "Computational Engineering, Finance, and Science", "30": "Systems and Control", "31": "Multiagent Systems", "32": "Combinatorics", "33": "Numerical Analysis", "34": "Quantitative Biology - Quantitative Methods", "35": "Graphics", "36": "Computational Complexity", "37": "Data Analysis, Statistics and Probability", "38": "Software Engineering", "39": "Numerical Analysis", "40": "Probability", "41": "Quantum Physics", "42": "Digital Libraries", "43": "Networking and Internet Architecture", "44": "Learning", "45": "Programming Languages", "46": "Disordered Systems and Neural Networks", "47": "Adaptation and Self-Organizing Systems", "48": "Computation and Language", "49": "Discrete Mathematics" }, "initializer_range": 0.02, "label2id": { "LABEL_0": 0, "LABEL_1": 1, "LABEL_10": 10, "LABEL_11": 11, "LABEL_12": 12, "LABEL_13": 13, "LABEL_14": 14, "LABEL_15": 15, "LABEL_16": 16, "LABEL_17": 17, "LABEL_18": 18, "LABEL_19": 19, "LABEL_2": 2, "LABEL_20": 20, "LABEL_21": 21, "LABEL_22": 22, "LABEL_23": 23, "LABEL_24": 24, "LABEL_25": 25, "LABEL_26": 26, "LABEL_27": 27, "LABEL_28": 28, "LABEL_29": 29, "LABEL_3": 3, "LABEL_30": 30, "LABEL_31": 31, "LABEL_32": 32, "LABEL_33": 33, "LABEL_34": 34, "LABEL_35": 35, "LABEL_36": 36, "LABEL_37": 37, "LABEL_38": 38, "LABEL_39": 39, "LABEL_4": 4, "LABEL_40": 40, "LABEL_41": 41, "LABEL_42": 42, "LABEL_43": 43, "LABEL_44": 44, "LABEL_45": 45, "LABEL_46": 46, "LABEL_47": 47, "LABEL_48": 48, "LABEL_49": 49, "LABEL_5": 5, "LABEL_6": 6, "LABEL_7": 7, "LABEL_8": 8, "LABEL_9": 9 }, "max_position_embeddings": 512, "model_type": "distilbert", "n_heads": 12, "n_layers": 6, "output_past": true, "pad_token_id": 0, "problem_type": "multi_label_classification", "qa_dropout": 0.1, "seq_classif_dropout": 0.2, "sinusoidal_pos_embds": false, "tie_weights_": true, "torch_dtype": "float32", "transformers_version": "4.27.4", "vocab_size": 28996 }