lt-historicjapan-supcon / LT_training_config.json
96abhishekarora's picture
Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.
6aa6cec
raw
history blame
1.09 kB
{
"model_save_dir": "models",
"model_save_name": "lt-historicjapanesecompanies-comp-prod-ind_supcon_full",
"opt_model_description": "This model was trained on a dataset of historic Japanese companies, products, industry, addresses, and shareholders. Take a look at our paper for more details. The task is to link indices of japanese companies",
"opt_model_lang": "ja",
"train_batch_size": 64,
"num_epochs": 50,
"warm_up_perc": 1,
"learning_rate": 2e-05,
"loss_type": "supcon",
"val_perc": 0.2,
"wandb_names": {
"id": "econabhishek",
"run": "lt-historicjapanesecompanies-comp-prod-ind_supcon_full",
"project": "linkage",
"entity": "econabhishek"
},
"add_pooling_layer": false,
"large_val": true,
"eval_steps_perc": 0.5,
"test_at_end": true,
"save_val_test_pickles": true,
"val_query_prop": 0.5,
"loss_params": {},
"eval_type": "classification",
"training_dataset": "dataframe",
"base_model_path": "oshizo/sbert-jsnli-luke-japanese-base-lite",
"best_model_path": "models/lt-historicjapanesecompanies-comp-prod-ind_supcon_full"
}