lt-historicjapan-onlinecontrastive / LT_training_config.json
96abhishekarora's picture
Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.
2999c7f
{
"model_save_dir": "models",
"model_save_name": "lt-historicjapanesecompanies-comp-prod-ind_onlinecontrastive_full",
"opt_model_description": "This model was trained on a dataset of historic Japanese companies, products, industry, addresses, and shareholders. Take a look at our paper for more details. The task is to link indices of japanese companies",
"opt_model_lang": "ja",
"train_batch_size": 64,
"num_epochs": 50,
"warm_up_perc": 1,
"learning_rate": 2e-05,
"loss_type": "onlinecontrastive",
"val_perc": 0.2,
"wandb_names": {
"id": "econabhishek",
"run": "lt-historicjapanesecompanies-comp-prod-ind_onlinecontrastive_full",
"project": "linkage",
"entity": "econabhishek"
},
"add_pooling_layer": false,
"large_val": true,
"eval_steps_perc": 0.5,
"test_at_end": true,
"save_val_test_pickles": true,
"val_query_prop": 0.5,
"loss_params": {},
"eval_type": "classification",
"training_dataset": "dataframe",
"base_model_path": "oshizo/sbert-jsnli-luke-japanese-base-lite",
"best_model_path": "models/lt-historicjapanesecompanies-comp-prod-ind_onlinecontrastive_full"
}