Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.
2999c7f
{ | |
"model_save_dir": "models", | |
"model_save_name": "lt-historicjapanesecompanies-comp-prod-ind_onlinecontrastive_full", | |
"opt_model_description": "This model was trained on a dataset of historic Japanese companies, products, industry, addresses, and shareholders. Take a look at our paper for more details. The task is to link indices of japanese companies", | |
"opt_model_lang": "ja", | |
"train_batch_size": 64, | |
"num_epochs": 50, | |
"warm_up_perc": 1, | |
"learning_rate": 2e-05, | |
"loss_type": "onlinecontrastive", | |
"val_perc": 0.2, | |
"wandb_names": { | |
"id": "econabhishek", | |
"run": "lt-historicjapanesecompanies-comp-prod-ind_onlinecontrastive_full", | |
"project": "linkage", | |
"entity": "econabhishek" | |
}, | |
"add_pooling_layer": false, | |
"large_val": true, | |
"eval_steps_perc": 0.5, | |
"test_at_end": true, | |
"save_val_test_pickles": true, | |
"val_query_prop": 0.5, | |
"loss_params": {}, | |
"eval_type": "classification", | |
"training_dataset": "dataframe", | |
"base_model_path": "oshizo/sbert-jsnli-luke-japanese-base-lite", | |
"best_model_path": "models/lt-historicjapanesecompanies-comp-prod-ind_onlinecontrastive_full" | |
} |