meghanaraok
/

HiLAT_50

Inference Endpoints

Model card Files Files and versions Community

HiLAT_50 / config.json

meghanaraok's picture

Upload 2 files

0640e01 verified 9 months ago

history blame contribute delete

1.75 kB

	{
	"model_name_or_path": "pretrained/ClinicalplusXLNet/",
	"tokenizer_name": "xlnet-base-cased",
	"output_dir": "../model/",
	"overwrite_output_dir": true,

	"task_name": "mimic3-50",
	"max_seq_length": 512,
	"train_file": "../data/mimic3/50/train_data_50_level_1_new.csv",
	"validation_file": "../data/mimic3/50/dev_data_50_level_1_new.csv",
	"test_file": "../data/mimic3/50/test_data_50_level_1_new.csv",
	"label_dictionary_file": "../data/mimic3/50/labels_dictionary_50_level_1.csv",
	"ignore_keys_for_eval": ["preds", "label_attention_weights", "chunk_attention_weights"],
	"use_cached_datasets": true,
	"data_segmented": false,
	"lazy_loading": false,

	"d_model": 768,
	"dropout": 0.1,
	"dropout_att": 0.1,
	"num_chunks_per_document": 10,
	"transformer_layer_update_strategy": "all",
	"use_code_representation": false,
	"multi_head_attention": false,
	"chunk_attention": true,
	"multi_head_chunk_attention": false,
	"linear_init_mean": 0.0,
	"linear_init_std": 0.03,
	"document_pooling_strategy": "mean",

	"do_train": true,
	"do_eval": true,
	"do_predict": true,
	"evaluation_strategy": "steps",
	"per_device_train_batch_size": 4,
	"per_device_eval_batch_size": 4,
	"gradient_accumulation_steps": 1,
	"learning_rate": 5e-5,
	"weight_decay": 0.1,
	"num_train_epochs": 100,
	"max_steps": 10000,
	"warmup_steps": 500,
	"log_level": "error",
	"logging_strategy": "steps",
	"logging_steps": 500,
	"save_strategy": "steps",
	"save_steps": 500,
	"seed": 2022,
	"dataloader_drop_last": false,
	"disable_tqdm": false,
	"label_names": ["targets"],
	"load_best_model_at_end": false,
	"metric_for_best_model": "micro_f1",
	"greater_is_better": true,
	"remove_unused_columns": false,
	"report_to": "none"
	}