|
{ |
|
"_CHeeSEArguments": "CHeeSEArguments", |
|
"model_name_or_path": "LennartKeller/nystromformer-gottbert-base-8192", |
|
"dataset_path": "./dataset.py", |
|
"metric_path": "./metric.py", |
|
"task": "stance_detection", |
|
"first_sentence_inputs": [ |
|
"question" |
|
], |
|
"second_sentence_inputs": [ |
|
"title", |
|
"snippet", |
|
"paragraphs" |
|
], |
|
"labels_to_predict": [ |
|
"stance" |
|
], |
|
"_CHeeSETrainingArguments": "CHeeSETrainingArguments", |
|
"do_train": true, |
|
"do_eval": true, |
|
"do_predict": true, |
|
"do_cross_validation": false, |
|
"output_dir": "/netscratch/schnitzler/nystromformer-8", |
|
"logging_dir": "/netscratch/schnitzler/nystromformer-8", |
|
"save_total_limit": 3, |
|
"log_to_file": true, |
|
"logging_strategy": "steps", |
|
"logging_steps": 50, |
|
"cross_validation_folds": 5, |
|
"save_steps": 1000, |
|
"evaluation_strategy": "steps", |
|
"eval_steps": 500, |
|
"seed": 121, |
|
"num_train_epochs": 4, |
|
"per_device_train_batch_size": 8, |
|
"per_device_eval_batch_size": 8, |
|
"learning_rate": 3e-05, |
|
"prediction_csv_kwargs": { |
|
"index": false |
|
}, |
|
"prediction_columns_to_include": [ |
|
"title", |
|
"snippet", |
|
"paragraphs", |
|
"question", |
|
"labels", |
|
"stance" |
|
], |
|
"overwrite_output_dir": true |
|
} |