Image-to-Text
Transformers
PyTorch
donut
vision
Eval Results
hmarzan's picture
First version of Donut DR Matriculas
4d03da9
raw
history blame contribute delete
720 Bytes
resume_from_checkpoint_path: None
result_path: 'trainer/result'
pretrained_model_name_or_path: 'marzanconsulting/donut-dr-matriculas-ocr'
dataset_name_or_paths:
- 'trainer/dataset'
task_start_tokens:
- '<s_matricula>'
sort_json_key: False
train_batch_sizes:
- 5
val_batch_sizes:
- 1
input_size:
- 960
- 1280
max_length: 868
max_position_embeddings: 868
align_long_axis: False
num_nodes: 1
seed: 2022
lr: 3e-05
warmup_steps: 300
num_training_samples_per_epoch: 800
max_epochs: 50
max_steps: -1
num_workers: 12
val_check_interval: 1.0
check_val_every_n_epoch: 3
gradient_clip_val: 1.0
verbose: True
model_dir: ''
tensorboard_dir: ''
checkpoint_dir:
exp_name: 'train_cord_matriculas'
exp_version: 'mmc_v1'