# Layer dimensions | |
mlp_input: 1024 | |
mlp_tag_hidden: 16 | |
mlp_arc_hidden: 512 | |
mlp_lab_hidden: 128 | |
# Lexers | |
lexers: | |
- name: word_embeddings | |
type: words | |
embedding_size: 256 | |
word_dropout: 0.5 | |
- name: char_level_embeddings | |
type: chars_rnn | |
embedding_size: 64 | |
lstm_output_size: 128 | |
- name: fasttext | |
type: fasttext | |
- name: camembertav2_base_p2_17k_last_layer | |
type: bert | |
model: /scratch/camembertv2/runs/models/camembertav2-base-bf16/post/ckpt-p2-17000/pt/discriminator/ | |
layers: [11] | |
subwords_reduction: "mean" | |
# Training hyperparameters | |
encoder_dropout: 0.5 | |
mlp_dropout: 0.5 | |
batch_size: 8 | |
epochs: 64 | |
lr: | |
base: 0.00003 | |
schedule: | |
shape: linear | |
warmup_steps: 100 | |