File size: 713 Bytes
2428af1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 |
# Layer dimensions
mlp_input: 1024
mlp_tag_hidden: 16
mlp_arc_hidden: 512
mlp_lab_hidden: 128
# Lexers
lexers:
- name: word_embeddings
type: words
embedding_size: 256
word_dropout: 0.5
- name: char_level_embeddings
type: chars_rnn
embedding_size: 64
lstm_output_size: 128
- name: fasttext
type: fasttext
- name: camembertav2_base_p2_17k_last_layer
type: bert
model: /scratch/camembertv2/runs/models/camembertav2-base-bf16/post/ckpt-p2-17000/pt/discriminator/
layers: [11]
subwords_reduction: "mean"
# Training hyperparameters
encoder_dropout: 0.5
mlp_dropout: 0.5
batch_size: 8
epochs: 64
lr:
base: 0.00003
schedule:
shape: linear
warmup_steps: 100
|