File size: 475 Bytes
3bcee60 d957b41 b1ad6b7 d957b41 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 |
name: t5_text_generation
config_type: model
vocab_size: 32103
d_model: 768
d_kv: 64
d_ff: 2048
num_layers: 12
num_decoder_layers: 12
num_heads: 12
relative_attention_num_buckets: 32
relative_attention_max_distance: 128
dropout_rate: 0.1
layer_norm_epsilon: 1.0e-06
initializer_factor: 1.0
feed_forward_proj: gated-gelu
is_encoder_decoder: true
tie_word_embeddings: false
use_cache: true
pad_token_id: 0
decoder_start_token_id: 0
eos_token_id: 1
min_length: 0
max_length: 100
|