boris commited on
Commit
79557f9
1 Parent(s): 3d64598

feat: update configs

Browse files
tools/train/config/medium/config.json CHANGED
@@ -4,17 +4,17 @@
4
  "attention_dropout": 0.0,
5
  "bos_token_id": 16385,
6
  "classifier_dropout": 0.0,
7
- "d_model": 1536,
8
  "decoder_attention_heads": 16,
9
  "decoder_ffn_dim": 4096,
10
  "decoder_layerdrop": 0.0,
11
- "decoder_layers": 18,
12
  "decoder_start_token_id": 16384,
13
- "dropout": 0.1,
14
  "encoder_attention_heads": 16,
15
  "encoder_ffn_dim": 4096,
16
  "encoder_layerdrop": 0.0,
17
- "encoder_layers": 18,
18
  "encoder_vocab_size": 50264,
19
  "eos_token_id": 16385,
20
  "gradient_checkpointing": false,
 
4
  "attention_dropout": 0.0,
5
  "bos_token_id": 16385,
6
  "classifier_dropout": 0.0,
7
+ "d_model": 1408,
8
  "decoder_attention_heads": 16,
9
  "decoder_ffn_dim": 4096,
10
  "decoder_layerdrop": 0.0,
11
+ "decoder_layers": 14,
12
  "decoder_start_token_id": 16384,
13
+ "dropout": 0.0,
14
  "encoder_attention_heads": 16,
15
  "encoder_ffn_dim": 4096,
16
  "encoder_layerdrop": 0.0,
17
+ "encoder_layers": 14,
18
  "encoder_vocab_size": 50264,
19
  "eos_token_id": 16385,
20
  "gradient_checkpointing": false,
tools/train/config/micro/config.json CHANGED
@@ -8,13 +8,13 @@
8
  "decoder_attention_heads": 16,
9
  "decoder_ffn_dim": 2048,
10
  "decoder_layerdrop": 0.0,
11
- "decoder_layers": 6,
12
  "decoder_start_token_id": 16384,
13
- "dropout": 0.1,
14
  "encoder_attention_heads": 16,
15
  "encoder_ffn_dim": 2048,
16
  "encoder_layerdrop": 0.0,
17
- "encoder_layers": 6,
18
  "encoder_vocab_size": 50264,
19
  "eos_token_id": 16385,
20
  "gradient_checkpointing": false,
 
8
  "decoder_attention_heads": 16,
9
  "decoder_ffn_dim": 2048,
10
  "decoder_layerdrop": 0.0,
11
+ "decoder_layers": 2,
12
  "decoder_start_token_id": 16384,
13
+ "dropout": 0.0,
14
  "encoder_attention_heads": 16,
15
  "encoder_ffn_dim": 2048,
16
  "encoder_layerdrop": 0.0,
17
+ "encoder_layers": 2,
18
  "encoder_vocab_size": 50264,
19
  "eos_token_id": 16385,
20
  "gradient_checkpointing": false,
tools/train/config/mini/config.json CHANGED
@@ -10,7 +10,7 @@
10
  "decoder_layerdrop": 0.0,
11
  "decoder_layers": 12,
12
  "decoder_start_token_id": 16384,
13
- "dropout": 0.1,
14
  "encoder_attention_heads": 16,
15
  "encoder_ffn_dim": 4096,
16
  "encoder_layerdrop": 0.0,
 
10
  "decoder_layerdrop": 0.0,
11
  "decoder_layers": 12,
12
  "decoder_start_token_id": 16384,
13
+ "dropout": 0.0,
14
  "encoder_attention_heads": 16,
15
  "encoder_ffn_dim": 4096,
16
  "encoder_layerdrop": 0.0,