andrespm commited on
Commit
93f59bf
1 Parent(s): 3165be8

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +51 -20
config.json CHANGED
@@ -1,12 +1,18 @@
1
  {
2
- "_name_or_path": "facebook/wav2vec2-large-xlsr-53",
3
- "activation_dropout": 0.0,
 
 
 
4
  "apply_spec_augment": true,
5
  "architectures": [
6
  "Wav2Vec2ForCTC"
7
  ],
8
- "attention_dropout": 0.1,
9
  "bos_token_id": 1,
 
 
 
10
  "conv_bias": true,
11
  "conv_dim": [
12
  512,
@@ -37,40 +43,65 @@
37
  ],
38
  "ctc_loss_reduction": "mean",
39
  "ctc_zero_infinity": false,
 
40
  "do_stable_layer_norm": true,
41
  "eos_token_id": 2,
42
  "feat_extract_activation": "gelu",
43
  "feat_extract_dropout": 0.0,
44
  "feat_extract_norm": "layer",
45
- "feat_proj_dropout": 0.0,
 
46
  "final_dropout": 0.0,
47
- "gradient_checkpointing": true,
48
  "hidden_act": "gelu",
49
- "hidden_dropout": 0.1,
50
  "hidden_size": 1024,
51
  "initializer_range": 0.02,
52
  "intermediate_size": 4096,
53
  "layer_norm_eps": 1e-05,
54
- "layerdrop": 0.1,
55
- "mask_channel_length": 10,
56
- "mask_channel_min_space": 1,
57
- "mask_channel_other": 0.0,
58
- "mask_channel_prob": 0.0,
59
- "mask_channel_selection": "static",
60
  "mask_feature_length": 10,
 
61
  "mask_feature_prob": 0.0,
62
  "mask_time_length": 10,
63
- "mask_time_min_space": 1,
64
- "mask_time_other": 0.0,
65
- "mask_time_prob": 0.05,
66
- "mask_time_selection": "static",
67
  "model_type": "wav2vec2",
 
68
  "num_attention_heads": 16,
 
 
69
  "num_conv_pos_embedding_groups": 16,
70
  "num_conv_pos_embeddings": 128,
71
  "num_feat_extract_layers": 7,
72
  "num_hidden_layers": 24,
73
- "pad_token_id": 34,
74
- "transformers_version": "4.4.0",
75
- "vocab_size": 35
76
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  {
2
+ "_name_or_path": "facebook/wav2vec2-xls-r-300m",
3
+ "activation_dropout": 0.04,
4
+ "adapter_kernel_size": 3,
5
+ "adapter_stride": 2,
6
+ "add_adapter": false,
7
  "apply_spec_augment": true,
8
  "architectures": [
9
  "Wav2Vec2ForCTC"
10
  ],
11
+ "attention_dropout": 0.01,
12
  "bos_token_id": 1,
13
+ "classifier_proj_size": 256,
14
+ "codevector_dim": 768,
15
+ "contrastive_logits_temperature": 0.1,
16
  "conv_bias": true,
17
  "conv_dim": [
18
  512,
 
43
  ],
44
  "ctc_loss_reduction": "mean",
45
  "ctc_zero_infinity": false,
46
+ "diversity_loss_weight": 0.1,
47
  "do_stable_layer_norm": true,
48
  "eos_token_id": 2,
49
  "feat_extract_activation": "gelu",
50
  "feat_extract_dropout": 0.0,
51
  "feat_extract_norm": "layer",
52
+ "feat_proj_dropout": 0.04,
53
+ "feat_quantizer_dropout": 0.0,
54
  "final_dropout": 0.0,
 
55
  "hidden_act": "gelu",
56
+ "hidden_dropout": 0.04,
57
  "hidden_size": 1024,
58
  "initializer_range": 0.02,
59
  "intermediate_size": 4096,
60
  "layer_norm_eps": 1e-05,
61
+ "layerdrop": 0.04,
 
 
 
 
 
62
  "mask_feature_length": 10,
63
+ "mask_feature_min_masks": 0,
64
  "mask_feature_prob": 0.0,
65
  "mask_time_length": 10,
66
+ "mask_time_min_masks": 2,
67
+ "mask_time_prob": 0.04,
 
 
68
  "model_type": "wav2vec2",
69
+ "num_adapter_layers": 3,
70
  "num_attention_heads": 16,
71
+ "num_codevector_groups": 2,
72
+ "num_codevectors_per_group": 320,
73
  "num_conv_pos_embedding_groups": 16,
74
  "num_conv_pos_embeddings": 128,
75
  "num_feat_extract_layers": 7,
76
  "num_hidden_layers": 24,
77
+ "num_negatives": 100,
78
+ "output_hidden_size": 1024,
79
+ "pad_token_id": 38,
80
+ "proj_codevector_dim": 768,
81
+ "tdnn_dilation": [
82
+ 1,
83
+ 2,
84
+ 3,
85
+ 1,
86
+ 1
87
+ ],
88
+ "tdnn_dim": [
89
+ 512,
90
+ 512,
91
+ 512,
92
+ 512,
93
+ 1500
94
+ ],
95
+ "tdnn_kernel": [
96
+ 5,
97
+ 3,
98
+ 3,
99
+ 1,
100
+ 1
101
+ ],
102
+ "torch_dtype": "float32",
103
+ "transformers_version": "4.16.1",
104
+ "use_weighted_layer_sum": false,
105
+ "vocab_size": 39,
106
+ "xvector_output_dim": 512
107
+ }