{ "add_postnet": true, "architectures": [ "FastSpeech2Model" ], "attention_dropout": 0, "decoder_attention_heads": 2, "decoder_embed_dim": 256, "decoder_layers": 4, "encoder_attention_heads": 2, "encoder_embed_dim": 256, "encoder_layers": 4, "energy_max": 5.646703243255615, "energy_min": -3.548804759979248, "fft_dropout": 0.2, "fft_hidden_dim": 1024, "fft_kernel_size": 9, "initializer_range": 0.0625, "max_source_positions": 1024, "model_type": "fastspeech2", "num_speakers": 200, "pad_token_id": 1, "pitch_max": 5.164862652912731, "pitch_min": -2.5049682966705484, "postnet_conv_dim": 512, "postnet_conv_kernel_size": 5, "postnet_dropout": 0.5, "postnet_layers": 5, "speaker_embed_dim": 64, "torch_dtype": "float32", "transformers_version": "4.19.0.dev0", "use_mean": true, "use_standard_deviation": true, "var_pred_dropout": 0.5, "var_pred_hidden_dim": 256, "var_pred_kernel_size": 3, "vocab_size": 74 }