{ "_name_or_path": "oza75/bambara-vqvae", "act_fn": "relu", "architectures": [ "BMSpeechVQVAE" ], "in_channels": 1, "initial_filters": 64, "input_shape": null, "kernel_size": 4, "latent_channels": 512, "model_type": "bm_speech_vq_vae", "norm_num_groups": 32, "norm_type": "group", "num_layers": 4, "num_vq_embeddings": 512, "out_channels": 1, "padding": 1, "sample_size": 32, "scaling_factor": 0.18215, "speaker_embed_dim": 512, "stride": 2, "torch_dtype": "float32", "transformers_version": "4.41.1", "vq_embed_dim": 64 }