Fill-Mask
Transformers
Safetensors
English
mdlm
custom_code
subbham's picture
Upload MDLM
19f029e verified
raw
history blame contribute delete
509 Bytes
{
"_name_or_path": "kuleshov-group/mdlm-no_flashattn-fp32-owt",
"architectures": [
"MDLM"
],
"auto_map": {
"AutoConfig": "configuration_mdlm.MDLMConfig",
"AutoModelForMaskedLM": "modeling_mdlm_2.MDLM"
},
"cond_dim": 128,
"dropout": 0.1,
"hidden_dim": 768,
"model_length": 1024,
"model_type": "mdlm",
"n_blocks": 12,
"n_heads": 12,
"return_dict": false,
"time_conditioning": false,
"torch_dtype": "float32",
"transformers_version": "4.38.2",
"vocab_size": 50258
}