{ "architectures": [ "NanoGPT" ], "bias": true, "block_size": 256, "dropout": 0.0, "model_type": "nanogpt", "n_embd": 384, "n_head": 6, "n_layer": 6, "nonlinearity": "RELU", "torch_dtype": "float32", "transformers_version": "4.46.0", "use_NoPE": true, "use_layernorm": true, "vocab_size": 14 }