Gael Le Lan
Initial commit
9d0d223
raw
history blame
97 Bytes
# @package _global_
# 300M Param.
transformer_lm:
dim: 1024
num_heads: 16
num_layers: 24