# singularity exec --nv nemo2302 bash convert_nemo_to_hf.sh | |
#### Convert model pretrained from scratch in Nemo Meagtron to HuggingFace format | |
python convert_nemo_ul2_checkpoint.py \ | |
--nemo_model_path=nemo_checkpoints/megatron_ul2--val_loss=2.54-step=7000-consumed_samples=14557920.0.ckpt \ | |
--hf_config_path=config_ul2_base_nl36.json \ | |
--output_path=ul2-base-nl36-swedish \ | |
--hidden_size=768 \ | |
# --num_heads=12 \ | |
# --kv_dim=64 \ | |
# --checkpoint_version=2.0 \ | |
# --fix_qkv \ | |
# --hf_model_path=ul2_base_nl36 \ | |