{ | |
"dataset_name": "data/packaged_pretrain_dataset.parquet", | |
"num_proc": 1, | |
"max_seq_length": 32, | |
"seed": 0, | |
"optim": "adamw_torch", | |
"max_steps": 60, | |
"per_device_train_batch_size": 2, | |
"learning_rate": 1e-05, | |
"weight_decay": 0, | |
"warmup_steps": 10, | |
"lr_scheduler_type": "linear", | |
"gradient_checkpointing": true, | |
"dataloader_num_workers": 2, | |
"bf16": true, | |
"gradient_accumulation_steps": 1, | |
"logging_steps": 3, | |
"report_to": [], | |
"save_strategy": "steps", | |
"save_steps": 3, | |
"save_total_limit": 1, | |
"push_to_hub": true, | |
"hub_model_id": "hienbm/psychology-llama3.1-8B" | |
} |