test-public-space / finetuning.py
phuong-d-h-nguyen's picture
Upload folder using huggingface_hub
0dcea97 verified
raw
history blame
838 Bytes
from trl import SFTTrainer
from transformers import TrainingArguments
import json
import torch
with open("finetuning_set_v1.0.json") as f:
dataset = json.load(f)
# torch.cuda.empty_cache()
# torch.cuda.set_per_process_memory_fraction(0.9)
args = TrainingArguments(
per_device_train_batch_size=1,
per_device_eval_batch_size=1,
output_dir="Salesforce-codegen2-1B-text-to-neurapy",
gradient_accumulation_steps=1,
num_train_epochs=8
)
trainer = SFTTrainer(
"Salesforce/codegen2-1B",
train_dataset=dataset,
dataset_text_field="completion",
max_seq_length=1024,
args=args,
model_init_kwargs={
"torch_dtype": torch.bfloat16,
},
packing=True
)
trainer.train()
# testing without saving uncomment for actual training
# trainer.save_model("Salesforce-codegen2-1B-text-to-neurapy")