metadata
license: apache-2.0
Hyperparameters: learning rate: 2e-5, weight decay: 0.01, per_device_train_batch_size: 8, per_device_eval_batch_size: 8, gradient_accumulation_steps:1, eval steps: 6000, max_length: 512, num_epochs: 2
Dataset version: “craffel/tasky_or_not”, “10xp3_10xc4”, “15f88c8”