{ "base_model_name": "mpasila_gpt3-finnish-8B-gptq-4bit", "base_model_class": "BloomForCausalLM", "base_loaded_in_4bit": false, "base_loaded_in_8bit": false, "projections": "query_key_value", "loss": 2.3115, "grad_norm": 0.10131204128265381, "learning_rate": 3.1034482758620685e-05, "epoch": 2.98, "current_steps": 1051, "train_runtime": 4886.022, "train_samples_per_second": 0.869, "train_steps_per_second": 0.007, "total_flos": 112306365136896.0, "train_loss": 2.4886908531188965 }