File size: 1,946 Bytes
7b01340
 
 
ef79740
7b01340
ef79740
7b01340
 
 
 
 
 
c8bebbb
ef79740
7b01340
 
 
fcb4856
ef79740
 
 
 
fcb4856
7b01340
 
ef79740
fcb4856
ef79740
fcb4856
ba9d9d0
 
ef79740
 
 
 
 
fcb4856
ba9d9d0
 
ef79740
fcb4856
ef79740
fcb4856
 
 
ef79740
 
 
 
 
fcb4856
 
 
ef79740
fcb4856
ef79740
fcb4856
 
 
ef79740
 
 
 
 
 
ba9d9d0
 
ef79740
 
 
 
 
 
 
7b01340
 
 
c8bebbb
 
7b01340
ef79740
7b01340
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 3.3086838534599727,
  "eval_steps": 500,
  "global_step": 16,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.09,
      "learning_rate": 1.9974521146102535e-05,
      "loss": 1.3794,
      "step": 1
    },
    {
      "epoch": 0.35,
      "eval_loss": 1.3587424755096436,
      "eval_runtime": 21.5907,
      "eval_samples_per_second": 13.617,
      "eval_steps_per_second": 1.714,
      "step": 4
    },
    {
      "epoch": 1.07,
      "learning_rate": 1.936949724999762e-05,
      "loss": 1.3642,
      "step": 5
    },
    {
      "epoch": 1.33,
      "eval_loss": 1.3150031566619873,
      "eval_runtime": 21.6398,
      "eval_samples_per_second": 13.586,
      "eval_steps_per_second": 1.71,
      "step": 8
    },
    {
      "epoch": 2.15,
      "learning_rate": 1.7557495743542586e-05,
      "loss": 1.3179,
      "step": 10
    },
    {
      "epoch": 2.32,
      "eval_loss": 1.2843962907791138,
      "eval_runtime": 21.6342,
      "eval_samples_per_second": 13.59,
      "eval_steps_per_second": 1.71,
      "step": 12
    },
    {
      "epoch": 3.22,
      "learning_rate": 1.479248986720057e-05,
      "loss": 1.2789,
      "step": 15
    },
    {
      "epoch": 3.31,
      "eval_loss": 1.2639315128326416,
      "eval_runtime": 21.5826,
      "eval_samples_per_second": 13.622,
      "eval_steps_per_second": 1.714,
      "step": 16
    },
    {
      "epoch": 3.31,
      "step": 16,
      "total_flos": 7.473328135392461e+17,
      "train_loss": 1.3643869757652283,
      "train_runtime": 5803.8585,
      "train_samples_per_second": 4.063,
      "train_steps_per_second": 0.008
    }
  ],
  "logging_steps": 5,
  "max_steps": 44,
  "num_train_epochs": 4,
  "save_steps": 500,
  "total_flos": 7.473328135392461e+17,
  "trial_name": null,
  "trial_params": null
}