File size: 2,392 Bytes
91a7f19
7a49ddf
91a7f19
eb7cd01
91a7f19
 
 
 
 
 
 
eb7cd01
7a49ddf
eb7cd01
 
91a7f19
 
 
eb7cd01
7a49ddf
 
 
 
91a7f19
 
 
eb7cd01
7a49ddf
eb7cd01
7a49ddf
91a7f19
 
 
eb7cd01
7a49ddf
 
 
 
91a7f19
 
 
eb7cd01
7a49ddf
eb7cd01
7a49ddf
91a7f19
 
 
eb7cd01
7a49ddf
 
 
 
91a7f19
 
 
eb7cd01
7a49ddf
eb7cd01
7a49ddf
91a7f19
 
 
eb7cd01
7a49ddf
 
 
 
91a7f19
 
 
 
eb7cd01
91a7f19
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
{
  "best_metric": 1.239119052886963,
  "best_model_checkpoint": "./output/clip-finetuned-csu-p14-336-e4l58-l/checkpoint-2000",
  "epoch": 0.36845983787767134,
  "eval_steps": 500,
  "global_step": 2000,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.09211495946941783,
      "grad_norm": 20.04043960571289,
      "learning_rate": 4.8848563006632274e-08,
      "loss": 0.3758,
      "step": 500
    },
    {
      "epoch": 0.09211495946941783,
      "eval_loss": 1.4184927940368652,
      "eval_runtime": 74.3562,
      "eval_samples_per_second": 16.233,
      "eval_steps_per_second": 2.031,
      "step": 500
    },
    {
      "epoch": 0.18422991893883567,
      "grad_norm": 74.25025939941406,
      "learning_rate": 4.7697126013264556e-08,
      "loss": 0.4103,
      "step": 1000
    },
    {
      "epoch": 0.18422991893883567,
      "eval_loss": 1.3500770330429077,
      "eval_runtime": 75.7013,
      "eval_samples_per_second": 15.944,
      "eval_steps_per_second": 1.995,
      "step": 1000
    },
    {
      "epoch": 0.2763448784082535,
      "grad_norm": 0.5102410912513733,
      "learning_rate": 4.6545689019896826e-08,
      "loss": 0.433,
      "step": 1500
    },
    {
      "epoch": 0.2763448784082535,
      "eval_loss": 1.2885024547576904,
      "eval_runtime": 75.197,
      "eval_samples_per_second": 16.051,
      "eval_steps_per_second": 2.008,
      "step": 1500
    },
    {
      "epoch": 0.36845983787767134,
      "grad_norm": 0.1667678952217102,
      "learning_rate": 4.539425202652911e-08,
      "loss": 0.3424,
      "step": 2000
    },
    {
      "epoch": 0.36845983787767134,
      "eval_loss": 1.239119052886963,
      "eval_runtime": 75.387,
      "eval_samples_per_second": 16.011,
      "eval_steps_per_second": 2.003,
      "step": 2000
    }
  ],
  "logging_steps": 500,
  "max_steps": 21712,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 4,
  "save_steps": 500,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": false
      },
      "attributes": {}
    }
  },
  "total_flos": 720236219222520.0,
  "train_batch_size": 2,
  "trial_name": null,
  "trial_params": null
}