cwaud commited on
Commit
77fbfcf
1 Parent(s): 2914ac0

Training in progress, step 2, checkpoint

Browse files
last-checkpoint/adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "k_proj",
24
  "q_proj",
25
  "o_proj",
26
  "gate_proj",
27
- "up_proj",
28
- "down_proj",
29
- "v_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "down_proj",
24
  "q_proj",
25
  "o_proj",
26
  "gate_proj",
27
+ "v_proj",
28
+ "k_proj",
29
+ "up_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f4f4bd8173a488493bfc135b0b00d218b60f7ca3127442bac3ee332b279de308
3
  size 1770585648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7aadff02eb8558c9740beadd5a8515e6a692bec62185c57715dc74eb516e3e8
3
  size 1770585648
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6e45df8c72375b9124c1cf915cc824a784b313fcc071cd79625c91d75d52e7a
3
  size 99235764
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f22fda284fe8c75934d03ac77ff1560b4a2fcc4bc20b3580a6483453cc4bcdf
3
  size 99235764
last-checkpoint/trainer_state.json CHANGED
@@ -10,32 +10,32 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.8,
13
- "grad_norm": 4.495707988739014,
14
  "learning_rate": 2e-05,
15
- "loss": 5.4988,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.8,
20
- "eval_loss": 5.075080871582031,
21
- "eval_runtime": 0.3898,
22
- "eval_samples_per_second": 2.566,
23
- "eval_steps_per_second": 2.566,
24
  "step": 1
25
  },
26
  {
27
  "epoch": 1.6,
28
- "grad_norm": 4.435665607452393,
29
  "learning_rate": 4e-05,
30
- "loss": 5.2725,
31
  "step": 2
32
  },
33
  {
34
  "epoch": 1.6,
35
- "eval_loss": 5.068875789642334,
36
- "eval_runtime": 0.3873,
37
- "eval_samples_per_second": 2.582,
38
- "eval_steps_per_second": 2.582,
39
  "step": 2
40
  }
41
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.8,
13
+ "grad_norm": 11.588508605957031,
14
  "learning_rate": 2e-05,
15
+ "loss": 13.3042,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.8,
20
+ "eval_loss": 11.52426815032959,
21
+ "eval_runtime": 0.39,
22
+ "eval_samples_per_second": 2.564,
23
+ "eval_steps_per_second": 2.564,
24
  "step": 1
25
  },
26
  {
27
  "epoch": 1.6,
28
+ "grad_norm": 11.549392700195312,
29
  "learning_rate": 4e-05,
30
+ "loss": 13.1934,
31
  "step": 2
32
  },
33
  {
34
  "epoch": 1.6,
35
+ "eval_loss": 11.268893241882324,
36
+ "eval_runtime": 0.3904,
37
+ "eval_samples_per_second": 2.562,
38
+ "eval_steps_per_second": 2.562,
39
  "step": 2
40
  }
41
  ],
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44748d1dcddc20382d94692c82fe6f19df00bbe11e18d390697f5a775b282d62
3
  size 6136
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af853a67b3854fa26b67dfae731715dfd1e79725227c471b95b403f47394d08e
3
  size 6136