mnoukhov commited on
Commit
0554a3b
·
verified ·
1 Parent(s): a4258e9

Training in progress, step 63, checkpoint

Browse files
checkpoint-63/adapter_config.json CHANGED
@@ -20,10 +20,10 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "dense_4h_to_h",
24
  "query_key_value",
25
- "dense",
26
- "dense_h_to_4h"
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
+ "dense_h_to_4h",
24
  "dense_4h_to_h",
25
  "query_key_value",
26
+ "dense"
 
27
  ],
28
  "task_type": "CAUSAL_LM",
29
  "use_dora": false,
checkpoint-63/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c04e4a5ee03ad4fdf0d8ba26bcb9a845b52e0ffbd4c951d39c70c454d130bb6
3
  size 25192592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84870ad2b082f3826b0ed2ce8fa97fce56a8ddda28564330d270419cf4c14948
3
  size 25192592
checkpoint-63/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e56c92dea78ac4f66ad3020662353b8a735395a7deb986154bc80bca931863c
3
  size 50493050
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0229abefac5f451a6b28b1746d32d13ea09db4f682456b6847c5b44e6ed18c8f
3
  size 50493050
checkpoint-63/trainer_state.json CHANGED
@@ -10,18 +10,18 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.2016,
13
- "eval_logps/chosen": -106.34315490722656,
14
  "eval_logps/ref_chosen": -70.265625,
15
  "eval_logps/ref_rejected": -63.51186752319336,
16
- "eval_logps/rejected": -106.34315490722656,
17
- "eval_loss": 0.6557361483573914,
18
- "eval_rewards/accuracies": 0.6162024772678456,
19
- "eval_rewards/chosen": -1.8038759231567383,
20
- "eval_rewards/margins": 0.1433669477701187,
21
- "eval_rewards/rejected": -1.9472428560256958,
22
- "eval_runtime": 2599.3441,
23
- "eval_samples_per_second": 32.24,
24
- "eval_steps_per_second": 4.03,
25
  "step": 63
26
  }
27
  ],
 
10
  "log_history": [
11
  {
12
  "epoch": 0.2016,
13
+ "eval_logps/chosen": -70.4515609741211,
14
  "eval_logps/ref_chosen": -70.265625,
15
  "eval_logps/ref_rejected": -63.51186752319336,
16
+ "eval_logps/rejected": -70.4515609741211,
17
+ "eval_loss": 0.700020968914032,
18
+ "eval_rewards/accuracies": 0.5043316388630343,
19
+ "eval_rewards/chosen": -0.009296582080423832,
20
+ "eval_rewards/margins": -0.0003258216893300414,
21
+ "eval_rewards/rejected": -0.00897076167166233,
22
+ "eval_runtime": 2598.2788,
23
+ "eval_samples_per_second": 32.253,
24
+ "eval_steps_per_second": 4.032,
25
  "step": 63
26
  }
27
  ],
checkpoint-63/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46ff4287a15bff07546a9b59f8721b8272bf4ace050683003790d085d41bfcd5
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6686dc40b6db461a3b988241b5bc24010b480d0524615f6ccf956bf69c70fdf
3
  size 5176