devamanyu commited on
Commit
34964e3
1 Parent(s): de737e5

End of training

Browse files
README.md CHANGED
@@ -4,6 +4,7 @@ library_name: transformers
4
  model_name: zephyr-7b-dpo-full
5
  tags:
6
  - generated_from_trainer
 
7
  - trl
8
  - dpo
9
  licence: license
 
4
  model_name: zephyr-7b-dpo-full
5
  tags:
6
  - generated_from_trainer
7
+ - alignment-handbook
8
  - trl
9
  - dpo
10
  licence: license
all_results.json CHANGED
@@ -9,10 +9,10 @@
9
  "eval_rewards/chosen": -0.9375,
10
  "eval_rewards/margins": 1.0078125,
11
  "eval_rewards/rejected": -1.9375,
12
- "eval_runtime": 39.9906,
13
  "eval_samples": 2000,
14
- "eval_samples_per_second": 50.012,
15
- "eval_steps_per_second": 0.8,
16
  "total_flos": 0.0,
17
  "train_loss": 0.0,
18
  "train_runtime": 1.4031,
 
9
  "eval_rewards/chosen": -0.9375,
10
  "eval_rewards/margins": 1.0078125,
11
  "eval_rewards/rejected": -1.9375,
12
+ "eval_runtime": 40.2538,
13
  "eval_samples": 2000,
14
+ "eval_samples_per_second": 49.685,
15
+ "eval_steps_per_second": 0.795,
16
  "total_flos": 0.0,
17
  "train_loss": 0.0,
18
  "train_runtime": 1.4031,
config.json CHANGED
@@ -22,6 +22,6 @@
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
  "transformers_version": "4.46.1",
25
- "use_cache": false,
26
  "vocab_size": 32000
27
  }
 
22
  "tie_word_embeddings": false,
23
  "torch_dtype": "bfloat16",
24
  "transformers_version": "4.46.1",
25
+ "use_cache": true,
26
  "vocab_size": 32000
27
  }
eval_results.json CHANGED
@@ -9,8 +9,8 @@
9
  "eval_rewards/chosen": -0.9375,
10
  "eval_rewards/margins": 1.0078125,
11
  "eval_rewards/rejected": -1.9375,
12
- "eval_runtime": 39.9906,
13
  "eval_samples": 2000,
14
- "eval_samples_per_second": 50.012,
15
- "eval_steps_per_second": 0.8
16
  }
 
9
  "eval_rewards/chosen": -0.9375,
10
  "eval_rewards/margins": 1.0078125,
11
  "eval_rewards/rejected": -1.9375,
12
+ "eval_runtime": 40.2538,
13
  "eval_samples": 2000,
14
+ "eval_samples_per_second": 49.685,
15
+ "eval_steps_per_second": 0.795
16
  }
runs/Nov22_21-24-16_dvhaz-sleeper-cmh-gpu/events.out.tfevents.1732310866.dvhaz-sleeper-cmh-gpu.11516.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddd7dd3ef6c4afdd9247ec552c913b8b1cdabd965425e50e7dd922167725e05e
3
+ size 828