“pharaouk” commited on
Commit
0f63f40
1 Parent(s): a548bca
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +21 -0
  2. added_tokens.json +3 -0
  3. checkpoint-250/config.json +3 -0
  4. checkpoint-250/generation_config.json +3 -0
  5. checkpoint-250/global_step250/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  6. checkpoint-250/global_step250/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  7. checkpoint-250/global_step250/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  8. checkpoint-250/global_step250/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  9. checkpoint-250/global_step250/mp_rank_00_model_states.pt +3 -0
  10. checkpoint-250/latest +3 -0
  11. checkpoint-250/pytorch_model-00001-of-00002.bin +3 -0
  12. checkpoint-250/pytorch_model-00002-of-00002.bin +3 -0
  13. checkpoint-250/pytorch_model.bin.index.json +3 -0
  14. checkpoint-250/rng_state_0.pth +3 -0
  15. checkpoint-250/rng_state_1.pth +3 -0
  16. checkpoint-250/rng_state_2.pth +3 -0
  17. checkpoint-250/rng_state_3.pth +3 -0
  18. checkpoint-250/trainer_state.json +3 -0
  19. checkpoint-250/training_args.bin +3 -0
  20. checkpoint-250/zero_to_fp32.py +3 -0
  21. checkpoint-500/config.json +3 -0
  22. checkpoint-500/generation_config.json +3 -0
  23. checkpoint-500/global_step500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  24. checkpoint-500/global_step500/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  25. checkpoint-500/global_step500/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  26. checkpoint-500/global_step500/mp_rank_00_model_states.pt +3 -0
  27. checkpoint-500/pytorch_model-00001-of-00002.bin +3 -0
  28. checkpoint-500/pytorch_model-00002-of-00002.bin +3 -0
  29. checkpoint-500/pytorch_model.bin.index.json +3 -0
  30. checkpoint-500/training_args.bin +3 -0
  31. checkpoint-750/config.json +3 -0
  32. checkpoint-750/generation_config.json +3 -0
  33. checkpoint-750/global_step750/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
  34. checkpoint-750/global_step750/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
  35. checkpoint-750/global_step750/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
  36. checkpoint-750/global_step750/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
  37. checkpoint-750/global_step750/mp_rank_00_model_states.pt +3 -0
  38. checkpoint-750/latest +3 -0
  39. checkpoint-750/pytorch_model-00001-of-00002.bin +3 -0
  40. checkpoint-750/pytorch_model-00002-of-00002.bin +3 -0
  41. checkpoint-750/pytorch_model.bin.index.json +3 -0
  42. checkpoint-750/rng_state_0.pth +3 -0
  43. checkpoint-750/rng_state_1.pth +3 -0
  44. checkpoint-750/rng_state_2.pth +3 -0
  45. checkpoint-750/rng_state_3.pth +3 -0
  46. checkpoint-750/trainer_state.json +3 -0
  47. checkpoint-750/training_args.bin +3 -0
  48. checkpoint-750/zero_to_fp32.py +3 -0
  49. config.json +3 -0
  50. generation_config.json +3 -0
.gitattributes CHANGED
@@ -33,3 +33,24 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint-250 filter=lfs diff=lfs merge=lfs -text
37
+ checkpoint-750 filter=lfs diff=lfs merge=lfs -text
38
+ generation_config.json filter=lfs diff=lfs merge=lfs -text
39
+ latest filter=lfs diff=lfs merge=lfs -text
40
+ pytorch_model-00002-of-00002.bin filter=lfs diff=lfs merge=lfs -text
41
+ rng_state_0.pth filter=lfs diff=lfs merge=lfs -text
42
+ zero_to_fp32.py filter=lfs diff=lfs merge=lfs -text
43
+ checkpoint-500 filter=lfs diff=lfs merge=lfs -text
44
+ special_tokens_map.json filter=lfs diff=lfs merge=lfs -text
45
+ tokenizer_config.json filter=lfs diff=lfs merge=lfs -text
46
+ added_tokens.json filter=lfs diff=lfs merge=lfs -text
47
+ config.json filter=lfs diff=lfs merge=lfs -text
48
+ global_step500 filter=lfs diff=lfs merge=lfs -text
49
+ rng_state_1.pth filter=lfs diff=lfs merge=lfs -text
50
+ rng_state_2.pth filter=lfs diff=lfs merge=lfs -text
51
+ tokenizer.model filter=lfs diff=lfs merge=lfs -text
52
+ pytorch_model-00001-of-00002.bin filter=lfs diff=lfs merge=lfs -text
53
+ pytorch_model.bin.index.json filter=lfs diff=lfs merge=lfs -text
54
+ rng_state_3.pth filter=lfs diff=lfs merge=lfs -text
55
+ trainer_state.json filter=lfs diff=lfs merge=lfs -text
56
+ training_args.bin filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1137d58ae316b03a36d7162631e491319c75a223ee366beddc447e77ccb42832
3
+ size 90
checkpoint-250/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38040ecb6dd98fcbe9a29765b4c1db8e79c6677a63acc41919af2d7337454654
3
+ size 620
checkpoint-250/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afcf2a1da583dbeb66bb367a759713901e23ce19ed83ed8f5a21b0e877addd5b
3
+ size 116
checkpoint-250/global_step250/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73a26c1e6ac191c92f45e6dbd0b292942d37c1bd7bff9ca2ed3841d131452760
3
+ size 21725254007
checkpoint-250/global_step250/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65bfe89cbcb1ea530a018536901c8ba9f9e6b347bf24fc63eba685e0588f47de
3
+ size 21725254583
checkpoint-250/global_step250/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76dda73ab480f23c26df27d9ed2c5cb3489b81a49ddec4bfc73e14d3acc2afd7
3
+ size 21725254647
checkpoint-250/global_step250/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02f54ef909fe921bd1e2cbba6ef7694f322308450f6c9209e33348adad518fb5
3
+ size 21725254007
checkpoint-250/global_step250/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bef3c4a04e356bf2842db3aa0d1133a3546c9ff3b3eb05d64852e0b19f03ab6
3
+ size 14483584899
checkpoint-250/latest ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:074d211701b75761ea28e8611c3d9a4db5b233e788456ff08f2111426855cd5e
3
+ size 14
checkpoint-250/pytorch_model-00001-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a13b9de24d37a71843b49556c3202c9d8e1a1a368187a88c1bb980c0cee50c6
3
+ size 9943044428
checkpoint-250/pytorch_model-00002-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21ffcff369d4c1b2b91d1286dfea5bbd27607098bbf21d851b6ba8e45dcf2152
3
+ size 4540552031
checkpoint-250/pytorch_model.bin.index.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e0f44b64f8e8d5241ee3c393f6339e05f2e844134c75c524d87dc89a7257e9
3
+ size 23950
checkpoint-250/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eafe3d5e0585dde8c5033613de99a5d4f23df4284a488f4007b3944580c0b97
3
+ size 17655
checkpoint-250/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e34eb456d2d003a2839f2daa9425e99bdd79ed7e24a1de9fc7d5738476bfb4b
3
+ size 17655
checkpoint-250/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b374af4a2765d8771cee7a72921d3c2e438b9bee34f0b2d098ce6071afeb65e4
3
+ size 17655
checkpoint-250/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5df75d8477fcc69c7abb03025313915ebfe3ac18c54a7c57aaa455c0099e13e5
3
+ size 17655
checkpoint-250/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef4b6d519251155a8dc355dd61a9cf5ee8a3c9020795f2603f2f146b47ebb0d5
3
+ size 31155
checkpoint-250/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dbeb8071fbe7ebd575391d62f8bcd4599760ab21bbc612b111647e2a2bf508e
3
+ size 6011
checkpoint-250/zero_to_fp32.py ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68f965505cd086b7582e9821f8a6bc9b5b80c43450671c1139f734d1c7678a2c
3
+ size 24177
checkpoint-500/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38040ecb6dd98fcbe9a29765b4c1db8e79c6677a63acc41919af2d7337454654
3
+ size 620
checkpoint-500/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afcf2a1da583dbeb66bb367a759713901e23ce19ed83ed8f5a21b0e877addd5b
3
+ size 116
checkpoint-500/global_step500/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcd98e2885c8add0e9ce02232ebb7d57637bcc73be93433f13d0b3d7297b5f2c
3
+ size 21725254007
checkpoint-500/global_step500/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a1c1b1d036ffe97cb0873f0c3382e1077aedec0d27c8c6303a7396a8bd1eb7b
3
+ size 7946108928
checkpoint-500/global_step500/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f25bd7cace2d38e9d43f48d2bed436add1ed610ca8ca893200ff18c8d14fa96
3
+ size 21725254007
checkpoint-500/global_step500/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7114b83cd3d93111db5d75975628ae8730ccbf2ea2aa15ae1a6ff626bd57c3ec
3
+ size 14483584899
checkpoint-500/pytorch_model-00001-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea284a24a4d42047bc5b0a99840420497496eff7d9af6c76b8020c9aac3b3ac4
3
+ size 9943044428
checkpoint-500/pytorch_model-00002-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff85db3904cf639607677c3b225fc6a687ae4b4c72cae68063ae86c28dac7115
3
+ size 4540552031
checkpoint-500/pytorch_model.bin.index.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e0f44b64f8e8d5241ee3c393f6339e05f2e844134c75c524d87dc89a7257e9
3
+ size 23950
checkpoint-500/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dbeb8071fbe7ebd575391d62f8bcd4599760ab21bbc612b111647e2a2bf508e
3
+ size 6011
checkpoint-750/config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38040ecb6dd98fcbe9a29765b4c1db8e79c6677a63acc41919af2d7337454654
3
+ size 620
checkpoint-750/generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afcf2a1da583dbeb66bb367a759713901e23ce19ed83ed8f5a21b0e877addd5b
3
+ size 116
checkpoint-750/global_step750/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4db949e8907e6f83bd6f3dbb0dc0682d0d15d7a444fe6555d5112976151b3463
3
+ size 21725254007
checkpoint-750/global_step750/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c1fb6c7b67b75d1eb10f43f19195600f62e671558efbb8907e44e310994896e
3
+ size 21725254583
checkpoint-750/global_step750/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27808edd997a0d40385887613c8bbf3f6835869eab1eac81bab04b685ad0d9de
3
+ size 21725254647
checkpoint-750/global_step750/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99be19c541989a9156b434863500a24848be3fce5b60ba44fa82c281f87a7454
3
+ size 21725254007
checkpoint-750/global_step750/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d2b2ec5cf5d538d34f84f5f633ff7ae85c8db0d1eb7599958a97684d19baf70
3
+ size 14483584899
checkpoint-750/latest ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bd3153661a24859b6a2748f64ccf12ea6ba4772d09ef03886b14d37541114d8
3
+ size 14
checkpoint-750/pytorch_model-00001-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24a0c772c0633cfedd7d31fce0f8d8348d9ba982ab49fb18dd38a353319fadb4
3
+ size 9943044428
checkpoint-750/pytorch_model-00002-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a590331b0e3ce8b4ce22b509ab95f5a1c637b82da880aa4c9bcaa18ead8904b
3
+ size 4540552031
checkpoint-750/pytorch_model.bin.index.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72e0f44b64f8e8d5241ee3c393f6339e05f2e844134c75c524d87dc89a7257e9
3
+ size 23950
checkpoint-750/rng_state_0.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5775c11ec2fe6a5d58d1857fa436bb0da77027386858b2a4e7ea3eff9c2ab66
3
+ size 17655
checkpoint-750/rng_state_1.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca1a0e79990b2325280b0f88b8b2e25a4c5d61927bfa5e5c178ffe1321125ca9
3
+ size 17655
checkpoint-750/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aebaa297ea8d8fd38ae9b49e17f26565783e27c56a220dc278f70f6593bccda
3
+ size 17655
checkpoint-750/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f537c78a9ca12294baa835f33188b772f2cbf238559c0f36ab3505e19304755
3
+ size 17655
checkpoint-750/trainer_state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56866d2dfe74e8ad06e88fd187ab8dc61429dc2abdf7b1ff2826fe63ed7e5750
3
+ size 93002
checkpoint-750/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dbeb8071fbe7ebd575391d62f8bcd4599760ab21bbc612b111647e2a2bf508e
3
+ size 6011
checkpoint-750/zero_to_fp32.py ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68f965505cd086b7582e9821f8a6bc9b5b80c43450671c1139f734d1c7678a2c
3
+ size 24177
config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38040ecb6dd98fcbe9a29765b4c1db8e79c6677a63acc41919af2d7337454654
3
+ size 620
generation_config.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afcf2a1da583dbeb66bb367a759713901e23ce19ed83ed8f5a21b0e877addd5b
3
+ size 116