Commit
·
0beffd4
1
Parent(s):
c02ede4
Training in progress, step 100000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/rng_state_4.pth +1 -1
- last-checkpoint/rng_state_5.pth +1 -1
- last-checkpoint/rng_state_6.pth +1 -1
- last-checkpoint/rng_state_7.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +14 -322
- last-checkpoint/training_args.bin +1 -1
- pytorch_model.bin +1 -1
- runs/Feb17_16-44-06_t1v-n-7a44a9fa-w-0/events.out.tfevents.1676652777.t1v-n-7a44a9fa-w-0.1006877.0 +2 -2
- runs/Feb24_00-19-02_t1v-n-7a44a9fa-w-0/1677197978.0466611/events.out.tfevents.1677197978.t1v-n-7a44a9fa-w-0.3980329.1 +3 -0
- runs/Feb24_00-19-02_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677197978.t1v-n-7a44a9fa-w-0.3980329.0 +3 -0
- runs/Feb24_02-54-45_t1v-n-7a44a9fa-w-0/1677207316.2172732/events.out.tfevents.1677207316.t1v-n-7a44a9fa-w-0.4014800.1 +3 -0
- runs/Feb24_02-54-45_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677207316.t1v-n-7a44a9fa-w-0.4014800.0 +3 -0
- runs/Feb24_03-42-21_t1v-n-7a44a9fa-w-0/1677210177.3730767/events.out.tfevents.1677210177.t1v-n-7a44a9fa-w-0.4043690.1 +3 -0
- runs/Feb24_03-42-21_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677210177.t1v-n-7a44a9fa-w-0.4043690.0 +3 -0
- runs/Feb25_19-27-01_t1v-n-7a44a9fa-w-0/1677353255.835489/events.out.tfevents.1677353255.t1v-n-7a44a9fa-w-0.33944.1 +3 -0
- runs/Feb25_19-27-01_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677353255.t1v-n-7a44a9fa-w-0.33944.0 +3 -0
- training_args.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2693742553
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:904b75985efc40c0457e36867bea59373e9bfdfcfd6faed477a21a85c4bd560e
|
3 |
size 2693742553
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1346893675
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47992429487d016109373d5a83150b8f5e4877618c7785bb61465cd39529dc23
|
3 |
size 1346893675
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/rng_state_4.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/rng_state_5.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/rng_state_6.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/rng_state_7.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 13611
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a766705dfa06584b04e13adde061e144056ae2a8ef43bca4589db57242d9e2e
|
3 |
size 13611
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:647800033a1fe4aa55a6bc8c002ddb2326a52950bde89b878eccf8a697eacefa
|
3 |
size 623
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 1
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -576,365 +576,57 @@
|
|
576 |
{
|
577 |
"epoch": 0.09,
|
578 |
"learning_rate": 9.94716380576598e-05,
|
579 |
-
"loss": 0.
|
580 |
"step": 94000
|
581 |
},
|
582 |
{
|
583 |
"epoch": 0.1,
|
584 |
"learning_rate": 9.944739353007344e-05,
|
585 |
-
"loss": 0.
|
586 |
"step": 95000
|
587 |
},
|
588 |
{
|
589 |
"epoch": 0.1,
|
590 |
"learning_rate": 9.942260825371358e-05,
|
591 |
-
"loss": 0.
|
592 |
"step": 96000
|
593 |
},
|
594 |
{
|
595 |
"epoch": 0.1,
|
596 |
"learning_rate": 9.939728249962807e-05,
|
597 |
-
"loss": 0.
|
598 |
"step": 97000
|
599 |
},
|
600 |
{
|
601 |
"epoch": 0.1,
|
602 |
"learning_rate": 9.937141654477528e-05,
|
603 |
-
"loss": 0.
|
604 |
"step": 98000
|
605 |
},
|
606 |
{
|
607 |
"epoch": 0.1,
|
608 |
"learning_rate": 9.934501067202117e-05,
|
609 |
-
"loss": 0.
|
610 |
"step": 99000
|
611 |
},
|
612 |
{
|
613 |
"epoch": 0.1,
|
614 |
"learning_rate": 9.931806517013612e-05,
|
615 |
-
"loss": 0.
|
616 |
"step": 100000
|
617 |
},
|
618 |
{
|
619 |
"epoch": 0.1,
|
620 |
-
"eval_loss": 0.
|
621 |
-
"eval_runtime":
|
622 |
-
"eval_samples_per_second":
|
623 |
-
"eval_steps_per_second": 2.
|
624 |
"step": 100000
|
625 |
-
},
|
626 |
-
{
|
627 |
-
"epoch": 0.1,
|
628 |
-
"learning_rate": 9.929058033379181e-05,
|
629 |
-
"loss": 0.7337,
|
630 |
-
"step": 101000
|
631 |
-
},
|
632 |
-
{
|
633 |
-
"epoch": 0.1,
|
634 |
-
"learning_rate": 9.926255646355804e-05,
|
635 |
-
"loss": 0.7325,
|
636 |
-
"step": 102000
|
637 |
-
},
|
638 |
-
{
|
639 |
-
"epoch": 0.1,
|
640 |
-
"learning_rate": 9.923399386589933e-05,
|
641 |
-
"loss": 0.7289,
|
642 |
-
"step": 103000
|
643 |
-
},
|
644 |
-
{
|
645 |
-
"epoch": 0.1,
|
646 |
-
"learning_rate": 9.92048928531717e-05,
|
647 |
-
"loss": 0.7278,
|
648 |
-
"step": 104000
|
649 |
-
},
|
650 |
-
{
|
651 |
-
"epoch": 0.1,
|
652 |
-
"learning_rate": 9.917525374361912e-05,
|
653 |
-
"loss": 0.7314,
|
654 |
-
"step": 105000
|
655 |
-
},
|
656 |
-
{
|
657 |
-
"epoch": 0.11,
|
658 |
-
"learning_rate": 9.914507686137019e-05,
|
659 |
-
"loss": 0.7412,
|
660 |
-
"step": 106000
|
661 |
-
},
|
662 |
-
{
|
663 |
-
"epoch": 0.11,
|
664 |
-
"learning_rate": 9.911436253643445e-05,
|
665 |
-
"loss": 0.7378,
|
666 |
-
"step": 107000
|
667 |
-
},
|
668 |
-
{
|
669 |
-
"epoch": 0.11,
|
670 |
-
"learning_rate": 9.90831111046988e-05,
|
671 |
-
"loss": 0.7349,
|
672 |
-
"step": 108000
|
673 |
-
},
|
674 |
-
{
|
675 |
-
"epoch": 0.11,
|
676 |
-
"learning_rate": 9.905132290792394e-05,
|
677 |
-
"loss": 0.7401,
|
678 |
-
"step": 109000
|
679 |
-
},
|
680 |
-
{
|
681 |
-
"epoch": 0.11,
|
682 |
-
"learning_rate": 9.901899829374047e-05,
|
683 |
-
"loss": 0.7345,
|
684 |
-
"step": 110000
|
685 |
-
},
|
686 |
-
{
|
687 |
-
"epoch": 0.11,
|
688 |
-
"learning_rate": 9.89861376156452e-05,
|
689 |
-
"loss": 0.7241,
|
690 |
-
"step": 111000
|
691 |
-
},
|
692 |
-
{
|
693 |
-
"epoch": 0.11,
|
694 |
-
"learning_rate": 9.895274123299723e-05,
|
695 |
-
"loss": 0.7212,
|
696 |
-
"step": 112000
|
697 |
-
},
|
698 |
-
{
|
699 |
-
"epoch": 0.11,
|
700 |
-
"learning_rate": 9.891880951101407e-05,
|
701 |
-
"loss": 0.7148,
|
702 |
-
"step": 113000
|
703 |
-
},
|
704 |
-
{
|
705 |
-
"epoch": 0.11,
|
706 |
-
"learning_rate": 9.888434282076758e-05,
|
707 |
-
"loss": 0.7159,
|
708 |
-
"step": 114000
|
709 |
-
},
|
710 |
-
{
|
711 |
-
"epoch": 0.12,
|
712 |
-
"learning_rate": 9.884934153917997e-05,
|
713 |
-
"loss": 0.7219,
|
714 |
-
"step": 115000
|
715 |
-
},
|
716 |
-
{
|
717 |
-
"epoch": 0.12,
|
718 |
-
"learning_rate": 9.881380604901964e-05,
|
719 |
-
"loss": 0.7249,
|
720 |
-
"step": 116000
|
721 |
-
},
|
722 |
-
{
|
723 |
-
"epoch": 0.12,
|
724 |
-
"learning_rate": 9.877773673889701e-05,
|
725 |
-
"loss": 0.7261,
|
726 |
-
"step": 117000
|
727 |
-
},
|
728 |
-
{
|
729 |
-
"epoch": 0.12,
|
730 |
-
"learning_rate": 9.87411340032603e-05,
|
731 |
-
"loss": 0.7197,
|
732 |
-
"step": 118000
|
733 |
-
},
|
734 |
-
{
|
735 |
-
"epoch": 0.12,
|
736 |
-
"learning_rate": 9.870399824239117e-05,
|
737 |
-
"loss": 0.7315,
|
738 |
-
"step": 119000
|
739 |
-
},
|
740 |
-
{
|
741 |
-
"epoch": 0.12,
|
742 |
-
"learning_rate": 9.86663298624003e-05,
|
743 |
-
"loss": 0.7219,
|
744 |
-
"step": 120000
|
745 |
-
},
|
746 |
-
{
|
747 |
-
"epoch": 0.12,
|
748 |
-
"learning_rate": 9.862812927522309e-05,
|
749 |
-
"loss": 0.7117,
|
750 |
-
"step": 121000
|
751 |
-
},
|
752 |
-
{
|
753 |
-
"epoch": 0.12,
|
754 |
-
"learning_rate": 9.858939689861506e-05,
|
755 |
-
"loss": 0.7075,
|
756 |
-
"step": 122000
|
757 |
-
},
|
758 |
-
{
|
759 |
-
"epoch": 0.12,
|
760 |
-
"learning_rate": 9.855013315614725e-05,
|
761 |
-
"loss": 0.7033,
|
762 |
-
"step": 123000
|
763 |
-
},
|
764 |
-
{
|
765 |
-
"epoch": 0.12,
|
766 |
-
"learning_rate": 9.851033847720166e-05,
|
767 |
-
"loss": 0.7049,
|
768 |
-
"step": 124000
|
769 |
-
},
|
770 |
-
{
|
771 |
-
"epoch": 0.12,
|
772 |
-
"learning_rate": 9.847001329696653e-05,
|
773 |
-
"loss": 0.7129,
|
774 |
-
"step": 125000
|
775 |
-
},
|
776 |
-
{
|
777 |
-
"epoch": 0.13,
|
778 |
-
"learning_rate": 9.842915805643155e-05,
|
779 |
-
"loss": 0.7153,
|
780 |
-
"step": 126000
|
781 |
-
},
|
782 |
-
{
|
783 |
-
"epoch": 0.13,
|
784 |
-
"learning_rate": 9.838777320238312e-05,
|
785 |
-
"loss": 0.7145,
|
786 |
-
"step": 127000
|
787 |
-
},
|
788 |
-
{
|
789 |
-
"epoch": 0.13,
|
790 |
-
"learning_rate": 9.834585918739936e-05,
|
791 |
-
"loss": 0.711,
|
792 |
-
"step": 128000
|
793 |
-
},
|
794 |
-
{
|
795 |
-
"epoch": 0.13,
|
796 |
-
"learning_rate": 9.830341646984521e-05,
|
797 |
-
"loss": 0.7197,
|
798 |
-
"step": 129000
|
799 |
-
},
|
800 |
-
{
|
801 |
-
"epoch": 0.13,
|
802 |
-
"learning_rate": 9.826044551386744e-05,
|
803 |
-
"loss": 0.7135,
|
804 |
-
"step": 130000
|
805 |
-
},
|
806 |
-
{
|
807 |
-
"epoch": 0.13,
|
808 |
-
"learning_rate": 9.821694678938953e-05,
|
809 |
-
"loss": 0.698,
|
810 |
-
"step": 131000
|
811 |
-
},
|
812 |
-
{
|
813 |
-
"epoch": 0.13,
|
814 |
-
"learning_rate": 9.817292077210659e-05,
|
815 |
-
"loss": 0.6971,
|
816 |
-
"step": 132000
|
817 |
-
},
|
818 |
-
{
|
819 |
-
"epoch": 0.13,
|
820 |
-
"learning_rate": 9.812836794348004e-05,
|
821 |
-
"loss": 0.6936,
|
822 |
-
"step": 133000
|
823 |
-
},
|
824 |
-
{
|
825 |
-
"epoch": 0.13,
|
826 |
-
"learning_rate": 9.808328879073251e-05,
|
827 |
-
"loss": 0.6987,
|
828 |
-
"step": 134000
|
829 |
-
},
|
830 |
-
{
|
831 |
-
"epoch": 0.14,
|
832 |
-
"learning_rate": 9.803768380684242e-05,
|
833 |
-
"loss": 0.7058,
|
834 |
-
"step": 135000
|
835 |
-
},
|
836 |
-
{
|
837 |
-
"epoch": 0.14,
|
838 |
-
"learning_rate": 9.799155349053851e-05,
|
839 |
-
"loss": 0.7077,
|
840 |
-
"step": 136000
|
841 |
-
},
|
842 |
-
{
|
843 |
-
"epoch": 0.14,
|
844 |
-
"learning_rate": 9.794489834629455e-05,
|
845 |
-
"loss": 0.7078,
|
846 |
-
"step": 137000
|
847 |
-
},
|
848 |
-
{
|
849 |
-
"epoch": 0.14,
|
850 |
-
"learning_rate": 9.789771888432375e-05,
|
851 |
-
"loss": 0.7044,
|
852 |
-
"step": 138000
|
853 |
-
},
|
854 |
-
{
|
855 |
-
"epoch": 0.14,
|
856 |
-
"learning_rate": 9.785001562057309e-05,
|
857 |
-
"loss": 0.7119,
|
858 |
-
"step": 139000
|
859 |
-
},
|
860 |
-
{
|
861 |
-
"epoch": 0.14,
|
862 |
-
"learning_rate": 9.780178907671789e-05,
|
863 |
-
"loss": 0.7045,
|
864 |
-
"step": 140000
|
865 |
-
},
|
866 |
-
{
|
867 |
-
"epoch": 0.14,
|
868 |
-
"learning_rate": 9.775303978015585e-05,
|
869 |
-
"loss": 0.6908,
|
870 |
-
"step": 141000
|
871 |
-
},
|
872 |
-
{
|
873 |
-
"epoch": 0.14,
|
874 |
-
"learning_rate": 9.77037682640015e-05,
|
875 |
-
"loss": 0.6906,
|
876 |
-
"step": 142000
|
877 |
-
},
|
878 |
-
{
|
879 |
-
"epoch": 0.14,
|
880 |
-
"learning_rate": 9.765397506708023e-05,
|
881 |
-
"loss": 0.6852,
|
882 |
-
"step": 143000
|
883 |
-
},
|
884 |
-
{
|
885 |
-
"epoch": 0.14,
|
886 |
-
"learning_rate": 9.760366073392246e-05,
|
887 |
-
"loss": 0.6872,
|
888 |
-
"step": 144000
|
889 |
-
},
|
890 |
-
{
|
891 |
-
"epoch": 1.0,
|
892 |
-
"learning_rate": 9.755282581475769e-05,
|
893 |
-
"loss": 0.6902,
|
894 |
-
"step": 145000
|
895 |
-
},
|
896 |
-
{
|
897 |
-
"epoch": 1.0,
|
898 |
-
"learning_rate": 9.750147086550844e-05,
|
899 |
-
"loss": 0.6877,
|
900 |
-
"step": 146000
|
901 |
-
},
|
902 |
-
{
|
903 |
-
"epoch": 1.0,
|
904 |
-
"learning_rate": 9.744959644778422e-05,
|
905 |
-
"loss": 0.6953,
|
906 |
-
"step": 147000
|
907 |
-
},
|
908 |
-
{
|
909 |
-
"epoch": 1.0,
|
910 |
-
"learning_rate": 9.739720312887535e-05,
|
911 |
-
"loss": 0.6949,
|
912 |
-
"step": 148000
|
913 |
-
},
|
914 |
-
{
|
915 |
-
"epoch": 1.0,
|
916 |
-
"learning_rate": 9.734429148174675e-05,
|
917 |
-
"loss": 0.6974,
|
918 |
-
"step": 149000
|
919 |
-
},
|
920 |
-
{
|
921 |
-
"epoch": 1.01,
|
922 |
-
"learning_rate": 9.729086208503174e-05,
|
923 |
-
"loss": 0.6974,
|
924 |
-
"step": 150000
|
925 |
-
},
|
926 |
-
{
|
927 |
-
"epoch": 1.01,
|
928 |
-
"eval_loss": 0.35331928730010986,
|
929 |
-
"eval_runtime": 24.1868,
|
930 |
-
"eval_samples_per_second": 206.724,
|
931 |
-
"eval_steps_per_second": 3.266,
|
932 |
-
"step": 150000
|
933 |
}
|
934 |
],
|
935 |
"max_steps": 1000000,
|
936 |
"num_train_epochs": 9223372036854775807,
|
937 |
-
"total_flos":
|
938 |
"trial_name": null,
|
939 |
"trial_params": null
|
940 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.1,
|
5 |
+
"global_step": 100000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
576 |
{
|
577 |
"epoch": 0.09,
|
578 |
"learning_rate": 9.94716380576598e-05,
|
579 |
+
"loss": 0.7419,
|
580 |
"step": 94000
|
581 |
},
|
582 |
{
|
583 |
"epoch": 0.1,
|
584 |
"learning_rate": 9.944739353007344e-05,
|
585 |
+
"loss": 0.7442,
|
586 |
"step": 95000
|
587 |
},
|
588 |
{
|
589 |
"epoch": 0.1,
|
590 |
"learning_rate": 9.942260825371358e-05,
|
591 |
+
"loss": 0.7534,
|
592 |
"step": 96000
|
593 |
},
|
594 |
{
|
595 |
"epoch": 0.1,
|
596 |
"learning_rate": 9.939728249962807e-05,
|
597 |
+
"loss": 0.7503,
|
598 |
"step": 97000
|
599 |
},
|
600 |
{
|
601 |
"epoch": 0.1,
|
602 |
"learning_rate": 9.937141654477528e-05,
|
603 |
+
"loss": 0.7482,
|
604 |
"step": 98000
|
605 |
},
|
606 |
{
|
607 |
"epoch": 0.1,
|
608 |
"learning_rate": 9.934501067202117e-05,
|
609 |
+
"loss": 0.7546,
|
610 |
"step": 99000
|
611 |
},
|
612 |
{
|
613 |
"epoch": 0.1,
|
614 |
"learning_rate": 9.931806517013612e-05,
|
615 |
+
"loss": 0.7459,
|
616 |
"step": 100000
|
617 |
},
|
618 |
{
|
619 |
"epoch": 0.1,
|
620 |
+
"eval_loss": 0.3987598419189453,
|
621 |
+
"eval_runtime": 34.6601,
|
622 |
+
"eval_samples_per_second": 144.258,
|
623 |
+
"eval_steps_per_second": 2.279,
|
624 |
"step": 100000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
625 |
}
|
626 |
],
|
627 |
"max_steps": 1000000,
|
628 |
"num_train_epochs": 9223372036854775807,
|
629 |
+
"total_flos": 5.9649898315776e+18,
|
630 |
"trial_name": null,
|
631 |
"trial_params": null
|
632 |
}
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0444fe16bf9b06a68fd5e817595cfc6c792710fbf61e20d4bbac3d798ec5d5a1
|
3 |
size 3503
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1346893675
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47992429487d016109373d5a83150b8f5e4877618c7785bb61465cd39529dc23
|
3 |
size 1346893675
|
runs/Feb17_16-44-06_t1v-n-7a44a9fa-w-0/events.out.tfevents.1676652777.t1v-n-7a44a9fa-w-0.1006877.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3eb0de50730ded5ac6628dd35ac7d8f855e7114015809c0ea8d904e516303642
|
3 |
+
size 26348
|
runs/Feb24_00-19-02_t1v-n-7a44a9fa-w-0/1677197978.0466611/events.out.tfevents.1677197978.t1v-n-7a44a9fa-w-0.3980329.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99a9b42ce553315c5ae0f62a8ef2bb4f9e4988d63ef2db77139558b4448d137c
|
3 |
+
size 5499
|
runs/Feb24_00-19-02_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677197978.t1v-n-7a44a9fa-w-0.3980329.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e7f4ad62b8d375bec25c7f7865cb2e942e23f3c8a97fe87a416a403fffcf2a32
|
3 |
+
size 4196
|
runs/Feb24_02-54-45_t1v-n-7a44a9fa-w-0/1677207316.2172732/events.out.tfevents.1677207316.t1v-n-7a44a9fa-w-0.4014800.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e1043b6df313538f909cc57ea7fb5034def016a1f244203823cba9400afbff1
|
3 |
+
size 5499
|
runs/Feb24_02-54-45_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677207316.t1v-n-7a44a9fa-w-0.4014800.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72df6f83ff4681aef8d4f8a07929eb5259beb82227cc8032760fbe37d6f2f5bd
|
3 |
+
size 4196
|
runs/Feb24_03-42-21_t1v-n-7a44a9fa-w-0/1677210177.3730767/events.out.tfevents.1677210177.t1v-n-7a44a9fa-w-0.4043690.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97b30d40948a8434ba8d7568418e73eff3f78cd3787650f2001e60a36ac16d41
|
3 |
+
size 5499
|
runs/Feb24_03-42-21_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677210177.t1v-n-7a44a9fa-w-0.4043690.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2e0c8f61288e5437e4a721d20ed4ca5cae02634083bce843341d43b7d6d54b5
|
3 |
+
size 4196
|
runs/Feb25_19-27-01_t1v-n-7a44a9fa-w-0/1677353255.835489/events.out.tfevents.1677353255.t1v-n-7a44a9fa-w-0.33944.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94591a885a43cf4cc1b330b7aab942b6333f26fd1a8c93b95e944abec60cf5ea
|
3 |
+
size 5499
|
runs/Feb25_19-27-01_t1v-n-7a44a9fa-w-0/events.out.tfevents.1677353255.t1v-n-7a44a9fa-w-0.33944.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14eb0c602f55affbf1d46b9db6d589f6bc0300da3c89a85d4dda61c28acb12e8
|
3 |
+
size 12112
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0444fe16bf9b06a68fd5e817595cfc6c792710fbf61e20d4bbac3d798ec5d5a1
|
3 |
size 3503
|