huggingartists

Files changed (9) hide show

README.md CHANGED Viewed

@@ -45,15 +45,15 @@ from datasets import load_dataset
 dataset = load_dataset("huggingartists/eminem")
 ```
-[Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/w7y07ejq/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
 ## Training procedure
 The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Eminem's lyrics.
-Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/1j6e92ir) for full transparency and reproducibility.
-At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/1j6e92ir/artifacts) is logged and versioned.
 ## How to use

 dataset = load_dataset("huggingartists/eminem")
 ```
+[Explore the data](https://wandb.ai/huggingartists/huggingartists/runs/3j11lytq/artifacts), which is tracked with [W&B artifacts](https://docs.wandb.com/artifacts) at every step of the pipeline.
 ## Training procedure
 The model is based on a pre-trained [GPT-2](https://huggingface.co/gpt2) which is fine-tuned on Eminem's lyrics.
+Hyperparameters and metrics are recorded in the [W&B training run](https://wandb.ai/huggingartists/huggingartists/runs/1zieygbg) for full transparency and reproducibility.
+At the end of training, [the final model](https://wandb.ai/huggingartists/huggingartists/runs/1zieygbg/artifacts) is logged and versioned.
 ## How to use

evaluation.txt CHANGED Viewed

	@@ -1 +1 @@
1	- {"eval_loss": 2.~~026026487350464~~, "eval_runtime": 32.~~1272~~, "eval_samples_per_second": 20.~~699~~, "eval_steps_per_second": 2.~~615~~, "epoch": 5.0}


1	+ {"eval_loss": 1.8596649169921875, "eval_runtime": 29.521, "eval_samples_per_second": 21.138, "eval_steps_per_second": 2.642, "epoch": 2.0}

flax_model.msgpack CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:464d4e7e6e4c6382358d88fef714b72f5deae64e28bfb5b9bf00f9ff6030918b
 size 497764120

 version https://git-lfs.github.com/spec/v1
+oid sha256:b135877e250da289f866a54700c125f37a80174dcc1e12dfb1f5dbd2249cdec2
 size 497764120

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9f578f796fe425b739c57c93d4870307639bdede01ade17192cbfd7dade1337c
 size 995604017

 version https://git-lfs.github.com/spec/v1
+oid sha256:eecd9ef518643711b9927ae1f9897be18a83cabb4c9d4cb783637ffd91b94e92
 size 995604017

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5744d9da42094b4502ba2c2c52176dfb839e8656df36cf0783b4832a5444d42b
 size 510403817

 version https://git-lfs.github.com/spec/v1
+oid sha256:d63665b8addacc515cc738fbaa06e7fafcd26d90f9625949551144aaa6f57495
 size 510403817

rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1bd5d70a0d7170f2240ff3effc84cd6446ab98ec4b12f17cec590991fb7f5f94
-size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:2c4cd04e3d531ff616086aabe0842d017287cb7d6aa18753bc57ea83f5c6ec09
+size 14567

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5606edb00c1d85c79a7e6e65c60470a6b50e72dc1246597e70873019f5c126ed
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:6cde66d2336c18c91f6044376f78eeeea90a1182517e78de002b9f811e407360
 size 623

trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
-  "best_metric": 2.026026487350464,
-  "best_model_checkpoint": "output/eminem/checkpoint-452",
   "epoch": 1.0,
-  "global_step": 452,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -554,11 +554,25 @@
       "eval_samples_per_second": 20.779,
       "eval_steps_per_second": 2.625,
       "step": 452
     }
   ],
-  "max_steps": 2260,
-  "num_train_epochs": 5,
-  "total_flos": 472024055808000.0,
   "trial_name": null,
   "trial_params": null
 }

 {
+  "best_metric": 1.8596649169921875,
+  "best_model_checkpoint": "output/eminem/checkpoint-457",
   "epoch": 1.0,
+  "global_step": 457,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 20.779,
       "eval_steps_per_second": 2.625,
       "step": 452
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 1.757624254440622e-06,
+      "loss": 2.2171,
+      "step": 455
+    },
+    {
+      "epoch": 1.0,
+      "eval_loss": 1.8596649169921875,
+      "eval_runtime": 29.8564,
+      "eval_samples_per_second": 20.9,
+      "eval_steps_per_second": 2.613,
+      "step": 457
     }
   ],
+  "max_steps": 914,
+  "num_train_epochs": 2,
+  "total_flos": 476857958400000.0,
   "trial_name": null,
   "trial_params": null
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:42cd89b75d7c0f3fe6da69fe6e477354496b002c63ce374ba6ee57264a045ed7
 size 2671

 version https://git-lfs.github.com/spec/v1
+oid sha256:a79cbab9dd97447de0d3db9f15d21e846aff0e011af608b06d64e13678d93e8a
 size 2671