Tech-oriented commited on Mar 3, 2024

Commit

c6bdb57

verified ·

1 Parent(s): 7a5942d

Training in progress, epoch 1

Browse files

Files changed (37) hide show

model.safetensors +1 -1
run-10/checkpoint-211/config.json +27 -0
run-10/checkpoint-211/model.safetensors +3 -0
run-10/checkpoint-211/optimizer.pt +3 -0
run-10/checkpoint-211/rng_state.pth +3 -0
run-10/checkpoint-211/scheduler.pt +3 -0
run-10/checkpoint-211/special_tokens_map.json +7 -0
run-10/checkpoint-211/tokenizer.json +0 -0
run-10/checkpoint-211/tokenizer_config.json +55 -0
run-10/checkpoint-211/trainer_state.json +35 -0
run-10/checkpoint-211/training_args.bin +3 -0
run-10/checkpoint-211/vocab.txt +0 -0
run-10/checkpoint-422/config.json +27 -0
run-10/checkpoint-422/model.safetensors +3 -0
run-10/checkpoint-422/optimizer.pt +3 -0
run-10/checkpoint-422/rng_state.pth +3 -0
run-10/checkpoint-422/scheduler.pt +3 -0
run-10/checkpoint-422/special_tokens_map.json +7 -0
run-10/checkpoint-422/tokenizer.json +0 -0
run-10/checkpoint-422/tokenizer_config.json +55 -0
run-10/checkpoint-422/trainer_state.json +44 -0
run-10/checkpoint-422/training_args.bin +3 -0
run-10/checkpoint-422/vocab.txt +0 -0
run-11/checkpoint-211/config.json +27 -0
run-11/checkpoint-211/model.safetensors +3 -0
run-11/checkpoint-211/optimizer.pt +3 -0
run-11/checkpoint-211/rng_state.pth +3 -0
run-11/checkpoint-211/scheduler.pt +3 -0
run-11/checkpoint-211/special_tokens_map.json +7 -0
run-11/checkpoint-211/tokenizer.json +0 -0
run-11/checkpoint-211/tokenizer_config.json +55 -0
run-11/checkpoint-211/trainer_state.json +35 -0
run-11/checkpoint-211/training_args.bin +3 -0
run-11/checkpoint-211/vocab.txt +0 -0
runs/Mar03_17-42-01_90708aaa767a/events.out.tfevents.1709499337.90708aaa767a.21824.28 +3 -0
runs/Mar03_17-42-01_90708aaa767a/events.out.tfevents.1709499505.90708aaa767a.21824.29 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d201f460d7bdd8145286af8f5c723f35f0050e28c4afafc6d56d06ce2595b40d
 size 437958648

 version https://git-lfs.github.com/spec/v1
+oid sha256:4fbe36943eedb3184229a1a5974bcc08a70bed558ba6f4453cecbfadb1f62b89
 size 437958648

run-10/checkpoint-211/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-10/checkpoint-211/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:70ab8ef25bf1e4159772370368c1515778946b06823ea30f59d96b4dbf60213c
+size 437958648

run-10/checkpoint-211/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:308f8d713e5a87239b411e0ade5ae8dc05aed0770e0b57f3f09c41b8d055f12a
+size 876038394

run-10/checkpoint-211/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7dd536778dff8e09a3adf2e1ada791b7834e50ce1a519297f5a7325f25e66d5b
+size 14244

run-10/checkpoint-211/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f76f8626a957a82c8b8b309f0323ac0593df8a5f9f62ab64e2d64b3818d25ab1
+size 1064

run-10/checkpoint-211/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-10/checkpoint-211/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-10/checkpoint-211/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-10/checkpoint-211/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.9071100917431193,
+  "best_model_checkpoint": "bert-base-uncased-finetuned-sst2/run-10/checkpoint-211",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 211,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9071100917431193,
+      "eval_loss": 0.21861808001995087,
+      "eval_runtime": 2.4313,
+      "eval_samples_per_second": 358.662,
+      "eval_steps_per_second": 22.622,
+      "step": 211
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 844,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.8551043262104743e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 32,
+    "seed": 4
+  }
+}

run-10/checkpoint-211/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:867a6a56564c0c496d5770014cefc137b8c04861a257894a96083bcaf8e241ae
+size 4920

run-10/checkpoint-211/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-10/checkpoint-422/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-10/checkpoint-422/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3feffa37f54807c648accec23430c7d34012c75d23a02861bd0496d35e00fbd8
+size 437958648

run-10/checkpoint-422/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba411534c4f32acd29630e6f8991f051ab26c199b740b913c7d98aef00c633a5
+size 876038394

run-10/checkpoint-422/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a552a367005c08fc935fba6db0178fd612c11143da54160857b415e72c8168bd
+size 14244

run-10/checkpoint-422/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:03ff796904ee2f8f12ba22ca3390052f8969ceb72b1756ffb73164188028de83
+size 1064

run-10/checkpoint-422/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-10/checkpoint-422/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-10/checkpoint-422/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-10/checkpoint-422/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.9094036697247706,
+  "best_model_checkpoint": "bert-base-uncased-finetuned-sst2/run-10/checkpoint-422",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 422,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9071100917431193,
+      "eval_loss": 0.21861808001995087,
+      "eval_runtime": 2.4313,
+      "eval_samples_per_second": 358.662,
+      "eval_steps_per_second": 22.622,
+      "step": 211
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.9094036697247706,
+      "eval_loss": 0.26571977138519287,
+      "eval_runtime": 2.4292,
+      "eval_samples_per_second": 358.961,
+      "eval_steps_per_second": 22.641,
+      "step": 422
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 844,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.8551043262104743e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 32,
+    "seed": 4
+  }
+}

run-10/checkpoint-422/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:867a6a56564c0c496d5770014cefc137b8c04861a257894a96083bcaf8e241ae
+size 4920

run-10/checkpoint-422/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-11/checkpoint-211/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-11/checkpoint-211/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4fbe36943eedb3184229a1a5974bcc08a70bed558ba6f4453cecbfadb1f62b89
+size 437958648

run-11/checkpoint-211/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1398939f877b65a1ab4cf8011c8123eef46c668392356e3ad3a34eafcf0961e2
+size 876038394

run-11/checkpoint-211/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bacf6ed581f22ac50e4e426230d241f2f0a079241fe3ec5f490f2ba20a6c4ab2
+size 14244

run-11/checkpoint-211/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a82ddf5ad45740190831e7e00ffc66b55f0e1d0b0a8bc15e7969ac2d93687d2
+size 1064

run-11/checkpoint-211/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-11/checkpoint-211/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-11/checkpoint-211/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-11/checkpoint-211/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.9036697247706422,
+  "best_model_checkpoint": "bert-base-uncased-finetuned-sst2/run-11/checkpoint-211",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 211,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.9036697247706422,
+      "eval_loss": 0.22603479027748108,
+      "eval_runtime": 2.4304,
+      "eval_samples_per_second": 358.785,
+      "eval_steps_per_second": 22.63,
+      "step": 211
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 844,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 5.0602619122090524e-05,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 32,
+    "seed": 5
+  }
+}

run-11/checkpoint-211/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c20f491bcd258cb2b04ee82e11e2d99e0be3d52fceef83399f1e08b07b63e13c
+size 4920

run-11/checkpoint-211/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Mar03_17-42-01_90708aaa767a/events.out.tfevents.1709499337.90708aaa767a.21824.28 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:95c34637a63a1e425374d8544c1e731612f83d6c0bc106c0930334eb85df4380
+size 5804

runs/Mar03_17-42-01_90708aaa767a/events.out.tfevents.1709499505.90708aaa767a.21824.29 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68570fdff007113f9997eecc4e0e72053f5f3ca333b515dd7ec50b80515dd00a
+size 5804

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ff0ded7f1550b2b2938d781c01cca247a57f943b1522ab0d31f9711c61ea56d
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:c20f491bcd258cb2b04ee82e11e2d99e0be3d52fceef83399f1e08b07b63e13c
 size 4920