medium_test

Browse files

Files changed (13) hide show

.gitignore +1 -0
all_results.json +28 -0
config.json +57 -0
eval_results.json +13 -0
generated_predictions.txt +7 -0
predict_results.json +12 -0
pytorch_model.bin +3 -0
special_tokens_map.json +1 -0
spiece.model +3 -0
tokenizer.json +0 -0
tokenizer_config.json +1 -0
train_results.json +8 -0
training_args.bin +3 -0

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ checkpoint-*/

all_results.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+    "epoch": 2.95,
+    "eval_gen_len": 33.1429,
+    "eval_loss": 0.4828817844390869,
+    "eval_rouge1": 80.6131,
+    "eval_rouge2": 73.305,
+    "eval_rougeL": 79.6954,
+    "eval_rougeLsum": 79.6954,
+    "eval_runtime": 2.536,
+    "eval_samples": 7,
+    "eval_samples_per_second": 2.76,
+    "eval_steps_per_second": 0.789,
+    "predict_gen_len": 33.1429,
+    "predict_loss": 0.4828817844390869,
+    "predict_rouge1": 80.6131,
+    "predict_rouge2": 73.305,
+    "predict_rougeL": 79.6954,
+    "predict_rougeLsum": 79.6954,
+    "predict_runtime": 2.541,
+    "predict_samples": 7,
+    "predict_samples_per_second": 2.755,
+    "predict_steps_per_second": 0.787,
+    "train_loss": 0.7666861640082465,
+    "train_runtime": 31.051,
+    "train_samples": 252,
+    "train_samples_per_second": 24.347,
+    "train_steps_per_second": 1.449
+}

config.json ADDED Viewed

	@@ -0,0 +1,57 @@

+{
+  "_name_or_path": "Vamsi/T5_Paraphrase_Paws",
+  "architectures": [
+    "T5ForConditionalGeneration"
+  ],
+  "d_ff": 3072,
+  "d_kv": 64,
+  "d_model": 768,
+  "decoder_start_token_id": 0,
+  "dropout_rate": 0.1,
+  "eos_token_id": 1,
+  "feed_forward_proj": "relu",
+  "initializer_factor": 1.0,
+  "is_encoder_decoder": true,
+  "layer_norm_epsilon": 1e-06,
+  "model_type": "t5",
+  "n_positions": 512,
+  "num_decoder_layers": 12,
+  "num_heads": 12,
+  "num_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "relative_attention_num_buckets": 32,
+  "task_specific_params": {
+    "summarization": {
+      "early_stopping": true,
+      "length_penalty": 2.0,
+      "max_length": 200,
+      "min_length": 30,
+      "no_repeat_ngram_size": 3,
+      "num_beams": 4,
+      "prefix": "summarize: "
+    },
+    "translation_en_to_de": {
+      "early_stopping": true,
+      "max_length": 300,
+      "num_beams": 4,
+      "prefix": "translate English to German: "
+    },
+    "translation_en_to_fr": {
+      "early_stopping": true,
+      "max_length": 300,
+      "num_beams": 4,
+      "prefix": "translate English to French: "
+    },
+    "translation_en_to_ro": {
+      "early_stopping": true,
+      "max_length": 300,
+      "num_beams": 4,
+      "prefix": "translate English to Romanian: "
+    }
+  },
+  "torch_dtype": "float32",
+  "transformers_version": "4.15.0",
+  "use_cache": true,
+  "vocab_size": 32100
+}

eval_results.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+    "epoch": 2.95,
+    "eval_gen_len": 33.1429,
+    "eval_loss": 0.4828817844390869,
+    "eval_rouge1": 80.6131,
+    "eval_rouge2": 73.305,
+    "eval_rougeL": 79.6954,
+    "eval_rougeLsum": 79.6954,
+    "eval_runtime": 2.536,
+    "eval_samples": 7,
+    "eval_samples_per_second": 2.76,
+    "eval_steps_per_second": 0.789
+}

generated_predictions.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Danny Bazil Riley started working as general manager at a commercial real estate firm at an annual base salary of #36;70,000. Soon after a financial planner stopped by his desk to drop off brochures about insurance benefits available through his employer. But at 32, "buying insurance was the furthest thing from my mind," Riley says.
+Short-sellers, Wall Street's dwindling band of ultra-cynics, are seeing green again ### END
+Soaring crude prices ### outlook for earnings are expected to hang over the stock market next ### END
+OPEC can do nothing to douse scorching oil prices when markets are already oversupplied by 2.8 million barrels per day (bpd) of crude ### END
+Non-OPEC oil exporters should consider increasing output to cool record crude prices ### END
+The auction for Google Inc.'s highly anticipated initial public offering got off to a rocky start on Friday ### END
+The dollar tumbled broadly on Friday ### END

predict_results.json ADDED Viewed

	@@ -0,0 +1,12 @@

+{
+    "predict_gen_len": 33.1429,
+    "predict_loss": 0.4828817844390869,
+    "predict_rouge1": 80.6131,
+    "predict_rouge2": 73.305,
+    "predict_rougeL": 79.6954,
+    "predict_rougeLsum": 79.6954,
+    "predict_runtime": 2.541,
+    "predict_samples": 7,
+    "predict_samples_per_second": 2.755,
+    "predict_steps_per_second": 0.787
+}

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6bfd4f9feaf2691d94dc1e0bbb2677fb114aa0a1a4ed1f7370504cf292a19bdb
+size 891644863

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "additional_special_tokens": ["<extra_id_0>", "<extra_id_1>", "<extra_id_2>", "<extra_id_3>", "<extra_id_4>", "<extra_id_5>", "<extra_id_6>", "<extra_id_7>", "<extra_id_8>", "<extra_id_9>", "<extra_id_10>", "<extra_id_11>", "<extra_id_12>", "<extra_id_13>", "<extra_id_14>", "<extra_id_15>", "<extra_id_16>", "<extra_id_17>", "<extra_id_18>", "<extra_id_19>", "<extra_id_20>", "<extra_id_21>", "<extra_id_22>", "<extra_id_23>", "<extra_id_24>", "<extra_id_25>", "<extra_id_26>", "<extra_id_27>", "<extra_id_28>", "<extra_id_29>", "<extra_id_30>", "<extra_id_31>", "<extra_id_32>", "<extra_id_33>", "<extra_id_34>", "<extra_id_35>", "<extra_id_36>", "<extra_id_37>", "<extra_id_38>", "<extra_id_39>", "<extra_id_40>", "<extra_id_41>", "<extra_id_42>", "<extra_id_43>", "<extra_id_44>", "<extra_id_45>", "<extra_id_46>", "<extra_id_47>", "<extra_id_48>", "<extra_id_49>", "<extra_id_50>", "<extra_id_51>", "<extra_id_52>", "<extra_id_53>", "<extra_id_54>", "<extra_id_55>", "<extra_id_56>", "<extra_id_57>", "<extra_id_58>", "<extra_id_59>", "<extra_id_60>", "<extra_id_61>", "<extra_id_62>", "<extra_id_63>", "<extra_id_64>", "<extra_id_65>", "<extra_id_66>", "<extra_id_67>", "<extra_id_68>", "<extra_id_69>", "<extra_id_70>", "<extra_id_71>", "<extra_id_72>", "<extra_id_73>", "<extra_id_74>", "<extra_id_75>", "<extra_id_76>", "<extra_id_77>", "<extra_id_78>", "<extra_id_79>", "<extra_id_80>", "<extra_id_81>", "<extra_id_82>", "<extra_id_83>", "<extra_id_84>", "<extra_id_85>", "<extra_id_86>", "<extra_id_87>", "<extra_id_88>", "<extra_id_89>", "<extra_id_90>", "<extra_id_91>", "<extra_id_92>", "<extra_id_93>", "<extra_id_94>", "<extra_id_95>", "<extra_id_96>", "<extra_id_97>", "<extra_id_98>", "<extra_id_99>"]}

spiece.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d60acb128cf7b7f2536e8f38a5b18a05535c9e14c7a355904270e15b0945ea86
+size 791656

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"eos_token": "</s>", "unk_token": "<unk>", "pad_token": "<pad>", "extra_ids": 100, "additional_special_tokens": ["<extra_id_0>", "<extra_id_1>", "<extra_id_2>", "<extra_id_3>", "<extra_id_4>", "<extra_id_5>", "<extra_id_6>", "<extra_id_7>", "<extra_id_8>", "<extra_id_9>", "<extra_id_10>", "<extra_id_11>", "<extra_id_12>", "<extra_id_13>", "<extra_id_14>", "<extra_id_15>", "<extra_id_16>", "<extra_id_17>", "<extra_id_18>", "<extra_id_19>", "<extra_id_20>", "<extra_id_21>", "<extra_id_22>", "<extra_id_23>", "<extra_id_24>", "<extra_id_25>", "<extra_id_26>", "<extra_id_27>", "<extra_id_28>", "<extra_id_29>", "<extra_id_30>", "<extra_id_31>", "<extra_id_32>", "<extra_id_33>", "<extra_id_34>", "<extra_id_35>", "<extra_id_36>", "<extra_id_37>", "<extra_id_38>", "<extra_id_39>", "<extra_id_40>", "<extra_id_41>", "<extra_id_42>", "<extra_id_43>", "<extra_id_44>", "<extra_id_45>", "<extra_id_46>", "<extra_id_47>", "<extra_id_48>", "<extra_id_49>", "<extra_id_50>", "<extra_id_51>", "<extra_id_52>", "<extra_id_53>", "<extra_id_54>", "<extra_id_55>", "<extra_id_56>", "<extra_id_57>", "<extra_id_58>", "<extra_id_59>", "<extra_id_60>", "<extra_id_61>", "<extra_id_62>", "<extra_id_63>", "<extra_id_64>", "<extra_id_65>", "<extra_id_66>", "<extra_id_67>", "<extra_id_68>", "<extra_id_69>", "<extra_id_70>", "<extra_id_71>", "<extra_id_72>", "<extra_id_73>", "<extra_id_74>", "<extra_id_75>", "<extra_id_76>", "<extra_id_77>", "<extra_id_78>", "<extra_id_79>", "<extra_id_80>", "<extra_id_81>", "<extra_id_82>", "<extra_id_83>", "<extra_id_84>", "<extra_id_85>", "<extra_id_86>", "<extra_id_87>", "<extra_id_88>", "<extra_id_89>", "<extra_id_90>", "<extra_id_91>", "<extra_id_92>", "<extra_id_93>", "<extra_id_94>", "<extra_id_95>", "<extra_id_96>", "<extra_id_97>", "<extra_id_98>", "<extra_id_99>"], "model_max_length": 512, "special_tokens_map_file": "C:\\Users\\peter/.cache\\huggingface\\transformers\\ca670222dc28504dc97cb6136cadc777e4158e3b346f98b99064406f5ac6eac0.c94798918c92ded6aeef2d2f0e666d2cc4145eca1aa6e1336fde07f2e13e2f46", "name_or_path": "Vamsi/T5_Paraphrase_Paws", "sp_model_kwargs": {}, "tokenizer_class": "T5Tokenizer"}

train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 2.95,
+    "train_loss": 0.7666861640082465,
+    "train_runtime": 31.051,
+    "train_samples": 252,
+    "train_samples_per_second": 24.347,
+    "train_steps_per_second": 1.449
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bf8d9c3c9936cb871cebcdaea9f4bf6dce8ca2eca8a689ec8e0471393131ba89
+size 3055