Spaces:

nicpopovic
/

ember_chat

Sleeping

App Files Files Community

nicpopovic commited on Oct 11, 2024

Commit

b244637

verified ·

1 Parent(s): 9979f92

Upload 8 files

Browse files

Files changed (8) hide show

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/B7Ogkftne6/checkpoint.pt +3 -0
data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/B7Ogkftne6/config.json +29 -0
data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/B7Ogkftne6/config_train.json +53 -0
data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9/checkpoint.pt +3 -0
data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9/config.json +166 -0
data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9/config_train.json +53 -0
data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/config.json +8 -0
data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/stoke_config.json +10 -0

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/B7Ogkftne6/checkpoint.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f8ed0c5f360111a0cf03c113e844eb99d5a25966859f2b746cdfecb0641c1b34
+size 8439912

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/B7Ogkftne6/config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+ "model": "meta-llama/Llama-3.2-1B-Instruct",
+ "type": "span_classifier",
+ "label_map": [
+  "no_span",
+  "span"
+ ],
+ "learning_rate": 0.001,
+ "classifier_dim": 4096,
+ "loss_weights": [
+  1.0,
+  50.0
+ ],
+ "identifier": "B7Ogkftne6",
+ "best_f1_validation": 0.5553668737411499,
+ "best_f1_validation_classwise": {
+  "span": {
+   "p": 0.3978736698627472,
+   "r": 0.9192339777946472,
+   "f": 0.5553668737411499,
+   "s": 4804.0
+  },
+  "macro": {
+   "p": 0.3978736698627472,
+   "r": 0.9192339777946472,
+   "f": 0.5553668737411499
+  }
+ }
+}

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/B7Ogkftne6/config_train.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+ "path": "data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa",
+ "splits": [
+  "train",
+  "validation"
+ ],
+ "layers": [
+  8,
+  9,
+  10,
+  11,
+  12
+ ],
+ "hfcache": "",
+ "classifier_dims": [
+  4096
+ ],
+ "learning_rates": [
+  0.0001,
+  5e-05,
+  0.0003,
+  0.0005,
+  0.001
+ ],
+ "cuda": true,
+ "n_steps_per_epoch": 500,
+ "n_epochs": 30,
+ "batch_size": 4,
+ "balance_loss": false,
+ "loss_weights_span": [
+  [
+   1.0,
+   1.0
+  ],
+  [
+   1.0,
+   50.0
+  ],
+  [
+   1.0,
+   100.0
+  ]
+ ],
+ "time": 1728553144.1331656,
+ "config_dataset": {
+  "generation_kwargs": {
+   "max_new_tokens": 500,
+   "repetition_penalty": 1.2
+  },
+  "model_id": "meta-llama/Llama-3.2-1B-Instruct",
+  "flair_model_name": "flair/ner-english-ontonotes-large"
+ }
+}

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9/checkpoint.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:95f1f6318f661446e7ff38af3e31293ba1f0fc88ed94aee0a8c47ceaf6ec2b1c
+size 33884328

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9/config.json ADDED Viewed

	@@ -0,0 +1,166 @@

+{
+ "layer": 10,
+ "model": "meta-llama/Llama-3.2-1B-Instruct",
+ "type": "token_classifier",
+ "label_map": [
+  "O",
+  "CARDINAL",
+  "DATE",
+  "EVENT",
+  "FAC",
+  "GPE",
+  "LANGUAGE",
+  "LAW",
+  "LOC",
+  "MONEY",
+  "NORP",
+  "ORDINAL",
+  "ORG",
+  "PERCENT",
+  "PERSON",
+  "PRODUCT",
+  "QUANTITY",
+  "TIME",
+  "WORK_OF_ART"
+ ],
+ "learning_rate": 0.001,
+ "classifier_dim": 4096,
+ "loss_weights": [
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0,
+  1.0
+ ],
+ "identifier": "ShBuzLjzh9",
+ "best_f1_validation": 0.8960928916931152,
+ "best_f1_validation_classwise": {
+  "CARDINAL": {
+   "p": 0.8828781247138977,
+   "r": 0.9042496085166931,
+   "f": 0.8934361338615417,
+   "s": 1859.0
+  },
+  "DATE": {
+   "p": 0.9753617644309998,
+   "r": 0.9696733951568604,
+   "f": 0.9725092649459839,
+   "s": 5144.0
+  },
+  "EVENT": {
+   "p": 0.8030303120613098,
+   "r": 0.7194570302963257,
+   "f": 0.758949875831604,
+   "s": 221.0
+  },
+  "FAC": {
+   "p": 0.7110481858253479,
+   "r": 0.7011173367500305,
+   "f": 0.7060478329658508,
+   "s": 358.0
+  },
+  "GPE": {
+   "p": 0.8975331783294678,
+   "r": 0.9113680124282837,
+   "f": 0.9043976664543152,
+   "s": 1038.0
+  },
+  "LANGUAGE": {
+   "p": 0.9354838728904724,
+   "r": 0.8787878751754761,
+   "f": 0.90625,
+   "s": 66.0
+  },
+  "LAW": {
+   "p": 0.8544303774833679,
+   "r": 0.7714285850524902,
+   "f": 0.8108107447624207,
+   "s": 175.0
+  },
+  "LOC": {
+   "p": 0.6557376980781555,
+   "r": 0.6425702571868896,
+   "f": 0.6490872502326965,
+   "s": 249.0
+  },
+  "MONEY": {
+   "p": 0.9277108311653137,
+   "r": 0.9277108311653137,
+   "f": 0.9277108311653137,
+   "s": 166.0
+  },
+  "NORP": {
+   "p": 0.8764045238494873,
+   "r": 0.7852349281311035,
+   "f": 0.8283185958862305,
+   "s": 298.0
+  },
+  "ORDINAL": {
+   "p": 0.8032786846160889,
+   "r": 0.8909090757369995,
+   "f": 0.8448275923728943,
+   "s": 55.0
+  },
+  "ORG": {
+   "p": 0.8269370198249817,
+   "r": 0.8305454254150391,
+   "f": 0.8287373185157776,
+   "s": 1375.0
+  },
+  "PERCENT": {
+   "p": 0.939130425453186,
+   "r": 0.7248322367668152,
+   "f": 0.8181818127632141,
+   "s": 149.0
+  },
+  "PERSON": {
+   "p": 0.9401294589042664,
+   "r": 0.9535011053085327,
+   "f": 0.9467681050300598,
+   "s": 1828.0
+  },
+  "PRODUCT": {
+   "p": 0.7434554696083069,
+   "r": 0.4610389471054077,
+   "f": 0.56913822889328,
+   "s": 308.0
+  },
+  "QUANTITY": {
+   "p": 0.8620689511299133,
+   "r": 0.8796296119689941,
+   "f": 0.8707607984542847,
+   "s": 540.0
+  },
+  "TIME": {
+   "p": 0.6315789222717285,
+   "r": 0.4285714328289032,
+   "f": 0.5106382369995117,
+   "s": 56.0
+  },
+  "WORK_OF_ART": {
+   "p": 0.8444194197654724,
+   "r": 0.8221734166145325,
+   "f": 0.8331480026245117,
+   "s": 911.0
+  },
+  "macro": {
+   "p": 0.8394787311553955,
+   "r": 0.7890443801879883,
+   "f": 0.8099843859672546
+  }
+ }
+}

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9/config_train.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+ "path": "data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa",
+ "splits": [
+  "train",
+  "validation"
+ ],
+ "layers": [
+  8,
+  9,
+  10,
+  11,
+  12
+ ],
+ "hfcache": "",
+ "classifier_dims": [
+  4096
+ ],
+ "learning_rates": [
+  0.0001,
+  5e-05,
+  0.0003,
+  0.0005,
+  0.001
+ ],
+ "cuda": true,
+ "n_steps_per_epoch": 500,
+ "n_epochs": 30,
+ "batch_size": 4,
+ "balance_loss": false,
+ "loss_weights_span": [
+  [
+   1.0,
+   1.0
+  ],
+  [
+   1.0,
+   50.0
+  ],
+  [
+   1.0,
+   100.0
+  ]
+ ],
+ "time": 1728553144.1331656,
+ "config_dataset": {
+  "generation_kwargs": {
+   "max_new_tokens": 500,
+   "repetition_penalty": 1.2
+  },
+  "model_id": "meta-llama/Llama-3.2-1B-Instruct",
+  "flair_model_name": "flair/ner-english-ontonotes-large"
+ }
+}

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/config.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "generation_kwargs": {
+     "max_new_tokens": 500,
+     "repetition_penalty": 1.2
+    },
+    "model_id": "meta-llama/Llama-3.2-1B-Instruct",
+    "flair_model_name": "flair/ner-english-ontonotes-large"
+   }

data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/stoke_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+    "default": {
+        "classifier_token": "data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9",
+        "classifier_span": "data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/B7Ogkftne6"
+    },
+    "basic": {
+        "classifier_token": "data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/token_classifier/ShBuzLjzh9",
+        "classifier_span": "data/meta-llama/Llama-3.2-1B-Instruct/STOKE_500_wikiqa/checkpoints/span_classifier/lx17UmlUbN"
+    }
+}