Publishing model

Browse files

Files changed (10) hide show

.gitattributes +5 -0
.gitignore +1 -0
README.md +101 -0
config.json +3 -51
pytorch_model.bin +2 -2
special_tokens_map.json +3 -0
tokenizer.json +3 -0
tokenizer_config.json +3 -0
train_results.json +3 -0
vocab.json +3 -0

.gitattributes CHANGED Viewed

@@ -1,3 +1,4 @@
 *.7z filter=lfs diff=lfs merge=lfs -text
 *.arrow filter=lfs diff=lfs merge=lfs -text
 *.bin filter=lfs diff=lfs merge=lfs -text
@@ -25,3 +26,7 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

+<<<<<<< HEAD
 *.7z filter=lfs diff=lfs merge=lfs -text
 *.arrow filter=lfs diff=lfs merge=lfs -text
 *.bin filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+=======
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.json filter=lfs diff=lfs merge=lfs -text
+>>>>>>> Publishing model

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ .DS_Store

README.md ADDED Viewed

	@@ -0,0 +1,101 @@

+---
+license: mit
+tags:
+- generated_from_trainer
+datasets:
+- ju-bezdek/conll2003-SK-NER
+metrics:
+- precision
+- recall
+- f1
+- accuracy
+model-index:
+- name: outputs
+  results:
+  - task:
+      name: Token Classification
+      type: token-classification
+    dataset:
+      name: ju-bezdek/conll2003-SK-NER
+      type: ju-bezdek/conll2003-SK-NER
+      args: conll2003-SK-NER
+    metrics:
+    - name: Precision
+      type: precision
+      value: 0.8189727994593682
+    - name: Recall
+      type: recall
+      value: 0.8389581169955002
+    - name: F1
+      type: f1
+      value: 0.8288450029922203
+    - name: Accuracy
+      type: accuracy
+      value: 0.9526157920337243
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# outputs
+This model is a fine-tuned version of [gerulata/slovakbert](https://huggingface.co/gerulata/slovakbert) on the ju-bezdek/conll2003-SK-NER dataset.
+It achieves the following results on the evaluation  (validation) set:
+- Loss: 0.1752
+- Precision: 0.8190
+- Recall: 0.8390
+- F1: 0.8288
+- Accuracy: 0.9526
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0001
+- train_batch_size: 16
+- eval_batch_size: 16
+- seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
+- lr_scheduler_type: linear
+- num_epochs: 15
+### Training results
+| Training Loss | Epoch | Step  | Validation Loss | Precision | Recall | F1     | Accuracy |
+|:-------------:|:-----:|:-----:|:---------------:|:---------:|:------:|:------:|:--------:|
+| 0.3237        | 1.0   | 878   | 0.2541          | 0.7125    | 0.8059 | 0.7563 | 0.9283   |
+| 0.1663        | 2.0   | 1756  | 0.2370          | 0.7775    | 0.8090 | 0.7929 | 0.9394   |
+| 0.1251        | 3.0   | 2634  | 0.2289          | 0.7732    | 0.8029 | 0.7878 | 0.9385   |
+| 0.0984        | 4.0   | 3512  | 0.2818          | 0.7294    | 0.8189 | 0.7715 | 0.9294   |
+| 0.0808        | 5.0   | 4390  | 0.3138          | 0.7615    | 0.7900 | 0.7755 | 0.9326   |
+| 0.0578        | 6.0   | 5268  | 0.3072          | 0.7548    | 0.8222 | 0.7871 | 0.9370   |
+| 0.0481        | 7.0   | 6146  | 0.2778          | 0.7897    | 0.8156 | 0.8025 | 0.9408   |
+| 0.0414        | 8.0   | 7024  | 0.3336          | 0.7695    | 0.8201 | 0.7940 | 0.9389   |
+| 0.0268        | 9.0   | 7902  | 0.3294          | 0.7868    | 0.8140 | 0.8002 | 0.9409   |
+| 0.0204        | 10.0  | 8780  | 0.3693          | 0.7657    | 0.8239 | 0.7938 | 0.9376   |
+| 0.016         | 11.0  | 9658  | 0.3816          | 0.7932    | 0.8242 | 0.8084 | 0.9425   |
+| 0.0108        | 12.0  | 10536 | 0.3607          | 0.7929    | 0.8256 | 0.8089 | 0.9431   |
+| 0.0078        | 13.0  | 11414 | 0.3980          | 0.7915    | 0.8240 | 0.8074 | 0.9423   |
+| 0.0062        | 14.0  | 12292 | 0.4096          | 0.7995    | 0.8247 | 0.8119 | 0.9436   |
+| 0.0035        | 15.0  | 13170 | 0.4177          | 0.8006    | 0.8251 | 0.8127 | 0.9438   |
+### Framework versions
+- Transformers 4.15.0
+- Pytorch 1.10.1+cu102
+- Datasets 1.17.0
+- Tokenizers 0.10.3

config.json CHANGED Viewed

@@ -1,51 +1,3 @@
-{
-  "_name_or_path": "./outputs/result_model",
-  "architectures": [
-    "RobertaModel"
-  ],
-  "attention_probs_dropout_prob": 0.1,
-  "bos_token_id": 0,
-  "classifier_dropout": null,
-  "eos_token_id": 2,
-  "finetuning_task": "ner",
-  "gradient_checkpointing": false,
-  "hidden_act": "gelu",
-  "hidden_dropout_prob": 0.1,
-  "hidden_size": 768,
-  "id2label": {
-    "0": "O",
-    "1": "B-PER",
-    "2": "I-PER",
-    "3": "B-ORG",
-    "4": "I-ORG",
-    "5": "B-LOC",
-    "6": "I-LOC",
-    "7": "B-MISC",
-    "8": "I-MISC"
-  },
-  "initializer_range": 0.02,
-  "intermediate_size": 3072,
-  "label2id": {
-    "B-LOC": 5,
-    "B-MISC": 7,
-    "B-ORG": 3,
-    "B-PER": 1,
-    "I-LOC": 6,
-    "I-MISC": 8,
-    "I-ORG": 4,
-    "I-PER": 2,
-    "O": 0
-  },
-  "layer_norm_eps": 1e-05,
-  "max_position_embeddings": 514,
-  "model_type": "roberta",
-  "num_attention_heads": 12,
-  "num_hidden_layers": 12,
-  "pad_token_id": 1,
-  "position_embedding_type": "absolute",
-  "torch_dtype": "float32",
-  "transformers_version": "4.15.0",
-  "type_vocab_size": 1,
-  "use_cache": true,
-  "vocab_size": 50264
-}

+version https://git-lfs.github.com/spec/v1
+oid sha256:d35a1a372e23da813f2d4e9c7fcb07eaeb5022857617fa9c12fc0dbad20f04f2
+size 1256

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ad0846a9f729976dfd8c7c54203b9e2c858096b33f99fc17fc4a0990e6e5d806
-size 498658097

 version https://git-lfs.github.com/spec/v1
+oid sha256:767ca4c288d62426b9712fb70b230db7e78b77ae850d0f325198f0b361f5c13b
+size 271

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c611b1f7d416eb001ee4f293d903ea8c88e703463f1d403f1866a0352743fd00
+size 772

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:abef51df8e357559d0f1eb3213621a11c2984d640f65dce953e4aba1debcb77f
+size 1508651

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34441ea75c71dec47663c8193a54891302b53560d20c68d62fdcd884279e501d
+size 1145

train_results.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:812a7c0a5fe27b04ac426c29086051e2a6e41a7ba548299468e77004af9c71aa
+size 197

vocab.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5a9d4ff71e32998a10570dadce36179053a7086a1638b402e65ae85a320242f9
+size 874618