VenkatManda commited on
Commit
0283e0f
1 Parent(s): 040f232

End of training

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ eval_nbest_predictions.json filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ base_model: prajjwal1/bert-tiny
4
+ tags:
5
+ - generated_from_trainer
6
+ datasets:
7
+ - squad_v2
8
+ model-index:
9
+ - name: V1
10
+ results: []
11
+ ---
12
+
13
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
+ should probably proofread and complete it, then remove this comment. -->
15
+
16
+ # V1
17
+
18
+ This model is a fine-tuned version of [prajjwal1/bert-tiny](https://huggingface.co/prajjwal1/bert-tiny) on the squad_v2 dataset.
19
+
20
+ ## Model description
21
+
22
+ More information needed
23
+
24
+ ## Intended uses & limitations
25
+
26
+ More information needed
27
+
28
+ ## Training and evaluation data
29
+
30
+ More information needed
31
+
32
+ ## Training procedure
33
+
34
+ ### Training hyperparameters
35
+
36
+ The following hyperparameters were used during training:
37
+ - learning_rate: 5e-05
38
+ - train_batch_size: 96
39
+ - eval_batch_size: 12
40
+ - seed: 42
41
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
42
+ - lr_scheduler_type: linear
43
+ - num_epochs: 3.0
44
+
45
+ ### Framework versions
46
+
47
+ - Transformers 4.37.0.dev0
48
+ - Pytorch 2.1.0+cu121
49
+ - Datasets 2.16.1
50
+ - Tokenizers 0.15.0
all_results.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eval_HasAns_exact": 0.0,
3
+ "eval_HasAns_f1": 4.14210369723646,
4
+ "eval_HasAns_total": 5928,
5
+ "eval_NoAns_exact": 19.83179142136249,
6
+ "eval_NoAns_f1": 19.83179142136249,
7
+ "eval_NoAns_total": 5945,
8
+ "eval_best_exact": 50.07159100480081,
9
+ "eval_best_exact_thresh": 0.0,
10
+ "eval_best_f1": 50.081405424967926,
11
+ "eval_best_f1_thresh": 0.0,
12
+ "eval_exact": 9.9300934894298,
13
+ "eval_f1": 11.998179964391293,
14
+ "eval_runtime": 247.8052,
15
+ "eval_samples": 12134,
16
+ "eval_samples_per_second": 48.966,
17
+ "eval_steps_per_second": 4.084,
18
+ "eval_total": 11873
19
+ }
config.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "_name_or_path": "VenkatManda/V1",
3
  "architectures": [
4
  "BertForQuestionAnswering"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
  "hidden_act": "gelu",
9
- "hidden_dropout_prob": 0.3,
10
  "hidden_size": 128,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 512,
@@ -18,7 +18,7 @@
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
20
  "torch_dtype": "float32",
21
- "transformers_version": "4.36.2",
22
  "type_vocab_size": 2,
23
  "use_cache": true,
24
  "vocab_size": 30522
 
1
  {
2
+ "_name_or_path": "prajjwal1/bert-tiny",
3
  "architectures": [
4
  "BertForQuestionAnswering"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "classifier_dropout": null,
8
  "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
  "hidden_size": 128,
11
  "initializer_range": 0.02,
12
  "intermediate_size": 512,
 
18
  "pad_token_id": 0,
19
  "position_embedding_type": "absolute",
20
  "torch_dtype": "float32",
21
+ "transformers_version": "4.37.0.dev0",
22
  "type_vocab_size": 2,
23
  "use_cache": true,
24
  "vocab_size": 30522
eval_nbest_predictions.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a986d1ec9e11c91463d2b63f2ea2ff33d6ec81fd6201faa4707ec5ce2168c8be
3
+ size 21812970
eval_null_odds.json ADDED
The diff for this file is too large to render. See raw diff
 
eval_predictions.json ADDED
The diff for this file is too large to render. See raw diff
 
eval_results.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "eval_HasAns_exact": 0.0,
3
+ "eval_HasAns_f1": 4.14210369723646,
4
+ "eval_HasAns_total": 5928,
5
+ "eval_NoAns_exact": 19.83179142136249,
6
+ "eval_NoAns_f1": 19.83179142136249,
7
+ "eval_NoAns_total": 5945,
8
+ "eval_best_exact": 50.07159100480081,
9
+ "eval_best_exact_thresh": 0.0,
10
+ "eval_best_f1": 50.081405424967926,
11
+ "eval_best_f1_thresh": 0.0,
12
+ "eval_exact": 9.9300934894298,
13
+ "eval_f1": 11.998179964391293,
14
+ "eval_runtime": 247.8052,
15
+ "eval_samples": 12134,
16
+ "eval_samples_per_second": 48.966,
17
+ "eval_steps_per_second": 4.084,
18
+ "eval_total": 11873
19
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d52262c0b41bda521bbea4f8620ecf690586333a9955d6a4fa0f9389de9237d1
3
  size 17483080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:532d2ec490653061f5bdf3eb184e58d2be566b8e96c010b6d76a3eb75bd7263f
3
  size 17483080
special_tokens_map.json CHANGED
@@ -1,37 +1,7 @@
1
  {
2
- "cls_token": {
3
- "content": "[CLS]",
4
- "lstrip": false,
5
- "normalized": false,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "mask_token": {
10
- "content": "[MASK]",
11
- "lstrip": false,
12
- "normalized": false,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "[PAD]",
18
- "lstrip": false,
19
- "normalized": false,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "sep_token": {
24
- "content": "[SEP]",
25
- "lstrip": false,
26
- "normalized": false,
27
- "rstrip": false,
28
- "single_word": false
29
- },
30
- "unk_token": {
31
- "content": "[UNK]",
32
- "lstrip": false,
33
- "normalized": false,
34
- "rstrip": false,
35
- "single_word": false
36
- }
37
  }
 
1
  {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
tokenizer.json CHANGED
@@ -1,7 +1,21 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 384,
6
+ "strategy": "OnlySecond",
7
+ "stride": 128
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 384
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 0,
16
+ "pad_type_id": 0,
17
+ "pad_token": "[PAD]"
18
+ },
19
  "added_tokens": [
20
  {
21
  "id": 0,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:437e0695fb8e79ab7fc2dc357b1a230b757ffb22d3a04433e16268de0466951d
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cdace9ec738f1bfc2f5d803c733ebd0a623e89b53e4c48b568d22841517a874
3
+ size 4664