dvssr commited on
Commit
7125685
1 Parent(s): 91eb0bb

Model save

Browse files
README.md CHANGED
@@ -3,8 +3,6 @@ license: apache-2.0
3
  base_model: mse30/bart-base-finetuned-pubmed
4
  tags:
5
  - generated_from_trainer
6
- metrics:
7
- - accuracy
8
  model-index:
9
  - name: unipelt
10
  results: []
@@ -16,9 +14,6 @@ should probably proofread and complete it, then remove this comment. -->
16
  # unipelt
17
 
18
  This model is a fine-tuned version of [mse30/bart-base-finetuned-pubmed](https://huggingface.co/mse30/bart-base-finetuned-pubmed) on an unknown dataset.
19
- It achieves the following results on the evaluation set:
20
- - Loss: 9.5453
21
- - Accuracy: 0.0169
22
 
23
  ## Model description
24
 
 
3
  base_model: mse30/bart-base-finetuned-pubmed
4
  tags:
5
  - generated_from_trainer
 
 
6
  model-index:
7
  - name: unipelt
8
  results: []
 
14
  # unipelt
15
 
16
  This model is a fine-tuned version of [mse30/bart-base-finetuned-pubmed](https://huggingface.co/mse30/bart-base-finetuned-pubmed) on an unknown dataset.
 
 
 
17
 
18
  ## Model description
19
 
config.json CHANGED
@@ -4,6 +4,9 @@
4
  "activation_function": "gelu",
5
  "adapters": {
6
  "adapters": {
 
 
 
7
  "unipelt": "0815dd75d5ff5808"
8
  },
9
  "config_map": {
@@ -73,10 +76,44 @@
73
  "use_gating": true
74
  }
75
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
76
  }
77
  },
78
  "fusion_config_map": {},
79
- "fusions": {}
 
 
80
  },
81
  "add_bias_logits": false,
82
  "add_final_layer_norm": false,
 
4
  "activation_function": "gelu",
5
  "adapters": {
6
  "adapters": {
7
+ "adapter1": "847a59cd9f1cbf0e",
8
+ "adapter2": "847a59cd9f1cbf0e",
9
+ "adapter3": "847a59cd9f1cbf0e",
10
  "unipelt": "0815dd75d5ff5808"
11
  },
12
  "config_map": {
 
76
  "use_gating": true
77
  }
78
  ]
79
+ },
80
+ "847a59cd9f1cbf0e": {
81
+ "adapter_residual_before_ln": false,
82
+ "cross_adapter": false,
83
+ "factorized_phm_W": true,
84
+ "factorized_phm_rule": false,
85
+ "hypercomplex_nonlinearity": "glorot-uniform",
86
+ "init_weights": "bert",
87
+ "inv_adapter": null,
88
+ "inv_adapter_reduction_factor": null,
89
+ "is_parallel": false,
90
+ "learn_phm": true,
91
+ "leave_out": [],
92
+ "ln_after": false,
93
+ "ln_before": false,
94
+ "mh_adapter": false,
95
+ "non_linearity": "relu",
96
+ "original_ln_after": true,
97
+ "original_ln_before": true,
98
+ "output_adapter": true,
99
+ "phm_bias": true,
100
+ "phm_c_init": "normal",
101
+ "phm_dim": 4,
102
+ "phm_init_range": 0.0001,
103
+ "phm_layer": false,
104
+ "phm_rank": 1,
105
+ "reduction_factor": 16,
106
+ "residual_before_ln": true,
107
+ "scaling": 1.0,
108
+ "shared_W_phm": false,
109
+ "shared_phm_rule": true,
110
+ "use_gating": true
111
  }
112
  },
113
  "fusion_config_map": {},
114
+ "fusions": {
115
+ "adapter1,adapter2,adapter3": "dynamic"
116
+ }
117
  },
118
  "add_bias_logits": false,
119
  "add_final_layer_norm": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9929a3f9944a7877ee27cbf23be5300c743831eb9da6bf3f76f766d986216192
3
- size 625051084
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:428d82d0e717392b4332faa292284179e62945c99343ff104a1ce0c537c2a56c
3
+ size 720945604
runs/Mar16_04-20-55_13e96b604141/events.out.tfevents.1710562860.13e96b604141.387.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2432e785623752a934c7c7e7b7452d29b85f2e3ef1f001ea59164064b3c0f35f
3
+ size 5807
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:323920350a32a56049c4982458db48b80028ef6c3e17431e268a26cdb321f260
3
  size 4792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5db3bd67f7ccb239064a38709e5c31c5d4433e4bc69c75ed56d21a45c9ec1cd7
3
  size 4792