Upload 11 files

Files changed (11) hide show

0_Transformer/config.json ADDED Viewed

+{
+  "architectures": [
+    "BertModel"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "directionality": "bidi",
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "output_past": true,
+  "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "type_vocab_size": 2,
+  "vocab_size": 29794
+}

0_Transformer/pytorch_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0e96a670906ee64f42b0f60170251b9a3927c767527a51fa522640eb9496ba2c
+size 435771886

0_Transformer/sentence_bert_config.json ADDED Viewed

+{
+  "max_seq_length": 128
+}

0_Transformer/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"unk_token": "[UNK]", "sep_token": "[SEP]", "pad_token": "[PAD]", "cls_token": "[CLS]", "mask_token": "[MASK]"}

0_Transformer/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"special_tokens_map_file": null, "full_tokenizer_file": null}

0_Transformer/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

1_Pooling/config.json ADDED Viewed

+{
+  "word_embedding_dimension": 768,
+  "pooling_mode_cls_token": false,
+  "pooling_mode_mean_tokens": true,
+  "pooling_mode_max_tokens": false,
+  "pooling_mode_mean_sqrt_len_tokens": false
+}

config.json ADDED Viewed

+{
+  "__version__": "0.3.5.1"
+}

modules.json ADDED Viewed

+[
+  {
+    "idx": 0,
+    "name": "0",
+    "path": "0_Transformer",
+    "type": "sentence_transformers.models.Transformer"
+  },
+  {
+    "idx": 1,
+    "name": "1",
+    "path": "1_Pooling",
+    "type": "sentence_transformers.models.Pooling"
+  }
+]

similarity_evaluation_sts-dev_results.csv ADDED Viewed

+epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
+0,-1,0.8810313733021867,0.8765896223439993,0.8135243773981371,0.8113353724031187,0.8126467226589057,0.8097498613646772,0.7010983914810677,0.7105895269487511
+1,-1,0.894487538190678,0.8923645187262643,0.8322341727041636,0.8326890056594196,0.8309415317021186,0.8306906378427429,0.7367307981824308,0.7465082254406685
+2,-1,0.8987050017046159,0.8964115235151033,0.8370117962663568,0.8363835766923299,0.8361181815502218,0.8347883361768138,0.7530603478015696,0.7606953221158317
+3,-1,0.900684841476426,0.8985778995238289,0.8367507007687051,0.8352543394300794,0.8358523363238494,0.8336725972520378,0.7522138387815421,0.7609377870816812

similarity_evaluation_sts-test_results.csv ADDED Viewed


1	+ epoch,steps,cosine_pearson,cosine_spearman,euclidean_pearson,euclidean_spearman,manhattan_pearson,manhattan_spearman,dot_pearson,dot_spearman
2	+ -1,-1,0.8877026168264394,0.8743395104288838,0.8410158131915916,0.823468358864715,0.8403935866721796,0.8226021217264627,0.7406676806236411,0.731883081220538