Upload 13 files

Browse files

Files changed (6) hide show

README.md +57 -57
config.json +1 -1
config_sentence_transformers.json +1 -1
config_setfit.json +2 -2
model.safetensors +1 -1
model_head.pkl +1 -1

README.md CHANGED Viewed

@@ -9,12 +9,12 @@ base_model: intfloat/multilingual-e5-small
 metrics:
 - accuracy
 widget:
-- text: 'query: Sí, la próxima vez que vayas, cuenta conmigo. He querido salir y hacer
-    más actividades en la naturaleza.'
-- text: 'query: I''m man, I''m leaving now.'
-- text: 'query: Ja, forse possiamo fare un giro in bicicletta insieme.'
-- text: 'query: Mak saya suruh balik, jumpa lagi.'
-- text: 'query: İnanılmaz, bu harika! Bir ayı gördüğüne inanamıyorum!'
 pipeline_tag: text-classification
 inference: true
 ---
@@ -47,10 +47,10 @@ The model has been trained using an efficient few-shot learning technique that i
 - **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
 ### Model Labels
-| Label | Examples                                                                                                                                                                                                               |
-|:------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| 1     | <ul><li>'query: Tja, måste dra nu, ses senare.'</li><li>'query: Ispričavam se, moram sada otići.'</li><li>'query: Przepraszam, muszę już iść.'</li></ul>                                                               |
-| 0     | <ul><li>'query: Sveiki, kā jums klājas?'</li><li>'query: அதிர்ச்சிகரமானது, அது மிகவும் அருமையாக இருக்கிறது! நீ கரடியை பார்த்தது எனக்கு நம்பிக்கையே வரவில்லை!'</li><li>'query: Ég hef það fínt, takk. Og þú?'</li></ul> |
 ## Uses
@@ -70,7 +70,7 @@ from setfit import SetFitModel
 # Download from the 🤗 Hub
 model = SetFitModel.from_pretrained("setfit_model_id")
 # Run inference
-preds = model("query: I'm man, I'm leaving now.")
 ```
 <!--
@@ -102,17 +102,17 @@ preds = model("query: I'm man, I'm leaving now.")
 ### Training Set Metrics
 | Training set | Min | Median | Max |
 |:-------------|:----|:-------|:----|
-| Word count   | 2   | 7.6965 | 31  |
 | Label | Training Sample Count |
 |:------|:----------------------|
-| 0     | 902                   |
-| 1     | 910                   |
 ### Training Hyperparameters
 - batch_size: (16, 2)
 - num_epochs: (1, 16)
-- max_steps: -1
 - sampling_strategy: undersampling
 - body_learning_rate: (1e-05, 1e-05)
 - head_learning_rate: 0.001
@@ -130,53 +130,53 @@ preds = model("query: I'm man, I'm leaving now.")
 ### Training Results
 | Epoch  | Step | Training Loss | Validation Loss |
 |:------:|:----:|:-------------:|:---------------:|
-| 0.0000 | 1    | 0.3613        | -               |
-| 0.0005 | 50   | 0.3577        | -               |
-| 0.0010 | 100  | 0.3511        | 0.3413          |
-| 0.0015 | 150  | 0.3372        | -               |
-| 0.0019 | 200  | 0.3447        | 0.3347          |
-| 0.0024 | 250  | 0.3349        | -               |
-| 0.0029 | 300  | 0.3326        | 0.3224          |
-| 0.0034 | 350  | 0.3372        | -               |
-| 0.0039 | 400  | 0.3185        | 0.3039          |
-| 0.0044 | 450  | 0.2828        | -               |
-| 0.0049 | 500  | 0.3055        | 0.2774          |
-| 0.0054 | 550  | 0.2594        | -               |
-| 0.0058 | 600  | 0.2779        | 0.2489          |
-| 0.0063 | 650  | 0.2486        | -               |
-| 0.0068 | 700  | 0.2321        | 0.22            |
-| 0.0073 | 750  | 0.1838        | -               |
-| 0.0078 | 800  | 0.1845        | 0.2075          |
-| 0.0083 | 850  | 0.1899        | -               |
-| 0.0088 | 900  | 0.2147        | 0.2025          |
-| 0.0093 | 950  | 0.1644        | -               |
-| 0.0097 | 1000 | 0.2019        | 0.1821          |
-| 0.0102 | 1050 | 0.2309        | -               |
-| 0.0107 | 1100 | 0.2084        | 0.1784          |
-| 0.0112 | 1150 | 0.1508        | -               |
-| 0.0117 | 1200 | 0.1064        | 0.1453          |
-| 0.0122 | 1250 | 0.1376        | -               |
-| 0.0127 | 1300 | 0.0828        | 0.121           |
-| 0.0132 | 1350 | 0.1628        | -               |
-| 0.0136 | 1400 | 0.1308        | 0.1018          |
-| 0.0141 | 1450 | 0.0566        | -               |
-| 0.0146 | 1500 | 0.0953        | 0.0767          |
-| 0.0151 | 1550 | 0.1607        | -               |
-| 0.0156 | 1600 | 0.1322        | 0.0625          |
-| 0.0161 | 1650 | 0.0861        | -               |
-| 0.0166 | 1700 | 0.0926        | 0.0423          |
-| 0.0171 | 1750 | 0.0338        | -               |
-| 0.0175 | 1800 | 0.1029        | 0.0344          |
-| 0.0180 | 1850 | 0.0442        | -               |
-| 0.0185 | 1900 | 0.019         | 0.0256          |
-| 0.0190 | 1950 | 0.0489        | -               |
-| 0.0195 | 2000 | 0.0675        | 0.0187          |
 ### Framework Versions
 - Python: 3.10.11
 - SetFit: 1.0.3
 - Sentence Transformers: 2.7.0
-- Transformers: 4.39.0
 - PyTorch: 2.4.0
 - Datasets: 2.20.0
 - Tokenizers: 0.15.2

 metrics:
 - accuracy
 widget:
+- text: 'query: Interessant. Hast du das schon mal ausprobiert?'
+- text: 'query: はい、持っていますよ。すぐにメールで送りますね。'
+- text: 'query: Va bene ci sentiamo dopo Marco buona giornata'
+- text: 'query: Ζητώ συγγνώμη, πρέπει να αποχωρήσω τώρα.'
+- text: 'query: Guten Morgen, Maria! Hast du die Präsentation für das Meeting heute
+    fertig?'
 pipeline_tag: text-classification
 inference: true
 ---
 - **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
 ### Model Labels
+| Label | Examples                                                                                                                                                                                            |
+|:------|:----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| 0     | <ul><li>'query: สวัสดีค่ะ วันนี้เป็นอย่างไรบ้าง?'</li><li>'query: Jag förstår. Vad tycker du att vi ska göra nu?'</li><li>'query: Hej, wszystko w porządku. Właśnie dostałam nową pracę.'</li></ul> |
+| 1     | <ul><li>'query: Чудесно, доскоро!'</li><li>'query: Mama mă cheamă, trebuie să mă întorc acasă, pa.'</li><li>'query: Perdó, ja he de marxar.'</li></ul>                                              |
 ## Uses
 # Download from the 🤗 Hub
 model = SetFitModel.from_pretrained("setfit_model_id")
 # Run inference
+preds = model("query: はい、持っていますよ。すぐにメールで送りますね。")
 ```
 <!--
 ### Training Set Metrics
 | Training set | Min | Median | Max |
 |:-------------|:----|:-------|:----|
+| Word count   | 2   | 7.3663 | 21  |
 | Label | Training Sample Count |
 |:------|:----------------------|
+| 0     | 286                   |
+| 1     | 290                   |
 ### Training Hyperparameters
 - batch_size: (16, 2)
 - num_epochs: (1, 16)
+- max_steps: 2000
 - sampling_strategy: undersampling
 - body_learning_rate: (1e-05, 1e-05)
 - head_learning_rate: 0.001
 ### Training Results
 | Epoch  | Step | Training Loss | Validation Loss |
 |:------:|:----:|:-------------:|:---------------:|
+| 0.0002 | 1    | 0.3683        | -               |
+| 0.0125 | 50   | 0.3256        | -               |
+| 0.0250 | 100  | 0.211         | 0.1998          |
+| 0.0375 | 150  | 0.1668        | -               |
+| 0.0500 | 200  | 0.0788        | 0.0571          |
+| 0.0625 | 250  | 0.0644        | -               |
+| 0.0750 | 300  | 0.0232        | 0.0286          |
+| 0.0875 | 350  | 0.0024        | -               |
+| 0.1000 | 400  | 0.0014        | 0.0945          |
+| 0.1125 | 450  | 0.0007        | -               |
+| 0.1250 | 500  | 0.0008        | 0.1036          |
+| 0.1375 | 550  | 0.0005        | -               |
+| 0.1500 | 600  | 0.0005        | 0.098           |
+| 0.1625 | 650  | 0.0003        | -               |
+| 0.1750 | 700  | 0.0005        | 0.1056          |
+| 0.1875 | 750  | 0.0004        | -               |
+| 0.2000 | 800  | 0.0006        | 0.1044          |
+| 0.2124 | 850  | 0.0005        | -               |
+| 0.2249 | 900  | 0.0004        | 0.1072          |
+| 0.2374 | 950  | 0.0003        | -               |
+| 0.2499 | 1000 | 0.0001        | 0.0993          |
+| 0.2624 | 1050 | 0.0003        | -               |
+| 0.2749 | 1100 | 0.0003        | 0.1114          |
+| 0.2874 | 1150 | 0.0002        | -               |
+| 0.2999 | 1200 | 0.0002        | 0.1078          |
+| 0.3124 | 1250 | 0.0001        | -               |
+| 0.3249 | 1300 | 0.0002        | 0.0908          |
+| 0.3374 | 1350 | 0.0002        | -               |
+| 0.3499 | 1400 | 0.0002        | 0.1019          |
+| 0.3624 | 1450 | 0.0001        | -               |
+| 0.3749 | 1500 | 0.0002        | 0.11            |
+| 0.3874 | 1550 | 0.0002        | -               |
+| 0.3999 | 1600 | 0.0001        | 0.1031          |
+| 0.4124 | 1650 | 0.0001        | -               |
+| 0.4249 | 1700 | 0.0001        | 0.0996          |
+| 0.4374 | 1750 | 0.0002        | -               |
+| 0.4499 | 1800 | 0.0001        | 0.0903          |
+| 0.4624 | 1850 | 0.0002        | -               |
+| 0.4749 | 1900 | 0.0001        | 0.0901          |
+| 0.4874 | 1950 | 0.0002        | -               |
+| 0.4999 | 2000 | 0.0001        | 0.0854          |
 ### Framework Versions
 - Python: 3.10.11
 - SetFit: 1.0.3
 - Sentence Transformers: 2.7.0
+- Transformers: 4.39.3
 - PyTorch: 2.4.0
 - Datasets: 2.20.0
 - Tokenizers: 0.15.2

config.json CHANGED Viewed

@@ -19,7 +19,7 @@
   "position_embedding_type": "absolute",
   "tokenizer_class": "XLMRobertaTokenizer",
   "torch_dtype": "float32",
-  "transformers_version": "4.39.0",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 250037

   "position_embedding_type": "absolute",
   "tokenizer_class": "XLMRobertaTokenizer",
   "torch_dtype": "float32",
+  "transformers_version": "4.39.3",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 250037

config_sentence_transformers.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "__version__": {
     "sentence_transformers": "2.7.0",
-    "transformers": "4.39.0",
     "pytorch": "2.4.0"
   },
   "prompts": {},

 {
   "__version__": {
     "sentence_transformers": "2.7.0",
+    "transformers": "4.39.3",
     "pytorch": "2.4.0"
   },
   "prompts": {},

config_setfit.json CHANGED Viewed

@@ -1,4 +1,4 @@
 {
-  "labels": null,
-  "normalize_embeddings": false
 }

 {
+  "normalize_embeddings": false,
+  "labels": null
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:61169cbb78c41b4aebadcaac92b29f7dd363dea2e868cf27f169ce0771888e6c
 size 470637416

 version https://git-lfs.github.com/spec/v1
+oid sha256:ecfce4dd8b2e3179e859bc278ca2390319e04a66f3179fbbeb1bf7b598a86307
 size 470637416

model_head.pkl CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:df178af3c19cf3bd160758f24dfedbf2133263527e90b572f5ff9c7107f6a5de
 size 4608

 version https://git-lfs.github.com/spec/v1
+oid sha256:492fb3b7da876887807a7f0eb94fda6a77e65bbb7f72311fb8caaf601a46407c
 size 4608