Push model using huggingface_hub.
Browse files- 1_Pooling/config.json +7 -0
- README.md +372 -0
- config.json +31 -0
- config_sentence_transformers.json +7 -0
- config_setfit.json +4 -0
- model.safetensors +3 -0
- model_head.pkl +3 -0
- modules.json +20 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +7 -0
- tokenizer.json +0 -0
- tokenizer_config.json +57 -0
- vocab.txt +0 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 384,
|
3 |
+
"pooling_mode_cls_token": true,
|
4 |
+
"pooling_mode_mean_tokens": false,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false
|
7 |
+
}
|
README.md
ADDED
@@ -0,0 +1,372 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: setfit
|
3 |
+
tags:
|
4 |
+
- setfit
|
5 |
+
- sentence-transformers
|
6 |
+
- text-classification
|
7 |
+
- generated_from_setfit_trainer
|
8 |
+
metrics:
|
9 |
+
- accuracy
|
10 |
+
widget:
|
11 |
+
- text: "Tax Invoice\nOriginal for Buyer/ Duplicate for Transporter/ Triplicate for\
|
12 |
+
\ Assessee\n\nSupplier Legal_Name: Mahaneadi Coalfields 4rea Code +MOO1\nLimited\
|
13 |
+
\ Area Description Jagannath\nSupplier Addresa . Jagriti Vihar, Buria Inv3ice\
|
14 |
+
\ Number -9100065259\nSambalpur 768020 Invoice Date :Dec 3, 2022\nSupplier City\
|
15 |
+
\ - Sambalpur Con=zact Reference: 3030007756\nSupplier State - Odisha Conzzact\
|
16 |
+
\ type ;Spot Auction\nSupplier Pincode : 768020 Salas Order 11240002677\nP.O -\
|
17 |
+
\ Jagriti Vihar, Burla Supplier GSTIN 2134ABCM5188P1Z3 Sale Order Date :Nov 10,\
|
18 |
+
\ 2022\n\nDistrict : Sambalpur - Supplier Email 7 Vode of Dispatch ;ROAD\n768020\
|
19 |
+
\ Odasha\n\n+91-663-2542461\n\n+91-663-2542770\nWWH .MAHANADICOAL. IN ae4a8clfeb29d373\
|
20 |
+
\ 2dedeaa25bd3 903 7eec4d£013a425b74bd5801750c2ab132\n\nReceiver (Billed To) Consignee\
|
21 |
+
\ (Shipped to) Details of Dispatch\nName »HINDALCO INDUSTRIES LIMITED Name :\n\
|
22 |
+
Party Code 2000000395 Party Code 12000000395 Grade ‘G12\nAddress _ HIRAKUD SAMBALPUR\
|
23 |
+
\ SAMBALPUR Addresa _Within Odisha acv + 3701-4000\n768016 Sire :-100 MM\n\nCity\
|
24 |
+
\ * SAMBALPUR City\nPincode - 768016 Pincode Dispatch date Dec 3, 2022\n\nState\
|
25 |
+
\ code Gdasha State code < Plant S046\nPhone number. 06632481365 Phone number\n\
|
26 |
+
GSTIN 21AAACH1201R122 GSTIN\n\nE-Mail ID aaurav panigrahi@adityabirla com E-Mail\
|
27 |
+
\ ID\n\nCompany Name\n\na\n\nPARTICULARS\n\nPricing Description i ih | Rate Per\
|
28 |
+
\ UOM (INR Amount (INR)\n\nSizing Charges Fi\nas\n\n \n\nDMF( 30% of Royalty}\
|
29 |
+
\ 18545.29\n\nCGST( 2 5% ) 122.29\n\n[es\n\nTotal Amount: $17597.31\n\nRemarks/Note/\
|
30 |
+
\ Declaration\n\nReverse Charge Applicable; No\n\nTotal Bill Value In words SIX\
|
31 |
+
\ LAKH SEVENTEEN THOUSAND PIVE HUNDRED NINETY SEV&N RUPEES THIRTY ONE PAISE\n\n\
|
32 |
+
Certified that the particulars givan above are true and correct and the amount\
|
33 |
+
\ indicated reprasents the price actually charged and that\n\nthera is no flow\
|
34 |
+
\ of additional consideration directly or indirectly from the buyer.\n\nArea :\
|
35 |
+
\ Jagannath\n— Rete ” Telephone . 6760269528\nLe Amount ° Fax Number : 6760269527\n\
|
36 |
+
\nAdviaing Bank Name _NA E-Mail Address . so-sales-jaga.mcl@coalindia, in\n\n\
|
37 |
+
This is digitally verified document hence manual/ physical signature 1s not required\n\
|
38 |
+
\nAuthorized Signatory\n\n \n\f"
|
39 |
+
- text: "Hirakud Administration\n\nFrom: Hirakud Administration\n\nSent: 18 December\
|
40 |
+
\ 2021 12:41 PM\n\nTo: sheela tower\n\nCe: Dusyant Dushkar; Sumit Kumar; Nagesh\
|
41 |
+
\ Pal; SANDEEP TIWARI; Raj Singh; Binay Dash\nSubject: RE: Room booking in hotel\n\
|
42 |
+
\nDear Sir,\n\nAs per trailing mail, kindly book 02 more rooms for our guest.\
|
43 |
+
\ Details as under:-\n\n1. Ms Alka Chaubey\n2. Mr Devguru Dash\n\nNote — Host\
|
44 |
+
\ will be Mr. Dusyant Dushkar. Check in date is 19.12.2021. Kindly correct the\
|
45 |
+
\ name of the guest\nin my previous mail, sl no 3 Mr.Subham Goel\n\nRegards\n\
|
46 |
+
~ Sandeep Kumar Ranbadia\n\nFrom: sheela tower [mailto:sheelatowers@gmail.com]\n\
|
47 |
+
Sent: 18 December 2021 12:22 PM\n\nTo: Hirakud Administration <hind-hkd.admin@adityabirla.com>\n\
|
48 |
+
\nCe: Dusyant Dushkar <dusyant.dushkar@adityabirla.com>; Sumit Kumar <sumit.skumar@adityabirla.com>;\
|
49 |
+
\ Nagesh Pal\n<nagesh.pal@adityabirla.com>; SANDEEP TIWARI <sandeep.tiwari@adityabirla.com>;\
|
50 |
+
\ Raj Singh\n\n<raj.kumarsingh @adityabirla.com>; Binay Dash <binaya.dash@adityabirla.com>\n\
|
51 |
+
\nSubject: Re: Room booking in hotel\n\n \n \n\nCAUTION: This email originated\
|
52 |
+
\ from outside of the organization. Do not click links or open attachments unless\
|
53 |
+
\ you recognize the\n‘sender and know the content is:safe.\n\nDear sir\nGreeting\
|
54 |
+
\ from sheelatowers!!!\n\nWe are confirm 04 business plus room for your guest.\n\
|
55 |
+
\nSra\n\nmcteCKotenat\n\na\n\na a\n\n \n\nRegards\nRanjt kumar sahoo\n9778403111\n\
|
56 |
+
\f"
|
57 |
+
- text: "Tax Invoice\nOriginal for Buyer/ Duplicate for Transporter/ Triplicate for\
|
58 |
+
\ Assessee\n\nan ¢\n6 , Mc Supplier Legal Nama, Mahanadi Coalfields Are2 Code\
|
59 |
+
\ .MOO1\n» ta . — i\n\nLimited area Description ;Jagannath 3% Lane a Metareriz\
|
60 |
+
\ ete!\nSupplier Address Jagriti Vihar, Bur-a |Invoice Number =. 9100067434 area\
|
61 |
+
\ isd Sooner at\nSambalpur 768020 Invoice Date :Dec 19, 2022 UA aarp LBL\n; Supplier\
|
62 |
+
\ City : Sambalpur Contract Reference:3030007756 :\n. L Supplier State : Odisha\
|
63 |
+
\ Contract type iSpot Auction\n+ Supplier Pincode : 7@8020 Sales Order 11240002677\n\
|
64 |
+
P.O. - Jagriti Vahar, Burla [Supplier GSTIN . 21 QAABCMS188P123 Sals Order Date\
|
65 |
+
\ «Nov 10, 2022\n\nDistrict : Sambalpur - Supplier Email Nod? of Dispatch .ROAD\n\
|
66 |
+
768020 Odasha\n\n+91-663-2542461\n\n*91-663+2542770\nWWW. MAHANADICOAL. IN IRN\
|
67 |
+
\ No: 21829066 2bd3486eef9a903185 74daciafc0«13744361e£93477eBd16aa0bast\n\nReceiver\
|
68 |
+
\ (Billed To} Conaignee (Shipred <a) Details of Dispatch\nName : HINDALCO INDUSTRIES\
|
69 |
+
\ LIMITED Name :\nParty Code ,2000000355 Party Code 7 20000003355 Grade » G12\n\
|
70 |
+
Address . FTRAKUD = SAMBALFUR SAMBALPUR Address : Within Odis.a cv - 3701-4000\n\
|
71 |
+
768016 Size .-100 MM\n\nCity sSAMBALPUR city Dispatch date :Dec 19, 2022\nPincode\
|
72 |
+
\ . 768016 Pincode\n\nState code .Cdisha State code i Plant 15046\nPhone number:\
|
73 |
+
\ 06632481365 Phone number :\nGSTIN + 21AKRACH1201R122 GSTIN\n\nE-Mail ID : Saurav.\
|
74 |
+
\ panigrahi@adityabirla.com B-Mail ID\n\nCompany Name;\n\nPricing Desoription\
|
75 |
+
\ 7\n\nEvac Facility Charge 60.00 68384.40\nPoyalty Charges ( 14% of Basic Price)\
|
76 |
+
\ $84.12\n\nNMET Charges( 2% of Royalty)\n\neC\n\nGross Bill Value 5536.61 6309612.40\n\
|
77 |
+
\n6309612.40\nRemarks/Note/ Declaration Total Amount:\n\nReverse Charge Applicable\
|
78 |
+
\ No\n\nTotal Bill Value In words SIXTY THREE LAKH NINE THOUSAND SIX HUNDRED TWELVE\
|
79 |
+
\ RJPBES FORTY PAISE\n\nCertified that the particulars given above are true and\
|
80 |
+
\ correct and the amount indicated represents the price actually charged and that\n\
|
81 |
+
\nthere 18 no flow of additional consideration directly or indirectly Erom tke\
|
82 |
+
\ bayer.\n\nLC Ref.No NA\nLC Date\n\nLe Amount 90\nAdvising Bank Name - NA\n\n\
|
83 |
+
Area : Jagannath\nTelephone + 6760269528\nFax Number : ©760269527\nR-Mail Addresa\
|
84 |
+
\ : so-sales-jaga.mcl@coalindia. in\n\nThis is digitally verified document hence\
|
85 |
+
\ manual/ physical signature is not required\n\nAuthorized Signatory\n\n \n\n\
|
86 |
+
\ \n\f"
|
87 |
+
- text: "UNITED MEDICAL STORE Patient Name: KASTURI uENA\n‘EW MARKET, C/O PRAFULLA\
|
88 |
+
\ KUMAR JENA\nHIRAKUD. SAMBALPUR. Dr. Name :\n\nMedicine Advice Slip: MA/2223/0668\
|
89 |
+
\ “\nPhone :0663-2431670 Prescription Indent:M/2223/06299\n\nDL No. :SAWZ 486\
|
90 |
+
\ R/487 RC Invoice No. ; 0002785 Date : 21/11/2022\n\nSe|__Qiy. [Pack [Product\
|
91 |
+
\ “Batch [Exp] HSN [ MRP | Table | Dis [5051] CO3i] Amount |\n\n1. 30 TAB] 30'S\
|
92 |
+
\ TELMA H TAB 11/24 | 30049099; 484.00! 432.14 0.001 6.00\nNEOPRIDE TOTAL CAP\
|
93 |
+
\ 7/24 30049099) 445.00) 0,00; 6.00\n\n \n\n \n\n \n\nSUB TOTAL :\n\nSGST\ner\
|
94 |
+
\ rH 2 ROFF :\n— ha GRAND TOTAL\n\nTe & Con itions For UNITED MEDICAL STORE R\
|
95 |
+
\ a ah\nBILL GRAND TOTAL IS CALCULATED ACCORDING TO 1D- 3306 Im- 1220\nMRP PRICE\
|
96 |
+
\ ( INCLUDING ALL GST TAXES ) Q _ 06 (ped)\n\n \n\f"
|
97 |
+
- text: "Original for Buyer/\n\nSupplier\n\nSupplier\n\nSupplier\nSupplier\nSupplier\n\
|
98 |
+
Supplier\nSupplier\n\nP.O. - Jagriti Vihar, Burla\n\nDistrict : Sambalpur -\n\n\
|
99 |
+
Legal _Name:\n\nAddress\n\nCity\nState\nPincode\nGSTIN\nEmail\n\nTax Invoice\n\
|
100 |
+
Duplicate for Transporter/ Triplicate for Assessea\n\nMahanadi Coalfields\nLimited\n\
|
101 |
+
\nJagriti Vihar, Burla\nSambalpur 768020\n\n: Sambalpur\n\n: Odisha\n\n: 768020\n\
|
102 |
+
\n: 21AABCM5186P123\n\nArea Code\n\nArea Description\nInvaice Number\nInvoice\
|
103 |
+
\ Date\n\n:MOO1\nJagannath K Ss pasts\n9100067646 Le\n\nEee yy\n-Dec 21, 2022\
|
104 |
+
\ 4 PSIG Nae\nca ee\n\npar\n\nContract Raference 3030007756\n\nContract typa\n\
|
105 |
+
Sales Order\n\nSale Order Date\nYods of Dispatch\n\n:Spot Auction\n11240002677\n\
|
106 |
+
:Nov 10, 2022\n:ROAD\n\n768020 Odisha\n+91-663-2542461\n+91-663-2542770\nWWW.\
|
107 |
+
\ MAHANADICOAL.IN\nReceiver (Billed To)\n-HINDALCO INDUSTRIES LIMITED\n: 2000000395\n\
|
108 |
+
HIRAKUD\n768016\n: SAMBALPUR\nPincoda : 768016\nState code Odisha\nPhone number.\
|
109 |
+
\ 06632481365\nGSTIN . 21AAACH1201R12Z\n\nE-Mail Ip\n\nIRN No. b£1b63c27ecdbbbeOedf{d3b343825\
|
110 |
+
\ £06861 d200cd310b3e3344c6c0de297£635\n\nConsignee (Shipred -o)\n\nDetails of\
|
111 |
+
\ Dispatch\n\nName\nParty Code\n\nAddress\n\nName\nParty Code\n\nAddress\n\n'Gl2\n\
|
112 |
+
: 3701-4000\n-100 MM\n\n'Dec 21,\n\nGrade\n@cv\nSize\n\nDispatch date\n\n: 2000000395\n\
|
113 |
+
\nSAMBALPUR SAMBALPUR Within Odisha\n\nCity city\n\nPincede\n\nState code\nPhone\
|
114 |
+
\ number :\nGSTIN\n\n2022\n\nPlant : 5046\n\n- Saurav.panigrahi@adityabirla.com\
|
115 |
+
\ E-Mail ID\n\nCompany Name.\n\n8001237358 42e00c0000 Bituminous Coal 27011200\
|
116 |
+
\ 1128.42\n\nPricing Description TW ate Pee WONT a ay\n\nSizing Charges 87.00\
|
117 |
+
\ $8172.54\n\nSTC Charges\n\n60.00 67705,20\n\nEvac Facility Charge\n\n$54.12\
|
118 |
+
\ 625280.909\n\nRoyalty Charges ( 14% of Basic Price)\n\n \n\n11.08 12505.$0\n\
|
119 |
+
\nNMET Charges{ 2% of Royalty)\n\n166.24 187584 .03\n\nDLMF({ 30% of Royalty)\n\
|
120 |
+
137989.92\n\n \n\nCGST( 2.56}\n\n122.28 137989.92\n\nSGST( 2.5% }\n\n400.00 451368.00\n\
|
121 |
+
\nGST Comp Cess\n\nGross Bill Value\n\nNet Value\n\nRemarks/Note/ Declaration\n\
|
122 |
+
\nTotal Bill Value In words\n\nLC Ref No NA\nLc Date\n\nLe Amount 6\n\nAdvising\
|
123 |
+
\ Bank Name_: NA\n\n \n\nReverse Charge Applicable: No\n\nSIMTY TWO LAKH FORTY\
|
124 |
+
\ SIX THOUSAND NINE HUNDRED FOPTY FOUR RUPEES SEVENTY SIX PAISE\n\nCertified that\
|
125 |
+
\ the particulars givan above are true and correct and tha amount indicated represents\
|
126 |
+
\ the price\nthere is no flow of additional consideration directly or indirectly\
|
127 |
+
\ from the buyer.\n\nArea . Jagannath\nTelephone - 6760269528\nFax Number : 6760269527\n\
|
128 |
+
\nE-Mail Address\n\nThie is digitally verified document hence manual/ physical\
|
129 |
+
\ signature 16 not requ.red\n\n5536.01\n\n$536.01 6246944.76\n\nTotal Amount:\
|
130 |
+
\ 6246944.76\n\nactually charged and that\n\n: g0-sales-jaga.mel@coalindia.in\n\
|
131 |
+
\nAuthorized Signatory\n\n \n\f"
|
132 |
+
pipeline_tag: text-classification
|
133 |
+
inference: true
|
134 |
+
base_model: BAAI/bge-small-en-v1.5
|
135 |
+
model-index:
|
136 |
+
- name: SetFit with BAAI/bge-small-en-v1.5
|
137 |
+
results:
|
138 |
+
- task:
|
139 |
+
type: text-classification
|
140 |
+
name: Text Classification
|
141 |
+
dataset:
|
142 |
+
name: Unknown
|
143 |
+
type: unknown
|
144 |
+
split: test
|
145 |
+
metrics:
|
146 |
+
- type: accuracy
|
147 |
+
value: 1.0
|
148 |
+
name: Accuracy
|
149 |
+
---
|
150 |
+
|
151 |
+
# SetFit with BAAI/bge-small-en-v1.5
|
152 |
+
|
153 |
+
This is a [SetFit](https://github.com/huggingface/setfit) model that can be used for Text Classification. This SetFit model uses [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5) as the Sentence Transformer embedding model. A [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance is used for classification.
|
154 |
+
|
155 |
+
The model has been trained using an efficient few-shot learning technique that involves:
|
156 |
+
|
157 |
+
1. Fine-tuning a [Sentence Transformer](https://www.sbert.net) with contrastive learning.
|
158 |
+
2. Training a classification head with features from the fine-tuned Sentence Transformer.
|
159 |
+
|
160 |
+
## Model Details
|
161 |
+
|
162 |
+
### Model Description
|
163 |
+
- **Model Type:** SetFit
|
164 |
+
- **Sentence Transformer body:** [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5)
|
165 |
+
- **Classification head:** a [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance
|
166 |
+
- **Maximum Sequence Length:** 512 tokens
|
167 |
+
- **Number of Classes:** 2 classes
|
168 |
+
<!-- - **Training Dataset:** [Unknown](https://huggingface.co/datasets/unknown) -->
|
169 |
+
<!-- - **Language:** Unknown -->
|
170 |
+
<!-- - **License:** Unknown -->
|
171 |
+
|
172 |
+
### Model Sources
|
173 |
+
|
174 |
+
- **Repository:** [SetFit on GitHub](https://github.com/huggingface/setfit)
|
175 |
+
- **Paper:** [Efficient Few-Shot Learning Without Prompts](https://arxiv.org/abs/2209.11055)
|
176 |
+
- **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
|
177 |
+
|
178 |
+
### Model Labels
|
179 |
+
| Label | Examples |
|
180 |
+
|:------|:-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
181 |
+
| 0 | <ul><li>'. : Pt oh mM\nBaw iS\n\nWw tere\nPr pe 0 ok ji the\nFw: Pending Bills jer\n\n, Ronit Sarangi to: Vinit K Sinha i 22-01-2020 11:37\n| Ce: Shree Nath Mishra, Rajesh Kumar Gupta, Krishna Padhi\n\ntect |, UG\nDear Vinit, “ni Do\n\n24\nPlease find the corporate approval in your trailing mail. The excel sheet of details of pending bills A\nclearance is attached herewith for your kind perusal.\n\ni:\n\nBills Pending.xisx\n\nRegards,\nRonit Sarangi\nHirakud Legal\nooo-+ Forwarded by Fcnit Sarangi/Legal/Hirakud/Hindalco/ABG on 01/22/2020 11:29 -----\n\nFrom: Shankar V R <vr.shankar@adityabirla.com>\nT Kamadev Raulo <kamadev.raulo@adityabirla.com>\nRONIT SARANGI <ronit.sarangi@adityabirla.com>\n01/22/2020 11:04 AM\nRE: Pending Bills\nae: acne\n\nApproved.\n\nShankar VR\n\nFrom: Kamadev Raulo\n\nSent: Monday, January 20, 2020 5:09 PM\n\nTo: Shankar V R <vr.shankar@adityabirla.com>\n\nCc: RONIT SARANW <ronit.sarangi@adityabirla.com>\nSubject: Fw: Pending Bills\n\nDear Sir,\nNumber of bills of lawyers/ counsel yet to be cleared, a list thereof is attached in trailing mail.\n\nAs required by the Unit finance, corporate approval will be required for clearance of the bills.\n\nWe are collecting fee structure from the individual lawyers for one time approval from corporate which\nmay take some time.\n\nMeanwhile, please approve the pending bills as per the list attached for clearance. | have cross\nchecked the bills of the lawyers which are based on the rate the Unit has been paying during last 2-3\nyears.\n\nFurther, for FY 2019-20 legal budget was sanctioned for Rs.30.00 lacs only, wnicn is already over. We\nare taking up the issue with Finance Head, Sambalpur cluster for adjustment as we have unutilized\nbudget in hand of Rs.33.00 lacs sanctioned to Aditya.\n\x0c'</li><li>"eV\n\n QIGY Sgue aia cqaa sé\n\nOFFICE OF THE CHIEF LOAD DESPATCHER,SLDC\n\nODISHA POWER TRANSMISSION CORPORATION LIMITED\nGRIDCO Colony, P.O.-Mancheswar Rly. Colony, Bhubaneswar-751017, FAX-0674- 2748509\nCIN — U401020R2004SGC007553\n\n(2 )\nNo. CLD(OS)-160/2019/STOA (INTRA)- 33% Dated :> } 01/2020\nFrom: )\n\n \n\nChief Load Despateher.\nSLDC. OPTCL. Bhubaneswar\nTo:\nM/s Hindalco Industries Limited, Hirakud Smelter.\nHirakud, Dist. Sambalpur, Pin ; 768016\n\nSub: Approval for Intra-State Short Term Open Access for wheeling of 40MW RTC power from M/s\nAditya Aluminium, Hindalco Industries Limited, Lapanga .Sambalpur to M/s Hindalco Industries\nLimited, Hirakud Smelter, Hirakud, Sambalpur for the period from 01/02/2020 to 29/02/2020\n\nRef; Approval No. : SLDC/BBSR/2019-20/626/STOA Dated: 31.01.2020\n\nSir,\nAs per OERC (Terms and Conditions for Open Access) Regulation 2005, the STOA for transfer of 40\nMW of power on RTC basis from M/s Aditya Aluminium, Hindalco Industries Limited, Lapanga ,Sambalpur\nto M/s Hindalco Industries Limited, Hirakud Smelter, Hirakud. Sambalpur for a period from 01/02/2020 to\n29/02/2020 has been approved vide approval under reference. A copy of the approval order (Format —7) along\nwith requisite formats is as enclosed herewith for necessary action.\n\n‘Transmission loss, as approved by OERC shall be borne by the OA customer and Transmission\ncharges as approved by OERC has to be paid by the OA customer. M/s Aditya Aluminium, Hindalco\nIndustries Limited, Lapanga ,Sambalpur shall furnish 15 minutes block wise day-ahead injection schedule and\ndrawal schedule of M/s Hindalco Industries Limited, Hirakud Smelter, Hirakud, Sambalpur separately as per\nthe prescribed format to SLDC. A copy of the drawal schedule shall be furnished to WESCO.\n\nAs per Clause 2.4.2 of “Guidelines & Procedure fur Reservation of Transmission / Distribution\nCapacity for STOA Customers”, M/s Hindalco Industries Limited. Hirakud shall make payment to SLDC /\nOPTCL as per the scheduled payment latest by 11:00 hours of the working day, before beginning of the\ntransaction.\n\nAs per Clause 3.12.1, in case of payment default the customer shall be liable to pay the outstanding\npayment in full along with Delayed Payment Surcharge @ 0.1% per day.\n\nYours faithfully,\n\nEncl: As above fy v™\nq oN s\n_xChief Load Despatcher,\n' SLDC\nCC:\n\nlL. = =C,0.0., WESCO Utility for information.\n\n2. ABT Cell in Charge, WESCO Utility. Burla. He is requested to deduct the scheduled energy from the\nenergy consumed by M/s Hindalco Industries Limited, Hirakud Simelter, Hirakud, Sambalpur for the\nabove transaction from billing for the month of February-2020.\n\n3. CGM(O&M). OPTCL /CGM( Fin). OPTCI. / C.G.M.APP).Grideo / Sr.G.M. (RT&C), OPTCL/ Member\nSecretary. GCC\n\n4. EA to CMD, OPTCL for kind information of CMD\n\x0c"</li><li>'2s\na\n\n \n \n \n \n \n\n \n \n\n€ WR ORC Gale GaN! SateTa Gua!\n| oe i : z oa\n\noe Os!\n\naa one <= ae aponae\n\n(een T= oo ghevrIaa) ;\nCOHERA > Bo, cu Foo RCTS)\n(HORNA > 900,45 800 GRAA)\nCHM > Yoo Sisriaa) .\nEIR! QSOS > @ PO CAT .\n(NORM <= Coo GCAMIG)\n(HERA > Foo, c= Noo Ghe/eiay\nCARRA> Noe BReTee ;\n\n \n\nTas cea oI) :\n\n \n\nfeat OaSeIg ED GEM >= 99 Gead<eeoKee | OR\n\nPRICING Cloaks) ASG k * ¢\n\nace\n\nCad Gate (Ca) SACI < 99 Oa a\n\n \n\naoe Oo\n\nMAR oo\n\n \n \n \n\n \n\n \n\nPR6R efianem aes\n\n \n\n \n\nsgange gerne Gage ARLSTOT!\n\n \n\n \n \n\n \n\n \n\n \n\n \n \n \n \n \n \n \n\n \n \n\n \n \n \n\n \n\n; sf B Ea ¢ PEGt FSR\n[3 [rear RRC\n\n \n \n\nAER BRO HS FIO FLNee\nad 66a) Gue rides GA\n\n9. ossva aidk Socen 20 Aq 9 CERES Maa Gog GoM GER |\n\nGBeoegen. = _\n\n=\nsco\n\n \n \n\nBS QS! OS SA ARO GoKTAAIS EEE Bisa BIS GGA EDT .C.AN, 08 E09 OAD :\nSOG, GRE GA GOR ACA Bei oN RELAIS V 0G. OF Gale 5a, HEY FREA GOPISR GHORIA aqUe! AqHe, RASA 9.0% P/U TIDES Gas See 1-H Qiur Swad Gas Qe qe\n\n“ope aDeoTe |\n\nDIHGI-PNIDTR\n\n \n\nGe\n\nsig st norma sence anmerencecvsncnen PANN cls rx unas mina rien erie wegen\n\nHAUT). QM 7, Teoel GSA\nERR FAR, GOGATR OF 000 a\n\n: QUE SORT AEREND\npa 1 PRO Qs FOE 7:\n_ [Sa TS OTSA GFT TORR\nate GrSCAA GAs Tos\nGS 6 AST SCAR 6 Veen Ga Pers\n\nRYCETLCIOPRES\n\na\n\ncaon ol adres rea\n\n \n\n€\n\x0c'</li></ul> |
|
182 |
+
| 1 | <ul><li>'Tax Invoice\nOriginal for Buyer/ Duplicate for Transporter/ Triplicate for Assessee\n\nSupplier Legal Name; Mahanadi Coalfields Area Code :MO01\n7 Limited Area Description :Jagannath\nSupplier Address , Jagriti Vihar, Bur.a Invaice Number 19100066504\nSambalpur 768020 Involee Date :Dee 15, 2022\nSupplier City : Sambalpur Contract Reference: 3030007756\nSupplier State Odisha Contract type :Spot Auction\nSupplier Pincode : 768020 Salas Order 1240002677\n.P.O. - dJagriti vihar, Burla |Supplier GSTIN : 21AABCMS188P1Z23 Sala Order Data sNov 10, 2022\n\nDistrict : Sambalpur - Supplier Email : Mode of Dispatch :ROAD\n768020 Odisha\n\n+91-663-2542461\n+91-663-2542770\nWWW. MAHANADICOAL. IN b17b2c4d22fdc429d9£ 2220208 3dd713cf1C85200343d43eacl£7415af5d190a\n\nRaceiver (Billed To) Consignese (Shipced =o) Details of Dispatch\nName *HINDALCO INDUSTRIES LIMITED Name :\nParty Code :2000000335 Party Code : 2000000395 Grade - G12\nAddress ; HIRAKUD SAMBALPUR SAMBALPUR Address + Within Odisha acy + 3701-4000\n768016 Size : +100 MM\n\ncity - SAMBALPUR City\nPincode _ 768016 pincede Dispatch date :Dec 15, 2022\n\nState code :Odigha State code Plant 15046\nPhone number 06632481365 Phone number :\n\nGSTIN 21AAACH1201R1Z2Z GSTIN\n£-Mail ID Saurav. panigrahi@adityabirla.com E-Mail ID\n\nCompany Name-\n\n8001220502 4100000000 Bituminous coal 27011200 1289.37\n\nPARTICULARS\n\nPriaing Description ; : cif 1, Rete Per DOM(INR) Amount (INR)\n\nBasic Price 3958.00 5103326 .46\nSizing Charges 112175.19\nSTC Charges 70915.35\nfvac Facility Charge 77362 .20\n\nRoyalty Charges { 14% of Basic Price) 714465.70\n\n \n\nNMET Chargea({ 2% of Royalty)\n\nDMF( 30% of Royalty) 214339.71\nCGST( 2.5% ) 157671.85\nSGST( 2.5% ) P| 157671.85\nGST Comp Cess 515748 00\nGross Bill Value 7137965 .62\n\nNet Value 5536.01 7137965.62\n\n14289.31\n\nRemarks/Note/ Declaration Total Amount: 7137965.62\n\nReverse Charge Applicable. No\n\n \n\nTotal Bill Value In words SEVENTY ONE LAKH THIRTY SEVEN THOUSAND NINE HUNDRED SIXTY FIVE RUPEES SIXTY TWO PAISE\n\nCartified that the particulars given above are true and correct and the amount indicated represents the price actually charged and that\nthere is no flow of additional consideration directly or indirectly from the buyer,\n\nArea : Jagannath\n\n»No NA\ni bate Telephone : 6760269528\nLe Amount 0 Fax Number : 6760269527\n\nAdvising Bank Name_: NA E-Mail Address : so-sales-jaga.mcl@coalindia, in\n\nThis 18 digitally verified document hence manual/ physical signature 15 not required\n\nAuthorized Signatory\n\x0c'</li><li>' \n\nj Tax Invoice 0 Ms,\n. Original for Buyer/ Duplicate for Transporter/ Triplicate for Assessee \\\n\n \n\n \n \n \n \n \n \n \n \n\n \n \n \n\n \n \n\n \n \n\n \n \n \n\n \n \n \n\n \n\n \n\n \n\n \n \n \n \n \n \n \n \n \n\nSupplier Legal_Name: Mahanadi Coalfields Area Code :MO09\nLimited Area Description :Basundhara\nSupplier Address ; Jagriti Vihar, Burla Invoice Number 9180040556\nSambalpur 768020 Invoice Date :Dec’ 27, 2022\nSupplier City : Sambalpur Contract Reference:3030004571\nSupplier State : Odisha Contract type :FSA Linkage\nSupplier Pincode : 768020 Sales Order :1390001150\nP.O. + J I Supplier GSTIN : 21AABCM5188P1Z3 Sale Order Date :Dec 14, 2022\nDistrict : Sambalpur - Supplier Email Mode of Dispatch :ROAD\n768020 Odisha\n+91- -2542\n+91- 3-2542770\nWWW .MAHANADICOAL.IN\n\n \n \n \n\nRece Consignee (Shipped to)\nName : HINDALCO INDUSTRIES LIMITED\nParty Code :20 J0395\n‘ RAKUD SAMBALPUR SAMBALPUR\n768016\n\nDetails of Dispatch\n\n \n \n \n \n \n \n\n \n \n\nName §\nParty Code : 2000000395\n\n \n\nGrade : G13\nGCV : 3401-3700\nSize : -100 MM\n\n \n \n\n \n \n\n \n\n \n \n\nAddress :Within Odisha\n\n \n\nDispatch date : Dec 27, 2022\n\n \n\nPlant 75026\n\n \n\nE-Mail\n\nMaterial Description HSN Code Unit of Measure Quantity\nseeeeeee ohwnsness _ o_\n\nID\n\n \n\n \n\nPARTICULARS\nPricing Description Rate Per UOM(INR) Amount (INR)\nBasic Price 1140.00 60522.60\n\n4618.83\n\n5627.54\n\n \n\nEvac Facility Charge | 60.00 3185.40\n\n8473.16\n\nmy\noy\n\\o\nib\nOV\n\n2541.95\n\n2128.47\n\n2128.47\n\n \n\nGST Comp Cess 400.00 21236.00\n\n \n \n\nGross Bill Value 2083.86 110631.88\n\n2083.86 110631.88\n\nTotal Amount: 110631.88\n\nReverse Charge Applicable: No\n\nTotal Bill Value In words ONE LAKH TEN THOUSAND SIX HUNDRED THIRTY ONE RUP\n\nArea : Basundhara\nTelephone : 6621286133\nFax Number : 6621286144\n:NA E-Mail Address : so-sales-basa.mcl@coalindia.in\n\nis digitally verified document hence manual/ physical signature is\n\nAuthorized Signatory\n\n \n\x0c'</li><li>'Tax Invoice\nOriginal for Buyer/ Duplicate for Transporter/ Triplicate for Assessee C\n\nMahanadi Coalfields Area Code :MO09\nLimited Area Description :Basundhara\nSupplier Address ‘ dJagriti Vihar, Burla Invoice Number 19180038258\nSambalpur 768020 Invoice Date :Nov 24, 2022\nSupplier City : Sambalpur Contract Reference: 3030007704\nSupplier State : Odisha Contract type :Spot Auction\nSupplier Pincode : 768020 Sales Order 71290001518\n- Jagriti Vihar, Burla |Supplier GSTIN : 21AABCM5188P1Z3 Sale Order Date :Nov 10, 2022\ni Sambalpur - Supplier Email : Mode of Dispatch :ROAD\n\nSupplier Legal_Name:\n\nso\n\n‘\n10 © 0)\n\n+\n\ndl2bd458édabaf99f542f210873b14beb2b9c1e012976832alelded20e19f6a0\n\nReceiver (Billed To) Consignee (Shipped to) Details of Dispatch\n: HINDALCO INDUSTRIES LIMITED Name :\nParty Code :2000000395 Party Code : 2000000395 Grade : G13\nKdavees , HIRAKUD SAMBALPUR SAMBALPUR nBaireseres : Within Odisha Gcv : 3401-3700\n768016 Size : -100 MM\nity : SAMBALPUR City\nincode : 768016 Pincode\ne code :Odisha State code z Plant : 5026\nPhone number: 06632481365 Phone number\nGSTIN : 21AAACH1201R12ZZ GSTIN\n\nDispatch date : Nov 24, 2022\n\nE-Mail ID : Saurav.panigrahi@adityabirla.com E\n\nCompany Name:\n\nSst Sees ae ~~\nKulda OC Mine 4100000000 Bituminous Coal 27011200 1691:.22\n\nPARTICULARS\n\nPricing Description : Rate Per UOM(INR) / Amount (INR) — é\n\n=\n\n6995.33 11829934.89\n\n: 11829934.89\nRemarks/Note/ Declaration Total Amount\n\nReverse Charge Applicable: No\n\nEIGHTEEN LAKH TWENTY NINE THOUSAND NINE HJNDRED THIRTY FOUR RUPEES EIGHTY NINE PAISE\n\nCertified that the particulars given above are true and correct and the amc indicated represents the price actually charged and that\nthere is no flow of additional consideration directly or indirectly from the jer.\n\nArea : Basundhara\n\nTelephone : 6621286133\n\nFax Number : 6621286144\n\nLe _ ‘ ‘ ‘\nE-Mail Address : so-sales-basa.mcl@coalindia.in\n\nAdvising Bank Name\n\nThis is digitally verified document hence manual/ physical signature is not required\n\nAuthorized Signatory\n\n \n\x0c'</li></ul> |
|
183 |
+
|
184 |
+
## Evaluation
|
185 |
+
|
186 |
+
### Metrics
|
187 |
+
| Label | Accuracy |
|
188 |
+
|:--------|:---------|
|
189 |
+
| **all** | 1.0 |
|
190 |
+
|
191 |
+
## Uses
|
192 |
+
|
193 |
+
### Direct Use for Inference
|
194 |
+
|
195 |
+
First install the SetFit library:
|
196 |
+
|
197 |
+
```bash
|
198 |
+
pip install setfit
|
199 |
+
```
|
200 |
+
|
201 |
+
Then you can load this model and run inference.
|
202 |
+
|
203 |
+
```python
|
204 |
+
from setfit import SetFitModel
|
205 |
+
|
206 |
+
# Download from the 🤗 Hub
|
207 |
+
model = SetFitModel.from_pretrained("Gopal2002/COAL_INVOICE_ZEON")
|
208 |
+
# Run inference
|
209 |
+
preds = model("UNITED MEDICAL STORE Patient Name: KASTURI uENA
|
210 |
+
‘EW MARKET, C/O PRAFULLA KUMAR JENA
|
211 |
+
HIRAKUD. SAMBALPUR. Dr. Name :
|
212 |
+
|
213 |
+
Medicine Advice Slip: MA/2223/0668 “
|
214 |
+
Phone :0663-2431670 Prescription Indent:M/2223/06299
|
215 |
+
|
216 |
+
DL No. :SAWZ 486 R/487 RC Invoice No. ; 0002785 Date : 21/11/2022
|
217 |
+
|
218 |
+
Se|__Qiy. [Pack [Product “Batch [Exp] HSN [ MRP | Table | Dis [5051] CO3i] Amount |
|
219 |
+
|
220 |
+
1. 30 TAB] 30'S TELMA H TAB 11/24 | 30049099; 484.00! 432.14 0.001 6.00
|
221 |
+
NEOPRIDE TOTAL CAP 7/24 30049099) 445.00) 0,00; 6.00
|
222 |
+
|
223 |
+
|
224 |
+
|
225 |
+
|
226 |
+
|
227 |
+
|
228 |
+
|
229 |
+
SUB TOTAL :
|
230 |
+
|
231 |
+
SGST
|
232 |
+
er rH 2 ROFF :
|
233 |
+
— ha GRAND TOTAL
|
234 |
+
|
235 |
+
Te & Con itions For UNITED MEDICAL STORE R a ah
|
236 |
+
BILL GRAND TOTAL IS CALCULATED ACCORDING TO 1D- 3306 Im- 1220
|
237 |
+
MRP PRICE ( INCLUDING ALL GST TAXES ) Q _ 06 (ped)
|
238 |
+
|
239 |
+
|
240 |
+
")
|
241 |
+
```
|
242 |
+
|
243 |
+
<!--
|
244 |
+
### Downstream Use
|
245 |
+
|
246 |
+
*List how someone could finetune this model on their own dataset.*
|
247 |
+
-->
|
248 |
+
|
249 |
+
<!--
|
250 |
+
### Out-of-Scope Use
|
251 |
+
|
252 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
253 |
+
-->
|
254 |
+
|
255 |
+
<!--
|
256 |
+
## Bias, Risks and Limitations
|
257 |
+
|
258 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
259 |
+
-->
|
260 |
+
|
261 |
+
<!--
|
262 |
+
### Recommendations
|
263 |
+
|
264 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
265 |
+
-->
|
266 |
+
|
267 |
+
## Training Details
|
268 |
+
|
269 |
+
### Training Set Metrics
|
270 |
+
| Training set | Min | Median | Max |
|
271 |
+
|:-------------|:----|:---------|:-----|
|
272 |
+
| Word count | 1 | 270.5442 | 4241 |
|
273 |
+
|
274 |
+
| Label | Training Sample Count |
|
275 |
+
|:------|:----------------------|
|
276 |
+
| 0 | 130 |
|
277 |
+
| 1 | 85 |
|
278 |
+
|
279 |
+
### Training Hyperparameters
|
280 |
+
- batch_size: (32, 32)
|
281 |
+
- num_epochs: (2, 2)
|
282 |
+
- max_steps: -1
|
283 |
+
- sampling_strategy: oversampling
|
284 |
+
- body_learning_rate: (2e-05, 1e-05)
|
285 |
+
- head_learning_rate: 0.01
|
286 |
+
- loss: CosineSimilarityLoss
|
287 |
+
- distance_metric: cosine_distance
|
288 |
+
- margin: 0.25
|
289 |
+
- end_to_end: False
|
290 |
+
- use_amp: False
|
291 |
+
- warmup_proportion: 0.1
|
292 |
+
- seed: 42
|
293 |
+
- eval_max_steps: -1
|
294 |
+
- load_best_model_at_end: False
|
295 |
+
|
296 |
+
### Training Results
|
297 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
298 |
+
|:------:|:----:|:-------------:|:---------------:|
|
299 |
+
| 0.0013 | 1 | 0.2394 | - |
|
300 |
+
| 0.0657 | 50 | 0.1203 | - |
|
301 |
+
| 0.1314 | 100 | 0.0095 | - |
|
302 |
+
| 0.1971 | 150 | 0.0029 | - |
|
303 |
+
| 0.2628 | 200 | 0.0014 | - |
|
304 |
+
| 0.3285 | 250 | 0.0014 | - |
|
305 |
+
| 0.3942 | 300 | 0.0011 | - |
|
306 |
+
| 0.4599 | 350 | 0.0009 | - |
|
307 |
+
| 0.5256 | 400 | 0.0008 | - |
|
308 |
+
| 0.5913 | 450 | 0.0007 | - |
|
309 |
+
| 0.6570 | 500 | 0.0008 | - |
|
310 |
+
| 0.7227 | 550 | 0.0008 | - |
|
311 |
+
| 0.7884 | 600 | 0.0006 | - |
|
312 |
+
| 0.8541 | 650 | 0.0005 | - |
|
313 |
+
| 0.9198 | 700 | 0.0004 | - |
|
314 |
+
| 0.9855 | 750 | 0.0005 | - |
|
315 |
+
| 1.0512 | 800 | 0.0004 | - |
|
316 |
+
| 1.1170 | 850 | 0.0005 | - |
|
317 |
+
| 1.1827 | 900 | 0.0004 | - |
|
318 |
+
| 1.2484 | 950 | 0.0004 | - |
|
319 |
+
| 1.3141 | 1000 | 0.0003 | - |
|
320 |
+
| 1.3798 | 1050 | 0.0004 | - |
|
321 |
+
| 1.4455 | 1100 | 0.0004 | - |
|
322 |
+
| 1.5112 | 1150 | 0.0004 | - |
|
323 |
+
| 1.5769 | 1200 | 0.0005 | - |
|
324 |
+
| 1.6426 | 1250 | 0.0004 | - |
|
325 |
+
| 1.7083 | 1300 | 0.0003 | - |
|
326 |
+
| 1.7740 | 1350 | 0.0004 | - |
|
327 |
+
| 1.8397 | 1400 | 0.0005 | - |
|
328 |
+
| 1.9054 | 1450 | 0.0004 | - |
|
329 |
+
| 1.9711 | 1500 | 0.0003 | - |
|
330 |
+
|
331 |
+
### Framework Versions
|
332 |
+
- Python: 3.10.12
|
333 |
+
- SetFit: 1.0.3
|
334 |
+
- Sentence Transformers: 2.2.2
|
335 |
+
- Transformers: 4.35.2
|
336 |
+
- PyTorch: 2.1.0+cu121
|
337 |
+
- Datasets: 2.16.1
|
338 |
+
- Tokenizers: 0.15.0
|
339 |
+
|
340 |
+
## Citation
|
341 |
+
|
342 |
+
### BibTeX
|
343 |
+
```bibtex
|
344 |
+
@article{https://doi.org/10.48550/arxiv.2209.11055,
|
345 |
+
doi = {10.48550/ARXIV.2209.11055},
|
346 |
+
url = {https://arxiv.org/abs/2209.11055},
|
347 |
+
author = {Tunstall, Lewis and Reimers, Nils and Jo, Unso Eun Seo and Bates, Luke and Korat, Daniel and Wasserblat, Moshe and Pereg, Oren},
|
348 |
+
keywords = {Computation and Language (cs.CL), FOS: Computer and information sciences, FOS: Computer and information sciences},
|
349 |
+
title = {Efficient Few-Shot Learning Without Prompts},
|
350 |
+
publisher = {arXiv},
|
351 |
+
year = {2022},
|
352 |
+
copyright = {Creative Commons Attribution 4.0 International}
|
353 |
+
}
|
354 |
+
```
|
355 |
+
|
356 |
+
<!--
|
357 |
+
## Glossary
|
358 |
+
|
359 |
+
*Clearly define terms in order to be accessible across audiences.*
|
360 |
+
-->
|
361 |
+
|
362 |
+
<!--
|
363 |
+
## Model Card Authors
|
364 |
+
|
365 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
366 |
+
-->
|
367 |
+
|
368 |
+
<!--
|
369 |
+
## Model Card Contact
|
370 |
+
|
371 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
372 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/root/.cache/torch/sentence_transformers/BAAI_bge-small-en-v1.5/",
|
3 |
+
"architectures": [
|
4 |
+
"BertModel"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 384,
|
11 |
+
"id2label": {
|
12 |
+
"0": "LABEL_0"
|
13 |
+
},
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 1536,
|
16 |
+
"label2id": {
|
17 |
+
"LABEL_0": 0
|
18 |
+
},
|
19 |
+
"layer_norm_eps": 1e-12,
|
20 |
+
"max_position_embeddings": 512,
|
21 |
+
"model_type": "bert",
|
22 |
+
"num_attention_heads": 12,
|
23 |
+
"num_hidden_layers": 12,
|
24 |
+
"pad_token_id": 0,
|
25 |
+
"position_embedding_type": "absolute",
|
26 |
+
"torch_dtype": "float32",
|
27 |
+
"transformers_version": "4.35.2",
|
28 |
+
"type_vocab_size": 2,
|
29 |
+
"use_cache": true,
|
30 |
+
"vocab_size": 30522
|
31 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": {
|
3 |
+
"sentence_transformers": "2.2.2",
|
4 |
+
"transformers": "4.28.1",
|
5 |
+
"pytorch": "1.13.0+cu117"
|
6 |
+
}
|
7 |
+
}
|
config_setfit.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"labels": null,
|
3 |
+
"normalize_embeddings": false
|
4 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98a187dd402733ebbaa859e78d0cce75b1a994e12fe579d4f5bac0efdb4d23b0
|
3 |
+
size 133462128
|
model_head.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5954cae7ab425103f9263d543d45ee1c48e4b11d4e256a7e53b2e8aba2d74811
|
3 |
+
size 3919
|
modules.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
},
|
14 |
+
{
|
15 |
+
"idx": 2,
|
16 |
+
"name": "2",
|
17 |
+
"path": "2_Normalize",
|
18 |
+
"type": "sentence_transformers.models.Normalize"
|
19 |
+
}
|
20 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 512,
|
3 |
+
"do_lower_case": true
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"100": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"101": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"102": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"103": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": true,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_basic_tokenize": true,
|
47 |
+
"do_lower_case": true,
|
48 |
+
"mask_token": "[MASK]",
|
49 |
+
"model_max_length": 512,
|
50 |
+
"never_split": null,
|
51 |
+
"pad_token": "[PAD]",
|
52 |
+
"sep_token": "[SEP]",
|
53 |
+
"strip_accents": null,
|
54 |
+
"tokenize_chinese_chars": true,
|
55 |
+
"tokenizer_class": "BertTokenizer",
|
56 |
+
"unk_token": "[UNK]"
|
57 |
+
}
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|