Push model using huggingface_hub.
Browse files- 1_Pooling/config.json +7 -0
- README.md +271 -0
- config.json +31 -0
- config_sentence_transformers.json +7 -0
- config_setfit.json +4 -0
- model.safetensors +3 -0
- model_head.pkl +3 -0
- modules.json +20 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +7 -0
- tokenizer.json +0 -0
- tokenizer_config.json +57 -0
- vocab.txt +0 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 384,
|
3 |
+
"pooling_mode_cls_token": true,
|
4 |
+
"pooling_mode_mean_tokens": false,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false
|
7 |
+
}
|
README.md
ADDED
@@ -0,0 +1,271 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
library_name: setfit
|
3 |
+
tags:
|
4 |
+
- setfit
|
5 |
+
- sentence-transformers
|
6 |
+
- text-classification
|
7 |
+
- generated_from_setfit_trainer
|
8 |
+
metrics:
|
9 |
+
- accuracy
|
10 |
+
widget:
|
11 |
+
- text: " \n \n \n\nHIRAKUD POWER / SMELTER\n\n@ - Payment Order\n\n( Address\
|
12 |
+
\ )\n\nEmp.No./S.Code No. Qhle\nby Cash/Cheque/D.D./Transfer the sumof ~ 35, +S0/—\n\
|
13 |
+
Rupees Thi ei ve therane Seven hun\nFi \\\nMail Id of Initiator: : OF)\n\n \n\n\
|
14 |
+
| Details of Payment\n\n;\n| AtMenclance, Cleritage ancl Otner\naa T\n\n|mise:\
|
15 |
+
\ Conveyances for ip eome No. |\n2x to 2-9, 3\\ 32 ano 34 of Qo| 2\n\nURL of payment:\n\
|
16 |
+
\nin . TotalRs.| 35, too /]- .\n\nPrepared by Recommended by Endorsed by Authorised\
|
17 |
+
\ By Approved by\n‘ A =\nPort Sara ee\nA ee EU (NY—\nDate 20/ 19 Plant Head Head-F\
|
18 |
+
\ &A Head - Sambalpur Cluster\n\n \n \n\nCharge\nAccount\n\n \n \
|
19 |
+
\ \n\nLeqa2\n\n~ Odisha cluoy\n\nOI) 202 Sefer (90\n\nONLINE PAYMENT\n\n \n\n\
|
20 |
+
\ \n\nCashier\nReceived Payment | Charge Account Checked by\n\nae eee _\n\n \n\
|
21 |
+
\nSignature\n\f"
|
22 |
+
- text: " \n\f"
|
23 |
+
- text: "Expenses during visit of morning for coal logistic.\n\nSl.no. _ Date Of Visit\
|
24 |
+
\ Particulars Amount Remarks\n1 21-Feb-16 Tea,Snax ager mis. - 105.00 Along with\
|
25 |
+
\ Mr N K Kar\n\n \n \n\n \n\n \n\n \n\nft eee ‘\n~# “Lunch. ° of AVS\
|
26 |
+
\ |\nee ou SATS i\n2 22-Feb-16); | “Fea soe mis, dee aot]\n; 3 . cng! a oa hoy\
|
27 |
+
\ ‘ “e i hs ye eo 1\n3 23-Feb-1600). Téa,Snax Andithis. I Along with Mr'N K Kar\
|
28 |
+
\ .\nee _ |) Lunch... a 00° oO 2 !\n4 24-Feb-16 Tea,Snax And mis. okt? |\nLinch\
|
29 |
+
\ ~ : egthedgtt £92 ox\n5 25-Feb-16\n\nmeted FES entre? i462\n\n- Teaisnax And\
|
30 |
+
\ mis. r AS Vi on\n) ie ihe oe » Lunch eres , Mo\n\n6 26-Feb-16 Tea, Snax And\
|
31 |
+
\ nis,\n\nyeahh! ct\n\nfeo, 7\n\n \n\n \n \n \n \n \n\n, 140.00; - Pend\
|
32 |
+
\ wih iM NK Kar\nlene . : -aaciog par rs :\n’ a7-Febalt Tea,Snax And itis” \"\
|
33 |
+
425.00 Along with Mr. K Kar\nLunch 280,00 es _— ,\n8 29-Feb-16 se Tea,Snax And\
|
34 |
+
\ oie Bh i af U5 5.00). \" pe. a!\n9 te Snax ‘And mis. ce n20. to & oe\n\n10\n\
|
35 |
+
\neee £50. Alone wit Mr N K Kar bye efort-\n\nevn, enews) :\nLaheue 325. 00 x\
|
36 |
+
\ Up £0 perenne os\neerie coer re ue\n\n \n\n,\n\n11\n\nHf figs bh.\n\n \n\n \
|
37 |
+
\ \n \n \n \n\n \n\n4\n‘\na\nvt wr 4 ‘\n“ane . mae t\nwha via ‘\n‘\n5\n12 {\n\
|
38 |
+
_ o |\n\" nay\ni\n¥\n4\n4\n_\ni\nTew. EN at Rbiew: Caen sere 4\ntA eS : f i :\n\
|
39 |
+
i — Eyl 3. 4\nes, j Lax > * awe 4\nwe be oy . “ tyne eel\ni ad\n: oe\nSeog) ayM.\
|
40 |
+
\ 44\nwr\na, obo ye eect ee —\n-\n\n \n\f"
|
41 |
+
- text: "HINDALCO INDUSTRIES LIMITED EMPLOYEES’ PROVIDENT FUND II\n\n| | B)REASON\
|
42 |
+
\ OF LEAVING SERVICE: RESIGNATION\n_ SERVICE TERMINATED ON\n\n \n \n \n \
|
43 |
+
\ \n \n \n \n \n\n \n\n|\n\n| | ACCOUNT OF (A) ILL\nHEALTH OF MEMBER\
|
44 |
+
\ (8)\nCONTRACTION /\n\nDISCONTINUATION — OF\nEMPLOYER'S BUSINESS OR\n\n(C) OTHER\
|
45 |
+
\ CAUSE BEYOND\n\nTHE CONTROL OF THE\n\n| EMBER\n|i PERSONAL REASON _\n\n__\n\n\
|
46 |
+
PAYMENT UCO BANK ,HIRAKUD SAMBALPUR ,ODISHA.\n(PLEASE ATTACH A COPY OF cmmntnnmeanisnnennenesennmaneeneisene\
|
47 |
+
\ nese\nCANCELLED CHEQUE/ATTESTED\n| COPY OF FIRST PAGE OF BANK PASS | IFS CODE\
|
48 |
+
\ ... UCBA0000285\n| BOOK _\nTa) FULL POSTAL ADDRESS WITH E- AT. GUNDRUPADA, PO-HIRAKUD,\
|
49 |
+
\ DIST- SAMBALPUR, ODISHA-.\n\n| 12 I BANK ACCOUNT DETAILS “FOR SAVING BANK ACCOUNT\
|
50 |
+
\ NO — 02850110044179\n!\n\nMAIL ID (IF ANY)\n\n \n\nPIN ...768016\n| E-MAIL ID\
|
51 |
+
\ :-\n\n- INCASE THE AMOUNT IS USED FOR ANY PURPOSE OTHER THAN STATED IN COLUMN\
|
52 |
+
\ (9) ABOVE, | AM\nLIABLE TO RETURN THE ENTIRE AMOUNT WITH PENAL INTEREST.\nTHE\
|
53 |
+
\ MEMBER HEREBY DECLARES THAT HE HAD NOT BEEN EMPLOYED FOR 2 MONTH (YES/NO)\n\n\
|
54 |
+
(APPLICABLE FOR PF SETTLEMENT ONLY)\nve SIG N41\n\nMEMBER SIGNATURE AND DATE\n\
|
55 |
+
\nCERTIFIED THAT THE APPLICATION HAS BEEN SIGNED BY THE MEMBER IN MY PRESENCE\
|
56 |
+
\ AFTER HE/SHE HAD\nREAD THE CONTENT / THE CONTENT HAD BEEN EXPLAINED TO HIM /\
|
57 |
+
\ HER BY ME AND THAT THE\nINFORMATION GIVEN IN THE APPLICATION FORM |S CORRECT\n\
|
58 |
+
\nDATE:- : yA\nye\"\nEMPLOYER'S SIGNATURE\n\nDESIGNATION & SEAL OF EMPLOYER\n\
|
59 |
+
(OPTIANAL FOR FINAL PF SETTLEMENT)\n\nENCLOSURES: WV SELF ATTESTED AADHAR CARD\
|
60 |
+
\ & PANCARD\n2 cory OF CANCELLED CHEQUE / SELF ATTESTED COPY OF 15° PAGE OF PASS\
|
61 |
+
\ BOOK.\n\f"
|
62 |
+
- text: " \n\nHINDALCO INDUSTRIES LIMITED\nHIRAKUD\n\nPAYMENT ORDER\n\nPayto Simanchal\
|
63 |
+
\ Khatai\nCash Vr.No.\n\n \n\nEmp.No/S.Code No. _ ~\nby Cash/Cheque/D.D./Transfer\
|
64 |
+
\ the sum of Rs.2,00,000.00 apvrno,lOlY% 3s\nRupees Two Lakh only\n\n \n\nDetails\
|
65 |
+
\ of Payment Amount (Rs)\n\n \n\nns . 2,00,000\n\n \n\n \n\n \n\n \n\n \n\n \n\
|
66 |
+
\n2,00,000.\nPrepared by Recommeded by Endorsed by Authorised By Approved by\n\
|
67 |
+
\n9 ’\nner (wy\nDate Dept. Head Plant Head -F&A Head - Sambalpur Cluster\nPayment\
|
68 |
+
\ made on Charge\noem ra\n\n(b) By Cheque ner 2] 2G ~ 2> 7 + DA SHO-KLB (321)\n\
|
69 |
+
\nState Bank of india, Burla\nState Bank of India, Hirakud\nPunjab National Bank,\
|
70 |
+
\ Sambalpur [PNB-1]\n\n \n\n \n\n \n\n \n\n \n\nUuCcO Hirakud\n\n \n\nUCO’Bank,\
|
71 |
+
\ Sambalpur\n{DBI , Sambalpur (IDBI -1)\nIDB! , Sambalpur (IDBI -2)\n\nReceived\
|
72 |
+
\ Payment Charge Account Checked by\nSignature\n\n \n\n \n\n \n\n \n\n \n\n \n\
|
73 |
+
\f"
|
74 |
+
pipeline_tag: text-classification
|
75 |
+
inference: true
|
76 |
+
base_model: BAAI/bge-small-en-v1.5
|
77 |
+
model-index:
|
78 |
+
- name: SetFit with BAAI/bge-small-en-v1.5
|
79 |
+
results:
|
80 |
+
- task:
|
81 |
+
type: text-classification
|
82 |
+
name: Text Classification
|
83 |
+
dataset:
|
84 |
+
name: Unknown
|
85 |
+
type: unknown
|
86 |
+
split: test
|
87 |
+
metrics:
|
88 |
+
- type: accuracy
|
89 |
+
value: 1.0
|
90 |
+
name: Accuracy
|
91 |
+
---
|
92 |
+
|
93 |
+
# SetFit with BAAI/bge-small-en-v1.5
|
94 |
+
|
95 |
+
This is a [SetFit](https://github.com/huggingface/setfit) model that can be used for Text Classification. This SetFit model uses [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5) as the Sentence Transformer embedding model. A [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance is used for classification.
|
96 |
+
|
97 |
+
The model has been trained using an efficient few-shot learning technique that involves:
|
98 |
+
|
99 |
+
1. Fine-tuning a [Sentence Transformer](https://www.sbert.net) with contrastive learning.
|
100 |
+
2. Training a classification head with features from the fine-tuned Sentence Transformer.
|
101 |
+
|
102 |
+
## Model Details
|
103 |
+
|
104 |
+
### Model Description
|
105 |
+
- **Model Type:** SetFit
|
106 |
+
- **Sentence Transformer body:** [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5)
|
107 |
+
- **Classification head:** a [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance
|
108 |
+
- **Maximum Sequence Length:** 512 tokens
|
109 |
+
- **Number of Classes:** 2 classes
|
110 |
+
<!-- - **Training Dataset:** [Unknown](https://huggingface.co/datasets/unknown) -->
|
111 |
+
<!-- - **Language:** Unknown -->
|
112 |
+
<!-- - **License:** Unknown -->
|
113 |
+
|
114 |
+
### Model Sources
|
115 |
+
|
116 |
+
- **Repository:** [SetFit on GitHub](https://github.com/huggingface/setfit)
|
117 |
+
- **Paper:** [Efficient Few-Shot Learning Without Prompts](https://arxiv.org/abs/2209.11055)
|
118 |
+
- **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
|
119 |
+
|
120 |
+
### Model Labels
|
121 |
+
| Label | Examples |
|
122 |
+
|:------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
123 |
+
| 0 | <ul><li>'GHt Sa [OI uco Bank\n\nvis Free Number: 180¢-193-9125 _\n\nDICGC INSURANCE UPTO 5 LAC\n\nBRANCH\n\nUCO Bank\nP NT\n(1) Consuitants are requested to note that all moneys\n\nremitted to the Bank should either be sent by Registered\nPost or handed over to the Cash Department, as no\n\n \n\nUco BANK\n\naq\n\nName\n\n"IFSC: uceaocotms\n\' dress\n\nKICK Code: 7428029504\n\nHIRAKUD\n-HIRAKED BRARCH HIRAKUS\nProae:\n\nindividual (s) outside. the Cash Department has/have JHARY EIST\nauthority to receive cash. KADAMPOLA\n(2) The account-holder should insist on delivery of Pass Book HERAKUD\n‘ made uptodate as far as possible on the same date; a 6.8%\n- otherwise he should obtain a receipt indicating when the HIRAKYD PIN .#oBlss\nPass Book will be delivered.\n(3) Deposit Rules in vogue can be obtained by account-holder TET. WaT / Asst.\nfrom the Branch on request Q28501 19027145\nPB.NG. }\n\n \n\n \n\n \n\nfe er ee me\n\n \n\x0c'</li><li>' \n\n= 2, ip\nO ~\nN 2\na\n: Y ve re ty\n) 3 x.\nNai] (F) my\n\n \n\ny Viayal chat aloala\nSH PPP ea [sys sys *\nas NB\n2\n=\n\ni x X we\na. = Xt +\n— W\nx 2| > x xv)\n— ~ wa al on\nmh a\n\nx\n@\n\n \n\nSy\n>3\nS\nak\n\n \n\n \n\n= coemeirata nani\nyy“\nxX -~|<\n. q - r " 2 e eee\n| S TTT !\n“ sa S ~\ngaysey Maye oe | toe\n\ni\'s . <4 " = : nics\n: 5 oy Sy . : aR N =\nS Sy = yy > =P OW\n, oe Q\n3 4 WK SS j 2 .\n-~ rs, , 4 i AS ~ si 6 .\nA Se S = Ce 4G ‘ tb. ee bene |\n\na\n\n \n\nes |\nTo a 3,\n-} ™ i] nest -— a Dome: eo . Sp a > Ee eh ao Ty ache oe ewe cede oe oe tee ~\n5 . “i a ( . - i -\n\n \n\n \n\x0c'</li><li>'Interest will be payable @ 24 % p.a. if the invoice is not paid within 30 days of the date of invoice.\n\nABBREVIATION: TB — Tower & Basin\nTO — Tower Only\n\n1. All taxes and duties invoiced herein are subject to revision depending upon the final assessment\n\nby the Statutory Authorities. Any such revision will be to buyer’s account.\n\n2. Payments should be made by A/C Payee cheque/Pay oder/bank draft/Online fund transfer\n\nthrough NEFT/RTGS platform in favour of “Paharpur Cooling Towers Ltd.”. Payment towards this\n\nbill made in any other form will be done entirely at your own risk.\n\n3. ALL DISPUTES SUBJECT TO CALCUTTA JURISDICTION ONLY.\n\x0c'</li></ul> |
|
124 |
+
| 1 | <ul><li>'. Ae - PR CSeathetn & 3)\n" J She ase 9 Pao\n\n‘s lad Bank Afr o Steppe\nIN | fave 4 fi foe & ats bent\n\nHINDALCO INDUSTRIES LIMITED\nHIRAKUD\n\nPAYMENT ORDER\n\nPayto Payment to Mr.Dilip Das\n\n|\nTravel expenses for Interview w candidate (A (Admin) J] jo. _| Cash Vr.No. Q pis | l\n\npk check he inkwes IFSC. code Emp.No/s.codeNo. _ OT Pago |\n\nby Cash/Cheque/D.D./Transfer the sum of —_Rs.13,695.00 _ _| AP.Vr.No.\nRupees Thirteen Thousand Six Hundred Ninety Five Only ———__ ; 3 ua 202 |\nDate\n\n \n\n \n\n \n\nX\n\n5\n\nee |\nain & Flight Tickets is. _ 13,195.00\nConvenience expenses Rs. — 500. 00°\n\n \n\n \n\nDetail Travel plan and tickets enclosed\n\nBank Account details also enclosed\n\n \n\n \n \n \n\nPrepared by Recommended by Endorsed by\nDate q Head- HR\n: Hirakud Complex\n\n \n \n \n\n \n \n\n \n\né y Cash 2. DAD ey ‘ZO\n(i \'y Cheque No DVPOVe Bee\n\n \n\n \n \n\nState Bank of India, Burla\nState Bank of India, Hirakud\n\nPunjab National Bank, Sambalpur [PNB-1]\nUCO Bank, Hirakud\n\nUCO Bank, Sambalpur\nIDB! , Sambaipur (IDB! -1)\nIDBI , Sambalpur (IDBI -2)\n\n \n \n \n\n \n\n \n \n\n \n\n \n \n\n \n\n \n \n \n \n \n\n \n\n \n\n \n \n\nCashier\n\n \n\n \n\nReceived Payment Charge Account Checked by\n\n \n\nSignature Signature\n\x0c'</li><li>'HINDALCO INDUSTRIES LIMITED\nHIRAKUD\n\nPAYMENT ORDER\nPay to FRakesh Gupta ; . . | 3898 BA (Q-1 2-15\n\nCash Vr.No.\n\n \n\n \n\n \n\n— - _ Emp.No./S.Code No. $-392 _\nby Cash/Cheque/D.D./Transfer the sum of a | AP vr.No. 91 355%\nRupees Four Thousand Six Hundred Only\n\n \n\n \n\n \n\n22\nDate 48-02-16\nDetails of Payment Amount\nTowards change of Battery of Vehicle No. OR-02-AM-8904\n\nas detailed below: (Bill Attached)\n(i) Bill No. 3898 Dt.19-12-2015\n\n \n\nTotal Rs. . 4,600.00\n\nPrepared by Recommended by Endorsed by Authorised by Approved by\nLanier bnwnnWenuw \\ \\ .\n\\4 = Ww \\ le\n\n\\ov Jv JI 4.) ee Zan”\n\nDate Dept Head Plant Head Hed - Location Head\n\n \n\n \n\nPayment made on\n(a) By Cash\n\n(b) By Cheque No.\n\n \n\n \n\nState Bank of India, Burla\n\nState Bank of india, Hirakud\n\nPunjab National Bank, Sambalpur [PNB-1]\nUCO Bank, Hirakud\n\nUCO Bank, Sambaipur\n\n{DBI , Sambalpur (IDB! -1)\n\nIDBI , Sambalpur (IDBI -2)\n\n \n\n \n\n \n\n \n\n \n\nCashier\n\nReceived Payment Charge Account Checked by\n\nSignature Signature\n\x0c'</li><li>'tT) Ce cfd\n\n \n \n \n \n \n \n \n\nADITYA BIRLA HINDALCO INDUSTRIES LIMITED\n874 HIRAKUD POWER\n\naN’ PAYMENT ORDER\n\nPP -200| - AI66\n\nCash Vr.No.\n\n \n \n \n\nAP.Vr.No._G/8Ol tT\n\nby Cash/Cheque/D.D./Transfer the sum of\nELEVEN THOUSAND FIFTY FOUR ONLY\n\n \n\nRupees\n\n \n \n \n \n\nDate:- 8.01.20\n\nENERGY CHARGES OF INTAKE CHAMBER FOR THE MONTH OF DEC 2019,BILL NO- L\n1533 2639.00\n8415.00 ~\n\n“\nTotal Total Rs. 41054.00\n\nPrepared by Recammeded by Endorsed by Authorised By Approved by\n\npu ( Nx\nHead-F&A Head - Sambalpur Cluster\nCharge Account an ou\n\n \n\n \n \n \n \n\n \n\nENERGY CHARGES OF ASH MOUND FOR THE MONTH OF DEC 2019, BILL NO-1532\n\n \n\n \n\n \n\n \n \n \n\n \n\n \n\n \n \n \n \n \n \n \n\nState Bank of india,\nState Bank of India, Buria\n\nPunjab National Bank, Sambalpur [PNB-1]\nPunjab National Bank, Kolkata {[PNB-2]\nUCO Bank, Hirakud\nUCO Bank, Sambalpur\n\n—\n\n \n \n \n \n \n\nes\neee\n\nReceived Payment Charge Account Checked by\n\n \n\nSignature Signature\n\x0c'</li></ul> |
|
125 |
+
|
126 |
+
## Evaluation
|
127 |
+
|
128 |
+
### Metrics
|
129 |
+
| Label | Accuracy |
|
130 |
+
|:--------|:---------|
|
131 |
+
| **all** | 1.0 |
|
132 |
+
|
133 |
+
## Uses
|
134 |
+
|
135 |
+
### Direct Use for Inference
|
136 |
+
|
137 |
+
First install the SetFit library:
|
138 |
+
|
139 |
+
```bash
|
140 |
+
pip install setfit
|
141 |
+
```
|
142 |
+
|
143 |
+
Then you can load this model and run inference.
|
144 |
+
|
145 |
+
```python
|
146 |
+
from setfit import SetFitModel
|
147 |
+
|
148 |
+
# Download from the 🤗 Hub
|
149 |
+
model = SetFitModel.from_pretrained("Gopal2002/CASH_AND_BANK_INVOICE")
|
150 |
+
# Run inference
|
151 |
+
preds = model("
|
152 |
+
")
|
153 |
+
```
|
154 |
+
|
155 |
+
<!--
|
156 |
+
### Downstream Use
|
157 |
+
|
158 |
+
*List how someone could finetune this model on their own dataset.*
|
159 |
+
-->
|
160 |
+
|
161 |
+
<!--
|
162 |
+
### Out-of-Scope Use
|
163 |
+
|
164 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
165 |
+
-->
|
166 |
+
|
167 |
+
<!--
|
168 |
+
## Bias, Risks and Limitations
|
169 |
+
|
170 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
171 |
+
-->
|
172 |
+
|
173 |
+
<!--
|
174 |
+
### Recommendations
|
175 |
+
|
176 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
177 |
+
-->
|
178 |
+
|
179 |
+
## Training Details
|
180 |
+
|
181 |
+
### Training Set Metrics
|
182 |
+
| Training set | Min | Median | Max |
|
183 |
+
|:-------------|:----|:---------|:-----|
|
184 |
+
| Word count | 1 | 201.2534 | 4241 |
|
185 |
+
|
186 |
+
| Label | Training Sample Count |
|
187 |
+
|:------|:----------------------|
|
188 |
+
| 0 | 113 |
|
189 |
+
| 1 | 33 |
|
190 |
+
|
191 |
+
### Training Hyperparameters
|
192 |
+
- batch_size: (32, 32)
|
193 |
+
- num_epochs: (2, 2)
|
194 |
+
- max_steps: -1
|
195 |
+
- sampling_strategy: oversampling
|
196 |
+
- body_learning_rate: (2e-05, 1e-05)
|
197 |
+
- head_learning_rate: 0.01
|
198 |
+
- loss: CosineSimilarityLoss
|
199 |
+
- distance_metric: cosine_distance
|
200 |
+
- margin: 0.25
|
201 |
+
- end_to_end: False
|
202 |
+
- use_amp: False
|
203 |
+
- warmup_proportion: 0.1
|
204 |
+
- seed: 42
|
205 |
+
- eval_max_steps: -1
|
206 |
+
- load_best_model_at_end: False
|
207 |
+
|
208 |
+
### Training Results
|
209 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
210 |
+
|:------:|:----:|:-------------:|:---------------:|
|
211 |
+
| 0.0023 | 1 | 0.3054 | - |
|
212 |
+
| 0.1142 | 50 | 0.1162 | - |
|
213 |
+
| 0.2283 | 100 | 0.0043 | - |
|
214 |
+
| 0.3425 | 150 | 0.0015 | - |
|
215 |
+
| 0.4566 | 200 | 0.0014 | - |
|
216 |
+
| 0.5708 | 250 | 0.0008 | - |
|
217 |
+
| 0.6849 | 300 | 0.0013 | - |
|
218 |
+
| 0.7991 | 350 | 0.001 | - |
|
219 |
+
| 0.9132 | 400 | 0.0004 | - |
|
220 |
+
| 1.0274 | 450 | 0.0008 | - |
|
221 |
+
| 1.1416 | 500 | 0.0008 | - |
|
222 |
+
| 1.2557 | 550 | 0.0011 | - |
|
223 |
+
| 1.3699 | 600 | 0.0008 | - |
|
224 |
+
| 1.4840 | 650 | 0.0007 | - |
|
225 |
+
| 1.5982 | 700 | 0.0005 | - |
|
226 |
+
| 1.7123 | 750 | 0.0005 | - |
|
227 |
+
| 1.8265 | 800 | 0.0007 | - |
|
228 |
+
| 1.9406 | 850 | 0.0005 | - |
|
229 |
+
|
230 |
+
### Framework Versions
|
231 |
+
- Python: 3.10.12
|
232 |
+
- SetFit: 1.0.3
|
233 |
+
- Sentence Transformers: 2.2.2
|
234 |
+
- Transformers: 4.35.2
|
235 |
+
- PyTorch: 2.1.0+cu121
|
236 |
+
- Datasets: 2.16.1
|
237 |
+
- Tokenizers: 0.15.0
|
238 |
+
|
239 |
+
## Citation
|
240 |
+
|
241 |
+
### BibTeX
|
242 |
+
```bibtex
|
243 |
+
@article{https://doi.org/10.48550/arxiv.2209.11055,
|
244 |
+
doi = {10.48550/ARXIV.2209.11055},
|
245 |
+
url = {https://arxiv.org/abs/2209.11055},
|
246 |
+
author = {Tunstall, Lewis and Reimers, Nils and Jo, Unso Eun Seo and Bates, Luke and Korat, Daniel and Wasserblat, Moshe and Pereg, Oren},
|
247 |
+
keywords = {Computation and Language (cs.CL), FOS: Computer and information sciences, FOS: Computer and information sciences},
|
248 |
+
title = {Efficient Few-Shot Learning Without Prompts},
|
249 |
+
publisher = {arXiv},
|
250 |
+
year = {2022},
|
251 |
+
copyright = {Creative Commons Attribution 4.0 International}
|
252 |
+
}
|
253 |
+
```
|
254 |
+
|
255 |
+
<!--
|
256 |
+
## Glossary
|
257 |
+
|
258 |
+
*Clearly define terms in order to be accessible across audiences.*
|
259 |
+
-->
|
260 |
+
|
261 |
+
<!--
|
262 |
+
## Model Card Authors
|
263 |
+
|
264 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
265 |
+
-->
|
266 |
+
|
267 |
+
<!--
|
268 |
+
## Model Card Contact
|
269 |
+
|
270 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
271 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/root/.cache/torch/sentence_transformers/BAAI_bge-small-en-v1.5/",
|
3 |
+
"architectures": [
|
4 |
+
"BertModel"
|
5 |
+
],
|
6 |
+
"attention_probs_dropout_prob": 0.1,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"hidden_act": "gelu",
|
9 |
+
"hidden_dropout_prob": 0.1,
|
10 |
+
"hidden_size": 384,
|
11 |
+
"id2label": {
|
12 |
+
"0": "LABEL_0"
|
13 |
+
},
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 1536,
|
16 |
+
"label2id": {
|
17 |
+
"LABEL_0": 0
|
18 |
+
},
|
19 |
+
"layer_norm_eps": 1e-12,
|
20 |
+
"max_position_embeddings": 512,
|
21 |
+
"model_type": "bert",
|
22 |
+
"num_attention_heads": 12,
|
23 |
+
"num_hidden_layers": 12,
|
24 |
+
"pad_token_id": 0,
|
25 |
+
"position_embedding_type": "absolute",
|
26 |
+
"torch_dtype": "float32",
|
27 |
+
"transformers_version": "4.35.2",
|
28 |
+
"type_vocab_size": 2,
|
29 |
+
"use_cache": true,
|
30 |
+
"vocab_size": 30522
|
31 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"__version__": {
|
3 |
+
"sentence_transformers": "2.2.2",
|
4 |
+
"transformers": "4.28.1",
|
5 |
+
"pytorch": "1.13.0+cu117"
|
6 |
+
}
|
7 |
+
}
|
config_setfit.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"labels": null,
|
3 |
+
"normalize_embeddings": false
|
4 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6683dd2051987c3c781a36af15c03ffb0f2fb2d9170ed99e531670496105824
|
3 |
+
size 133462128
|
model_head.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd82f3cf5a9430bb8bf5eef6aff9d54d4beab3926df499e2f3692a3fb2e0480c
|
3 |
+
size 3919
|
modules.json
ADDED
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
},
|
14 |
+
{
|
15 |
+
"idx": 2,
|
16 |
+
"name": "2",
|
17 |
+
"path": "2_Normalize",
|
18 |
+
"type": "sentence_transformers.models.Normalize"
|
19 |
+
}
|
20 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 512,
|
3 |
+
"do_lower_case": true
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"100": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"101": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"102": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"103": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": true,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_basic_tokenize": true,
|
47 |
+
"do_lower_case": true,
|
48 |
+
"mask_token": "[MASK]",
|
49 |
+
"model_max_length": 512,
|
50 |
+
"never_split": null,
|
51 |
+
"pad_token": "[PAD]",
|
52 |
+
"sep_token": "[SEP]",
|
53 |
+
"strip_accents": null,
|
54 |
+
"tokenize_chinese_chars": true,
|
55 |
+
"tokenizer_class": "BertTokenizer",
|
56 |
+
"unk_token": "[UNK]"
|
57 |
+
}
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|