Gopal2002 commited on
Commit
2a626bc
1 Parent(s): 9ecd0fd

Push model using huggingface_hub.

Browse files
1_Pooling/config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 384,
3
+ "pooling_mode_cls_token": true,
4
+ "pooling_mode_mean_tokens": false,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false
7
+ }
README.md ADDED
@@ -0,0 +1,358 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: setfit
3
+ tags:
4
+ - setfit
5
+ - sentence-transformers
6
+ - text-classification
7
+ - generated_from_setfit_trainer
8
+ metrics:
9
+ - accuracy
10
+ widget:
11
+ - text: "* 04 Hindalco Industries Ltd\nHirkaud Smelter Stores\n\n \n\n* Service Recei\
12
+ \ ot\nBUYER _ Lp / GATE ENRTY NO:\noe ADL D vA /2/0A\nRECEIPT DATE: 04-MAR-22\
13
+ \ ATU\" ! : 1-SAMBALPUR\nUNIQUE ENTERPRISES ad ZL POL CPi pg 6 ee Q/748/2022\n\
14
+ ASS Cer ag fe oO\nos \" -\n\n \n \n \n\nORG CODE:\n\nBOE NO:\nBOE DATE:\ncut\n\
15
+ \n \n\nTT\n\nWAY BILL AIRBILL NO\n\nPo\nSoe\nDATE:\n\nTOTAL RECEIVED 21074.8 Nes\
16
+ \ REMARKS/REFERENCE: | SUPPLY FOR PAINTING\nAMOUNT INCL TAX Reverse Charge: No\
17
+ \ ~\n\nINR) : Tax Point Basis : INVOICE\n\nPO Description SUPPLY FOR PAINTER FOR\
18
+ \ 85KA EMD\n\n \n\n \n \n \n\n \n \n \n \n\n \n \n \n\n\
19
+ \ \n \n \n \n\n \n \n \n\n \n \n\nLOCATOR\nShelf Life\nCONTROL\n\n\
20
+ QUANTITY:\nCHALAN/INVOICE\nRECEIVED\n\nQUANTITY:\nACCEPTED\nREJECTED\n\n \n\n\
21
+ \ \n\n \n \n\nITEM CODE DESCRIPTION HSN / SAC\nPR NUMBER SUB INVENTORY\
22
+ \ CODE\n\nPO NO. BU/cost Center/ Account Code along with GL ACCOUNT\n\nREQUESTER\
23
+ \ CODE\n\nNote to receiver\n\n1 - 801015110326 - HIRE: MANPOWER, SKILLED;RATE\
24
+ \ TYP:STANDARD, : MANDAY\nLVL/DSGNTN:PAINTER\n\n[=] = b07-\n\nS/PO/SRV/2122/054\n\
25
+ 2\n\n- Sekhar, Mr.\nChandra Makthala\n\n \n \n\n: No Control\n\n \n \n\n\
26
+ \ \n \n \n\n- 3711.204.910103.50803112.9999.9999.9999.9999.9999\n- Hirakud\
27
+ \ Smelter Plant.Aluminium Smelter.Electrical.Repairs to\nMachinery- Electrical.Default.Default.Default.Default.\
28
+ \ Default\n\nP ruchasuil dG ~L— gw\n\n \n\n4atos- OF + 2622. .e, oer |\nPREPARER\
29
+ \ SECTION HEAD / INSPECTOR SECTION HEAD /\nSTORES KEEPER AREA HEAD -RECEIVING\
30
+ \ AREA HEAD — CUSTODY & ISSUE\nor\n\nals\n\f"
31
+ - text: " \n\n \n\nDELIVERY CHALLAN ~ Phone : (0891) 2577077 |\nALUFLUORIDE LIMITED\n\
32
+ MULAGADA VILLAGE, MINDHI POST,\nVISAKHAPATNAM - 530 012 |\n\n \n\n \n\n \n\n \n\
33
+ \n \n\n \n\n \n\n \n\n \n\nDc Nox: g22 - - : ; “Date 02-02-2016\n| HINDALCO INDUSTRIES\
34
+ \ LTD HIRAKUD\nSAMBALPUR\nODISHA\nPIN CODE: 768016\nYour Order No: ~HKDRM/1516/0001\
35
+ \ DT: 01/04/2015\nReceived the below mentioned in good condition. Carrier No:\
36
+ \ AP 16 TC 9339\n—SI.No | ~~ PARTICULARS” | Qty. | Rate / MT\n: = | ae\n: 7\n\
37
+ ALUMINIUM FLUORIDE . | 21.000 | ; sbatS\n|\n420 BagsX 50.120 kg. = 21.0504 MT\
38
+ \ |\nWeight of Emppty Bags:& Liners: 0.050 MT\nSoa Net Weight of Material: ~ 21.000\
39
+ \ ~MT\nInvoice No.: 822 Date 02-02-2016\"\nAPVAT TIN : 37900106541 Dt: 02.06.2014\
40
+ \ CST No.: 37900106541 Dt: 02.06.2014\nReceiver's Signature Signature\n\n \n\f"
41
+ - text: " \n\n \n\n \n\n \n\n \n\n \n\n| rad nas Bi Tiapz Ke en\nap | pa\
42
+ \ ape EE By EY ED ITT? ON matte / ON moray |\nP| airing swodanraa boc pia oe ne\
43
+ \ ed ee v , 4\n! e i ma | VeACLA Baus §uOQ souBisua¢ of\n| “P io | . [ | seBieUo\
44
+ \ IS | wal VY | Loo abi +A Buipe spun |\n| | fe) De [ nl oman «| OE U :\nmS, (Spe\
45
+ \ fb) to ae\n| eo Ss | | Pepe (GEOUVHO | GE SOF ae\nE 4 ’ : E sapesecascnsctute\
46
+ \ saps Ln + ad et an\nme | | a | es ' | xR Uag ob iw aa ae 32\n' a a] i as aN\
47
+ \ Ne paneer\nRe is pad on\n| ee | Sel Nmd Oe oy ld,\n| ix | ; | ‘lwnov L PP. ‘dg\
48
+ \ py\n| . Pe eh\n\n \n\nmo sory oR! wor,\n\nou d&- ane eer\n\n: \"ORL\n\n \n\
49
+ \ \n\n \n\n‘PO 0Es - “ay Sink /BUSIA,\n‘eyemfes eipug weayediueaewueyepsd JeaK\n\
50
+ \"UINYD BPISGG SE-’-S7Z ON 100G\n\nBu. NOUMIS BNDIOOS\n\ney\nWeve! se\n\n \n\n\
51
+ \ \n\nhceaitbaaor re\n\n! AMoaAM\n\n \n\n \n\n> tewe-3™\n\noy eee\n\nY3WOISH)\
52
+ \ Ad GAUNSNI SI ODUYO\n— MSIH S.HSNMO LY\n\nAdOD HONDIS. NOD\n\nene os roarans\n\
53
+ \n \n\nKINO NOMIC unr\n\nWaalarad Ta soz - ‘Sn\n\n \n\n- “eu = 3 re\n\neagaee\n\
54
+ \nGY oe Ae\n\nBA OFT OVI\nfoe, 17 :\n\n“OL\n\n \n\nivan OL.Givs) NOiAIOSaa\n\
55
+ \n \n\neT ea ‘ON aGOW\n\n \n\n \n\n(sour g) 9292 94924 920P : 181 600 OOF\
56
+ \ - IVAW angus Wi0l <\n‘OVOY OTIS .G 'Zy “.BSNOH X3dINI PVHIA. ¢°O\"H\n\n? tAd\
57
+ \ LHOdSNU 4! 88909 LVENS\n\n-_ wd\nfe\n\n»\n\f"
58
+ - text: "SOT Ue\n\n \n\n \n\noH\n\n| ia\n\nI\nod\n\nHi\n\na\n\n|\nTo) Sig\
59
+ \ Pere\na\n\nal |g\n&%\n5)\n\nwS\\\neB\nSB\n“5\n“O\nS\n€X\n\nBea\n\nem\n\nPe eS\n\
60
+ \nse aE a\n\n4 |] | tat [ety\n\ntt pe Ta\n&\na\n\nOK\n\n¢\n\nSRLS ia Leh coe\n\
61
+ \n \n \n\f"
62
+ - text: " \n \n \n \n\nAUSEOOUSRGSEEENSSRCESRORROGS\n\nMise oaeta\nMis tnaes Lo\
63
+ \ Q) duty at col ane\n\nDate 12.8820\n‘Stra Bort as Corry Ub 2.\n\nexeauscscotecne:\
64
+ \ aneasese\n\nMm. €.M. NBUSTRIES\n\nAn ISO 9001 : 2008 COMPANY\n\n“PODDAR COURT\"\
65
+ , Phones : 2235 2096 / 3985 2494 Lo Wi. TEE OLL, a¥ahe Package Ae 2\natadiee Fax\
66
+ \ 033-2235 1868\n\nE-mail : cables@memindustries.com Tame Ahr SLM, Freight eng\n\
67
+ \n \n\nRaut WAR OKA O Van weg 9 at ai sl age Reve\nCorny u. )\n\nGABLES ARE\
68
+ \ IN GUR CONTROL\n\nFrease sign & return VAT No. : 19570720098 e TIN/ CST No.\
69
+ \ : 19570720292\n—~ = Office : 55, Ezra Street, 2nd Floor, Kolkata - 700 001\n\
70
+ \f"
71
+ pipeline_tag: text-classification
72
+ inference: true
73
+ base_model: BAAI/bge-small-en-v1.5
74
+ model-index:
75
+ - name: SetFit with BAAI/bge-small-en-v1.5
76
+ results:
77
+ - task:
78
+ type: text-classification
79
+ name: Text Classification
80
+ dataset:
81
+ name: Unknown
82
+ type: unknown
83
+ split: test
84
+ metrics:
85
+ - type: accuracy
86
+ value: 1.0
87
+ name: Accuracy
88
+ ---
89
+
90
+ # SetFit with BAAI/bge-small-en-v1.5
91
+
92
+ This is a [SetFit](https://github.com/huggingface/setfit) model that can be used for Text Classification. This SetFit model uses [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5) as the Sentence Transformer embedding model. A [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance is used for classification.
93
+
94
+ The model has been trained using an efficient few-shot learning technique that involves:
95
+
96
+ 1. Fine-tuning a [Sentence Transformer](https://www.sbert.net) with contrastive learning.
97
+ 2. Training a classification head with features from the fine-tuned Sentence Transformer.
98
+
99
+ ## Model Details
100
+
101
+ ### Model Description
102
+ - **Model Type:** SetFit
103
+ - **Sentence Transformer body:** [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5)
104
+ - **Classification head:** a [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance
105
+ - **Maximum Sequence Length:** 512 tokens
106
+ - **Number of Classes:** 2 classes
107
+ <!-- - **Training Dataset:** [Unknown](https://huggingface.co/datasets/unknown) -->
108
+ <!-- - **Language:** Unknown -->
109
+ <!-- - **License:** Unknown -->
110
+
111
+ ### Model Sources
112
+
113
+ - **Repository:** [SetFit on GitHub](https://github.com/huggingface/setfit)
114
+ - **Paper:** [Efficient Few-Shot Learning Without Prompts](https://arxiv.org/abs/2209.11055)
115
+ - **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
116
+
117
+ ### Model Labels
118
+ | Label | Examples |
119
+ |:------|:----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
120
+ | 0 | <ul><li>'_\ni.\nSe\nNew\n~~\ned\nTy\nSw\nNe\nNw\ned\n2:\n\n \n\x0c'</li><li>'ne.\n\n \n \n\n \n \n\n \n\nbBo fy20 5 ‘ )\n- wi Pas BOOKING STATION\nstat” SURAT GEIS TRA: BSPORT HOT. LTE, DIMPLE COURT, 2ND FLOOR,\n<ESEE> H.O.: “VIRAJ IMPEX HOUSE”, 47, D\' M= -toRoaD, + AT_OW. ER’S RISK oer\n\' , a” MUMBAI - 400 009 Tel. : 4076 7676 sianan Gece i al CARGO iS INSUR BY CUSTOMER — PH, : 033-30821697, 22\n{ 1. Consignor’s Name & Address As. ExOme peas Br. Code\ndT ncuer\n| acai denn EE Motie iho. ;\n| Weal © Gab TES 1 eensests Uasansensssssseonsenoereneorsenvenesnneasy\n\n\' 2.Cons ignce Bai:x’s Names wl ke iy at < CoO ale ysien b> € (to!\n\n“Litsakuod smalter f eat Lireatéuel Bor oa thin ~ behets ___\n\n \n\n|\n| %\n| on Sen Me te INS a sna iene tl er sues EES _KM__\nat i ag Se are ~ 7 oo 2 ne\n\'| L. US | - 1265 . - HY f Y -ataucl =\nate OF _ QESCHIPTION (SAIC TD ee wy ss _ WEIGHT at GATE PY 2 FRGH GH\neer . | we Re, ?. i\n\n| UFG Re Matta PS RO [aa =r 52 fences\nwe by “Matrtale O%, EFT Gora), ed\n\nhr\n\niia Sa ea eterna eas ean a\n\n \n\n \n\nTin Me a! pene __ aod i osem ge Wleg\n\' Lone CHARS 4 Hanne oe | 5 & ;\nt—- cee eee a = _ Ss Reece!\n| hig © pap Loading by 7S TAP ut. Crarges fon = aw\ntal | 7 “a eet ci a" or a — © =\n\nfree = w JBODs C } se ren st tet , Re 1 SURAT GOODS TRANSPORT VTALTD. * *\n\nTruck No. / Trailer No. : Capacity __\n\nscreens: eat BY SoH BUNS hs BENESME Pp\n\n \n\n \n\n \n\n. Lo\n\nAeookutd Clerk\n\n \n\x0c'</li><li>'J o\nALL DISPUTES SUBJECT TO KOLKATA JURISDICTION @ : 2236 6735\n\n"os Mobile : 98300 08461\n-*, _ TAXINVOICE RIG UYER\'\n\nUNITED ENTERPRISES\n\n— = Deals in : TARPAULIN, POLYTHENE, HDPE FABRIC, COTTON CLOTH,\nHESSIAN, GRANULES & GENERAL ORDER SUPPLIERS\n\n3, Amartalla Lane, Kolkata - 700 001 ~ 3 MAY 2Ui5\n\n \n \n \n\nws. HlinPAL so Taposreics Limireep | BN. bf LSS nnn\nDato......1 Sf94. LA csanscsonss\n\nSOD LSA LARS Bn Tee. Chalian No.....1.6. AS: ~(§\nDist: caumpac pon Opis HAD Date ....... LOfoy Iss sessssessseee\n\nCC OSECCLETTTECOETSSOECOHH TS ETTSSEOTHAU HE HOVER SHEUMOSECEDSOUCODESCODECE ODI SMousON RE RED\n\nBayar YATIEST No. BSS. za BIG san\n\n \n \n \n \n\n \n\n \n\nCAP TCT o Ce ERE veTe Darden vavoryDEETOeseeEDOOTEEDE\n\nRupees inwords .N.| why Fou These —\nmA YS..ntL ard cl\n\nVat No. 19511424085 dt. 20/3/08\nC.S.T. No. 19511424289 dt. 20/3/06\n\n \n \n \n \n\x0c'</li></ul> |
121
+ | 1 | <ul><li>"Posatis ils. H\n\n \n\niS\nvs\na (uf\n\noe\n\n \n\n-\n\n \n\nSarichor Pls: q\n\nPea :\n\nITEM /\n\n1. Description/ Received Reject Delivered Retur\n\n \n \n\nSPARE TX. Phat\n\n(MARKETED BY MESAPD\n\nPact eta\n\n \n\nMATERIAL RECEIPT REPORT\n\n \n\n \n \n \n\n \n\nCUM nea\n\n00 LeTlooo 0.000\n\nPAS\n\n \n \n\nELT\n\nJUPLICATE FOR TRANSPORTE?-\nOGPY (EMGISE INVOICE) RECEIVED\n\nMite ariant Eee\n\nPRAM MUIMAFE RCL RE\n\n \n\n \n\nFrys\n\n \n\not\n\nSuds oT\n\n \n \n\npeas\n\nee ase\n\n. Tax Gelig\n\nGrand Tooke\n\ni\n\nRM\n\nRate/Unit\n\nMRR SUBMITTED\nwv\n\nITH PARTY'S INVIGCE\n\nEET RY MO SSO OT Soe ELS\n\nLS.\n\n \n\n \n\n \n\nWee\n\n7; Ae 18\n\nTrcic\n\ni\nSu\n\n~s\n\n“en\n\nnny\n\x0c"</li><li>"«= ITER /\ncit BDescription/ Received\n\nms\n\n \n \n\n \n\nIces\n\ne to\n\ntea tae\n\nhoimeryh bea\n\nPorccheninernyh Qerkees\n\nRican dec\n\nrarer:\n\nPAD RP eAR eR\n\nMeare\n\n \n\nMATERIAL RECEIPT\n\n \n\nREPORT\n\n \n\nwe ie 7\nhe\n\nSeba.\nbh ETS\n\n \n\nReject Delivered Retur\n\nTESLA y’\n\n \n\n \n\n \n\nLF PIE\n\nTAIT a\n\nSUPLICATE FOR TRANSPORTER\nOGPY (EXGISE INVOICE) RECEIVED\n\noy\n\nf\n\n“soarewe Pk Beak\nree\n\nRAF |\n\n \n\nep oe:\n\nPATE\n\nenc\n\n \n\nMarat\nmw LA\n\n \n \n\nNeneh cat\n\nMRR SUBMITTED\n\\AITH PARTY'S INVIOCE\n\nvee oat\n\nPO Mea PEC SPR AL?\nPi Davtess Bech.\naS OMMOL\n\nRate/Unit\n\nouts 8\n\nI.\n\nfity ¥\n\n \n\n \n\n \n\n \n\nValue\niRise. }\n\n \n\nhare\n\nfMats Terkalis\n\nCaw Wa\n\nresid\n\nTera l.\n\nHae\n\n \n\nEVheres\n\n \n\n \n\nLrpechaarcies\n\nih\n\nAaB\n\n \n\noa,\n\n_\n\na\n\n_ alls\n\x0c"</li><li>'| ie\n\n \n \n \n \n\n \n\ntn eee i he _#\nTrivveiece Dae oo og OF\n1 Cxors d arimeant hoo &\n\nLearner: £ DA ted\n\n \n \n \n \n \n\n \n\nae ‘Beam teas” 8 GIR-sae? DY .mada 18 & GTR BBse “DT.13.1.38 GENO, S388\n4, Mandar Meum 2 DTV2.2.18 & G.E.NMO.S164 DT. LSeud. Le INV.NO.G5¥=1 71.8-EM-O1BS\nExcess a » DT.?.L.18 :\nSUMAM IND-AGRO SALES PYT. LTD.\n7 i\n(Te Quantity-—----—----— Value\nCAL) sence me i ee et “Received Reject Delivered: en ag ne tec enw\n\nLOCATION\n\nat\nSat OD\n\nROLFES7 5.\n\n \n\nAES FORCE | EXTRACT I,\n\non ie.\n\nDs so17Eave. au\n“6 OMELETTE MOTORISED\n\nhs norzasra 2.000\nCOMPLETE MOTORISED\n\n| GLOBE VALVE\n\nOO PATERIAL~OAS1. SIZE\n\n \n\nest AF 18 BO LEXS\nreli\n\n» COMPLETE MOM PETUBM VaLVr\na VTE TAL -- CAS d. a SIZE SOME,\n\nVALME\ney hai: Pu. WABI SIZE .\n\nALE\nTAMOHIMG TYRE.\n—LOONE ,\n\n \n\nMRR SUBMITTED -\n\n‘MATERIAL RECEIPT + REPORT -_ WITH PARTY S. INVIOCE |\n\neneeiae me\neden\n\n: “RRR Reece i at Pig\n, MARA Re ced pt Dahes\n\nPTY SPRY i Fibs\nOF -FER-LS\n\nv9\nore\n\nPO phos\n\nPEC SFRY v8 Ore\nFO Thahes\n\nOL AU?\n\n-#\n\n9.000 3.600 EET a OK 1SE460. ‘ OO a\n\nNMOS LST Tae oe PEGE IO pS\n860\nON-4as RELIVERY DATE es\nLaF EE 8 Srctual Tax Vailue 4922.20. ;\nOILST. ATTY “CO ; Stabs Torhals LoS\n\n2900\n\nSn encewn es bovese es an be neeven os ones ntES Oe pts wt 90H On eden ov ET Om aUReeR ones Mt eretereneneesa stoner mint o>\n\nOu OK)\nGTs--\n““LEOME,, 800\nDELIVERY DATE\n© Date FETE 1\n\nLE OOOD 00\nIGST Taxaiex\n\n -3ROOGO JOD\n\n- 6BA00.00 |\n\nPEI:\n\na\na\n\nfaz tua dL. Tax MaiLure E8400. 00.\n\nDIST. OTYVEC\n2.000\n\n2,000 oO\npene\n\nste os evenen enan en enetan ue saareberernestenereens eueaan ane ed ateras ony wReniboens mnotvnes cesumewtneey\n\n0.000\nTYRE\n\nnw CHD. BL OOO o OD\n\nABO . OO\nIGST Tax@iex\n\n75600. oe\n\nLOOODELUVERY DATE\n\noo Pe LASS. END CCOMMEDTION - BUTT 2a-FEERIS Actual Tax Value s FBO « 00\nPS. WELD. | . senpoeapcinatimane licleshicisunanpatal fe sini\nkG 2 BIST. OTY-/CC Suh Terkale 4PEGOO 00\nSat ya 8h Be KOCH. aetctemnneeetenectnimetnnnngeeeren tienen manent eneeremencinessirnatibioe\n\nmy\n(TW beeeninenminnien casein annnsnene sae wonenaennnnntnnneennneenunedenennineneneniannnecnenucntannennnniennacuccnannpaansuneaancinnnnnennnn nn aeeseanininc\nTN | Grand Total — LAO7F S82. 80\n-~ | SUPLICATE FOR TRANSPORTER : eo\n\n \n\n7 senvecauvenenen eqs quanvernsemn seesmaneseseneasnen amen etetenanenacesense eves anne ne on enemies ests\n\n \n \n\n“Pa ane a: of 2\n\n \n\n \n\noi eoeneens ater et et ote neat eegtas ent cege antes enewen ten mes eeenme webeei anemone anetes eran en seeeaterarts dat aneneree spans cums ct maretenen et seeterieen ment te et arereratet srereveneias cosesnesescipsenaceeie sncbntensuseeeth pesasemmeccnsnsaunsier sees lenses\n\nA ym\n\naren ra nit i\n\nee\n\ni\n\nnoe en Sep eet St ee\n\nagai e teoncrescs 7 aS\n\naaa Se Ss:\n\ncote\n\nco hegiecssoscse\n\nsenalt\n\naa\n\nJI J FF JF JF DF JD\n\nee\n\nee\n\n \n\nKoy\n\nwy \\\nae “ r\n\\\n\nZ\n\n \n\x0c'</li></ul> |
122
+
123
+ ## Evaluation
124
+
125
+ ### Metrics
126
+ | Label | Accuracy |
127
+ |:--------|:---------|
128
+ | **all** | 1.0 |
129
+
130
+ ## Uses
131
+
132
+ ### Direct Use for Inference
133
+
134
+ First install the SetFit library:
135
+
136
+ ```bash
137
+ pip install setfit
138
+ ```
139
+
140
+ Then you can load this model and run inference.
141
+
142
+ ```python
143
+ from setfit import SetFitModel
144
+
145
+ # Download from the 🤗 Hub
146
+ model = SetFitModel.from_pretrained("Gopal2002/Material_Receipt_Report_ZEON")
147
+ # Run inference
148
+ preds = model("SOT Ue
149
+
150
+
151
+
152
+
153
+
154
+ oH
155
+
156
+ | ia
157
+
158
+ I
159
+ od
160
+
161
+ Hi
162
+
163
+ a
164
+
165
+ |
166
+ To) Sig Pere
167
+ a
168
+
169
+ al |g
170
+ &%
171
+ 5)
172
+
173
+ wS\
174
+ eB
175
+ SB
176
+ “5
177
+ “O
178
+ S
179
+ €X
180
+
181
+ Bea
182
+
183
+ em
184
+
185
+ Pe eS
186
+
187
+ se aE a
188
+
189
+ 4 |] | tat [ety
190
+
191
+ tt pe Ta
192
+ &
193
+ a
194
+
195
+ OK
196
+
197
+ ¢
198
+
199
+ SRLS ia Leh coe
200
+
201
+
202
+
203
+ ")
204
+ ```
205
+
206
+ <!--
207
+ ### Downstream Use
208
+
209
+ *List how someone could finetune this model on their own dataset.*
210
+ -->
211
+
212
+ <!--
213
+ ### Out-of-Scope Use
214
+
215
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
216
+ -->
217
+
218
+ <!--
219
+ ## Bias, Risks and Limitations
220
+
221
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
222
+ -->
223
+
224
+ <!--
225
+ ### Recommendations
226
+
227
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
228
+ -->
229
+
230
+ ## Training Details
231
+
232
+ ### Training Set Metrics
233
+ | Training set | Min | Median | Max |
234
+ |:-------------|:----|:---------|:-----|
235
+ | Word count | 1 | 182.1336 | 1108 |
236
+
237
+ | Label | Training Sample Count |
238
+ |:------|:----------------------|
239
+ | 0 | 202 |
240
+ | 1 | 45 |
241
+
242
+ ### Training Hyperparameters
243
+ - batch_size: (32, 32)
244
+ - num_epochs: (2, 2)
245
+ - max_steps: -1
246
+ - sampling_strategy: oversampling
247
+ - body_learning_rate: (2e-05, 1e-05)
248
+ - head_learning_rate: 0.01
249
+ - loss: CosineSimilarityLoss
250
+ - distance_metric: cosine_distance
251
+ - margin: 0.25
252
+ - end_to_end: False
253
+ - use_amp: False
254
+ - warmup_proportion: 0.1
255
+ - seed: 42
256
+ - eval_max_steps: -1
257
+ - load_best_model_at_end: False
258
+
259
+ ### Training Results
260
+ | Epoch | Step | Training Loss | Validation Loss |
261
+ |:------:|:----:|:-------------:|:---------------:|
262
+ | 0.0007 | 1 | 0.2952 | - |
263
+ | 0.0371 | 50 | 0.2253 | - |
264
+ | 0.0742 | 100 | 0.1234 | - |
265
+ | 0.1114 | 150 | 0.0115 | - |
266
+ | 0.1485 | 200 | 0.0036 | - |
267
+ | 0.1856 | 250 | 0.0024 | - |
268
+ | 0.2227 | 300 | 0.0015 | - |
269
+ | 0.2598 | 350 | 0.0011 | - |
270
+ | 0.2970 | 400 | 0.0009 | - |
271
+ | 0.3341 | 450 | 0.0007 | - |
272
+ | 0.3712 | 500 | 0.0011 | - |
273
+ | 0.4083 | 550 | 0.0008 | - |
274
+ | 0.4454 | 600 | 0.0008 | - |
275
+ | 0.4826 | 650 | 0.0007 | - |
276
+ | 0.5197 | 700 | 0.0005 | - |
277
+ | 0.5568 | 750 | 0.0006 | - |
278
+ | 0.5939 | 800 | 0.0005 | - |
279
+ | 0.6310 | 850 | 0.0005 | - |
280
+ | 0.6682 | 900 | 0.0004 | - |
281
+ | 0.7053 | 950 | 0.0003 | - |
282
+ | 0.7424 | 1000 | 0.0004 | - |
283
+ | 0.7795 | 1050 | 0.0005 | - |
284
+ | 0.8166 | 1100 | 0.0004 | - |
285
+ | 0.8537 | 1150 | 0.0004 | - |
286
+ | 0.8909 | 1200 | 0.0005 | - |
287
+ | 0.9280 | 1250 | 0.0004 | - |
288
+ | 0.9651 | 1300 | 0.0003 | - |
289
+ | 1.0022 | 1350 | 0.0003 | - |
290
+ | 1.0393 | 1400 | 0.0003 | - |
291
+ | 1.0765 | 1450 | 0.0004 | - |
292
+ | 1.1136 | 1500 | 0.0003 | - |
293
+ | 1.1507 | 1550 | 0.0004 | - |
294
+ | 1.1878 | 1600 | 0.0004 | - |
295
+ | 1.2249 | 1650 | 0.0004 | - |
296
+ | 1.2621 | 1700 | 0.0003 | - |
297
+ | 1.2992 | 1750 | 0.0003 | - |
298
+ | 1.3363 | 1800 | 0.0003 | - |
299
+ | 1.3734 | 1850 | 0.0003 | - |
300
+ | 1.4105 | 1900 | 0.0003 | - |
301
+ | 1.4477 | 1950 | 0.0002 | - |
302
+ | 1.4848 | 2000 | 0.0003 | - |
303
+ | 1.5219 | 2050 | 0.0003 | - |
304
+ | 1.5590 | 2100 | 0.0003 | - |
305
+ | 1.5961 | 2150 | 0.0002 | - |
306
+ | 1.6333 | 2200 | 0.0003 | - |
307
+ | 1.6704 | 2250 | 0.0004 | - |
308
+ | 1.7075 | 2300 | 0.0004 | - |
309
+ | 1.7446 | 2350 | 0.0003 | - |
310
+ | 1.7817 | 2400 | 0.0002 | - |
311
+ | 1.8189 | 2450 | 0.0002 | - |
312
+ | 1.8560 | 2500 | 0.0003 | - |
313
+ | 1.8931 | 2550 | 0.0002 | - |
314
+ | 1.9302 | 2600 | 0.0003 | - |
315
+ | 1.9673 | 2650 | 0.0003 | - |
316
+
317
+ ### Framework Versions
318
+ - Python: 3.10.12
319
+ - SetFit: 1.0.3
320
+ - Sentence Transformers: 2.2.2
321
+ - Transformers: 4.35.2
322
+ - PyTorch: 2.1.0+cu121
323
+ - Datasets: 2.16.1
324
+ - Tokenizers: 0.15.0
325
+
326
+ ## Citation
327
+
328
+ ### BibTeX
329
+ ```bibtex
330
+ @article{https://doi.org/10.48550/arxiv.2209.11055,
331
+ doi = {10.48550/ARXIV.2209.11055},
332
+ url = {https://arxiv.org/abs/2209.11055},
333
+ author = {Tunstall, Lewis and Reimers, Nils and Jo, Unso Eun Seo and Bates, Luke and Korat, Daniel and Wasserblat, Moshe and Pereg, Oren},
334
+ keywords = {Computation and Language (cs.CL), FOS: Computer and information sciences, FOS: Computer and information sciences},
335
+ title = {Efficient Few-Shot Learning Without Prompts},
336
+ publisher = {arXiv},
337
+ year = {2022},
338
+ copyright = {Creative Commons Attribution 4.0 International}
339
+ }
340
+ ```
341
+
342
+ <!--
343
+ ## Glossary
344
+
345
+ *Clearly define terms in order to be accessible across audiences.*
346
+ -->
347
+
348
+ <!--
349
+ ## Model Card Authors
350
+
351
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
352
+ -->
353
+
354
+ <!--
355
+ ## Model Card Contact
356
+
357
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
358
+ -->
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/root/.cache/torch/sentence_transformers/BAAI_bge-small-en-v1.5/",
3
+ "architectures": [
4
+ "BertModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 384,
11
+ "id2label": {
12
+ "0": "LABEL_0"
13
+ },
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 1536,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
+ "layer_norm_eps": 1e-12,
20
+ "max_position_embeddings": 512,
21
+ "model_type": "bert",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 12,
24
+ "pad_token_id": 0,
25
+ "position_embedding_type": "absolute",
26
+ "torch_dtype": "float32",
27
+ "transformers_version": "4.35.2",
28
+ "type_vocab_size": 2,
29
+ "use_cache": true,
30
+ "vocab_size": 30522
31
+ }
config_sentence_transformers.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "2.2.2",
4
+ "transformers": "4.28.1",
5
+ "pytorch": "1.13.0+cu117"
6
+ }
7
+ }
config_setfit.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "labels": null,
3
+ "normalize_embeddings": false
4
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19314d8466b95dfcf720db4af8043a2204ba1712b073316801ac2ae96a2f2d86
3
+ size 133462128
model_head.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74868a19f42437be5d2b30e009f4f78c0e55425afa9e2ecab1b0c258959ac380
3
+ size 3919
modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": true
4
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "never_split": null,
51
+ "pad_token": "[PAD]",
52
+ "sep_token": "[SEP]",
53
+ "strip_accents": null,
54
+ "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "BertTokenizer",
56
+ "unk_token": "[UNK]"
57
+ }
vocab.txt ADDED
The diff for this file is too large to render. See raw diff