Gopal2002 commited on
Commit
5568b49
1 Parent(s): 47de212

Push model using huggingface_hub.

Browse files
1_Pooling/config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 384,
3
+ "pooling_mode_cls_token": true,
4
+ "pooling_mode_mean_tokens": false,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false
7
+ }
README.md ADDED
@@ -0,0 +1,271 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: setfit
3
+ tags:
4
+ - setfit
5
+ - sentence-transformers
6
+ - text-classification
7
+ - generated_from_setfit_trainer
8
+ metrics:
9
+ - accuracy
10
+ widget:
11
+ - text: " \n \n \n\nHIRAKUD POWER / SMELTER\n\n@ - Payment Order\n\n( Address\
12
+ \ )\n\nEmp.No./S.Code No. Qhle\nby Cash/Cheque/D.D./Transfer the sumof ~ 35, +S0/—\n\
13
+ Rupees Thi ei ve therane Seven hun\nFi \\\nMail Id of Initiator: : OF)\n\n \n\n\
14
+ | Details of Payment\n\n;\n| AtMenclance, Cleritage ancl Otner\naa T\n\n|mise:\
15
+ \ Conveyances for ip eome No. |\n2x to 2-9, 3\\ 32 ano 34 of Qo| 2\n\nURL of payment:\n\
16
+ \nin . TotalRs.| 35, too /]- .\n\nPrepared by Recommended by Endorsed by Authorised\
17
+ \ By Approved by\n‘ A =\nPort Sara ee\nA ee EU (NY—\nDate 20/ 19 Plant Head Head-F\
18
+ \ &A Head - Sambalpur Cluster\n\n \n \n\nCharge\nAccount\n\n \n \
19
+ \ \n\nLeqa2\n\n~ Odisha cluoy\n\nOI) 202 Sefer (90\n\nONLINE PAYMENT\n\n \n\n\
20
+ \ \n\nCashier\nReceived Payment | Charge Account Checked by\n\nae eee _\n\n \n\
21
+ \nSignature\n\f"
22
+ - text: " \n\f"
23
+ - text: "Expenses during visit of morning for coal logistic.\n\nSl.no. _ Date Of Visit\
24
+ \ Particulars Amount Remarks\n1 21-Feb-16 Tea,Snax ager mis. - 105.00 Along with\
25
+ \ Mr N K Kar\n\n \n \n\n \n\n \n\n \n\nft eee ‘\n~# “Lunch. ° of AVS\
26
+ \ |\nee ou SATS i\n2 22-Feb-16); | “Fea soe mis, dee aot]\n; 3 . cng! a oa hoy\
27
+ \ ‘ “e i hs ye eo 1\n3 23-Feb-1600). Téa,Snax Andithis. I Along with Mr'N K Kar\
28
+ \ .\nee _ |) Lunch... a 00° oO 2 !\n4 24-Feb-16 Tea,Snax And mis. okt? |\nLinch\
29
+ \ ~ : egthedgtt £92 ox\n5 25-Feb-16\n\nmeted FES entre? i462\n\n- Teaisnax And\
30
+ \ mis. r AS Vi on\n) ie ihe oe » Lunch eres , Mo\n\n6 26-Feb-16 Tea, Snax And\
31
+ \ nis,\n\nyeahh! ct\n\nfeo, 7\n\n \n\n \n \n \n \n \n\n, 140.00; - Pend\
32
+ \ wih iM NK Kar\nlene . : -aaciog par rs :\n’ a7-Febalt Tea,Snax And itis” \"\
33
+ 425.00 Along with Mr. K Kar\nLunch 280,00 es _— ,\n8 29-Feb-16 se Tea,Snax And\
34
+ \ oie Bh i af U5 5.00). \" pe. a!\n9 te Snax ‘And mis. ce n20. to & oe\n\n10\n\
35
+ \neee £50. Alone wit Mr N K Kar bye efort-\n\nevn, enews) :\nLaheue 325. 00 x\
36
+ \ Up £0 perenne os\neerie coer re ue\n\n \n\n,\n\n11\n\nHf figs bh.\n\n \n\n \
37
+ \ \n \n \n \n\n \n\n4\n‘\na\nvt wr 4 ‘\n“ane . mae t\nwha via ‘\n‘\n5\n12 {\n\
38
+ _ o |\n\" nay\ni\n¥\n4\n4\n_\ni\nTew. EN at Rbiew: Caen sere 4\ntA eS : f i :\n\
39
+ i — Eyl 3. 4\nes, j Lax > * awe 4\nwe be oy . “ tyne eel\ni ad\n: oe\nSeog) ayM.\
40
+ \ 44\nwr\na, obo ye eect ee —\n-\n\n \n\f"
41
+ - text: "HINDALCO INDUSTRIES LIMITED EMPLOYEES’ PROVIDENT FUND II\n\n| | B)REASON\
42
+ \ OF LEAVING SERVICE: RESIGNATION\n_ SERVICE TERMINATED ON\n\n \n \n \n \
43
+ \ \n \n \n \n \n\n \n\n|\n\n| | ACCOUNT OF (A) ILL\nHEALTH OF MEMBER\
44
+ \ (8)\nCONTRACTION /\n\nDISCONTINUATION — OF\nEMPLOYER'S BUSINESS OR\n\n(C) OTHER\
45
+ \ CAUSE BEYOND\n\nTHE CONTROL OF THE\n\n| EMBER\n|i PERSONAL REASON _\n\n__\n\n\
46
+ PAYMENT UCO BANK ,HIRAKUD SAMBALPUR ,ODISHA.\n(PLEASE ATTACH A COPY OF cmmntnnmeanisnnennenesennmaneeneisene\
47
+ \ nese\nCANCELLED CHEQUE/ATTESTED\n| COPY OF FIRST PAGE OF BANK PASS | IFS CODE\
48
+ \ ... UCBA0000285\n| BOOK _\nTa) FULL POSTAL ADDRESS WITH E- AT. GUNDRUPADA, PO-HIRAKUD,\
49
+ \ DIST- SAMBALPUR, ODISHA-.\n\n| 12 I BANK ACCOUNT DETAILS “FOR SAVING BANK ACCOUNT\
50
+ \ NO — 02850110044179\n!\n\nMAIL ID (IF ANY)\n\n \n\nPIN ...768016\n| E-MAIL ID\
51
+ \ :-\n\n- INCASE THE AMOUNT IS USED FOR ANY PURPOSE OTHER THAN STATED IN COLUMN\
52
+ \ (9) ABOVE, | AM\nLIABLE TO RETURN THE ENTIRE AMOUNT WITH PENAL INTEREST.\nTHE\
53
+ \ MEMBER HEREBY DECLARES THAT HE HAD NOT BEEN EMPLOYED FOR 2 MONTH (YES/NO)\n\n\
54
+ (APPLICABLE FOR PF SETTLEMENT ONLY)\nve SIG N41\n\nMEMBER SIGNATURE AND DATE\n\
55
+ \nCERTIFIED THAT THE APPLICATION HAS BEEN SIGNED BY THE MEMBER IN MY PRESENCE\
56
+ \ AFTER HE/SHE HAD\nREAD THE CONTENT / THE CONTENT HAD BEEN EXPLAINED TO HIM /\
57
+ \ HER BY ME AND THAT THE\nINFORMATION GIVEN IN THE APPLICATION FORM |S CORRECT\n\
58
+ \nDATE:- : yA\nye\"\nEMPLOYER'S SIGNATURE\n\nDESIGNATION & SEAL OF EMPLOYER\n\
59
+ (OPTIANAL FOR FINAL PF SETTLEMENT)\n\nENCLOSURES: WV SELF ATTESTED AADHAR CARD\
60
+ \ & PANCARD\n2 cory OF CANCELLED CHEQUE / SELF ATTESTED COPY OF 15° PAGE OF PASS\
61
+ \ BOOK.\n\f"
62
+ - text: " \n\nHINDALCO INDUSTRIES LIMITED\nHIRAKUD\n\nPAYMENT ORDER\n\nPayto Simanchal\
63
+ \ Khatai\nCash Vr.No.\n\n \n\nEmp.No/S.Code No. _ ~\nby Cash/Cheque/D.D./Transfer\
64
+ \ the sum of Rs.2,00,000.00 apvrno,lOlY% 3s\nRupees Two Lakh only\n\n \n\nDetails\
65
+ \ of Payment Amount (Rs)\n\n \n\nns . 2,00,000\n\n \n\n \n\n \n\n \n\n \n\n \n\
66
+ \n2,00,000.\nPrepared by Recommeded by Endorsed by Authorised By Approved by\n\
67
+ \n9 ’\nner (wy\nDate Dept. Head Plant Head -F&A Head - Sambalpur Cluster\nPayment\
68
+ \ made on Charge\noem ra\n\n(b) By Cheque ner 2] 2G ~ 2> 7 + DA SHO-KLB (321)\n\
69
+ \nState Bank of india, Burla\nState Bank of India, Hirakud\nPunjab National Bank,\
70
+ \ Sambalpur [PNB-1]\n\n \n\n \n\n \n\n \n\n \n\nUuCcO Hirakud\n\n \n\nUCO’Bank,\
71
+ \ Sambalpur\n{DBI , Sambalpur (IDBI -1)\nIDB! , Sambalpur (IDBI -2)\n\nReceived\
72
+ \ Payment Charge Account Checked by\nSignature\n\n \n\n \n\n \n\n \n\n \n\n \n\
73
+ \f"
74
+ pipeline_tag: text-classification
75
+ inference: true
76
+ base_model: BAAI/bge-small-en-v1.5
77
+ model-index:
78
+ - name: SetFit with BAAI/bge-small-en-v1.5
79
+ results:
80
+ - task:
81
+ type: text-classification
82
+ name: Text Classification
83
+ dataset:
84
+ name: Unknown
85
+ type: unknown
86
+ split: test
87
+ metrics:
88
+ - type: accuracy
89
+ value: 1.0
90
+ name: Accuracy
91
+ ---
92
+
93
+ # SetFit with BAAI/bge-small-en-v1.5
94
+
95
+ This is a [SetFit](https://github.com/huggingface/setfit) model that can be used for Text Classification. This SetFit model uses [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5) as the Sentence Transformer embedding model. A [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance is used for classification.
96
+
97
+ The model has been trained using an efficient few-shot learning technique that involves:
98
+
99
+ 1. Fine-tuning a [Sentence Transformer](https://www.sbert.net) with contrastive learning.
100
+ 2. Training a classification head with features from the fine-tuned Sentence Transformer.
101
+
102
+ ## Model Details
103
+
104
+ ### Model Description
105
+ - **Model Type:** SetFit
106
+ - **Sentence Transformer body:** [BAAI/bge-small-en-v1.5](https://huggingface.co/BAAI/bge-small-en-v1.5)
107
+ - **Classification head:** a [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance
108
+ - **Maximum Sequence Length:** 512 tokens
109
+ - **Number of Classes:** 2 classes
110
+ <!-- - **Training Dataset:** [Unknown](https://huggingface.co/datasets/unknown) -->
111
+ <!-- - **Language:** Unknown -->
112
+ <!-- - **License:** Unknown -->
113
+
114
+ ### Model Sources
115
+
116
+ - **Repository:** [SetFit on GitHub](https://github.com/huggingface/setfit)
117
+ - **Paper:** [Efficient Few-Shot Learning Without Prompts](https://arxiv.org/abs/2209.11055)
118
+ - **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
119
+
120
+ ### Model Labels
121
+ | Label | Examples |
122
+ |:------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
123
+ | 0 | <ul><li>'GHt Sa [OI uco Bank\n\nvis Free Number: 180¢-193-9125 _\n\nDICGC INSURANCE UPTO 5 LAC\n\nBRANCH\n\nUCO Bank\nP NT\n(1) Consuitants are requested to note that all moneys\n\nremitted to the Bank should either be sent by Registered\nPost or handed over to the Cash Department, as no\n\n \n\nUco BANK\n\naq\n\nName\n\n"IFSC: uceaocotms\n\' dress\n\nKICK Code: 7428029504\n\nHIRAKUD\n-HIRAKED BRARCH HIRAKUS\nProae:\n\nindividual (s) outside. the Cash Department has/have JHARY EIST\nauthority to receive cash. KADAMPOLA\n(2) The account-holder should insist on delivery of Pass Book HERAKUD\n‘ made uptodate as far as possible on the same date; a 6.8%\n- otherwise he should obtain a receipt indicating when the HIRAKYD PIN .#oBlss\nPass Book will be delivered.\n(3) Deposit Rules in vogue can be obtained by account-holder TET. WaT / Asst.\nfrom the Branch on request Q28501 19027145\nPB.NG. }\n\n \n\n \n\n \n\nfe er ee me\n\n \n\x0c'</li><li>' \n\n= 2, ip\nO ~\nN 2\na\n: Y ve re ty\n) 3 x.\nNai] (F) my\n\n \n\ny Viayal chat aloala\nSH PPP ea [sys sys *\nas NB\n2\n=\n\ni x X we\na. = Xt +\n— W\nx 2| > x xv)\n— ~ wa al on\nmh a\n\nx\n@\n\n \n\nSy\n>3\nS\nak\n\n \n\n \n\n= coemeirata nani\nyy“\nxX -~|<\n. q - r " 2 e eee\n| S TTT !\n“ sa S ~\ngaysey Maye oe | toe\n\ni\'s . <4 " = : nics\n: 5 oy Sy . : aR N =\nS Sy = yy > =P OW\n, oe Q\n3 4 WK SS j 2 .\n-~ rs, , 4 i AS ~ si 6 .\nA Se S = Ce 4G ‘ tb. ee bene |\n\na\n\n \n\nes |\nTo a 3,\n-} ™ i] nest -— a Dome: eo . Sp a > Ee eh ao Ty ache oe ewe cede oe oe tee ~\n5 . “i a ( . - i -\n\n \n\n \n\x0c'</li><li>'Interest will be payable @ 24 % p.a. if the invoice is not paid within 30 days of the date of invoice.\n\nABBREVIATION: TB — Tower & Basin\nTO — Tower Only\n\n1. All taxes and duties invoiced herein are subject to revision depending upon the final assessment\n\nby the Statutory Authorities. Any such revision will be to buyer’s account.\n\n2. Payments should be made by A/C Payee cheque/Pay oder/bank draft/Online fund transfer\n\nthrough NEFT/RTGS platform in favour of “Paharpur Cooling Towers Ltd.”. Payment towards this\n\nbill made in any other form will be done entirely at your own risk.\n\n3. ALL DISPUTES SUBJECT TO CALCUTTA JURISDICTION ONLY.\n\x0c'</li></ul> |
124
+ | 1 | <ul><li>'. Ae - PR CSeathetn & 3)\n" J She ase 9 Pao\n\n‘s lad Bank Afr o Steppe\nIN | fave 4 fi foe & ats bent\n\nHINDALCO INDUSTRIES LIMITED\nHIRAKUD\n\nPAYMENT ORDER\n\nPayto Payment to Mr.Dilip Das\n\n|\nTravel expenses for Interview w candidate (A (Admin) J] jo. _| Cash Vr.No. Q pis | l\n\npk check he inkwes IFSC. code Emp.No/s.codeNo. _ OT Pago |\n\nby Cash/Cheque/D.D./Transfer the sum of —_Rs.13,695.00 _ _| AP.Vr.No.\nRupees Thirteen Thousand Six Hundred Ninety Five Only ———__ ; 3 ua 202 |\nDate\n\n \n\n \n\n \n\nX\n\n5\n\nee |\nain & Flight Tickets is. _ 13,195.00\nConvenience expenses Rs. — 500. 00°\n\n \n\n \n\nDetail Travel plan and tickets enclosed\n\nBank Account details also enclosed\n\n \n\n \n \n \n\nPrepared by Recommended by Endorsed by\nDate q Head- HR\n: Hirakud Complex\n\n \n \n \n\n \n \n\n \n\né y Cash 2. DAD ey ‘ZO\n(i \'y Cheque No DVPOVe Bee\n\n \n\n \n \n\nState Bank of India, Burla\nState Bank of India, Hirakud\n\nPunjab National Bank, Sambalpur [PNB-1]\nUCO Bank, Hirakud\n\nUCO Bank, Sambalpur\nIDB! , Sambaipur (IDB! -1)\nIDBI , Sambalpur (IDBI -2)\n\n \n \n \n\n \n\n \n \n\n \n\n \n \n\n \n\n \n \n \n \n \n\n \n\n \n\n \n \n\nCashier\n\n \n\n \n\nReceived Payment Charge Account Checked by\n\n \n\nSignature Signature\n\x0c'</li><li>'HINDALCO INDUSTRIES LIMITED\nHIRAKUD\n\nPAYMENT ORDER\nPay to FRakesh Gupta ; . . | 3898 BA (Q-1 2-15\n\nCash Vr.No.\n\n \n\n \n\n \n\n— - _ Emp.No./S.Code No. $-392 _\nby Cash/Cheque/D.D./Transfer the sum of a | AP vr.No. 91 355%\nRupees Four Thousand Six Hundred Only\n\n \n\n \n\n \n\n22\nDate 48-02-16\nDetails of Payment Amount\nTowards change of Battery of Vehicle No. OR-02-AM-8904\n\nas detailed below: (Bill Attached)\n(i) Bill No. 3898 Dt.19-12-2015\n\n \n\nTotal Rs. . 4,600.00\n\nPrepared by Recommended by Endorsed by Authorised by Approved by\nLanier bnwnnWenuw \\ \\ .\n\\4 = Ww \\ le\n\n\\ov Jv JI 4.) ee Zan”\n\nDate Dept Head Plant Head Hed - Location Head\n\n \n\n \n\nPayment made on\n(a) By Cash\n\n(b) By Cheque No.\n\n \n\n \n\nState Bank of India, Burla\n\nState Bank of india, Hirakud\n\nPunjab National Bank, Sambalpur [PNB-1]\nUCO Bank, Hirakud\n\nUCO Bank, Sambaipur\n\n{DBI , Sambalpur (IDB! -1)\n\nIDBI , Sambalpur (IDBI -2)\n\n \n\n \n\n \n\n \n\n \n\nCashier\n\nReceived Payment Charge Account Checked by\n\nSignature Signature\n\x0c'</li><li>'tT) Ce cfd\n\n \n \n \n \n \n \n \n\nADITYA BIRLA HINDALCO INDUSTRIES LIMITED\n874 HIRAKUD POWER\n\naN’ PAYMENT ORDER\n\nPP -200| - AI66\n\nCash Vr.No.\n\n \n \n \n\nAP.Vr.No._G/8Ol tT\n\nby Cash/Cheque/D.D./Transfer the sum of\nELEVEN THOUSAND FIFTY FOUR ONLY\n\n \n\nRupees\n\n \n \n \n \n\nDate:- 8.01.20\n\nENERGY CHARGES OF INTAKE CHAMBER FOR THE MONTH OF DEC 2019,BILL NO- L\n1533 2639.00\n8415.00 ~\n\n“\nTotal Total Rs. 41054.00\n\nPrepared by Recammeded by Endorsed by Authorised By Approved by\n\npu ( Nx\nHead-F&A Head - Sambalpur Cluster\nCharge Account an ou\n\n \n\n \n \n \n \n\n \n\nENERGY CHARGES OF ASH MOUND FOR THE MONTH OF DEC 2019, BILL NO-1532\n\n \n\n \n\n \n\n \n \n \n\n \n\n \n\n \n \n \n \n \n \n \n\nState Bank of india,\nState Bank of India, Buria\n\nPunjab National Bank, Sambalpur [PNB-1]\nPunjab National Bank, Kolkata {[PNB-2]\nUCO Bank, Hirakud\nUCO Bank, Sambalpur\n\n—\n\n \n \n \n \n \n\nes\neee\n\nReceived Payment Charge Account Checked by\n\n \n\nSignature Signature\n\x0c'</li></ul> |
125
+
126
+ ## Evaluation
127
+
128
+ ### Metrics
129
+ | Label | Accuracy |
130
+ |:--------|:---------|
131
+ | **all** | 1.0 |
132
+
133
+ ## Uses
134
+
135
+ ### Direct Use for Inference
136
+
137
+ First install the SetFit library:
138
+
139
+ ```bash
140
+ pip install setfit
141
+ ```
142
+
143
+ Then you can load this model and run inference.
144
+
145
+ ```python
146
+ from setfit import SetFitModel
147
+
148
+ # Download from the 🤗 Hub
149
+ model = SetFitModel.from_pretrained("Gopal2002/CASH_AND_BANK_INVOICE")
150
+ # Run inference
151
+ preds = model("
152
+ ")
153
+ ```
154
+
155
+ <!--
156
+ ### Downstream Use
157
+
158
+ *List how someone could finetune this model on their own dataset.*
159
+ -->
160
+
161
+ <!--
162
+ ### Out-of-Scope Use
163
+
164
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
165
+ -->
166
+
167
+ <!--
168
+ ## Bias, Risks and Limitations
169
+
170
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
171
+ -->
172
+
173
+ <!--
174
+ ### Recommendations
175
+
176
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
177
+ -->
178
+
179
+ ## Training Details
180
+
181
+ ### Training Set Metrics
182
+ | Training set | Min | Median | Max |
183
+ |:-------------|:----|:---------|:-----|
184
+ | Word count | 1 | 201.2534 | 4241 |
185
+
186
+ | Label | Training Sample Count |
187
+ |:------|:----------------------|
188
+ | 0 | 113 |
189
+ | 1 | 33 |
190
+
191
+ ### Training Hyperparameters
192
+ - batch_size: (32, 32)
193
+ - num_epochs: (2, 2)
194
+ - max_steps: -1
195
+ - sampling_strategy: oversampling
196
+ - body_learning_rate: (2e-05, 1e-05)
197
+ - head_learning_rate: 0.01
198
+ - loss: CosineSimilarityLoss
199
+ - distance_metric: cosine_distance
200
+ - margin: 0.25
201
+ - end_to_end: False
202
+ - use_amp: False
203
+ - warmup_proportion: 0.1
204
+ - seed: 42
205
+ - eval_max_steps: -1
206
+ - load_best_model_at_end: False
207
+
208
+ ### Training Results
209
+ | Epoch | Step | Training Loss | Validation Loss |
210
+ |:------:|:----:|:-------------:|:---------------:|
211
+ | 0.0023 | 1 | 0.3054 | - |
212
+ | 0.1142 | 50 | 0.1162 | - |
213
+ | 0.2283 | 100 | 0.0043 | - |
214
+ | 0.3425 | 150 | 0.0015 | - |
215
+ | 0.4566 | 200 | 0.0014 | - |
216
+ | 0.5708 | 250 | 0.0008 | - |
217
+ | 0.6849 | 300 | 0.0013 | - |
218
+ | 0.7991 | 350 | 0.001 | - |
219
+ | 0.9132 | 400 | 0.0004 | - |
220
+ | 1.0274 | 450 | 0.0008 | - |
221
+ | 1.1416 | 500 | 0.0008 | - |
222
+ | 1.2557 | 550 | 0.0011 | - |
223
+ | 1.3699 | 600 | 0.0008 | - |
224
+ | 1.4840 | 650 | 0.0007 | - |
225
+ | 1.5982 | 700 | 0.0005 | - |
226
+ | 1.7123 | 750 | 0.0005 | - |
227
+ | 1.8265 | 800 | 0.0007 | - |
228
+ | 1.9406 | 850 | 0.0005 | - |
229
+
230
+ ### Framework Versions
231
+ - Python: 3.10.12
232
+ - SetFit: 1.0.3
233
+ - Sentence Transformers: 2.2.2
234
+ - Transformers: 4.35.2
235
+ - PyTorch: 2.1.0+cu121
236
+ - Datasets: 2.16.1
237
+ - Tokenizers: 0.15.0
238
+
239
+ ## Citation
240
+
241
+ ### BibTeX
242
+ ```bibtex
243
+ @article{https://doi.org/10.48550/arxiv.2209.11055,
244
+ doi = {10.48550/ARXIV.2209.11055},
245
+ url = {https://arxiv.org/abs/2209.11055},
246
+ author = {Tunstall, Lewis and Reimers, Nils and Jo, Unso Eun Seo and Bates, Luke and Korat, Daniel and Wasserblat, Moshe and Pereg, Oren},
247
+ keywords = {Computation and Language (cs.CL), FOS: Computer and information sciences, FOS: Computer and information sciences},
248
+ title = {Efficient Few-Shot Learning Without Prompts},
249
+ publisher = {arXiv},
250
+ year = {2022},
251
+ copyright = {Creative Commons Attribution 4.0 International}
252
+ }
253
+ ```
254
+
255
+ <!--
256
+ ## Glossary
257
+
258
+ *Clearly define terms in order to be accessible across audiences.*
259
+ -->
260
+
261
+ <!--
262
+ ## Model Card Authors
263
+
264
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
265
+ -->
266
+
267
+ <!--
268
+ ## Model Card Contact
269
+
270
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
271
+ -->
config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "/root/.cache/torch/sentence_transformers/BAAI_bge-small-en-v1.5/",
3
+ "architectures": [
4
+ "BertModel"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 384,
11
+ "id2label": {
12
+ "0": "LABEL_0"
13
+ },
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 1536,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
+ "layer_norm_eps": 1e-12,
20
+ "max_position_embeddings": 512,
21
+ "model_type": "bert",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 12,
24
+ "pad_token_id": 0,
25
+ "position_embedding_type": "absolute",
26
+ "torch_dtype": "float32",
27
+ "transformers_version": "4.35.2",
28
+ "type_vocab_size": 2,
29
+ "use_cache": true,
30
+ "vocab_size": 30522
31
+ }
config_sentence_transformers.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "2.2.2",
4
+ "transformers": "4.28.1",
5
+ "pytorch": "1.13.0+cu117"
6
+ }
7
+ }
config_setfit.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "labels": null,
3
+ "normalize_embeddings": false
4
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6683dd2051987c3c781a36af15c03ffb0f2fb2d9170ed99e531670496105824
3
+ size 133462128
model_head.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd82f3cf5a9430bb8bf5eef6aff9d54d4beab3926df499e2f3692a3fb2e0480c
3
+ size 3919
modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": true
4
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "never_split": null,
51
+ "pad_token": "[PAD]",
52
+ "sep_token": "[SEP]",
53
+ "strip_accents": null,
54
+ "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "BertTokenizer",
56
+ "unk_token": "[UNK]"
57
+ }
vocab.txt ADDED
The diff for this file is too large to render. See raw diff