Ambika14 commited on
Commit
b4baa46
·
verified ·
1 Parent(s): a714464

Upload folder using huggingface_hub

Browse files
1_Pooling/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "word_embedding_dimension": 768,
3
  "pooling_mode_cls_token": false,
4
  "pooling_mode_mean_tokens": true,
5
  "pooling_mode_max_tokens": false,
 
1
  {
2
+ "word_embedding_dimension": 384,
3
  "pooling_mode_cls_token": false,
4
  "pooling_mode_mean_tokens": true,
5
  "pooling_mode_max_tokens": false,
README.md CHANGED
@@ -5,108 +5,348 @@ tags:
5
  - feature-extraction
6
  - dense
7
  - generated_from_trainer
8
- - dataset_size:294
9
- - loss:TripletLoss
10
- base_model: sentence-transformers/all-mpnet-base-v2
11
  widget:
12
- - source_sentence: filed case msme portal regarding delayed payment rs 221560 invoice
13
- bme 23 24 429 despite previous reminders efforts payment pending customers payment
14
- received within stipulated time frame per msme act kindly confirm case status
15
- provide update expected resolution earliest non receipt payment delayed invoice
16
- msme act user reporting non receipt payment delayed invoice bme 23 24 429 worth
17
- rs 221560 despite previous reminders efforts requesting update case status expected
18
- resolution
19
  sentences:
20
- - Policy and Schemes. Delayed Payment/MSEFC related issues/Online Dispute Resolution
21
- (ODR)
22
- - Starter, Credit and Finance. Fund of Fund scheme of CGTMSE
23
- - UAM/Udyam Registration/Certificate related issues. UAM/Udyam Registration/Certificate
24
- related issues
25
- - source_sentence: ministry micro small medium enterprises sub request equivalent
26
- make acceptance tender ref iocl tender iocl tender 9030m24r51 id 2024 jr 182389
27
- 1 procurement non flp led flood lights would like introduce wm energy lighting
28
- pvt ltd aim conserve electricity wmel manufacturer energy efficient led lights
29
- india assist clients designing installing retrofitting energy efficiency equipment
30
- using latest technologies wmel mse company registered nsic udyam thankful various
31
- initiatives taken govt msme unit like purchase price preference policies help
32
- delayed payment would like draw attention specific make mentioned iocl referred
33
- tender tender specific makes phillips bajaj crompton havells syska ge osaram wipro
34
- polycab jaquar panasonic makes given led lights extract tender document enclosed
35
- reference affecting business growth msme units spite capable meeting pqc criteria
36
- specifications certification like bis iso msme units unable participate various
37
- govt psus tenders due specific makes stated tenders helpful msme organizations
38
- equivalent makes meeting technical specifications standards also permissible msme
39
- humbly requesting review take necessary initiative hoping supportive step msme
40
- units wm energy lighting pvt ltd request equivalent make acceptance public procurement
41
- tender user requesting ministry micro small medium enterprises consider accepting
42
- equivalent makes led flood lights tender iocl tender 9030m24r51 issued iocl specific
43
- makes mentioned tender affecting business growth msme units
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
44
  sentences:
45
- - Policy and Schemes. Related to Public Procurement by PSUs
46
- - Starter, Credit and Finance. Finance Related
47
- - Marketing and Skilling. Export Promotion/WTO
48
- - source_sentence: banks reject cgtmse credit guarantee cover collateral free loan
49
- citing high risk food sector even perfect udyam registration without starter credit
50
- buy ovens hire staff launch please guide banks approve cgtmse new units like mine
51
- fast non approval cgtmse credit guarantee cover collateral free loan user requesting
52
- guidance banks rejecting cgtmse credit guarantee cover collateral free loan food
53
- sector despite perfect udyam registration requesting expedited approval new units
54
- like
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
55
  sentences:
56
- - Starter, Credit and Finance. Credit Guarantee Fund for Micro and SmalI Enterprises(CGTMSE)
57
- - UAM/Udyam Registration/Certificate related issues. UAM/Udyam Registration/Certificate
58
- related issues
59
- - Technology, Quality and Institutions. Related to various Ministries
60
- - source_sentence: please refer subject reference dev creation propritor milan shivlal
61
- bhai dangodara plot 22 keval krupa ind society near masti minral water bhathena
62
- surat pin 395003 gst 24cebpd8513a2z8 comes gst jurisdiction committed default
63
- payment considered five bills bill 07 24 25 08 24 25 11 24 25 13 24 25 17 24 25
64
- worth rs 19 98 625 includes gst absconding place business trading jamalpura khandwa
65
- road burhanpur madhya pradesh 450331 india gst tin 23absfa5162g1zf havings supplied
66
- goods cotton grey fabric 52 48 46 broker mr kailash chawande haveing address babanlal
67
- chawande makan 50 shanwara burhanpur 450331 madhay pradesh adhar aadhaar invoice
68
- bill 07 24 25 dated 01 08 2024 rs 2 34 840 plus igs rs 11 742 total amount rs
69
- 2 46 582 eway bill aadhaar dated 05 08 2024 08 24 25 dated 07 08 2024 rs 2 47
70
- 997 plus igs rs 12 399 total amount rs 2 60 397 eway bill aadhaar dated 08 08
71
- 2024 11 24 25 dated 17 08 2024 rs 4 67 476 plus igs rs 23 374 total amount rs
72
- 4 90 850 eway bill aadhaar dated 19 08 2024 13 24 25 dated 24 08 2024 rs 4 67
73
- 458 plus igs rs 23 373 total amount rs 4 90 831 eway bill aadhaar dated 24 08
74
- 2024 17 24 25 dated 02 09 2024 rs 4 85 681 plus igs 24 284 total amount rs 5 09
75
- 965 eway bill aadhaar dated 03 09 2024 non payment gst dues user reporting default
76
- payment made dev creation falls gst jurisdiction requesting resolution outstanding
77
- amount
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78
  sentences:
79
- - Technology, Quality and Institutions. Related to Scheme of Coir Board
80
- - Policy and Schemes. Related to GST
81
- - Policy and Schemes. Raising and Accelerating MSME Performance (RAMP)
82
- - source_sentence: filed case msme portal regarding delayed payment rs 221560 invoice
83
- bme 23 24 429 despite previous reminders efforts payment pending customers payment
84
- received within stipulated time frame per msme act kindly confirm case status
85
- provide update expected resolution earliest non receipt payment delayed invoice
86
- msme act user reporting non receipt payment delayed invoice bme 23 24 429 worth
87
- rs 221560 despite previous reminders efforts requesting update case status expected
88
- resolution
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
89
  sentences:
90
- - UAM/Udyam Registration/Certificate related issues. UAM/Udyam Registration/Certificate
91
- related issues
92
- - Policy and Schemes. Delayed Payment/MSEFC related issues/Online Dispute Resolution
93
- (ODR)
94
- - Policy and Schemes. Related to GST
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
95
  pipeline_tag: sentence-similarity
96
  library_name: sentence-transformers
97
  ---
98
 
99
- # SentenceTransformer based on sentence-transformers/all-mpnet-base-v2
100
 
101
- This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
102
 
103
  ## Model Details
104
 
105
  ### Model Description
106
  - **Model Type:** Sentence Transformer
107
- - **Base model:** [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2) <!-- at revision e8c3b32edf5434bc2275fc9bab85f82640a19130 -->
108
- - **Maximum Sequence Length:** 384 tokens
109
- - **Output Dimensionality:** 768 dimensions
110
  - **Similarity Function:** Cosine Similarity
111
  <!-- - **Training Dataset:** Unknown -->
112
  <!-- - **Language:** Unknown -->
@@ -122,8 +362,8 @@ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [s
122
 
123
  ```
124
  SentenceTransformer(
125
- (0): Transformer({'max_seq_length': 384, 'do_lower_case': False, 'architecture': 'MPNetModel'})
126
- (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
127
  (2): Normalize()
128
  )
129
  ```
@@ -146,20 +386,20 @@ from sentence_transformers import SentenceTransformer
146
  model = SentenceTransformer("sentence_transformers_model_id")
147
  # Run inference
148
  sentences = [
149
- 'filed case msme portal regarding delayed payment rs 221560 invoice bme 23 24 429 despite previous reminders efforts payment pending customers payment received within stipulated time frame per msme act kindly confirm case status provide update expected resolution earliest non receipt payment delayed invoice msme act user reporting non receipt payment delayed invoice bme 23 24 429 worth rs 221560 despite previous reminders efforts requesting update case status expected resolution',
150
- 'Policy and Schemes. Delayed Payment/MSEFC related issues/Online Dispute Resolution (ODR)',
151
- 'Policy and Schemes. Related to GST',
152
  ]
153
  embeddings = model.encode(sentences)
154
  print(embeddings.shape)
155
- # [3, 768]
156
 
157
  # Get the similarity scores for the embeddings
158
  similarities = model.similarity(embeddings, embeddings)
159
  print(similarities)
160
- # tensor([[1.0000, 0.5977, 0.6986],
161
- # [0.5977, 1.0000, 0.8466],
162
- # [0.6986, 0.8466, 1.0000]])
163
  ```
164
 
165
  <!--
@@ -204,30 +444,34 @@ You can finetune this model on your own dataset.
204
 
205
  #### Unnamed Dataset
206
 
207
- * Size: 294 training samples
208
- * Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>sentence_2</code>
209
- * Approximate statistics based on the first 294 samples:
210
- | | sentence_0 | sentence_1 | sentence_2 |
211
- |:--------|:-------------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|
212
- | type | string | string | string |
213
- | details | <ul><li>min: 20 tokens</li><li>mean: 119.94 tokens</li><li>max: 384 tokens</li></ul> | <ul><li>min: 10 tokens</li><li>mean: 16.98 tokens</li><li>max: 31 tokens</li></ul> | <ul><li>min: 10 tokens</li><li>mean: 15.63 tokens</li><li>max: 31 tokens</li></ul> |
214
  * Samples:
215
- | sentence_0 | sentence_1 | sentence_2 |
216
- |:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|:----------------------------------------------------------------------------------------------------------|
217
- | <code>raising grievance due gross mishandling loan account rbl bank lan blnew007100061309 despite fully serviced emis loan per repayment schedule bank failed release dues certificate ndc additionally bank incorrectly reported overdue amount days past due dpd entries credit bureaus significantly impacted cibil score despite multiple follow ups emails communication channels bank provided resolution clarity matter negligence caused undue stress made ineligible credit facilities extremely disheartening experience unprofessional behavior reputed financial institution therefore request intervene take strict action ensure following immediate issuance ndc rectification incorrect overdue dpd reporting cibil restoration credit score written confirmation loan status corrected erroneous dpd entries removed credit profile provision explanation lapses compensation undue mental agony financial harm caused matter dragging far long trust esteemed offices take prompt action ensure justice accountability non r...</code> | <code>Starter, Credit and Finance. Loan under ECLGS (Emergency Credit of 20%)</code> | <code>Technology, Quality and Institutions. Related to Tool Rooms (Admn. Matters)</code> |
218
- | <code>respected sir mail recived grivances bank baroda rejected loan 3 months going bank baroda regularly took file 2 bank baroda medical branch medical brach said bring noc days went noc madam sitying medical branch harsh said unusail thing kept respect lady bt bank coustomer didint kept didginit raise grivance regected loan cibil score 776 verified noc bt long time machine ware house directly reajected loan oll documents inspection done loan rejected also puth forth vase respected regional manger bank baroda rbi loan rejection msme scheme user expressing disappointment loan rejection bank baroda citing unprofessional behavior bank staff despite good cibil score verified documents</code> | <code>Starter, Credit and Finance. Related to Loan</code> | <code>Technology, Quality and Institutions. Zero Defect Zero Effect (ZED)</code> |
219
- | <code>19 11 2024 honourable minister msme dear sir prime minister employment generation programme pmegp introduced generate employment opportunities rural well urban areas country setting new self employment ventures projects micro enterprises 2022 guidelines loans eligible maximum cost project unit admissible margin money subsidy manufacturing sector 50 00 000 maximum cost project unit admissible margin money subsidy business service sector 20 00 000 non msme activities allowed pmegp application however value addition allowed pmegp farm farm linked activities connection sericulture horticulture floriculture etc allowed following industry business connected animal husbandry also allowed dairy milk dairy products primarily cows also sheep goats camels buffaloes horses donkeys b poultry poultry kept form eggs meat include chickens turkeys geese ducks c aquaculture farming aquatic organisms including fish molluscs crustaceans aquatic plants insects including bees sericulture etc special case pi...</code> | <code>Policy and Schemes. Related to MSME Scheme</code> | <code>Starter, Credit and Finance. Interest Subvention Scheme for Incremental Credit to MSMEs 2018</code> |
220
- * Loss: [<code>TripletLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#tripletloss) with these parameters:
221
  ```json
222
  {
223
- "distance_metric": "TripletDistanceMetric.EUCLIDEAN",
224
- "triplet_margin": 5
 
225
  }
226
  ```
227
 
228
  ### Training Hyperparameters
229
  #### Non-Default Hyperparameters
230
 
 
 
 
231
  - `fp16`: True
232
  - `multi_dataset_batch_sampler`: round_robin
233
 
@@ -237,8 +481,8 @@ You can finetune this model on your own dataset.
237
  - `do_predict`: False
238
  - `eval_strategy`: no
239
  - `prediction_loss_only`: True
240
- - `per_device_train_batch_size`: 8
241
- - `per_device_eval_batch_size`: 8
242
  - `gradient_accumulation_steps`: 1
243
  - `eval_accumulation_steps`: None
244
  - `torch_empty_cache_steps`: None
@@ -248,7 +492,7 @@ You can finetune this model on your own dataset.
248
  - `adam_beta2`: 0.999
249
  - `adam_epsilon`: 1e-08
250
  - `max_grad_norm`: 1
251
- - `num_train_epochs`: 3
252
  - `max_steps`: -1
253
  - `lr_scheduler_type`: linear
254
  - `lr_scheduler_kwargs`: None
@@ -360,15 +604,15 @@ You can finetune this model on your own dataset.
360
  }
361
  ```
362
 
363
- #### TripletLoss
364
  ```bibtex
365
- @misc{hermans2017defense,
366
- title={In Defense of the Triplet Loss for Person Re-Identification},
367
- author={Alexander Hermans and Lucas Beyer and Bastian Leibe},
368
  year={2017},
369
- eprint={1703.07737},
370
  archivePrefix={arXiv},
371
- primaryClass={cs.CV}
372
  }
373
  ```
374
 
 
5
  - feature-extraction
6
  - dense
7
  - generated_from_trainer
8
+ - dataset_size:98
9
+ - loss:MultipleNegativesRankingLoss
10
+ base_model: sentence-transformers/all-MiniLM-L6-v2
11
  widget:
12
+ - source_sentence: ever try get register udyam registration registration getting completed
13
+ issue selection longitude latitude website says login website https webgis3 nic
14
+ bharatmaps rest services able select longitude latitude location please resolve
15
+ glitch issue longitude latitude selection udyam registration user experiencing
16
+ issue completing udyam registration process due problem selecting longitude latitude
17
+ website requires login separate website https webgis3 nic bharatmaps rest services
 
18
  sentences:
19
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
20
+ related identity creation verification eligibility validation micro small medium
21
+ enterprises msmes udyam registration system udyam registration system serves foundational
22
+ gateway msmes access central state government schemes bank loans subsidies credit
23
+ guarantees public procurement benefits statutory advantages scope purpose category
24
+ covers issues directly impact msme ecosystem including registration related issues
25
+ udyam portal errors issued udyam registration certificate migration related grievances
26
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
27
+ registration remains pending failure generate registration number system validation
28
+ errors despite correct data submission causes backend verification delays pan
29
+ aadhaar validation errors system downtime incomplete synchronization tax identity
30
+ databases errors issued udyam registration certificate incorrect inconsistent
31
+ details including enterprise classification micro small medium gst number address
32
+ business activity ownership information impact rejection loan applications denial
33
+ scheme benefits disqualification government tenders migration related grievances
34
+ failed migration attempts duplicate already registered system errors loss enterprise
35
+ data inability link historical uam records impact disruption
36
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
37
+ related identity creation verification eligibility validation micro small medium
38
+ enterprises msmes udyam registration system udyam registration system serves foundational
39
+ gateway msmes access central state government schemes bank loans subsidies credit
40
+ guarantees public procurement benefits statutory advantages scope purpose category
41
+ covers issues directly impact msme ecosystem including registration related issues
42
+ udyam portal errors issued udyam registration certificate migration related grievances
43
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
44
+ registration remains pending failure generate registration number system validation
45
+ errors despite correct data submission causes backend verification delays pan
46
+ aadhaar validation errors system downtime incomplete synchronization tax identity
47
+ databases errors issued udyam registration certificate incorrect inconsistent
48
+ details including enterprise classification micro small medium gst number address
49
+ business activity ownership information impact rejection loan applications denial
50
+ scheme benefits disqualification government tenders migration related grievances
51
+ failed migration attempts duplicate already registered system errors loss enterprise
52
+ data inability link historical uam records impact disruption
53
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
54
+ related identity creation verification eligibility validation micro small medium
55
+ enterprises msmes udyam registration system udyam registration system serves foundational
56
+ gateway msmes access central state government schemes bank loans subsidies credit
57
+ guarantees public procurement benefits statutory advantages scope purpose category
58
+ covers issues directly impact msme ecosystem including registration related issues
59
+ udyam portal errors issued udyam registration certificate migration related grievances
60
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
61
+ registration remains pending failure generate registration number system validation
62
+ errors despite correct data submission causes backend verification delays pan
63
+ aadhaar validation errors system downtime incomplete synchronization tax identity
64
+ databases errors issued udyam registration certificate incorrect inconsistent
65
+ details including enterprise classification micro small medium gst number address
66
+ business activity ownership information impact rejection loan applications denial
67
+ scheme benefits disqualification government tenders migration related grievances
68
+ failed migration attempts duplicate already registered system errors loss enterprise
69
+ data inability link historical uam records impact disruption
70
+ - source_sentence: insurancy company national insurance company limited branch name
71
+ insurance company branch khamgaon branch date application 30 05 2024 policy number
72
+ 281601112410000001 claim kept pending even submitting documents changing requirements
73
+ changed various surveyors delayed insurance claim national insurance company limited
74
+ user reporting insurance claim submitted 30 05 2024 policy number 281601112410000001
75
+ still pending despite submission required documents per changes made various surveyors
76
  sentences:
77
+ - Restructuring of loan. category restructuring loan pertains temporary relief expected
78
+ users periods stress line reserve bank india rbi frameworks key expectations include
79
+ fair restructuring protection declared non performing asset npa transparent restructuring
80
+ terms however practice several failures occur due following reasons failures loan
81
+ restructuring banks delay restructuring account slips npa banks deny restructuring
82
+ without providing written explanations banks fail formally acknowledge micro small
83
+ medium enterprises msme stress banks adopt fear based rejection approaches typical
84
+ grievance scenarios msmes eligible restructuring rbi guidelines refused bank without
85
+ written reasons banks ignore impact covid market slowdowns instead pressure borrowers
86
+ recovery restructuring applications remain undecided month communication loans
87
+ restructured revised emi equated monthly installment terms clearly explained accounts
88
+ declared npa without considering pending restructuring requests branch officials
89
+ claim restructuring targets exhausted despite limits mentioned guidelines operational
90
+ procedural policy institutional causes policy non implementation bank risk aversion
91
+ deliberate timing manipulation
92
+ - Delayed Payment/MSEFC related issues/Online Dispute Resolution (ODR). delayed
93
+ payment msefc related issues category encompasses grievances arising buyer default
94
+ payment micro small enterprises msmes provisions micro small medium enterprises
95
+ development msmed act 2006 specifically sections 15 23 category strictly limited
96
+ cases delayed withheld payments buyers include delays caused banks financial institutions
97
+ loan disbursement processes scope purpose category covers situations msme supplied
98
+ goods services raised valid invoice buyer accepted delivery payment remains pending
99
+ beyond 45 days agreed credit period whichever earlier either fully partially applies
100
+ government departments public sector undertakings psus private sector buyers including
101
+ cases buyers acknowledge dues continue postpone payment without justification
102
+ release partial payments withholding balance without raising quality contractual
103
+ dispute category also covers procedural delays within micro small enterprises
104
+ facilitation council msefc mechanism cases filed msmes listed hearing remain indefinitely
105
+ conciliation stage final orders awards delayed unsigned uploaded despite completion
106
+ hearings submission documents issues scenarios buyer default payment including
107
+ delayed payment beyond 45 days agreed credit period withheld payment without justification
108
+ release partial payments withholding balance non payment despite buyer acknowledgment
109
+ repeated follow ups procedural delays within msefc mechanism including non listing
110
+ cases hearing
111
+ - Insurance Claim related issues. category encompasses grievances related insurance
112
+ claims associated various government backed private insurance products scope includes
113
+ 1 esic employees state insurance corporation insurance benefits 2 epfo employees
114
+ provident fund organisation linked insurance benefits including edli employees
115
+ deposit linked insurance 3 cgtmse credit guarantee fund trust micro small enterprises
116
+ linked insurance elements 4 private general business insurance products government
117
+ department psu public sector undertaking bank acts intermediary implementing authority
118
+ category covers range issues including opaque rejection decisions undocumented
119
+ policy exclusions administrative closure without explanation shifting risk liability
120
+ onto msmes micro small medium enterprises employees document data mismatches across
121
+ multiple systems aadhaar uan universal account number employer filings bank records
122
+ insurance portals delays non responsiveness esic epfo insurer field office levels
123
+ manual bottlenecks officer transfers lack accountability jurisdictional overlaps
124
+ involving labour compliance banking conditions inter agency disputes insurers
125
+ banks employers labour authorities example issues include rejected esic medical
126
+ reimbursement claims due ineligibility despite continuous contribution history
127
+ denied epfo edli insurance claims due alleged break service caused employer side
128
+ portal errors rejected bank linked business insurance claims based undisclosed
129
+ policy clauses unhonoured cg
130
+ - source_sentence: name swarangi swapnil kadam uam mh28d0000281 want migrate uam udyam
131
+ registration dont contact number email id used uam please update new mobile phone
132
+ email id pranjalilingayat1986gmail com profile attaching copy uam along mail please
133
+ update details soon possible migration uam udyam registration user requesting
134
+ migration existing uam uam mh28d0000281 udyam registration updating contact details
135
+ profile
136
  sentences:
137
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
138
+ related identity creation verification eligibility validation micro small medium
139
+ enterprises msmes udyam registration system udyam registration system serves foundational
140
+ gateway msmes access central state government schemes bank loans subsidies credit
141
+ guarantees public procurement benefits statutory advantages scope purpose category
142
+ covers issues directly impact msme ecosystem including registration related issues
143
+ udyam portal errors issued udyam registration certificate migration related grievances
144
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
145
+ registration remains pending failure generate registration number system validation
146
+ errors despite correct data submission causes backend verification delays pan
147
+ aadhaar validation errors system downtime incomplete synchronization tax identity
148
+ databases errors issued udyam registration certificate incorrect inconsistent
149
+ details including enterprise classification micro small medium gst number address
150
+ business activity ownership information impact rejection loan applications denial
151
+ scheme benefits disqualification government tenders migration related grievances
152
+ failed migration attempts duplicate already registered system errors loss enterprise
153
+ data inability link historical uam records impact disruption
154
+ - Related to NI-MSME. category encompasses grievances related training capacity
155
+ building certification programs administered national institute micro small medium
156
+ enterprises ni msme micro small medium enterprises msmes entrepreneurs employees
157
+ scope category includes issues arising delivery training programs repeatedly postponed
158
+ schedules without prior notification inaccessible online training portals unclear
159
+ eligibility criteria unavailable trainers insufficient mentoring outdated non
160
+ practical course content additionally category captures certification related
161
+ issues including delayed issuance certificates certificates issued incorrect details
162
+ difficulty verifying certificates online failure deliver certificates course completion
163
+ furthermore category includes course enrollment admission disputes unjustified
164
+ rejection enrollment despite meeting eligibility criteria incorrect fee charges
165
+ delayed refunds confirmed admissions without available training slots miscommunication
166
+ batch size selection criteria grievances reflect administrative friction execution
167
+ gaps ni msme training ecosystem directly impact msmes workforce skill development
168
+ compliance readiness eligibility schemes linked certified training example issues
169
+ include ni msme training program announced schedule postponed multiple times without
170
+ intimation completed ni msme course certificate issued even several months affecting
171
+ eligibility schemes enrollment rejected despite meeting eligibility criteria clarification
172
+ provided online training login working ni msme support responding emails wrong
173
+ details printed ni ms
174
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
175
+ related identity creation verification eligibility validation micro small medium
176
+ enterprises msmes udyam registration system udyam registration system serves foundational
177
+ gateway msmes access central state government schemes bank loans subsidies credit
178
+ guarantees public procurement benefits statutory advantages scope purpose category
179
+ covers issues directly impact msme ecosystem including registration related issues
180
+ udyam portal errors issued udyam registration certificate migration related grievances
181
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
182
+ registration remains pending failure generate registration number system validation
183
+ errors despite correct data submission causes backend verification delays pan
184
+ aadhaar validation errors system downtime incomplete synchronization tax identity
185
+ databases errors issued udyam registration certificate incorrect inconsistent
186
+ details including enterprise classification micro small medium gst number address
187
+ business activity ownership information impact rejection loan applications denial
188
+ scheme benefits disqualification government tenders migration related grievances
189
+ failed migration attempts duplicate already registered system errors loss enterprise
190
+ data inability link historical uam records impact disruption
191
+ - source_sentence: vishal kumar unit address vill sanghour babain phone sir mene msme
192
+ scheme ke kvic scheme se 2020 loan liya tha jisme mujhe 35 subsidy mili thi jo
193
+ mujhe bola gya tha ki subsidy ka laabh aapko jb aapka loan ko 3 saal baad mil
194
+ jayega 2023 mere laon ko 3 saal ho gye tb kvic office ambala gya vaha se staff
195
+ ne bola ki aabhi apki verificatian pending hai fir september 2024 meri unit ki
196
+ verification b ho gyi uske baad fir kvic office ambala gya tb b vaha k staff ne
197
+ bola ki abhi time lgega ambala office vala staff bolte h ki verification department
198
+ ki problem h verification department bolta h ki kvic office ambala ki problem
199
+ h mene bhut chaakr lgaa diye office k mujhe koi subsidy realising latter nhi mila
200
+ mujhe sep 2023 k baad loan ki kist continue deni pd rhi hai kisto se jo mujhe
201
+ subsidy kaa laabh milna chaiye tha vo mujhe nhi mila paya hai mujhe extra peyment
202
+ deni pr rhi bhut pershan ho gya hu office k chakkar lgaa lgaa k aapse request
203
+ h ki mujhe subsidy releasing latter mil jayye thankyou non receipt subsidy kvic
204
+ scheme user reporting non receipt subsidy despite eligible completed verification
205
+ process requesting assistance obtaining subsidy realization letter
206
  sentences:
207
+ - Related to DCMSME Scheme. category related grievances dcmsme scheme specifically
208
+ focusing issues related access credit banks micro small medium enterprises msmes
209
+ category applies commercial banks regional rural banks rrbs cooperative banks
210
+ covers cases bottleneck lies entirely bank level excludes issues related rbi policy
211
+ government scheme design credit guarantee mechanisms buyer default rather addresses
212
+ bank side processing conditions conduct extending credit msmes category includes
213
+ cases msmes applied loans submitted required documents followed branches digital
214
+ portals loan application remains pending without formal sanction rejection decision
215
+ captures administrative stalling prolonged process pending verification status
216
+ absence deficiency letters timelines repeated demands already submitted documents
217
+ failure branch offices forward eligible applications regional head offices approval
218
+ additionally category covers situations loans formally sanctioned disbursement
219
+ delayed withheld bank without valid documented reasons includes cases prolonged
220
+ non disbursement despite fulfilment sanction conditions partial disbursement unexplained
221
+ withholding balance amount delays citing internal audits reviews imposition additional
222
+ post sanction conditions mentioned original sanction letter category also includes
223
+ grievances related excessive unreasonable collateral demands banks security requirements
224
+ exceed applicable msme rbi cgtmse guidelines includes insistence collateral despite
225
+ eligibility credit guarantee coverage demands disproportionate collateral value
226
+ rejection loan applications solely due refusal provide personal residential property
227
+ security requirements subcategories 1 tcec division implementation scheme establishement
228
+ new technology centres extension centres 2 economic analysis 3 statistics data
229
+ division 4 national awards 5 entrepreneurship skill development programmes esdp
230
+ 6 vendor development programme ancillarisation 7 export promotion wto 8 msme policy
231
+ industry associations related issues 9 software related 10 zero defect zero effect
232
+ zed 11 technology center system program tcsp 12 north east region cell ner promotion
233
+ msmes ner sikkim 13 international trade fair itf international cooperation ic
234
+ 14 support entrepreneurial managerial development smes incubators nmcp scheme
235
+ 15 building awareness intellectual property rights ipr micro small medium enterprises
236
+ nmcp scheme 16 lean manufacturing competitiveness scheme lmcs 17 design clinic
237
+ scheme nmcp scheme 18 pms scheme 19 technology quality upgradation tequp support
238
+ msmes nmcp scheme 20 digital msme nmcp scheme 21 micro small enterprises cluster
239
+ development programme mse cdp 22 credit linked capital subsidy technology upgradation
240
+ clcs tu special clcs sc st 23 credit guarantee fund micro smali enterprises cgtmse
241
+ 24 market development assistance mda msmes
242
+ - Related to Scheme of KVIC. category encompasses grievances related schemes subsidies
243
+ certifications implementation processes administered khadi village industries
244
+ commission kvic implementing authorities including state kvic district industries
245
+ centre dic offices specifically addresses issues originate kvic field level offices
246
+ excluding problems solely banks generic msme schemes non kvic authorities category
247
+ covers range issues including 1 delays failures release pmegp margin money subsidies
248
+ loans already sanctioned units set kvic credited subsidy bank due pending portal
249
+ actions physical verification delays repeated document objections prolonged process
250
+ status without timelines 2 grievances related khadi subsidies including non release
251
+ partial release unexplained reduction admissible subsidy amounts stoppage subsidy
252
+ citing non compliance without sharing inspection reports deviations prescribed
253
+ scheme norms determining subsidy eligibility quantum 3 issues related kvic certification
254
+ registration including pending delayed issuance khadi certificates cancellation
255
+ certification without prior notice stated reasons inspection related delays without
256
+ clarification delayed renewal certificates directly affect eligibility subsidies
257
+ tenders market access subcategories 1 providing financial assistance set new enterprises
258
+ pmegp 2 providing insurance cover khadi artisans aam admi bima yojana 3 providing
259
+ financial assistance khadi institutions mda 4 workshed scheme khadi artisans 5
260
+ loans interest subsidy eligibility certificate scheme isec 6 mission solar charkha
261
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
262
+ related identity creation verification eligibility validation micro small medium
263
+ enterprises msmes udyam registration system udyam registration system serves foundational
264
+ gateway msmes access central state government schemes bank loans subsidies credit
265
+ guarantees public procurement benefits statutory advantages scope purpose category
266
+ covers issues directly impact msme ecosystem including registration related issues
267
+ udyam portal errors issued udyam registration certificate migration related grievances
268
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
269
+ registration remains pending failure generate registration number system validation
270
+ errors despite correct data submission causes backend verification delays pan
271
+ aadhaar validation errors system downtime incomplete synchronization tax identity
272
+ databases errors issued udyam registration certificate incorrect inconsistent
273
+ details including enterprise classification micro small medium gst number address
274
+ business activity ownership information impact rejection loan applications denial
275
+ scheme benefits disqualification government tenders migration related grievances
276
+ failed migration attempts duplicate already registered system errors loss enterprise
277
+ data inability link historical uam records impact disruption
278
+ - source_sentence: dear sir mam trying register udyam pan error showing udyam registration
279
+ already done pan registered earlier please guide aadhaar uam pan pan mobile phone
280
+ clarification existing udyam registration user requesting clarification udyam
281
+ registration portal indicates registration already done pan although user states
282
+ registration made
283
  sentences:
284
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
285
+ related identity creation verification eligibility validation micro small medium
286
+ enterprises msmes udyam registration system udyam registration system serves foundational
287
+ gateway msmes access central state government schemes bank loans subsidies credit
288
+ guarantees public procurement benefits statutory advantages scope purpose category
289
+ covers issues directly impact msme ecosystem including registration related issues
290
+ udyam portal errors issued udyam registration certificate migration related grievances
291
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
292
+ registration remains pending failure generate registration number system validation
293
+ errors despite correct data submission causes backend verification delays pan
294
+ aadhaar validation errors system downtime incomplete synchronization tax identity
295
+ databases errors issued udyam registration certificate incorrect inconsistent
296
+ details including enterprise classification micro small medium gst number address
297
+ business activity ownership information impact rejection loan applications denial
298
+ scheme benefits disqualification government tenders migration related grievances
299
+ failed migration attempts duplicate already registered system errors loss enterprise
300
+ data inability link historical uam records impact disruption
301
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
302
+ related identity creation verification eligibility validation micro small medium
303
+ enterprises msmes udyam registration system udyam registration system serves foundational
304
+ gateway msmes access central state government schemes bank loans subsidies credit
305
+ guarantees public procurement benefits statutory advantages scope purpose category
306
+ covers issues directly impact msme ecosystem including registration related issues
307
+ udyam portal errors issued udyam registration certificate migration related grievances
308
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
309
+ registration remains pending failure generate registration number system validation
310
+ errors despite correct data submission causes backend verification delays pan
311
+ aadhaar validation errors system downtime incomplete synchronization tax identity
312
+ databases errors issued udyam registration certificate incorrect inconsistent
313
+ details including enterprise classification micro small medium gst number address
314
+ business activity ownership information impact rejection loan applications denial
315
+ scheme benefits disqualification government tenders migration related grievances
316
+ failed migration attempts duplicate already registered system errors loss enterprise
317
+ data inability link historical uam records impact disruption
318
+ - UAM/Udyam Registration/Certificate related issues. category encompasses grievances
319
+ related identity creation verification eligibility validation micro small medium
320
+ enterprises msmes udyam registration system udyam registration system serves foundational
321
+ gateway msmes access central state government schemes bank loans subsidies credit
322
+ guarantees public procurement benefits statutory advantages scope purpose category
323
+ covers issues directly impact msme ecosystem including registration related issues
324
+ udyam portal errors issued udyam registration certificate migration related grievances
325
+ legacy udyog aadhaar memorandum uam system udyam portal registration related issues
326
+ registration remains pending failure generate registration number system validation
327
+ errors despite correct data submission causes backend verification delays pan
328
+ aadhaar validation errors system downtime incomplete synchronization tax identity
329
+ databases errors issued udyam registration certificate incorrect inconsistent
330
+ details including enterprise classification micro small medium gst number address
331
+ business activity ownership information impact rejection loan applications denial
332
+ scheme benefits disqualification government tenders migration related grievances
333
+ failed migration attempts duplicate already registered system errors loss enterprise
334
+ data inability link historical uam records impact disruption
335
  pipeline_tag: sentence-similarity
336
  library_name: sentence-transformers
337
  ---
338
 
339
+ # SentenceTransformer based on sentence-transformers/all-MiniLM-L6-v2
340
 
341
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/all-MiniLM-L6-v2](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2). It maps sentences & paragraphs to a 384-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
342
 
343
  ## Model Details
344
 
345
  ### Model Description
346
  - **Model Type:** Sentence Transformer
347
+ - **Base model:** [sentence-transformers/all-MiniLM-L6-v2](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2) <!-- at revision c9745ed1d9f207416be6d2e6f8de32d1f16199bf -->
348
+ - **Maximum Sequence Length:** 64 tokens
349
+ - **Output Dimensionality:** 384 dimensions
350
  - **Similarity Function:** Cosine Similarity
351
  <!-- - **Training Dataset:** Unknown -->
352
  <!-- - **Language:** Unknown -->
 
362
 
363
  ```
364
  SentenceTransformer(
365
+ (0): Transformer({'max_seq_length': 64, 'do_lower_case': False, 'architecture': 'BertModel'})
366
+ (1): Pooling({'word_embedding_dimension': 384, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
367
  (2): Normalize()
368
  )
369
  ```
 
386
  model = SentenceTransformer("sentence_transformers_model_id")
387
  # Run inference
388
  sentences = [
389
+ 'dear sir mam trying register udyam pan error showing udyam registration already done pan registered earlier please guide aadhaar uam pan pan mobile phone clarification existing udyam registration user requesting clarification udyam registration portal indicates registration already done pan although user states registration made',
390
+ 'UAM/Udyam Registration/Certificate related issues. category encompasses grievances related identity creation verification eligibility validation micro small medium enterprises msmes udyam registration system udyam registration system serves foundational gateway msmes access central state government schemes bank loans subsidies credit guarantees public procurement benefits statutory advantages scope purpose category covers issues directly impact msme ecosystem including registration related issues udyam portal errors issued udyam registration certificate migration related grievances legacy udyog aadhaar memorandum uam system udyam portal registration related issues registration remains pending failure generate registration number system validation errors despite correct data submission causes backend verification delays pan aadhaar validation errors system downtime incomplete synchronization tax identity databases errors issued udyam registration certificate incorrect inconsistent details including enterprise classification micro small medium gst number address business activity ownership information impact rejection loan applications denial scheme benefits disqualification government tenders migration related grievances failed migration attempts duplicate already registered system errors loss enterprise data inability link historical uam records impact disruption',
391
+ 'UAM/Udyam Registration/Certificate related issues. category encompasses grievances related identity creation verification eligibility validation micro small medium enterprises msmes udyam registration system udyam registration system serves foundational gateway msmes access central state government schemes bank loans subsidies credit guarantees public procurement benefits statutory advantages scope purpose category covers issues directly impact msme ecosystem including registration related issues udyam portal errors issued udyam registration certificate migration related grievances legacy udyog aadhaar memorandum uam system udyam portal registration related issues registration remains pending failure generate registration number system validation errors despite correct data submission causes backend verification delays pan aadhaar validation errors system downtime incomplete synchronization tax identity databases errors issued udyam registration certificate incorrect inconsistent details including enterprise classification micro small medium gst number address business activity ownership information impact rejection loan applications denial scheme benefits disqualification government tenders migration related grievances failed migration attempts duplicate already registered system errors loss enterprise data inability link historical uam records impact disruption',
392
  ]
393
  embeddings = model.encode(sentences)
394
  print(embeddings.shape)
395
+ # [3, 384]
396
 
397
  # Get the similarity scores for the embeddings
398
  similarities = model.similarity(embeddings, embeddings)
399
  print(similarities)
400
+ # tensor([[1.0000, 0.7274, 0.7274],
401
+ # [0.7274, 1.0000, 1.0000],
402
+ # [0.7274, 1.0000, 1.0000]])
403
  ```
404
 
405
  <!--
 
444
 
445
  #### Unnamed Dataset
446
 
447
+ * Size: 98 training samples
448
+ * Columns: <code>sentence_0</code> and <code>sentence_1</code>
449
+ * Approximate statistics based on the first 98 samples:
450
+ | | sentence_0 | sentence_1 |
451
+ |:--------|:-----------------------------------------------------------------------------------|:----------------------------------------------------------------------------------|
452
+ | type | string | string |
453
+ | details | <ul><li>min: 20 tokens</li><li>mean: 59.08 tokens</li><li>max: 64 tokens</li></ul> | <ul><li>min: 64 tokens</li><li>mean: 64.0 tokens</li><li>max: 64 tokens</li></ul> |
454
  * Samples:
455
+ | sentence_0 | sentence_1 |
456
+ |:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
457
+ | <code>availed pmegp subsidy paper carry bag manufacturing unit 2020 iob bank kottayam three years paid loan amount correctly time without failure inspection needed sanction subsidy done yet since keen paying loan bringing burden financially please needful arrange inspection udyam reg kl 07 0005226 thanking non conduct inspection pmegp subsidy msme dfo user reporting despite timely loan repayment inspection required sanctioning pmegp subsidy paper carry bag manufacturing unit conducted causing financial burden requesting assistance earliest possible inspection</code> | <code>Related to MSME-DFO. category encompasses grievances related field level execution failures msme development facilitation offices dfos responsible facilitating msme schemes loans subsidies services scope category includes field level execution failures non responsive dfo officers failure provide guidance documentation procedures inaction queries submitted champions physical visits inspection delays inconsistencies postponed repeatedly rescheduled site visits delayed inspection reports unnecessary multiple inspections stall loan disbursement subsidy release local facilitation coordination failures misrouting applications offices lack facilitation land utilities approvals unavailability promised local support services poor coordination dfos banks psus state nodal officers resulting projects remaining stuck despite eligibility prior approvals example issues dfo officials responding phone calls emails regarding subsidy applications guidance provided required documents site inspection msme ...</code> |
458
+ | <code>unable edit district udhyam certificate please help editing district udyam certificate user requesting assistance edit district udyam certificate</code> | <code>UAM/Udyam Registration/Certificate related issues. category encompasses grievances related identity creation verification eligibility validation micro small medium enterprises msmes udyam registration system udyam registration system serves foundational gateway msmes access central state government schemes bank loans subsidies credit guarantees public procurement benefits statutory advantages scope purpose category covers issues directly impact msme ecosystem including registration related issues udyam portal errors issued udyam registration certificate migration related grievances legacy udyog aadhaar memorandum uam system udyam portal registration related issues registration remains pending failure generate registration number system validation errors despite correct data submission causes backend verification delays pan aadhaar validation errors system downtime incomplete synchronization tax identity databases errors issued udyam registration certificate incorrect inconsistent detai...</code> |
459
+ | <code>loanagreement isbl00910729978dated26 09 2024 loan payment pending since 29 sep 2024 hdfc bank returned cheque stating alteration rbi guidelines pli nodal agencies contact numbers found service unable connect attached loan agreement pdf reference please support get resolution pending since 29 sep 2024 non receipt loan payment dcmsme scheme user reporting non receipt loan payment since 29 09 2024 citing hdfc bank return cheque alteration rbi guidelines requesting assistance resolving issue</code> | <code>Related to DCMSME Scheme. category related grievances dcmsme scheme specifically focusing issues related access credit banks micro small medium enterprises msmes category applies commercial banks regional rural banks rrbs cooperative banks covers cases bottleneck lies entirely bank level excludes issues related rbi policy government scheme design credit guarantee mechanisms buyer default rather addresses bank side processing conditions conduct extending credit msmes category includes cases msmes applied loans submitted required documents followed branches digital portals loan application remains pending without formal sanction rejection decision captures administrative stalling prolonged process pending verification status absence deficiency letters timelines repeated demands already submitted documents failure branch offices forward eligible applications regional head offices approval additionally category covers situations loans formally sanctioned disbursement delayed withheld bank ...</code> |
460
+ * Loss: [<code>MultipleNegativesRankingLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#multiplenegativesrankingloss) with these parameters:
461
  ```json
462
  {
463
+ "scale": 20.0,
464
+ "similarity_fct": "cos_sim",
465
+ "gather_across_devices": false
466
  }
467
  ```
468
 
469
  ### Training Hyperparameters
470
  #### Non-Default Hyperparameters
471
 
472
+ - `per_device_train_batch_size`: 2
473
+ - `per_device_eval_batch_size`: 2
474
+ - `num_train_epochs`: 2
475
  - `fp16`: True
476
  - `multi_dataset_batch_sampler`: round_robin
477
 
 
481
  - `do_predict`: False
482
  - `eval_strategy`: no
483
  - `prediction_loss_only`: True
484
+ - `per_device_train_batch_size`: 2
485
+ - `per_device_eval_batch_size`: 2
486
  - `gradient_accumulation_steps`: 1
487
  - `eval_accumulation_steps`: None
488
  - `torch_empty_cache_steps`: None
 
492
  - `adam_beta2`: 0.999
493
  - `adam_epsilon`: 1e-08
494
  - `max_grad_norm`: 1
495
+ - `num_train_epochs`: 2
496
  - `max_steps`: -1
497
  - `lr_scheduler_type`: linear
498
  - `lr_scheduler_kwargs`: None
 
604
  }
605
  ```
606
 
607
+ #### MultipleNegativesRankingLoss
608
  ```bibtex
609
+ @misc{henderson2017efficient,
610
+ title={Efficient Natural Language Response Suggestion for Smart Reply},
611
+ author={Matthew Henderson and Rami Al-Rfou and Brian Strope and Yun-hsuan Sung and Laszlo Lukacs and Ruiqi Guo and Sanjiv Kumar and Balint Miklos and Ray Kurzweil},
612
  year={2017},
613
+ eprint={1705.00652},
614
  archivePrefix={arXiv},
615
+ primaryClass={cs.CL}
616
  }
617
  ```
618
 
config.json CHANGED
@@ -1,24 +1,30 @@
1
  {
 
2
  "architectures": [
3
- "MPNetModel"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
- "bos_token_id": 0,
 
7
  "dtype": "float32",
8
- "eos_token_id": 2,
 
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
- "hidden_size": 768,
12
  "initializer_range": 0.02,
13
- "intermediate_size": 3072,
14
- "layer_norm_eps": 1e-05,
15
- "max_position_embeddings": 514,
16
- "model_type": "mpnet",
 
17
  "num_attention_heads": 12,
18
- "num_hidden_layers": 12,
19
- "pad_token_id": 1,
20
- "relative_attention_num_buckets": 32,
21
  "tie_word_embeddings": true,
22
  "transformers_version": "5.0.0",
23
- "vocab_size": 30527
 
 
24
  }
 
1
  {
2
+ "add_cross_attention": false,
3
  "architectures": [
4
+ "BertModel"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": null,
8
+ "classifier_dropout": null,
9
  "dtype": "float32",
10
+ "eos_token_id": null,
11
+ "gradient_checkpointing": false,
12
  "hidden_act": "gelu",
13
  "hidden_dropout_prob": 0.1,
14
+ "hidden_size": 384,
15
  "initializer_range": 0.02,
16
+ "intermediate_size": 1536,
17
+ "is_decoder": false,
18
+ "layer_norm_eps": 1e-12,
19
+ "max_position_embeddings": 512,
20
+ "model_type": "bert",
21
  "num_attention_heads": 12,
22
+ "num_hidden_layers": 6,
23
+ "pad_token_id": 0,
24
+ "position_embedding_type": "absolute",
25
  "tie_word_embeddings": true,
26
  "transformers_version": "5.0.0",
27
+ "type_vocab_size": 2,
28
+ "use_cache": true,
29
+ "vocab_size": 30522
30
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df5af0b1556413bbed5ce25011b728de502822d45dde1ed41bc4044fb1e9c519
3
- size 437967648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfb2fedc427d6f0ab914cc80fa199fec65b7c465018cd0a684c01f512a2927d4
3
+ size 90864176
sentence_bert_config.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
- "max_seq_length": 384,
3
  "do_lower_case": false
4
  }
 
1
  {
2
+ "max_seq_length": 64,
3
  "do_lower_case": false
4
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,16 +1,16 @@
1
  {
2
  "backend": "tokenizers",
3
- "bos_token": "<s>",
4
- "cls_token": "<s>",
5
  "do_lower_case": true,
6
- "eos_token": "</s>",
7
  "is_local": false,
8
- "mask_token": "<mask>",
9
- "model_max_length": 384,
10
- "pad_token": "<pad>",
11
- "sep_token": "</s>",
 
12
  "strip_accents": null,
13
  "tokenize_chinese_chars": true,
14
- "tokenizer_class": "MPNetTokenizer",
15
  "unk_token": "[UNK]"
16
  }
 
1
  {
2
  "backend": "tokenizers",
3
+ "cls_token": "[CLS]",
4
+ "do_basic_tokenize": true,
5
  "do_lower_case": true,
 
6
  "is_local": false,
7
+ "mask_token": "[MASK]",
8
+ "model_max_length": 256,
9
+ "never_split": null,
10
+ "pad_token": "[PAD]",
11
+ "sep_token": "[SEP]",
12
  "strip_accents": null,
13
  "tokenize_chinese_chars": true,
14
+ "tokenizer_class": "BertTokenizer",
15
  "unk_token": "[UNK]"
16
  }