Upload folder using huggingface_hub
Browse files- 1_Pooling/config.json +10 -0
- README.md +554 -3
- config.json +23 -0
- config_sentence_transformers.json +10 -0
- model.safetensors +3 -0
- modules.json +20 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +73 -0
- vocab.txt +0 -0
1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
README.md
CHANGED
|
@@ -1,3 +1,554 @@
|
|
| 1 |
-
---
|
| 2 |
-
|
| 3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:27191
|
| 8 |
+
- loss:TripletLoss
|
| 9 |
+
base_model: sentence-transformers/all-mpnet-base-v2
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: MySafetyEye offers an innovative and sustainable home surveillance
|
| 12 |
+
and alarm solution that repurposes old smartphones or tablets into monitoring
|
| 13 |
+
devices. Users can install the app on their primary phone and the old device to
|
| 14 |
+
set up a home alarm system in under two minutes. The service includes free home
|
| 15 |
+
surveillance and a subscription-based home alarm feature with motion detection.
|
| 16 |
+
When motion is detected, an alarm notification is sent to the user's primary smartphone,
|
| 17 |
+
providing a picture of the event. The system also supports automatic activation
|
| 18 |
+
and deactivation based on the family's geolocation, enhancing convenience and
|
| 19 |
+
security.
|
| 20 |
+
sentences:
|
| 21 |
+
- CREDO FISH was a Denmark-based company specializing in the import and export of
|
| 22 |
+
seafood products, including tiger-shark and angel-shark. Established on December
|
| 23 |
+
1, 1995, the company was headquartered in Frederikshavn, Nordjylland. It ceased
|
| 24 |
+
operations on December 21, 2021.
|
| 25 |
+
- Software-Pro ApS provides technology consulting services, specializing in testing
|
| 26 |
+
and quality assurance. The company assists clients in testing their software and
|
| 27 |
+
optimizing processes to enhance predictability in software development. Software-Pro
|
| 28 |
+
serves customers in Denmark.
|
| 29 |
+
- Living Places is a comprehensive online resource dedicated to providing detailed
|
| 30 |
+
information about homes, neighborhoods, towns, and counties across the United
|
| 31 |
+
States. The platform offers insights into various residential subdivisions, architectural
|
| 32 |
+
styles, and historical areas, catering to individuals seeking to learn more about
|
| 33 |
+
different living environments. With a focus on U.S. neighborhoods and towns, Living
|
| 34 |
+
Places serves as a valuable guide for those exploring housing options and community
|
| 35 |
+
characteristics.
|
| 36 |
+
- source_sentence: Hindholm Privatskole is a private school located in Fuglebjerg,
|
| 37 |
+
Denmark, offering education from kindergarten through 9th grade. The school emphasizes
|
| 38 |
+
a respectful and inclusive environment, with a focus on holistic development through
|
| 39 |
+
varied learning experiences. Surrounded by nature, the campus features a lake,
|
| 40 |
+
green areas, sports fields, playgrounds, and a forest area utilized for both educational
|
| 41 |
+
and recreational purposes. Hindholm Privatskole maintains small class sizes, with
|
| 42 |
+
a maximum of 24 students per class, and upholds traditions such as daily morning
|
| 43 |
+
singing sessions and annual excursions to enhance the educational experience.
|
| 44 |
+
sentences:
|
| 45 |
+
- Flindt-Kristensen is a Danish engineering firm specializing in product development,
|
| 46 |
+
concept design, structural analysis, and technical drawings. They offer services
|
| 47 |
+
such as transport tools, lifting tools, and special projects, aiming to add value
|
| 48 |
+
through innovation and extensive technical knowledge. Their core values include
|
| 49 |
+
service, dedication, ambition, innovation, and fun.
|
| 50 |
+
- Automators Holding ApS is a Danish company located at Knud Kristensens Gade 11,
|
| 51 |
+
2300 København S. The company is active and has a Legal Entity Identifier (LEI)
|
| 52 |
+
code of 98450061ACA903B44085. As of the latest available data, Automators Holding
|
| 53 |
+
ApS has one employee. Further details about the company's operations, products,
|
| 54 |
+
or services are not readily available from the provided sources.
|
| 55 |
+
- 'Blomsterhaven is an integrated institution for children aged 0-6 years, operating
|
| 56 |
+
under Sydbyens Børnehus. It comprises three houses: Anemonen, Bellis, and Crocus,
|
| 57 |
+
accommodating up to 110 children. Located in a mixed residential and industrial
|
| 58 |
+
area near the local school, each house features large playgrounds tailored to
|
| 59 |
+
different age groups, promoting motor and sensory development. The facility offers
|
| 60 |
+
30 nursery and 80 kindergarten places, staffed by 24 permanent employees and 3
|
| 61 |
+
regular substitutes. Blomsterhaven emphasizes Danish traditions and utilizes the
|
| 62 |
+
surrounding nature for educational activities.'
|
| 63 |
+
- source_sentence: MENSEL & KASTEN RÅDGIVENDE EL-INGENIØRFIRMA is a Danish engineering
|
| 64 |
+
consultancy firm specializing in electrical engineering services for construction
|
| 65 |
+
and civil engineering projects. Established in 1996, the company is based in Løgumkloster,
|
| 66 |
+
Denmark. ([ownr.dk](https://ownr.dk/companies/public-profile/19115976?utm_source=openai))
|
| 67 |
+
The firm focuses on providing expert advice and solutions in the field of electrical
|
| 68 |
+
engineering, catering to various construction and infrastructure projects.
|
| 69 |
+
sentences:
|
| 70 |
+
- Dottir is a dynamic business law firm specializing in technology, intellectual
|
| 71 |
+
property, and data protection. Founded nearly a decade ago by attorneys from top
|
| 72 |
+
law firms, Dottir has evolved to meet the growing demand for legal services in
|
| 73 |
+
the expanding technology sector. Their globally ranked team advises companies
|
| 74 |
+
on a wide range of legal matters arising from technology transactions, regulatory
|
| 75 |
+
requirements, litigation, and regulatory enforcement proceedings. They assist
|
| 76 |
+
fast-growing tech companies in protecting strategic IP assets and translating
|
| 77 |
+
business models into solid legal documents. Their services also cover assisting
|
| 78 |
+
large corporations in outsourcing or transforming business-critical IT systems
|
| 79 |
+
and services, dispute resolution concerning complex technology-related disputes,
|
| 80 |
+
as well as AI, data protection, cybersecurity, and other data-related compliance
|
| 81 |
+
issues.
|
| 82 |
+
- 'Brenstensgård is a Danish partnership established in 2021, specializing in the
|
| 83 |
+
production of slaughter pigs. Located at Splitad 2, 8970 Havndal, the company
|
| 84 |
+
is owned equally by five partners: Valdemar Bay-Smidt, Tina Bay-Smidt, Suzy Storm,
|
| 85 |
+
Lars Bay-Smidt, and Hanne Bay-Smidt Lysgaard, each holding a 20% stake. ([paqle.dk](https://www.paqle.dk/p/brenstensg%C3%A5rd-i-s/6402918?utm_source=openai))'
|
| 86 |
+
- GROVE-NIELSEN ApS is a Danish company that has published financial statements
|
| 87 |
+
for the years 2010 through 2013. The company reported profits in 2012 and 2013,
|
| 88 |
+
with net results of DKK 312,000 and DKK 279,000, respectively. The company's total
|
| 89 |
+
assets increased from DKK 2.821 million in 2012 to DKK 2.986 million in 2013,
|
| 90 |
+
and equity rose from DKK 2.710 million to DKK 2.892 million over the same period.
|
| 91 |
+
Further details about the company's operations or industry are not available from
|
| 92 |
+
the provided information.
|
| 93 |
+
- source_sentence: PM & JØ Holding is a Danish non-financial holding company established
|
| 94 |
+
in 2017, located at Hejrevej 17, 8400 Ebeltoft. The company is co-owned by Palle
|
| 95 |
+
Martin Lund Jensen and Jette Ørnbøl Jeppesen, each holding a 50% stake. As a holding
|
| 96 |
+
entity, PM & JØ Holding primarily manages investments in other companies, including
|
| 97 |
+
L-tek A/S, where Palle Martin Lund Jensen serves as director. The company reported
|
| 98 |
+
a net profit of DKK 1.6 million in 2023, reflecting its financial performance
|
| 99 |
+
in managing its portfolio.
|
| 100 |
+
sentences:
|
| 101 |
+
- FAUNA PASSAGE is a Danish company specializing in the research, development, and
|
| 102 |
+
production of products and concepts aimed at protecting wildlife. Established
|
| 103 |
+
on September 1, 1996, and headquartered at Forskerparken 10, 5230 Odense M, the
|
| 104 |
+
company focuses on creating solutions to safeguard fauna from traffic-related
|
| 105 |
+
challenges. Their offerings include wildlife crossings such as tunnels, bridges,
|
| 106 |
+
and other structures designed to facilitate safe animal passage across human-made
|
| 107 |
+
barriers. The company is led by Director Lars Arthur Briggs.
|
| 108 |
+
- "\x0F8ksenm"
|
| 109 |
+
- Fisker Olesen Holding ApS is a Danish holding company established in 2021, located
|
| 110 |
+
at Gammel Kongevej 112, 3, 1850 Frederiksberg C. The company is involved in managing
|
| 111 |
+
investments and overseeing subsidiaries. As of 2023, it reported a gross profit
|
| 112 |
+
of -1 DKK and a pre-tax result of -12 DKK. The company is led by Nina Fisker Olesen,
|
| 113 |
+
who holds multiple business roles in Denmark. ([proff.dk](https://www.proff.dk/firma/nina-fisker-olesen-holding-aps/frederiksberg-c/holdingselskaper/0P9Q29I06Y4?utm_source=openai),
|
| 114 |
+
[ownr.dk](https://ownr.dk/users/public-profile/4008071852?utm_source=openai))
|
| 115 |
+
- source_sentence: Gammellund Ejendomme is a Danish real estate company based in Odense,
|
| 116 |
+
Denmark. The company specializes in property development, management, and sales
|
| 117 |
+
services. As of 2024, it employs one person and has reported total assets of approximately
|
| 118 |
+
2.9 million DKK. The company is led by Director Brian Gammellund Rasmussen and
|
| 119 |
+
was founded on October 9, 2020.
|
| 120 |
+
sentences:
|
| 121 |
+
- Jørgen Lund Frederiksen is a Danish company specializing in high-quality carpentry
|
| 122 |
+
and joinery services. Established in 1976, the company offers a wide range of
|
| 123 |
+
services, including small repairs and large construction projects, serving private
|
| 124 |
+
clients, businesses, and public institutions. With a team of 35-40 skilled employees,
|
| 125 |
+
Jørgen Lund Frederiksen emphasizes loyalty, flexibility, and responsibility, ensuring
|
| 126 |
+
professional handling of projects from start to finish. The company is also ISPM-15
|
| 127 |
+
certified for manufacturing heat-treated wooden packaging, such as pallets and
|
| 128 |
+
transport boxes, adhering to international standards.
|
| 129 |
+
- KERT INVEST ApS, established on February 6, 2014, is a Danish private limited
|
| 130 |
+
company based in Helsingør. The company specializes in purchasing, renovating,
|
| 131 |
+
and selling real estate, as well as trading securities and related activities.
|
| 132 |
+
([find-virksomhed.dk](https://find-virksomhed.dk/firma/kert-invest-aps-35658173?utm_source=openai))
|
| 133 |
+
The company's registered address is Grønnehavevej 7, 1, 3000 Helsingør. ([lei.bloomberg.com](https://lei.bloomberg.com/gleifs/view/549300IRNKZTEYCVK378?utm_source=openai))
|
| 134 |
+
- GANNI is a Danish contemporary fashion brand founded in 2000 by Frans Truelsen
|
| 135 |
+
and revitalized in 2009 by husband-and-wife duo Ditte and Nicolaj Reffstrup. ([en.wikipedia.org](https://en.wikipedia.org/wiki/Ganni?utm_source=openai))
|
| 136 |
+
The brand offers a wide range of women's apparel, footwear, eyewear, bags, jewelry,
|
| 137 |
+
and accessories, embodying a playful and effortless aesthetic that redefines Scandinavian
|
| 138 |
+
style. ([fashionunited.com](https://fashionunited.com/companies/ganni?utm_source=openai))
|
| 139 |
+
GANNI is committed to responsible practices, striving to make environmentally
|
| 140 |
+
friendly choices and improve daily. ([kristak.com](https://kristak.com/pages/ganni?utm_source=openai))
|
| 141 |
+
pipeline_tag: sentence-similarity
|
| 142 |
+
library_name: sentence-transformers
|
| 143 |
+
metrics:
|
| 144 |
+
- cosine_accuracy
|
| 145 |
+
model-index:
|
| 146 |
+
- name: SentenceTransformer based on sentence-transformers/all-mpnet-base-v2
|
| 147 |
+
results:
|
| 148 |
+
- task:
|
| 149 |
+
type: triplet
|
| 150 |
+
name: Triplet
|
| 151 |
+
dataset:
|
| 152 |
+
name: Unknown
|
| 153 |
+
type: unknown
|
| 154 |
+
metrics:
|
| 155 |
+
- type: cosine_accuracy
|
| 156 |
+
value: 0.9343575239181519
|
| 157 |
+
name: Cosine Accuracy
|
| 158 |
+
---
|
| 159 |
+
|
| 160 |
+
# SentenceTransformer based on sentence-transformers/all-mpnet-base-v2
|
| 161 |
+
|
| 162 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2) on the csv dataset. It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 163 |
+
|
| 164 |
+
## Model Details
|
| 165 |
+
|
| 166 |
+
### Model Description
|
| 167 |
+
- **Model Type:** Sentence Transformer
|
| 168 |
+
- **Base model:** [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2) <!-- at revision 12e86a3c702fc3c50205a8db88f0ec7c0b6b94a0 -->
|
| 169 |
+
- **Maximum Sequence Length:** 384 tokens
|
| 170 |
+
- **Output Dimensionality:** 768 dimensions
|
| 171 |
+
- **Similarity Function:** Cosine Similarity
|
| 172 |
+
- **Training Dataset:**
|
| 173 |
+
- csv
|
| 174 |
+
<!-- - **Language:** Unknown -->
|
| 175 |
+
<!-- - **License:** Unknown -->
|
| 176 |
+
|
| 177 |
+
### Model Sources
|
| 178 |
+
|
| 179 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 180 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 181 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 182 |
+
|
| 183 |
+
### Full Model Architecture
|
| 184 |
+
|
| 185 |
+
```
|
| 186 |
+
SentenceTransformer(
|
| 187 |
+
(0): Transformer({'max_seq_length': 384, 'do_lower_case': False}) with Transformer model: MPNetModel
|
| 188 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 189 |
+
(2): Normalize()
|
| 190 |
+
)
|
| 191 |
+
```
|
| 192 |
+
|
| 193 |
+
## Usage
|
| 194 |
+
|
| 195 |
+
### Direct Usage (Sentence Transformers)
|
| 196 |
+
|
| 197 |
+
First install the Sentence Transformers library:
|
| 198 |
+
|
| 199 |
+
```bash
|
| 200 |
+
pip install -U sentence-transformers
|
| 201 |
+
```
|
| 202 |
+
|
| 203 |
+
Then you can load this model and run inference.
|
| 204 |
+
```python
|
| 205 |
+
from sentence_transformers import SentenceTransformer
|
| 206 |
+
|
| 207 |
+
# Download from the 🤗 Hub
|
| 208 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 209 |
+
# Run inference
|
| 210 |
+
sentences = [
|
| 211 |
+
'Gammellund Ejendomme is a Danish real estate company based in Odense, Denmark. The company specializes in property development, management, and sales services. As of 2024, it employs one person and has reported total assets of approximately 2.9 million DKK. The company is led by Director Brian Gammellund Rasmussen and was founded on October 9, 2020.',
|
| 212 |
+
"KERT INVEST ApS, established on February 6, 2014, is a Danish private limited company based in Helsingør. The company specializes in purchasing, renovating, and selling real estate, as well as trading securities and related activities. ([find-virksomhed.dk](https://find-virksomhed.dk/firma/kert-invest-aps-35658173?utm_source=openai)) The company's registered address is Grønnehavevej 7, 1, 3000 Helsingør. ([lei.bloomberg.com](https://lei.bloomberg.com/gleifs/view/549300IRNKZTEYCVK378?utm_source=openai))",
|
| 213 |
+
"GANNI is a Danish contemporary fashion brand founded in 2000 by Frans Truelsen and revitalized in 2009 by husband-and-wife duo Ditte and Nicolaj Reffstrup. ([en.wikipedia.org](https://en.wikipedia.org/wiki/Ganni?utm_source=openai)) The brand offers a wide range of women's apparel, footwear, eyewear, bags, jewelry, and accessories, embodying a playful and effortless aesthetic that redefines Scandinavian style. ([fashionunited.com](https://fashionunited.com/companies/ganni?utm_source=openai)) GANNI is committed to responsible practices, striving to make environmentally friendly choices and improve daily. ([kristak.com](https://kristak.com/pages/ganni?utm_source=openai))",
|
| 214 |
+
]
|
| 215 |
+
embeddings = model.encode(sentences)
|
| 216 |
+
print(embeddings.shape)
|
| 217 |
+
# [3, 768]
|
| 218 |
+
|
| 219 |
+
# Get the similarity scores for the embeddings
|
| 220 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 221 |
+
print(similarities.shape)
|
| 222 |
+
# [3, 3]
|
| 223 |
+
```
|
| 224 |
+
|
| 225 |
+
<!--
|
| 226 |
+
### Direct Usage (Transformers)
|
| 227 |
+
|
| 228 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 229 |
+
|
| 230 |
+
</details>
|
| 231 |
+
-->
|
| 232 |
+
|
| 233 |
+
<!--
|
| 234 |
+
### Downstream Usage (Sentence Transformers)
|
| 235 |
+
|
| 236 |
+
You can finetune this model on your own dataset.
|
| 237 |
+
|
| 238 |
+
<details><summary>Click to expand</summary>
|
| 239 |
+
|
| 240 |
+
</details>
|
| 241 |
+
-->
|
| 242 |
+
|
| 243 |
+
<!--
|
| 244 |
+
### Out-of-Scope Use
|
| 245 |
+
|
| 246 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 247 |
+
-->
|
| 248 |
+
|
| 249 |
+
## Evaluation
|
| 250 |
+
|
| 251 |
+
### Metrics
|
| 252 |
+
|
| 253 |
+
#### Triplet
|
| 254 |
+
|
| 255 |
+
* Evaluated with [<code>TripletEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.TripletEvaluator)
|
| 256 |
+
|
| 257 |
+
| Metric | Value |
|
| 258 |
+
|:--------------------|:-----------|
|
| 259 |
+
| **cosine_accuracy** | **0.9344** |
|
| 260 |
+
|
| 261 |
+
<!--
|
| 262 |
+
## Bias, Risks and Limitations
|
| 263 |
+
|
| 264 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 265 |
+
-->
|
| 266 |
+
|
| 267 |
+
<!--
|
| 268 |
+
### Recommendations
|
| 269 |
+
|
| 270 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 271 |
+
-->
|
| 272 |
+
|
| 273 |
+
## Training Details
|
| 274 |
+
|
| 275 |
+
### Training Dataset
|
| 276 |
+
|
| 277 |
+
#### csv
|
| 278 |
+
|
| 279 |
+
* Dataset: csv
|
| 280 |
+
* Size: 27,191 training samples
|
| 281 |
+
* Columns: <code>anchor</code>, <code>positive</code>, and <code>negative</code>
|
| 282 |
+
* Approximate statistics based on the first 1000 samples:
|
| 283 |
+
| | anchor | positive | negative |
|
| 284 |
+
|:--------|:-----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
| 285 |
+
| type | string | string | string |
|
| 286 |
+
| details | <ul><li>min: 3 tokens</li><li>mean: 105.8 tokens</li><li>max: 335 tokens</li></ul> | <ul><li>min: 3 tokens</li><li>mean: 105.7 tokens</li><li>max: 361 tokens</li></ul> | <ul><li>min: 3 tokens</li><li>mean: 108.92 tokens</li><li>max: 383 tokens</li></ul> |
|
| 287 |
+
* Samples:
|
| 288 |
+
| anchor | positive | negative |
|
| 289 |
+
|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 290 |
+
| <code>ES Holding Aalborg II was a non-financial holding company based in Støvring, Denmark. Established on November 20, 2019, the company was dissolved after a demerger on December 20, 2019. Its primary purpose was to hold shares in subsidiaries and associated companies, engage in investment and financing activities, and conduct other related business as deemed appropriate by management. The company was registered with a capital of 200,000 DKK and was managed by director Ejner Sørensen. The registered address was Guldbækvej 116, 9530 Støvring, Denmark.</code> | <code>Malver Holding is a Danish non-financial holding company established on October 9, 2018. Based in Copenhagen, it focuses on investment and holding activities. The company is solely owned and directed by Nicklas Malver, who holds 100% ownership and voting rights. As of 2023, Malver Holding reported a net profit of DKK 437,389 and total assets amounting to DKK 3,889,000. The company's registered address is Hjørringgade 1, 3. tv., 2100 København Ø.</code> | <code>Research Infrastructure Consultancy Services is a Danish firm specializing in providing expert guidance and support for the development and management of research infrastructures. Their services encompass strategic planning, project management, and operational optimization to enhance the efficiency and effectiveness of research facilities. By collaborating closely with clients, they aim to tailor solutions that meet the unique needs of various research institutions.</code> |
|
| 291 |
+
| <code>SIGNCONCEPT is a Danish company specializing in the signage and advertising industry. Established in 2006, the company operates from its headquarters at Industrivej 60, 6740 Bramming, Denmark. SIGNCONCEPT offers a range of products and services related to signs and advertising materials, catering to various business needs. The company is registered under CVR number 30502590 and has a workforce of approximately 4 employees. For more information, visit their official website at http://www.signconcept.dk.</code> | <code>Fleet Complete Danmark specializes in fleet management solutions, offering GPS tracking, electronic logbooks, and task management systems to optimize vehicle fleets and mobile workforces. Their services aim to enhance performance, reduce fuel consumption, and integrate seamlessly with existing operational systems.</code> | <code>Lidemark Kirke is a historic church located in Bjæverskov, Denmark. Built in the 12th century in Romanesque style, the original structure comprises an apse, chancel, and nave. Around 1500, additions such as a porch, sacristy, and tower were incorporated. The church is primarily constructed from chalk and split fieldstone. Notable features include an altarpiece with two large columns and a painting titled "Christ in the Resurrection" by F. Storck from 1860. The tower houses a beautifully crafted organ built by K. Olsen in 1870, and the church has two bells dating from 1749 and 1842. A Renaissance gravestone commemorates Hartvig Høcken, a local nobleman who passed away in 1595. The church is part of a collaborative network with Bjæverskov, Gørslev, and Vollerslev churches, sharing clergy and a parish hall.</code> |
|
| 292 |
+
| <code>Indian Guro ApS was a Danish company established in 2017. The company was dissolved after bankruptcy in 2023. ([paqle.dk](https://www.paqle.dk/p/indian-guro-aps/842865?utm_source=openai))</code> | <code>BEG BESLAGSMEDIE ApS was a Danish company established in 2014, specializing in services related to livestock breeding. The company was dissolved after bankruptcy in August 2023. ([paqle.dk](https://www.paqle.dk/p/beg-beslagsmedie-aps/702103?utm_source=openai))</code> | <code>Gilleleje Lægecenter is a medical clinic located in Gilleleje, Denmark, offering same-day consultations for various health concerns. Patients can schedule appointments electronically via the clinic's website or the 'Minlæge' app, or by phone. The clinic provides both in-person and video consultations, emphasizing prompt and accessible healthcare services. ([xn--gillelejelgecenter-xub.dk](https://xn--gillelejelgecenter-xub.dk/?utm_source=openai))</code> |
|
| 293 |
+
* Loss: [<code>TripletLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#tripletloss) with these parameters:
|
| 294 |
+
```json
|
| 295 |
+
{
|
| 296 |
+
"distance_metric": "TripletDistanceMetric.COSINE",
|
| 297 |
+
"triplet_margin": 0.4
|
| 298 |
+
}
|
| 299 |
+
```
|
| 300 |
+
|
| 301 |
+
### Evaluation Dataset
|
| 302 |
+
|
| 303 |
+
#### csv
|
| 304 |
+
|
| 305 |
+
* Dataset: csv
|
| 306 |
+
* Size: 1,432 evaluation samples
|
| 307 |
+
* Columns: <code>anchor</code>, <code>positive</code>, and <code>negative</code>
|
| 308 |
+
* Approximate statistics based on the first 1000 samples:
|
| 309 |
+
| | anchor | positive | negative |
|
| 310 |
+
|:--------|:-----------------------------------------------------------------------------------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|
|
| 311 |
+
| type | string | string | string |
|
| 312 |
+
| details | <ul><li>min: 3 tokens</li><li>mean: 106.0 tokens</li><li>max: 325 tokens</li></ul> | <ul><li>min: 3 tokens</li><li>mean: 106.5 tokens</li><li>max: 384 tokens</li></ul> | <ul><li>min: 3 tokens</li><li>mean: 107.84 tokens</li><li>max: 384 tokens</li></ul> |
|
| 313 |
+
* Samples:
|
| 314 |
+
| anchor | positive | negative |
|
| 315 |
+
|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 316 |
+
| <code>Casela ApS is a Danish holding company established on June 17, 2004, located at Haugesundvej 1, 2850 Nærum. The company primarily functions as a non-financial holding entity, owning capital interests in other companies. As of 2023, Casela ApS reported a net profit of 389,125 DKK and an equity of 10,192,000 DKK. The company is led by Director Klaus Kastrup-Larsen, who has been in position since November 7, 2023. The sole owner is Lasse Bo Steenholt, holding 100% of the shares and voting rights since June 17, 2004.</code> | <code>EILKAER HOLDING is a Danish private limited company (Anpartsselskab) established on May 27, 2014. The company is located at Rejnstrupvej 15, 4250 Fuglebjerg, Denmark. Its primary purpose is to own shares and equity interests in other capital companies, manage assets, and engage in related activities as deemed appropriate by the management. The company is led by Director Thomas Bojesen Eilkær, who holds 100% ownership and voting rights. As of 2023, EILKAER HOLDING reported a gross profit of DKK -16,237 and a net income of DKK -4,768. The company is active and operates in the non-financial holding companies industry.</code> | <code>Vesterled Frugtplantage, located on Fejø Island in Denmark, specializes in cultivating high-quality apples, pears, and plums. Benefiting from Fejø's favorable climate, the plantation produces fruit known for its exceptional taste and quality. To ensure freshness, Vesterled Frugtplantage operates its own storage and packing facilities, delivering freshly picked fruit from early August. The plantation adheres to both organic farming practices and the principles of Dansk I.P., minimizing chemical use for the benefit of consumers and the environment.</code> |
|
| 317 |
+
| <code>S/I Margrethe Hjemmet is a private nursing home located in the heart of Roskilde, Denmark. The facility focuses on promoting active aging for both body and soul, providing a harmonious environment for its residents. With 44 apartments spread over two floors, each unit includes a private bathroom and wardrobe, and most feature a terrace or balcony. The home offers various amenities such as a cultural center, dining room, garden, workshop, hair salon, wellness room, and exercise equipment. Emphasizing the importance of family involvement, Margrethe Hjemmet views relatives as valuable resources and staff as catalysts for a meaningful, social, and active elderly life.</code> | <code>Medarbejderfond for ansatte i ISS Facility Services is a foundation established on December 31, 2005, located at Gyngemose Parkvej 50, 2860 Søborg, Denmark. The foundation operates within the industry of general building cleaning services. As of now, there is no official website registered for this organization.</code> | <code>Manbook.dk is a Danish company specializing in providing flexible staffing solutions across Denmark. They offer temporary workers for various tasks, including accounting, legal assignments, transportation, and security services. Their services are available 24/7, with the ability to dispatch personnel within two hours. Manbook.dk emphasizes creating a secure environment for both clients and employees, handling administrative tasks such as payroll, pensions, and holidays. Their office is located at Vallensbækvej 6, 2605 Brøndby, Denmark.</code> |
|
| 318 |
+
| <code>Børnehuset Goethesgade is a self-governing, age-integrated daycare institution located in Sønderborg, Denmark. ([boernehuset-goethesgade.aula.dk](https://boernehuset-goethesgade.aula.dk/velkommen?utm_source=openai)) Established in 1993, it offers a nurturing environment for children aged 0-6 years, comprising a nursery ('bobler') with 18 places and a kindergarten ('stjerner') with 38 places. ([boernehuset-goethesgade.aula.dk](https://boernehuset-goethesgade.aula.dk/velkommen?utm_source=openai)) The institution emphasizes small group activities to cater to individual child development and foster strong peer relationships. ([boernehuset-goethesgade.aula.dk](https://boernehuset-goethesgade.aula.dk/velkommen?utm_source=openai)) Situated centrally, it leverages its proximity to nature and the local community to enhance children's daily experiences. ([boernehuset-goethesgade.aula.dk](https://boernehuset-goethesgade.aula.dk/velkommen?utm_source=openai))</code> | <code>Horsens Gymnasium & HF is an educational institution located in Horsens, Denmark, offering both the general upper secondary education (STX) and the higher preparatory examination (HF). The school provides a range of study programs, including music, biology and chemistry, social sciences, mathematics, physics, chemistry, geoscience, language studies, and biotechnology. It emphasizes a broad educational foundation, preparing students for further education. The institution also boasts an impressive art collection featuring works by artists such as Kasper Bonnén, Michael Kvium, Cathrine Raben Davidsen, and Poul Anker Bech. ([horsens-gym.dk](https://horsens-gym.dk/?utm_source=openai))</code> | <code>Of Holding is a Danish company based in Aalborg SØ, Nordjylland, specializing in the management of companies and enterprises, particularly as a holding company. The key principal is Ole Frøkjær. Further details about the company's operations and services are not publicly available.</code> |
|
| 319 |
+
* Loss: [<code>TripletLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#tripletloss) with these parameters:
|
| 320 |
+
```json
|
| 321 |
+
{
|
| 322 |
+
"distance_metric": "TripletDistanceMetric.COSINE",
|
| 323 |
+
"triplet_margin": 0.4
|
| 324 |
+
}
|
| 325 |
+
```
|
| 326 |
+
|
| 327 |
+
### Training Hyperparameters
|
| 328 |
+
#### Non-Default Hyperparameters
|
| 329 |
+
|
| 330 |
+
- `eval_strategy`: steps
|
| 331 |
+
- `per_device_train_batch_size`: 6
|
| 332 |
+
- `per_device_eval_batch_size`: 6
|
| 333 |
+
- `gradient_accumulation_steps`: 3
|
| 334 |
+
- `num_train_epochs`: 2
|
| 335 |
+
- `warmup_ratio`: 0.1
|
| 336 |
+
- `fp16`: True
|
| 337 |
+
- `dataloader_pin_memory`: False
|
| 338 |
+
|
| 339 |
+
#### All Hyperparameters
|
| 340 |
+
<details><summary>Click to expand</summary>
|
| 341 |
+
|
| 342 |
+
- `overwrite_output_dir`: False
|
| 343 |
+
- `do_predict`: False
|
| 344 |
+
- `eval_strategy`: steps
|
| 345 |
+
- `prediction_loss_only`: True
|
| 346 |
+
- `per_device_train_batch_size`: 6
|
| 347 |
+
- `per_device_eval_batch_size`: 6
|
| 348 |
+
- `per_gpu_train_batch_size`: None
|
| 349 |
+
- `per_gpu_eval_batch_size`: None
|
| 350 |
+
- `gradient_accumulation_steps`: 3
|
| 351 |
+
- `eval_accumulation_steps`: None
|
| 352 |
+
- `torch_empty_cache_steps`: None
|
| 353 |
+
- `learning_rate`: 5e-05
|
| 354 |
+
- `weight_decay`: 0.0
|
| 355 |
+
- `adam_beta1`: 0.9
|
| 356 |
+
- `adam_beta2`: 0.999
|
| 357 |
+
- `adam_epsilon`: 1e-08
|
| 358 |
+
- `max_grad_norm`: 1.0
|
| 359 |
+
- `num_train_epochs`: 2
|
| 360 |
+
- `max_steps`: -1
|
| 361 |
+
- `lr_scheduler_type`: linear
|
| 362 |
+
- `lr_scheduler_kwargs`: {}
|
| 363 |
+
- `warmup_ratio`: 0.1
|
| 364 |
+
- `warmup_steps`: 0
|
| 365 |
+
- `log_level`: passive
|
| 366 |
+
- `log_level_replica`: warning
|
| 367 |
+
- `log_on_each_node`: True
|
| 368 |
+
- `logging_nan_inf_filter`: True
|
| 369 |
+
- `save_safetensors`: True
|
| 370 |
+
- `save_on_each_node`: False
|
| 371 |
+
- `save_only_model`: False
|
| 372 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 373 |
+
- `no_cuda`: False
|
| 374 |
+
- `use_cpu`: False
|
| 375 |
+
- `use_mps_device`: False
|
| 376 |
+
- `seed`: 42
|
| 377 |
+
- `data_seed`: None
|
| 378 |
+
- `jit_mode_eval`: False
|
| 379 |
+
- `use_ipex`: False
|
| 380 |
+
- `bf16`: False
|
| 381 |
+
- `fp16`: True
|
| 382 |
+
- `fp16_opt_level`: O1
|
| 383 |
+
- `half_precision_backend`: auto
|
| 384 |
+
- `bf16_full_eval`: False
|
| 385 |
+
- `fp16_full_eval`: False
|
| 386 |
+
- `tf32`: None
|
| 387 |
+
- `local_rank`: 0
|
| 388 |
+
- `ddp_backend`: None
|
| 389 |
+
- `tpu_num_cores`: None
|
| 390 |
+
- `tpu_metrics_debug`: False
|
| 391 |
+
- `debug`: []
|
| 392 |
+
- `dataloader_drop_last`: False
|
| 393 |
+
- `dataloader_num_workers`: 0
|
| 394 |
+
- `dataloader_prefetch_factor`: None
|
| 395 |
+
- `past_index`: -1
|
| 396 |
+
- `disable_tqdm`: False
|
| 397 |
+
- `remove_unused_columns`: True
|
| 398 |
+
- `label_names`: None
|
| 399 |
+
- `load_best_model_at_end`: False
|
| 400 |
+
- `ignore_data_skip`: False
|
| 401 |
+
- `fsdp`: []
|
| 402 |
+
- `fsdp_min_num_params`: 0
|
| 403 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 404 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 405 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 406 |
+
- `deepspeed`: None
|
| 407 |
+
- `label_smoothing_factor`: 0.0
|
| 408 |
+
- `optim`: adamw_torch
|
| 409 |
+
- `optim_args`: None
|
| 410 |
+
- `adafactor`: False
|
| 411 |
+
- `group_by_length`: False
|
| 412 |
+
- `length_column_name`: length
|
| 413 |
+
- `ddp_find_unused_parameters`: None
|
| 414 |
+
- `ddp_bucket_cap_mb`: None
|
| 415 |
+
- `ddp_broadcast_buffers`: False
|
| 416 |
+
- `dataloader_pin_memory`: False
|
| 417 |
+
- `dataloader_persistent_workers`: False
|
| 418 |
+
- `skip_memory_metrics`: True
|
| 419 |
+
- `use_legacy_prediction_loop`: False
|
| 420 |
+
- `push_to_hub`: False
|
| 421 |
+
- `resume_from_checkpoint`: None
|
| 422 |
+
- `hub_model_id`: None
|
| 423 |
+
- `hub_strategy`: every_save
|
| 424 |
+
- `hub_private_repo`: None
|
| 425 |
+
- `hub_always_push`: False
|
| 426 |
+
- `gradient_checkpointing`: False
|
| 427 |
+
- `gradient_checkpointing_kwargs`: None
|
| 428 |
+
- `include_inputs_for_metrics`: False
|
| 429 |
+
- `include_for_metrics`: []
|
| 430 |
+
- `eval_do_concat_batches`: True
|
| 431 |
+
- `fp16_backend`: auto
|
| 432 |
+
- `push_to_hub_model_id`: None
|
| 433 |
+
- `push_to_hub_organization`: None
|
| 434 |
+
- `mp_parameters`:
|
| 435 |
+
- `auto_find_batch_size`: False
|
| 436 |
+
- `full_determinism`: False
|
| 437 |
+
- `torchdynamo`: None
|
| 438 |
+
- `ray_scope`: last
|
| 439 |
+
- `ddp_timeout`: 1800
|
| 440 |
+
- `torch_compile`: False
|
| 441 |
+
- `torch_compile_backend`: None
|
| 442 |
+
- `torch_compile_mode`: None
|
| 443 |
+
- `include_tokens_per_second`: False
|
| 444 |
+
- `include_num_input_tokens_seen`: False
|
| 445 |
+
- `neftune_noise_alpha`: None
|
| 446 |
+
- `optim_target_modules`: None
|
| 447 |
+
- `batch_eval_metrics`: False
|
| 448 |
+
- `eval_on_start`: False
|
| 449 |
+
- `use_liger_kernel`: False
|
| 450 |
+
- `eval_use_gather_object`: False
|
| 451 |
+
- `average_tokens_across_devices`: False
|
| 452 |
+
- `prompts`: None
|
| 453 |
+
- `batch_sampler`: batch_sampler
|
| 454 |
+
- `multi_dataset_batch_sampler`: proportional
|
| 455 |
+
|
| 456 |
+
</details>
|
| 457 |
+
|
| 458 |
+
### Training Logs
|
| 459 |
+
| Epoch | Step | Training Loss | Validation Loss | cosine_accuracy |
|
| 460 |
+
|:------:|:----:|:-------------:|:---------------:|:---------------:|
|
| 461 |
+
| -1 | -1 | - | - | 0.8275 |
|
| 462 |
+
| 0.0662 | 100 | 0.4326 | - | - |
|
| 463 |
+
| 0.1324 | 200 | 0.2973 | - | - |
|
| 464 |
+
| 0.1655 | 250 | - | 0.0902 | 0.9141 |
|
| 465 |
+
| 0.1986 | 300 | 0.2914 | - | - |
|
| 466 |
+
| 0.2648 | 400 | 0.305 | - | - |
|
| 467 |
+
| 0.3310 | 500 | 0.2878 | 0.0920 | 0.9092 |
|
| 468 |
+
| 0.3972 | 600 | 0.308 | - | - |
|
| 469 |
+
| 0.4634 | 700 | 0.2722 | - | - |
|
| 470 |
+
| 0.4965 | 750 | - | 0.0805 | 0.9218 |
|
| 471 |
+
| 0.5296 | 800 | 0.2591 | - | - |
|
| 472 |
+
| 0.5958 | 900 | 0.2564 | - | - |
|
| 473 |
+
| 0.6620 | 1000 | 0.245 | 0.0815 | 0.9197 |
|
| 474 |
+
| 0.7282 | 1100 | 0.2395 | - | - |
|
| 475 |
+
| 0.7944 | 1200 | 0.2559 | - | - |
|
| 476 |
+
| 0.8274 | 1250 | - | 0.0818 | 0.9232 |
|
| 477 |
+
| 0.8605 | 1300 | 0.2581 | - | - |
|
| 478 |
+
| 0.9267 | 1400 | 0.2692 | - | - |
|
| 479 |
+
| 0.9929 | 1500 | 0.2544 | 0.0738 | 0.9302 |
|
| 480 |
+
| 1.0589 | 1600 | 0.2001 | - | - |
|
| 481 |
+
| 1.1251 | 1700 | 0.2112 | - | - |
|
| 482 |
+
| 1.1582 | 1750 | - | 0.0729 | 0.9302 |
|
| 483 |
+
| 1.1913 | 1800 | 0.1926 | - | - |
|
| 484 |
+
| 1.2575 | 1900 | 0.1801 | - | - |
|
| 485 |
+
| 1.3237 | 2000 | 0.1684 | 0.0706 | 0.9267 |
|
| 486 |
+
| 1.3899 | 2100 | 0.1831 | - | - |
|
| 487 |
+
| 1.4561 | 2200 | 0.1963 | - | - |
|
| 488 |
+
| 1.4892 | 2250 | - | 0.0719 | 0.9281 |
|
| 489 |
+
| 1.5223 | 2300 | 0.1878 | - | - |
|
| 490 |
+
| 1.5885 | 2400 | 0.2028 | - | - |
|
| 491 |
+
| 1.6547 | 2500 | 0.2045 | 0.0685 | 0.9323 |
|
| 492 |
+
| 1.7209 | 2600 | 0.1853 | - | - |
|
| 493 |
+
| 1.7871 | 2700 | 0.1793 | - | - |
|
| 494 |
+
| 1.8202 | 2750 | - | 0.0665 | 0.9344 |
|
| 495 |
+
| 1.8533 | 2800 | 0.1772 | - | - |
|
| 496 |
+
| 1.9195 | 2900 | 0.1722 | - | - |
|
| 497 |
+
| 1.9857 | 3000 | 0.1797 | 0.0658 | 0.9344 |
|
| 498 |
+
|
| 499 |
+
|
| 500 |
+
### Framework Versions
|
| 501 |
+
- Python: 3.13.2
|
| 502 |
+
- Sentence Transformers: 4.1.0
|
| 503 |
+
- Transformers: 4.52.1
|
| 504 |
+
- PyTorch: 2.7.0+cu126
|
| 505 |
+
- Accelerate: 1.7.0
|
| 506 |
+
- Datasets: 3.6.0
|
| 507 |
+
- Tokenizers: 0.21.1
|
| 508 |
+
|
| 509 |
+
## Citation
|
| 510 |
+
|
| 511 |
+
### BibTeX
|
| 512 |
+
|
| 513 |
+
#### Sentence Transformers
|
| 514 |
+
```bibtex
|
| 515 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 516 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 517 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 518 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 519 |
+
month = "11",
|
| 520 |
+
year = "2019",
|
| 521 |
+
publisher = "Association for Computational Linguistics",
|
| 522 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 523 |
+
}
|
| 524 |
+
```
|
| 525 |
+
|
| 526 |
+
#### TripletLoss
|
| 527 |
+
```bibtex
|
| 528 |
+
@misc{hermans2017defense,
|
| 529 |
+
title={In Defense of the Triplet Loss for Person Re-Identification},
|
| 530 |
+
author={Alexander Hermans and Lucas Beyer and Bastian Leibe},
|
| 531 |
+
year={2017},
|
| 532 |
+
eprint={1703.07737},
|
| 533 |
+
archivePrefix={arXiv},
|
| 534 |
+
primaryClass={cs.CV}
|
| 535 |
+
}
|
| 536 |
+
```
|
| 537 |
+
|
| 538 |
+
<!--
|
| 539 |
+
## Glossary
|
| 540 |
+
|
| 541 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 542 |
+
-->
|
| 543 |
+
|
| 544 |
+
<!--
|
| 545 |
+
## Model Card Authors
|
| 546 |
+
|
| 547 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 548 |
+
-->
|
| 549 |
+
|
| 550 |
+
<!--
|
| 551 |
+
## Model Card Contact
|
| 552 |
+
|
| 553 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 554 |
+
-->
|
config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"MPNetModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"eos_token_id": 2,
|
| 8 |
+
"hidden_act": "gelu",
|
| 9 |
+
"hidden_dropout_prob": 0.1,
|
| 10 |
+
"hidden_size": 768,
|
| 11 |
+
"initializer_range": 0.02,
|
| 12 |
+
"intermediate_size": 3072,
|
| 13 |
+
"layer_norm_eps": 1e-05,
|
| 14 |
+
"max_position_embeddings": 514,
|
| 15 |
+
"model_type": "mpnet",
|
| 16 |
+
"num_attention_heads": 12,
|
| 17 |
+
"num_hidden_layers": 12,
|
| 18 |
+
"pad_token_id": 1,
|
| 19 |
+
"relative_attention_num_buckets": 32,
|
| 20 |
+
"torch_dtype": "float32",
|
| 21 |
+
"transformers_version": "4.52.1",
|
| 22 |
+
"vocab_size": 30527
|
| 23 |
+
}
|
config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"__version__": {
|
| 3 |
+
"sentence_transformers": "4.1.0",
|
| 4 |
+
"transformers": "4.52.1",
|
| 5 |
+
"pytorch": "2.7.0+cu126"
|
| 6 |
+
},
|
| 7 |
+
"prompts": {},
|
| 8 |
+
"default_prompt_name": null,
|
| 9 |
+
"similarity_fn_name": "cosine"
|
| 10 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aed345e3c95b9716c8b9775bb6fd8254922bb4433d315a7100243f6f4e8c41d3
|
| 3 |
+
size 437967672
|
modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 384,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "[UNK]",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": true,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"104": {
|
| 36 |
+
"content": "[UNK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
},
|
| 43 |
+
"30526": {
|
| 44 |
+
"content": "<mask>",
|
| 45 |
+
"lstrip": true,
|
| 46 |
+
"normalized": false,
|
| 47 |
+
"rstrip": false,
|
| 48 |
+
"single_word": false,
|
| 49 |
+
"special": true
|
| 50 |
+
}
|
| 51 |
+
},
|
| 52 |
+
"bos_token": "<s>",
|
| 53 |
+
"clean_up_tokenization_spaces": false,
|
| 54 |
+
"cls_token": "<s>",
|
| 55 |
+
"do_lower_case": true,
|
| 56 |
+
"eos_token": "</s>",
|
| 57 |
+
"extra_special_tokens": {},
|
| 58 |
+
"mask_token": "<mask>",
|
| 59 |
+
"max_length": 128,
|
| 60 |
+
"model_max_length": 384,
|
| 61 |
+
"pad_to_multiple_of": null,
|
| 62 |
+
"pad_token": "<pad>",
|
| 63 |
+
"pad_token_type_id": 0,
|
| 64 |
+
"padding_side": "right",
|
| 65 |
+
"sep_token": "</s>",
|
| 66 |
+
"stride": 0,
|
| 67 |
+
"strip_accents": null,
|
| 68 |
+
"tokenize_chinese_chars": true,
|
| 69 |
+
"tokenizer_class": "MPNetTokenizer",
|
| 70 |
+
"truncation_side": "right",
|
| 71 |
+
"truncation_strategy": "longest_first",
|
| 72 |
+
"unk_token": "[UNK]"
|
| 73 |
+
}
|
vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|