Kapturz0ny commited on
Commit
89f10af
·
verified ·
1 Parent(s): 895bc3e

Upload fine-tuned retriever model

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. 1_Pooling/config.json +10 -0
  2. README.md +512 -0
  3. checkpoints/checkpoint-1050/1_Pooling/config.json +10 -0
  4. checkpoints/checkpoint-1050/README.md +512 -0
  5. checkpoints/checkpoint-1050/config.json +31 -0
  6. checkpoints/checkpoint-1050/config_sentence_transformers.json +10 -0
  7. checkpoints/checkpoint-1050/model.safetensors +3 -0
  8. checkpoints/checkpoint-1050/modules.json +20 -0
  9. checkpoints/checkpoint-1050/optimizer.pt +3 -0
  10. checkpoints/checkpoint-1050/rng_state.pth +3 -0
  11. checkpoints/checkpoint-1050/scheduler.pt +3 -0
  12. checkpoints/checkpoint-1050/sentence_bert_config.json +4 -0
  13. checkpoints/checkpoint-1050/special_tokens_map.json +37 -0
  14. checkpoints/checkpoint-1050/tokenizer.json +0 -0
  15. checkpoints/checkpoint-1050/tokenizer_config.json +58 -0
  16. checkpoints/checkpoint-1050/trainer_state.json +48 -0
  17. checkpoints/checkpoint-1050/training_args.bin +3 -0
  18. checkpoints/checkpoint-1050/vocab.txt +0 -0
  19. checkpoints/checkpoint-1053/1_Pooling/config.json +10 -0
  20. checkpoints/checkpoint-1053/README.md +512 -0
  21. checkpoints/checkpoint-1053/config.json +31 -0
  22. checkpoints/checkpoint-1053/config_sentence_transformers.json +10 -0
  23. checkpoints/checkpoint-1053/model.safetensors +3 -0
  24. checkpoints/checkpoint-1053/modules.json +20 -0
  25. checkpoints/checkpoint-1053/optimizer.pt +3 -0
  26. checkpoints/checkpoint-1053/rng_state.pth +3 -0
  27. checkpoints/checkpoint-1053/scheduler.pt +3 -0
  28. checkpoints/checkpoint-1053/sentence_bert_config.json +4 -0
  29. checkpoints/checkpoint-1053/special_tokens_map.json +37 -0
  30. checkpoints/checkpoint-1053/tokenizer.json +0 -0
  31. checkpoints/checkpoint-1053/tokenizer_config.json +58 -0
  32. checkpoints/checkpoint-1053/trainer_state.json +48 -0
  33. checkpoints/checkpoint-1053/training_args.bin +3 -0
  34. checkpoints/checkpoint-1053/vocab.txt +0 -0
  35. checkpoints/checkpoint-875/1_Pooling/config.json +10 -0
  36. checkpoints/checkpoint-875/README.md +511 -0
  37. checkpoints/checkpoint-875/config.json +31 -0
  38. checkpoints/checkpoint-875/config_sentence_transformers.json +10 -0
  39. checkpoints/checkpoint-875/model.safetensors +3 -0
  40. checkpoints/checkpoint-875/modules.json +20 -0
  41. checkpoints/checkpoint-875/optimizer.pt +3 -0
  42. checkpoints/checkpoint-875/rng_state.pth +3 -0
  43. checkpoints/checkpoint-875/scheduler.pt +3 -0
  44. checkpoints/checkpoint-875/sentence_bert_config.json +4 -0
  45. checkpoints/checkpoint-875/special_tokens_map.json +37 -0
  46. checkpoints/checkpoint-875/tokenizer.json +0 -0
  47. checkpoints/checkpoint-875/tokenizer_config.json +58 -0
  48. checkpoints/checkpoint-875/trainer_state.json +41 -0
  49. checkpoints/checkpoint-875/training_args.bin +3 -0
  50. checkpoints/checkpoint-875/vocab.txt +0 -0
1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 768,
3
+ "pooling_mode_cls_token": true,
4
+ "pooling_mode_mean_tokens": false,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
README.md ADDED
@@ -0,0 +1,512 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - sentence-transformers
4
+ - sentence-similarity
5
+ - feature-extraction
6
+ - generated_from_trainer
7
+ - dataset_size:5604
8
+ - loss:CosineSimilarityLoss
9
+ base_model: BAAI/bge-base-en-v1.5
10
+ widget:
11
+ - source_sentence: what are the powers of the virginia executive branch
12
+ sentences:
13
+ - The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
14
+ came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
15
+ Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
16
+ Seifert. They have been division champions 22 times between 1970 and 2023, making
17
+ them one of the most successful teams in NFL history. The 49ers sit alone in NFL
18
+ history for most playoff wins (38), having been in the league playoffs 30 times
19
+ (29 times in the NFL and one time in the AAFC), and have also played in the most
20
+ NFC Championship games (19), hosting 11 of them, also an NFC record. The team
21
+ has set numerous notable NFL records, including most consecutive away games won
22
+ (18), most consecutive seasons leading the league in scoring (4), most consecutive
23
+ games scored (420 games from 1977 to 2004), most field goals in a season (44),
24
+ most games won in a season (18), and most touchdowns (8) and points scored (55)
25
+ in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
26
+ in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
27
+ branch of the 49ers completed the acquisition of English soccer club Leeds United
28
+ and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
29
+ - In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
30
+ to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
31
+ Group were looking into selling the Arby's side of the business to focus on the
32
+ Wendy's brand. It was officially announced the companies would split on January
33
+ 21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
34
+ Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
35
+ East with the first location opening in Dubai in the United Arab Emirates in May
36
+ 2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
37
+ with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
38
+ the split, the former Wendy's/Arby's Group became The Wendy's Company.
39
+ - 'Executive: The Chief Executive is responsible for enforcing regional law, can
40
+ force reconsideration of legislation, and appoints Executive Council members and
41
+ principal officials. Acting with the Executive Council, the Chief Executive-in-Council
42
+ can propose new bills, issue subordinate legislation, and has authority to dissolve
43
+ the legislature. In states of emergency or public danger, the Chief Executive-in-Council
44
+ is further empowered to enact any regulation necessary to restore public order.
45
+ Legislature: The unicameral Legislative Council enacts regional law, approves
46
+ budgets, and has the power to impeach a sitting chief executive. Judiciary: The
47
+ Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
48
+ inconsistent with the Basic Law. Judges are appointed by the chief executive on
49
+ the advice of a recommendation commission. The chief executive is the head of
50
+ government and serves for a maximum of two five-year terms. The State Council
51
+ (led by the Premier of China) appoints the chief executive after nomination by
52
+ the Election Committee, which is composed of 1500 business, community, and government
53
+ leaders.'
54
+ - source_sentence: how many chromosomes does a human diploid cell have
55
+ sentences:
56
+ - The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
57
+ at a considerable advantage. However, the government was still mired in debt,
58
+ and declared bankruptcy that year. Most of the government's revenues came from
59
+ taxes and excise duties, not imported silver and other goods. The Ottoman Empire
60
+ had long menaced the fringes of the Habsburg dominions in Austria and northwest
61
+ Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
62
+ capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
63
+ Ottomans through a considerably more maritime strategy, hampering Ottoman landings
64
+ on the Venetian territories in the Eastern Mediterranean. Only in response to
65
+ raids on the eastern coast of Spain did Charles personally lead attacks against
66
+ holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
67
+ off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
68
+ vital island of Malta, defended by the Knights of St. John, were defeated. The
69
+ death of Suleiman the Magnificent the following year and his succession by Selim
70
+ II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
71
+ In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
72
+ Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
73
+ the Battle of Lepanto, in the largest naval battle fought in European waters since
74
+ Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
75
+ historic Spanish novel Don Quixote
76
+ - 'The 1930s were the team''s first golden era, when they improved their game through
77
+ play with more experienced teams. The Combinado del Pacífico (a squad composed
78
+ of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
79
+ with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
80
+ success. During one of these tours—Alianza Lima''s undefeated journey through
81
+ Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
82
+ by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
83
+ Sports historian Richard Witzig described these three as "a soccer triumvirate
84
+ unsurpassed in the world at that time", citing their combined innovation and effectiveness
85
+ at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
86
+ Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
87
+ as South American champions. Historian David Goldblatt assessed the decline of
88
+ its previous success: "despite all the apparent preconditions for footballing
89
+ growth and success, Peruvian football disappeared". He attributes this sudden
90
+ decline to Peruvian authorities'' repression of "social, sporting and political
91
+ organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
92
+ Peru performed creditably at the South American Championships, placing third in
93
+ Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
94
+ Cup finals, over two legs to eventual champions Brazil.'
95
+ - In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
96
+ and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
97
+ perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
98
+ who constituted 90% of Polish Jewry, made up half of all Poles killed during the
99
+ war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
100
+ and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
101
+ from actively risking death in order to save Jewish lives, and passive refusal
102
+ to inform on them, to indifference, blackmail, and in extreme cases, committing
103
+ premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
104
+ Polish citizens in the Holocaust was sporadic, but incidents of hostility against
105
+ Jews are well documented and have been a subject of renewed scholarly interest
106
+ during the 21st century.
107
+ - source_sentence: what is the difference between ice brent crude and wti crude
108
+ sentences:
109
+ - ==== Spring and Autumn period (722–476 BC) ====
110
+ - SpaceX has also bought and is modifying several residential properties in Boca
111
+ Chica Village, but apparently planning to leave them in residential use, about
112
+ 2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
113
+ offer to buy each of the houses in Boca Chica Village for three times the fair
114
+ market value along with an offer of VIP invitations to future launch events. The
115
+ 3x offer was said to be "non-negotiable." Homeowners were given two weeks for
116
+ this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
117
+ Department announced a proposal to transfer 43 acres of Boca Chica State Park
118
+ lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
119
+ National Wildlife Refuge.
120
+ - However, exclusive US control of this resource was eventually challenged, and
121
+ the Bering Sea Controversy resulted when the United States seized over 150 sealing
122
+ ships flying the British flag, based out of the coast of British Columbia. The
123
+ conflict between the United States and Britain was resolved by an arbitration
124
+ tribunal in 1893. The waters of the Bering Sea were deemed to be international
125
+ waters, contrary to the US contention that they were an internal sea. The US was
126
+ required to make a payment to Britain, and both nations were required to follow
127
+ regulations developed to preserve the resource.
128
+ - source_sentence: why is there a citgo sign in boston
129
+ sentences:
130
+ - Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
131
+ single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
132
+ of the 100 Greatest Country Artists of All Time. After the death of former flame
133
+ Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
134
+ "Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
135
+ The song's release the following day, on the eve of Campbell's funeral, drew ire
136
+ and criticism being exploitative. Tucker claimed that a portion of the proceeds
137
+ will benefit the Alzheimer's Foundation of America, but the foundation stated
138
+ it was not involved in the promotion and has not received any funds. Tucker released
139
+ While I'm Livin', her first collection of original material since 2002's Tanya,
140
+ in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
141
+ with Carlile brought onto the project after initially being approached for songs
142
+ by Jennings but after having professed such an admiration of Tucker and her work,
143
+ Jennings felt it necessary for her to co-produce the record alongside him. Tucker
144
+ performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
145
+ at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
146
+ single, "Hard Luck", was released on June 28, along with its accompanying music
147
+ video.
148
+ - ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
149
+ being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
150
+ ==
151
+ - The massive Islamic invasions of the mid-7th century began a long struggle between
152
+ Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
153
+ soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
154
+ Antioch and was reduced to that of Constantinople, the empire's capital. As a
155
+ result of Islamic domination of the Mediterranean, the Frankish state, centred
156
+ away from that sea, was able to evolve as the dominant power that shaped the Western
157
+ Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
158
+ advance in the West and the failed siege of Constantinople halted it in the East.
159
+ Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
160
+ the city of Ravenna from which it governed the small fragments of Italy, including
161
+ Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
162
+ by a no longer existent exarch was not asked for during the election in 752 of
163
+ Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
164
+ power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
165
+ king Pepin the Short conquered the Lombards. He then gifted the lands of the former
166
+ exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
167
+ Byzantine East were in conflict during the Photian schism, when Photius criticized
168
+ the Latin west for adding of the filioque clause, after being excommunicated by
169
+ Nicholas I. Though the schism was reconciled, unresolved issues would lead to
170
+ further division.
171
+ - source_sentence: who organized the native resistance to the british
172
+ sentences:
173
+ - === Engines === == Fifth generation (WL; 2021) ==
174
+ - '=== Unitarism === All states are unitary states, not federations or aggregates
175
+ of local governments. Local governments within them are created by and exist by
176
+ virtue of state law, and local governments within each state are subject to the
177
+ central authority of that particular state. State governments commonly delegate
178
+ some authority to local units and channel policy decisions down to them for implementation.
179
+ In a few states, local units of government are permitted a degree of home rule
180
+ over various matters. The prevailing legal theory of state preeminence over local
181
+ governments, referred to as Dillon''s Rule, holds that, A municipal corporation
182
+ possesses and can exercise the following powers and no others: First, those granted
183
+ in express words; second, those necessarily implied or necessarily incident to
184
+ the powers expressly granted; third, those absolutely essential to the declared
185
+ objects and purposes of the corporation—not simply convenient but indispensable;
186
+ fourth, any fair doubt as to the existence of power is resolved by the courts
187
+ against the corporation—against the existence of the powers. Each state defines
188
+ for itself what powers it will allow local governments. Generally, four categories
189
+ of power may be given to local jurisdictions: Structural – power to choose the
190
+ form of government, charter and enact charter revisions, Functional – power to
191
+ exercise local self-government in a broad or limited manner, Fiscal – authority
192
+ to determine revenue sources, set tax rates, borrow funds and other related financial
193
+ activities, Personnel – authority to set employment rules, remuneration rates,
194
+ employment conditions and collective bargaining. == Relationships =='
195
+ - Throughout the war, the British deported the Acadians to the Thirteen Colonies
196
+ and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
197
+ Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
198
+ force of French, Canadians, and their Native American allies led by the Marquis
199
+ de Montcalm launched an attack against the key British post at Fort Oswego on
200
+ Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
201
+ year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
202
+ Native Americans laid siege to Fort William Henry on the southern shores of Lake
203
+ George, and after three weeks of fighting the British commander Monroe surrendered.
204
+ Montcalm gave him honorable terms to return to England and not to fight for 18
205
+ months. And yet, when the British force with civilians was three miles from the
206
+ fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
207
+ pipeline_tag: sentence-similarity
208
+ library_name: sentence-transformers
209
+ ---
210
+
211
+ # SentenceTransformer based on BAAI/bge-base-en-v1.5
212
+
213
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
214
+
215
+ ## Model Details
216
+
217
+ ### Model Description
218
+ - **Model Type:** Sentence Transformer
219
+ - **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
220
+ - **Maximum Sequence Length:** 512 tokens
221
+ - **Output Dimensionality:** 768 dimensions
222
+ - **Similarity Function:** Cosine Similarity
223
+ <!-- - **Training Dataset:** Unknown -->
224
+ <!-- - **Language:** Unknown -->
225
+ <!-- - **License:** Unknown -->
226
+
227
+ ### Model Sources
228
+
229
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
230
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
231
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
232
+
233
+ ### Full Model Architecture
234
+
235
+ ```
236
+ SentenceTransformer(
237
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
238
+ (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
239
+ (2): Normalize()
240
+ )
241
+ ```
242
+
243
+ ## Usage
244
+
245
+ ### Direct Usage (Sentence Transformers)
246
+
247
+ First install the Sentence Transformers library:
248
+
249
+ ```bash
250
+ pip install -U sentence-transformers
251
+ ```
252
+
253
+ Then you can load this model and run inference.
254
+ ```python
255
+ from sentence_transformers import SentenceTransformer
256
+
257
+ # Download from the 🤗 Hub
258
+ model = SentenceTransformer("sentence_transformers_model_id")
259
+ # Run inference
260
+ sentences = [
261
+ 'who organized the native resistance to the british',
262
+ "Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
263
+ "=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
264
+ ]
265
+ embeddings = model.encode(sentences)
266
+ print(embeddings.shape)
267
+ # [3, 768]
268
+
269
+ # Get the similarity scores for the embeddings
270
+ similarities = model.similarity(embeddings, embeddings)
271
+ print(similarities.shape)
272
+ # [3, 3]
273
+ ```
274
+
275
+ <!--
276
+ ### Direct Usage (Transformers)
277
+
278
+ <details><summary>Click to see the direct usage in Transformers</summary>
279
+
280
+ </details>
281
+ -->
282
+
283
+ <!--
284
+ ### Downstream Usage (Sentence Transformers)
285
+
286
+ You can finetune this model on your own dataset.
287
+
288
+ <details><summary>Click to expand</summary>
289
+
290
+ </details>
291
+ -->
292
+
293
+ <!--
294
+ ### Out-of-Scope Use
295
+
296
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
297
+ -->
298
+
299
+ <!--
300
+ ## Bias, Risks and Limitations
301
+
302
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
303
+ -->
304
+
305
+ <!--
306
+ ### Recommendations
307
+
308
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
309
+ -->
310
+
311
+ ## Training Details
312
+
313
+ ### Training Dataset
314
+
315
+ #### Unnamed Dataset
316
+
317
+ * Size: 5,604 training samples
318
+ * Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
319
+ * Approximate statistics based on the first 1000 samples:
320
+ | | sentence_0 | sentence_1 | label |
321
+ |:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
322
+ | type | string | string | float |
323
+ | details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
324
+ * Samples:
325
+ | sentence_0 | sentence_1 | label |
326
+ |:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
327
+ | <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
328
+ | <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
329
+ | <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
330
+ * Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
331
+ ```json
332
+ {
333
+ "loss_fct": "torch.nn.modules.loss.MSELoss"
334
+ }
335
+ ```
336
+
337
+ ### Training Hyperparameters
338
+ #### Non-Default Hyperparameters
339
+
340
+ - `per_device_train_batch_size`: 16
341
+ - `per_device_eval_batch_size`: 16
342
+ - `multi_dataset_batch_sampler`: round_robin
343
+
344
+ #### All Hyperparameters
345
+ <details><summary>Click to expand</summary>
346
+
347
+ - `overwrite_output_dir`: False
348
+ - `do_predict`: False
349
+ - `eval_strategy`: no
350
+ - `prediction_loss_only`: True
351
+ - `per_device_train_batch_size`: 16
352
+ - `per_device_eval_batch_size`: 16
353
+ - `per_gpu_train_batch_size`: None
354
+ - `per_gpu_eval_batch_size`: None
355
+ - `gradient_accumulation_steps`: 1
356
+ - `eval_accumulation_steps`: None
357
+ - `torch_empty_cache_steps`: None
358
+ - `learning_rate`: 5e-05
359
+ - `weight_decay`: 0.0
360
+ - `adam_beta1`: 0.9
361
+ - `adam_beta2`: 0.999
362
+ - `adam_epsilon`: 1e-08
363
+ - `max_grad_norm`: 1
364
+ - `num_train_epochs`: 3
365
+ - `max_steps`: -1
366
+ - `lr_scheduler_type`: linear
367
+ - `lr_scheduler_kwargs`: {}
368
+ - `warmup_ratio`: 0.0
369
+ - `warmup_steps`: 0
370
+ - `log_level`: passive
371
+ - `log_level_replica`: warning
372
+ - `log_on_each_node`: True
373
+ - `logging_nan_inf_filter`: True
374
+ - `save_safetensors`: True
375
+ - `save_on_each_node`: False
376
+ - `save_only_model`: False
377
+ - `restore_callback_states_from_checkpoint`: False
378
+ - `no_cuda`: False
379
+ - `use_cpu`: False
380
+ - `use_mps_device`: False
381
+ - `seed`: 42
382
+ - `data_seed`: None
383
+ - `jit_mode_eval`: False
384
+ - `use_ipex`: False
385
+ - `bf16`: False
386
+ - `fp16`: False
387
+ - `fp16_opt_level`: O1
388
+ - `half_precision_backend`: auto
389
+ - `bf16_full_eval`: False
390
+ - `fp16_full_eval`: False
391
+ - `tf32`: None
392
+ - `local_rank`: 0
393
+ - `ddp_backend`: None
394
+ - `tpu_num_cores`: None
395
+ - `tpu_metrics_debug`: False
396
+ - `debug`: []
397
+ - `dataloader_drop_last`: False
398
+ - `dataloader_num_workers`: 0
399
+ - `dataloader_prefetch_factor`: None
400
+ - `past_index`: -1
401
+ - `disable_tqdm`: False
402
+ - `remove_unused_columns`: True
403
+ - `label_names`: None
404
+ - `load_best_model_at_end`: False
405
+ - `ignore_data_skip`: False
406
+ - `fsdp`: []
407
+ - `fsdp_min_num_params`: 0
408
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
409
+ - `fsdp_transformer_layer_cls_to_wrap`: None
410
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
411
+ - `deepspeed`: None
412
+ - `label_smoothing_factor`: 0.0
413
+ - `optim`: adamw_torch
414
+ - `optim_args`: None
415
+ - `adafactor`: False
416
+ - `group_by_length`: False
417
+ - `length_column_name`: length
418
+ - `ddp_find_unused_parameters`: None
419
+ - `ddp_bucket_cap_mb`: None
420
+ - `ddp_broadcast_buffers`: False
421
+ - `dataloader_pin_memory`: True
422
+ - `dataloader_persistent_workers`: False
423
+ - `skip_memory_metrics`: True
424
+ - `use_legacy_prediction_loop`: False
425
+ - `push_to_hub`: False
426
+ - `resume_from_checkpoint`: None
427
+ - `hub_model_id`: None
428
+ - `hub_strategy`: every_save
429
+ - `hub_private_repo`: None
430
+ - `hub_always_push`: False
431
+ - `gradient_checkpointing`: False
432
+ - `gradient_checkpointing_kwargs`: None
433
+ - `include_inputs_for_metrics`: False
434
+ - `include_for_metrics`: []
435
+ - `eval_do_concat_batches`: True
436
+ - `fp16_backend`: auto
437
+ - `push_to_hub_model_id`: None
438
+ - `push_to_hub_organization`: None
439
+ - `mp_parameters`:
440
+ - `auto_find_batch_size`: False
441
+ - `full_determinism`: False
442
+ - `torchdynamo`: None
443
+ - `ray_scope`: last
444
+ - `ddp_timeout`: 1800
445
+ - `torch_compile`: False
446
+ - `torch_compile_backend`: None
447
+ - `torch_compile_mode`: None
448
+ - `include_tokens_per_second`: False
449
+ - `include_num_input_tokens_seen`: False
450
+ - `neftune_noise_alpha`: None
451
+ - `optim_target_modules`: None
452
+ - `batch_eval_metrics`: False
453
+ - `eval_on_start`: False
454
+ - `use_liger_kernel`: False
455
+ - `eval_use_gather_object`: False
456
+ - `average_tokens_across_devices`: False
457
+ - `prompts`: None
458
+ - `batch_sampler`: batch_sampler
459
+ - `multi_dataset_batch_sampler`: round_robin
460
+
461
+ </details>
462
+
463
+ ### Training Logs
464
+ | Epoch | Step | Training Loss |
465
+ |:------:|:----:|:-------------:|
466
+ | 1.4245 | 500 | 0.1336 |
467
+ | 2.8490 | 1000 | 0.0787 |
468
+
469
+
470
+ ### Framework Versions
471
+ - Python: 3.12.3
472
+ - Sentence Transformers: 4.1.0
473
+ - Transformers: 4.52.4
474
+ - PyTorch: 2.7.0+cu128
475
+ - Accelerate: 1.7.0
476
+ - Datasets: 3.6.0
477
+ - Tokenizers: 0.21.1
478
+
479
+ ## Citation
480
+
481
+ ### BibTeX
482
+
483
+ #### Sentence Transformers
484
+ ```bibtex
485
+ @inproceedings{reimers-2019-sentence-bert,
486
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
487
+ author = "Reimers, Nils and Gurevych, Iryna",
488
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
489
+ month = "11",
490
+ year = "2019",
491
+ publisher = "Association for Computational Linguistics",
492
+ url = "https://arxiv.org/abs/1908.10084",
493
+ }
494
+ ```
495
+
496
+ <!--
497
+ ## Glossary
498
+
499
+ *Clearly define terms in order to be accessible across audiences.*
500
+ -->
501
+
502
+ <!--
503
+ ## Model Card Authors
504
+
505
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
506
+ -->
507
+
508
+ <!--
509
+ ## Model Card Contact
510
+
511
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
512
+ -->
checkpoints/checkpoint-1050/1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 768,
3
+ "pooling_mode_cls_token": true,
4
+ "pooling_mode_mean_tokens": false,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
checkpoints/checkpoint-1050/README.md ADDED
@@ -0,0 +1,512 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - sentence-transformers
4
+ - sentence-similarity
5
+ - feature-extraction
6
+ - generated_from_trainer
7
+ - dataset_size:5604
8
+ - loss:CosineSimilarityLoss
9
+ base_model: BAAI/bge-base-en-v1.5
10
+ widget:
11
+ - source_sentence: what are the powers of the virginia executive branch
12
+ sentences:
13
+ - The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
14
+ came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
15
+ Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
16
+ Seifert. They have been division champions 22 times between 1970 and 2023, making
17
+ them one of the most successful teams in NFL history. The 49ers sit alone in NFL
18
+ history for most playoff wins (38), having been in the league playoffs 30 times
19
+ (29 times in the NFL and one time in the AAFC), and have also played in the most
20
+ NFC Championship games (19), hosting 11 of them, also an NFC record. The team
21
+ has set numerous notable NFL records, including most consecutive away games won
22
+ (18), most consecutive seasons leading the league in scoring (4), most consecutive
23
+ games scored (420 games from 1977 to 2004), most field goals in a season (44),
24
+ most games won in a season (18), and most touchdowns (8) and points scored (55)
25
+ in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
26
+ in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
27
+ branch of the 49ers completed the acquisition of English soccer club Leeds United
28
+ and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
29
+ - In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
30
+ to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
31
+ Group were looking into selling the Arby's side of the business to focus on the
32
+ Wendy's brand. It was officially announced the companies would split on January
33
+ 21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
34
+ Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
35
+ East with the first location opening in Dubai in the United Arab Emirates in May
36
+ 2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
37
+ with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
38
+ the split, the former Wendy's/Arby's Group became The Wendy's Company.
39
+ - 'Executive: The Chief Executive is responsible for enforcing regional law, can
40
+ force reconsideration of legislation, and appoints Executive Council members and
41
+ principal officials. Acting with the Executive Council, the Chief Executive-in-Council
42
+ can propose new bills, issue subordinate legislation, and has authority to dissolve
43
+ the legislature. In states of emergency or public danger, the Chief Executive-in-Council
44
+ is further empowered to enact any regulation necessary to restore public order.
45
+ Legislature: The unicameral Legislative Council enacts regional law, approves
46
+ budgets, and has the power to impeach a sitting chief executive. Judiciary: The
47
+ Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
48
+ inconsistent with the Basic Law. Judges are appointed by the chief executive on
49
+ the advice of a recommendation commission. The chief executive is the head of
50
+ government and serves for a maximum of two five-year terms. The State Council
51
+ (led by the Premier of China) appoints the chief executive after nomination by
52
+ the Election Committee, which is composed of 1500 business, community, and government
53
+ leaders.'
54
+ - source_sentence: how many chromosomes does a human diploid cell have
55
+ sentences:
56
+ - The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
57
+ at a considerable advantage. However, the government was still mired in debt,
58
+ and declared bankruptcy that year. Most of the government's revenues came from
59
+ taxes and excise duties, not imported silver and other goods. The Ottoman Empire
60
+ had long menaced the fringes of the Habsburg dominions in Austria and northwest
61
+ Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
62
+ capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
63
+ Ottomans through a considerably more maritime strategy, hampering Ottoman landings
64
+ on the Venetian territories in the Eastern Mediterranean. Only in response to
65
+ raids on the eastern coast of Spain did Charles personally lead attacks against
66
+ holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
67
+ off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
68
+ vital island of Malta, defended by the Knights of St. John, were defeated. The
69
+ death of Suleiman the Magnificent the following year and his succession by Selim
70
+ II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
71
+ In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
72
+ Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
73
+ the Battle of Lepanto, in the largest naval battle fought in European waters since
74
+ Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
75
+ historic Spanish novel Don Quixote
76
+ - 'The 1930s were the team''s first golden era, when they improved their game through
77
+ play with more experienced teams. The Combinado del Pacífico (a squad composed
78
+ of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
79
+ with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
80
+ success. During one of these tours—Alianza Lima''s undefeated journey through
81
+ Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
82
+ by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
83
+ Sports historian Richard Witzig described these three as "a soccer triumvirate
84
+ unsurpassed in the world at that time", citing their combined innovation and effectiveness
85
+ at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
86
+ Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
87
+ as South American champions. Historian David Goldblatt assessed the decline of
88
+ its previous success: "despite all the apparent preconditions for footballing
89
+ growth and success, Peruvian football disappeared". He attributes this sudden
90
+ decline to Peruvian authorities'' repression of "social, sporting and political
91
+ organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
92
+ Peru performed creditably at the South American Championships, placing third in
93
+ Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
94
+ Cup finals, over two legs to eventual champions Brazil.'
95
+ - In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
96
+ and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
97
+ perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
98
+ who constituted 90% of Polish Jewry, made up half of all Poles killed during the
99
+ war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
100
+ and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
101
+ from actively risking death in order to save Jewish lives, and passive refusal
102
+ to inform on them, to indifference, blackmail, and in extreme cases, committing
103
+ premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
104
+ Polish citizens in the Holocaust was sporadic, but incidents of hostility against
105
+ Jews are well documented and have been a subject of renewed scholarly interest
106
+ during the 21st century.
107
+ - source_sentence: what is the difference between ice brent crude and wti crude
108
+ sentences:
109
+ - ==== Spring and Autumn period (722–476 BC) ====
110
+ - SpaceX has also bought and is modifying several residential properties in Boca
111
+ Chica Village, but apparently planning to leave them in residential use, about
112
+ 2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
113
+ offer to buy each of the houses in Boca Chica Village for three times the fair
114
+ market value along with an offer of VIP invitations to future launch events. The
115
+ 3x offer was said to be "non-negotiable." Homeowners were given two weeks for
116
+ this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
117
+ Department announced a proposal to transfer 43 acres of Boca Chica State Park
118
+ lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
119
+ National Wildlife Refuge.
120
+ - However, exclusive US control of this resource was eventually challenged, and
121
+ the Bering Sea Controversy resulted when the United States seized over 150 sealing
122
+ ships flying the British flag, based out of the coast of British Columbia. The
123
+ conflict between the United States and Britain was resolved by an arbitration
124
+ tribunal in 1893. The waters of the Bering Sea were deemed to be international
125
+ waters, contrary to the US contention that they were an internal sea. The US was
126
+ required to make a payment to Britain, and both nations were required to follow
127
+ regulations developed to preserve the resource.
128
+ - source_sentence: why is there a citgo sign in boston
129
+ sentences:
130
+ - Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
131
+ single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
132
+ of the 100 Greatest Country Artists of All Time. After the death of former flame
133
+ Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
134
+ "Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
135
+ The song's release the following day, on the eve of Campbell's funeral, drew ire
136
+ and criticism being exploitative. Tucker claimed that a portion of the proceeds
137
+ will benefit the Alzheimer's Foundation of America, but the foundation stated
138
+ it was not involved in the promotion and has not received any funds. Tucker released
139
+ While I'm Livin', her first collection of original material since 2002's Tanya,
140
+ in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
141
+ with Carlile brought onto the project after initially being approached for songs
142
+ by Jennings but after having professed such an admiration of Tucker and her work,
143
+ Jennings felt it necessary for her to co-produce the record alongside him. Tucker
144
+ performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
145
+ at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
146
+ single, "Hard Luck", was released on June 28, along with its accompanying music
147
+ video.
148
+ - ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
149
+ being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
150
+ ==
151
+ - The massive Islamic invasions of the mid-7th century began a long struggle between
152
+ Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
153
+ soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
154
+ Antioch and was reduced to that of Constantinople, the empire's capital. As a
155
+ result of Islamic domination of the Mediterranean, the Frankish state, centred
156
+ away from that sea, was able to evolve as the dominant power that shaped the Western
157
+ Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
158
+ advance in the West and the failed siege of Constantinople halted it in the East.
159
+ Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
160
+ the city of Ravenna from which it governed the small fragments of Italy, including
161
+ Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
162
+ by a no longer existent exarch was not asked for during the election in 752 of
163
+ Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
164
+ power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
165
+ king Pepin the Short conquered the Lombards. He then gifted the lands of the former
166
+ exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
167
+ Byzantine East were in conflict during the Photian schism, when Photius criticized
168
+ the Latin west for adding of the filioque clause, after being excommunicated by
169
+ Nicholas I. Though the schism was reconciled, unresolved issues would lead to
170
+ further division.
171
+ - source_sentence: who organized the native resistance to the british
172
+ sentences:
173
+ - === Engines === == Fifth generation (WL; 2021) ==
174
+ - '=== Unitarism === All states are unitary states, not federations or aggregates
175
+ of local governments. Local governments within them are created by and exist by
176
+ virtue of state law, and local governments within each state are subject to the
177
+ central authority of that particular state. State governments commonly delegate
178
+ some authority to local units and channel policy decisions down to them for implementation.
179
+ In a few states, local units of government are permitted a degree of home rule
180
+ over various matters. The prevailing legal theory of state preeminence over local
181
+ governments, referred to as Dillon''s Rule, holds that, A municipal corporation
182
+ possesses and can exercise the following powers and no others: First, those granted
183
+ in express words; second, those necessarily implied or necessarily incident to
184
+ the powers expressly granted; third, those absolutely essential to the declared
185
+ objects and purposes of the corporation—not simply convenient but indispensable;
186
+ fourth, any fair doubt as to the existence of power is resolved by the courts
187
+ against the corporation—against the existence of the powers. Each state defines
188
+ for itself what powers it will allow local governments. Generally, four categories
189
+ of power may be given to local jurisdictions: Structural – power to choose the
190
+ form of government, charter and enact charter revisions, Functional – power to
191
+ exercise local self-government in a broad or limited manner, Fiscal – authority
192
+ to determine revenue sources, set tax rates, borrow funds and other related financial
193
+ activities, Personnel – authority to set employment rules, remuneration rates,
194
+ employment conditions and collective bargaining. == Relationships =='
195
+ - Throughout the war, the British deported the Acadians to the Thirteen Colonies
196
+ and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
197
+ Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
198
+ force of French, Canadians, and their Native American allies led by the Marquis
199
+ de Montcalm launched an attack against the key British post at Fort Oswego on
200
+ Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
201
+ year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
202
+ Native Americans laid siege to Fort William Henry on the southern shores of Lake
203
+ George, and after three weeks of fighting the British commander Monroe surrendered.
204
+ Montcalm gave him honorable terms to return to England and not to fight for 18
205
+ months. And yet, when the British force with civilians was three miles from the
206
+ fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
207
+ pipeline_tag: sentence-similarity
208
+ library_name: sentence-transformers
209
+ ---
210
+
211
+ # SentenceTransformer based on BAAI/bge-base-en-v1.5
212
+
213
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
214
+
215
+ ## Model Details
216
+
217
+ ### Model Description
218
+ - **Model Type:** Sentence Transformer
219
+ - **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
220
+ - **Maximum Sequence Length:** 512 tokens
221
+ - **Output Dimensionality:** 768 dimensions
222
+ - **Similarity Function:** Cosine Similarity
223
+ <!-- - **Training Dataset:** Unknown -->
224
+ <!-- - **Language:** Unknown -->
225
+ <!-- - **License:** Unknown -->
226
+
227
+ ### Model Sources
228
+
229
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
230
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
231
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
232
+
233
+ ### Full Model Architecture
234
+
235
+ ```
236
+ SentenceTransformer(
237
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
238
+ (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
239
+ (2): Normalize()
240
+ )
241
+ ```
242
+
243
+ ## Usage
244
+
245
+ ### Direct Usage (Sentence Transformers)
246
+
247
+ First install the Sentence Transformers library:
248
+
249
+ ```bash
250
+ pip install -U sentence-transformers
251
+ ```
252
+
253
+ Then you can load this model and run inference.
254
+ ```python
255
+ from sentence_transformers import SentenceTransformer
256
+
257
+ # Download from the 🤗 Hub
258
+ model = SentenceTransformer("sentence_transformers_model_id")
259
+ # Run inference
260
+ sentences = [
261
+ 'who organized the native resistance to the british',
262
+ "Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
263
+ "=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
264
+ ]
265
+ embeddings = model.encode(sentences)
266
+ print(embeddings.shape)
267
+ # [3, 768]
268
+
269
+ # Get the similarity scores for the embeddings
270
+ similarities = model.similarity(embeddings, embeddings)
271
+ print(similarities.shape)
272
+ # [3, 3]
273
+ ```
274
+
275
+ <!--
276
+ ### Direct Usage (Transformers)
277
+
278
+ <details><summary>Click to see the direct usage in Transformers</summary>
279
+
280
+ </details>
281
+ -->
282
+
283
+ <!--
284
+ ### Downstream Usage (Sentence Transformers)
285
+
286
+ You can finetune this model on your own dataset.
287
+
288
+ <details><summary>Click to expand</summary>
289
+
290
+ </details>
291
+ -->
292
+
293
+ <!--
294
+ ### Out-of-Scope Use
295
+
296
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
297
+ -->
298
+
299
+ <!--
300
+ ## Bias, Risks and Limitations
301
+
302
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
303
+ -->
304
+
305
+ <!--
306
+ ### Recommendations
307
+
308
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
309
+ -->
310
+
311
+ ## Training Details
312
+
313
+ ### Training Dataset
314
+
315
+ #### Unnamed Dataset
316
+
317
+ * Size: 5,604 training samples
318
+ * Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
319
+ * Approximate statistics based on the first 1000 samples:
320
+ | | sentence_0 | sentence_1 | label |
321
+ |:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
322
+ | type | string | string | float |
323
+ | details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
324
+ * Samples:
325
+ | sentence_0 | sentence_1 | label |
326
+ |:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
327
+ | <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
328
+ | <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
329
+ | <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
330
+ * Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
331
+ ```json
332
+ {
333
+ "loss_fct": "torch.nn.modules.loss.MSELoss"
334
+ }
335
+ ```
336
+
337
+ ### Training Hyperparameters
338
+ #### Non-Default Hyperparameters
339
+
340
+ - `per_device_train_batch_size`: 16
341
+ - `per_device_eval_batch_size`: 16
342
+ - `multi_dataset_batch_sampler`: round_robin
343
+
344
+ #### All Hyperparameters
345
+ <details><summary>Click to expand</summary>
346
+
347
+ - `overwrite_output_dir`: False
348
+ - `do_predict`: False
349
+ - `eval_strategy`: no
350
+ - `prediction_loss_only`: True
351
+ - `per_device_train_batch_size`: 16
352
+ - `per_device_eval_batch_size`: 16
353
+ - `per_gpu_train_batch_size`: None
354
+ - `per_gpu_eval_batch_size`: None
355
+ - `gradient_accumulation_steps`: 1
356
+ - `eval_accumulation_steps`: None
357
+ - `torch_empty_cache_steps`: None
358
+ - `learning_rate`: 5e-05
359
+ - `weight_decay`: 0.0
360
+ - `adam_beta1`: 0.9
361
+ - `adam_beta2`: 0.999
362
+ - `adam_epsilon`: 1e-08
363
+ - `max_grad_norm`: 1
364
+ - `num_train_epochs`: 3
365
+ - `max_steps`: -1
366
+ - `lr_scheduler_type`: linear
367
+ - `lr_scheduler_kwargs`: {}
368
+ - `warmup_ratio`: 0.0
369
+ - `warmup_steps`: 0
370
+ - `log_level`: passive
371
+ - `log_level_replica`: warning
372
+ - `log_on_each_node`: True
373
+ - `logging_nan_inf_filter`: True
374
+ - `save_safetensors`: True
375
+ - `save_on_each_node`: False
376
+ - `save_only_model`: False
377
+ - `restore_callback_states_from_checkpoint`: False
378
+ - `no_cuda`: False
379
+ - `use_cpu`: False
380
+ - `use_mps_device`: False
381
+ - `seed`: 42
382
+ - `data_seed`: None
383
+ - `jit_mode_eval`: False
384
+ - `use_ipex`: False
385
+ - `bf16`: False
386
+ - `fp16`: False
387
+ - `fp16_opt_level`: O1
388
+ - `half_precision_backend`: auto
389
+ - `bf16_full_eval`: False
390
+ - `fp16_full_eval`: False
391
+ - `tf32`: None
392
+ - `local_rank`: 0
393
+ - `ddp_backend`: None
394
+ - `tpu_num_cores`: None
395
+ - `tpu_metrics_debug`: False
396
+ - `debug`: []
397
+ - `dataloader_drop_last`: False
398
+ - `dataloader_num_workers`: 0
399
+ - `dataloader_prefetch_factor`: None
400
+ - `past_index`: -1
401
+ - `disable_tqdm`: False
402
+ - `remove_unused_columns`: True
403
+ - `label_names`: None
404
+ - `load_best_model_at_end`: False
405
+ - `ignore_data_skip`: False
406
+ - `fsdp`: []
407
+ - `fsdp_min_num_params`: 0
408
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
409
+ - `fsdp_transformer_layer_cls_to_wrap`: None
410
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
411
+ - `deepspeed`: None
412
+ - `label_smoothing_factor`: 0.0
413
+ - `optim`: adamw_torch
414
+ - `optim_args`: None
415
+ - `adafactor`: False
416
+ - `group_by_length`: False
417
+ - `length_column_name`: length
418
+ - `ddp_find_unused_parameters`: None
419
+ - `ddp_bucket_cap_mb`: None
420
+ - `ddp_broadcast_buffers`: False
421
+ - `dataloader_pin_memory`: True
422
+ - `dataloader_persistent_workers`: False
423
+ - `skip_memory_metrics`: True
424
+ - `use_legacy_prediction_loop`: False
425
+ - `push_to_hub`: False
426
+ - `resume_from_checkpoint`: None
427
+ - `hub_model_id`: None
428
+ - `hub_strategy`: every_save
429
+ - `hub_private_repo`: None
430
+ - `hub_always_push`: False
431
+ - `gradient_checkpointing`: False
432
+ - `gradient_checkpointing_kwargs`: None
433
+ - `include_inputs_for_metrics`: False
434
+ - `include_for_metrics`: []
435
+ - `eval_do_concat_batches`: True
436
+ - `fp16_backend`: auto
437
+ - `push_to_hub_model_id`: None
438
+ - `push_to_hub_organization`: None
439
+ - `mp_parameters`:
440
+ - `auto_find_batch_size`: False
441
+ - `full_determinism`: False
442
+ - `torchdynamo`: None
443
+ - `ray_scope`: last
444
+ - `ddp_timeout`: 1800
445
+ - `torch_compile`: False
446
+ - `torch_compile_backend`: None
447
+ - `torch_compile_mode`: None
448
+ - `include_tokens_per_second`: False
449
+ - `include_num_input_tokens_seen`: False
450
+ - `neftune_noise_alpha`: None
451
+ - `optim_target_modules`: None
452
+ - `batch_eval_metrics`: False
453
+ - `eval_on_start`: False
454
+ - `use_liger_kernel`: False
455
+ - `eval_use_gather_object`: False
456
+ - `average_tokens_across_devices`: False
457
+ - `prompts`: None
458
+ - `batch_sampler`: batch_sampler
459
+ - `multi_dataset_batch_sampler`: round_robin
460
+
461
+ </details>
462
+
463
+ ### Training Logs
464
+ | Epoch | Step | Training Loss |
465
+ |:------:|:----:|:-------------:|
466
+ | 1.4245 | 500 | 0.1336 |
467
+ | 2.8490 | 1000 | 0.0787 |
468
+
469
+
470
+ ### Framework Versions
471
+ - Python: 3.12.3
472
+ - Sentence Transformers: 4.1.0
473
+ - Transformers: 4.52.4
474
+ - PyTorch: 2.7.0+cu128
475
+ - Accelerate: 1.7.0
476
+ - Datasets: 3.6.0
477
+ - Tokenizers: 0.21.1
478
+
479
+ ## Citation
480
+
481
+ ### BibTeX
482
+
483
+ #### Sentence Transformers
484
+ ```bibtex
485
+ @inproceedings{reimers-2019-sentence-bert,
486
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
487
+ author = "Reimers, Nils and Gurevych, Iryna",
488
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
489
+ month = "11",
490
+ year = "2019",
491
+ publisher = "Association for Computational Linguistics",
492
+ url = "https://arxiv.org/abs/1908.10084",
493
+ }
494
+ ```
495
+
496
+ <!--
497
+ ## Glossary
498
+
499
+ *Clearly define terms in order to be accessible across audiences.*
500
+ -->
501
+
502
+ <!--
503
+ ## Model Card Authors
504
+
505
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
506
+ -->
507
+
508
+ <!--
509
+ ## Model Card Contact
510
+
511
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
512
+ -->
checkpoints/checkpoint-1050/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BertModel"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "classifier_dropout": null,
7
+ "gradient_checkpointing": false,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "LABEL_0"
13
+ },
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
+ "layer_norm_eps": 1e-12,
20
+ "max_position_embeddings": 512,
21
+ "model_type": "bert",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 12,
24
+ "pad_token_id": 0,
25
+ "position_embedding_type": "absolute",
26
+ "torch_dtype": "float32",
27
+ "transformers_version": "4.52.4",
28
+ "type_vocab_size": 2,
29
+ "use_cache": true,
30
+ "vocab_size": 30522
31
+ }
checkpoints/checkpoint-1050/config_sentence_transformers.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "4.1.0",
4
+ "transformers": "4.52.4",
5
+ "pytorch": "2.7.0+cu128"
6
+ },
7
+ "prompts": {},
8
+ "default_prompt_name": null,
9
+ "similarity_fn_name": "cosine"
10
+ }
checkpoints/checkpoint-1050/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3c22492b93885a269f991e4912889fc64ca6c3858c1c70c987be738dcef7688
3
+ size 437951328
checkpoints/checkpoint-1050/modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
checkpoints/checkpoint-1050/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f0ff831e8ebad83480d98bba5381f4ee4b2f5a4a19885a5ad94be0b4e29c149
3
+ size 871298443
checkpoints/checkpoint-1050/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89fa75f44154aa9bc84403650f7166a41d177f71d86d3b4b9da11dd2045ca9f9
3
+ size 14645
checkpoints/checkpoint-1050/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:356de2ffe1b65399b40bb30d5b2a7127c39f387944414d23149ed66c1ab0c34b
3
+ size 1465
checkpoints/checkpoint-1050/sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": true
4
+ }
checkpoints/checkpoint-1050/special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
checkpoints/checkpoint-1050/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/checkpoint-1050/tokenizer_config.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "extra_special_tokens": {},
49
+ "mask_token": "[MASK]",
50
+ "model_max_length": 512,
51
+ "never_split": null,
52
+ "pad_token": "[PAD]",
53
+ "sep_token": "[SEP]",
54
+ "strip_accents": null,
55
+ "tokenize_chinese_chars": true,
56
+ "tokenizer_class": "BertTokenizer",
57
+ "unk_token": "[UNK]"
58
+ }
checkpoints/checkpoint-1050/trainer_state.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 2.9914529914529915,
6
+ "eval_steps": 0,
7
+ "global_step": 1050,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 1.4245014245014245,
14
+ "grad_norm": 1.1360502243041992,
15
+ "learning_rate": 1.1673728813559325e-05,
16
+ "loss": 0.1336,
17
+ "step": 500
18
+ },
19
+ {
20
+ "epoch": 2.849002849002849,
21
+ "grad_norm": 1.3151546716690063,
22
+ "learning_rate": 1.0805084745762714e-06,
23
+ "loss": 0.0787,
24
+ "step": 1000
25
+ }
26
+ ],
27
+ "logging_steps": 500,
28
+ "max_steps": 1053,
29
+ "num_input_tokens_seen": 0,
30
+ "num_train_epochs": 3,
31
+ "save_steps": 175,
32
+ "stateful_callbacks": {
33
+ "TrainerControl": {
34
+ "args": {
35
+ "should_epoch_stop": false,
36
+ "should_evaluate": false,
37
+ "should_log": false,
38
+ "should_save": true,
39
+ "should_training_stop": false
40
+ },
41
+ "attributes": {}
42
+ }
43
+ },
44
+ "total_flos": 0.0,
45
+ "train_batch_size": 16,
46
+ "trial_name": null,
47
+ "trial_params": null
48
+ }
checkpoints/checkpoint-1050/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:435635c51c00ae7c9634e1f44d69a2daae13b846b1d2e6a26d23d637a11c7e7f
3
+ size 5969
checkpoints/checkpoint-1050/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/checkpoint-1053/1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 768,
3
+ "pooling_mode_cls_token": true,
4
+ "pooling_mode_mean_tokens": false,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
checkpoints/checkpoint-1053/README.md ADDED
@@ -0,0 +1,512 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - sentence-transformers
4
+ - sentence-similarity
5
+ - feature-extraction
6
+ - generated_from_trainer
7
+ - dataset_size:5604
8
+ - loss:CosineSimilarityLoss
9
+ base_model: BAAI/bge-base-en-v1.5
10
+ widget:
11
+ - source_sentence: what are the powers of the virginia executive branch
12
+ sentences:
13
+ - The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
14
+ came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
15
+ Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
16
+ Seifert. They have been division champions 22 times between 1970 and 2023, making
17
+ them one of the most successful teams in NFL history. The 49ers sit alone in NFL
18
+ history for most playoff wins (38), having been in the league playoffs 30 times
19
+ (29 times in the NFL and one time in the AAFC), and have also played in the most
20
+ NFC Championship games (19), hosting 11 of them, also an NFC record. The team
21
+ has set numerous notable NFL records, including most consecutive away games won
22
+ (18), most consecutive seasons leading the league in scoring (4), most consecutive
23
+ games scored (420 games from 1977 to 2004), most field goals in a season (44),
24
+ most games won in a season (18), and most touchdowns (8) and points scored (55)
25
+ in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
26
+ in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
27
+ branch of the 49ers completed the acquisition of English soccer club Leeds United
28
+ and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
29
+ - In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
30
+ to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
31
+ Group were looking into selling the Arby's side of the business to focus on the
32
+ Wendy's brand. It was officially announced the companies would split on January
33
+ 21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
34
+ Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
35
+ East with the first location opening in Dubai in the United Arab Emirates in May
36
+ 2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
37
+ with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
38
+ the split, the former Wendy's/Arby's Group became The Wendy's Company.
39
+ - 'Executive: The Chief Executive is responsible for enforcing regional law, can
40
+ force reconsideration of legislation, and appoints Executive Council members and
41
+ principal officials. Acting with the Executive Council, the Chief Executive-in-Council
42
+ can propose new bills, issue subordinate legislation, and has authority to dissolve
43
+ the legislature. In states of emergency or public danger, the Chief Executive-in-Council
44
+ is further empowered to enact any regulation necessary to restore public order.
45
+ Legislature: The unicameral Legislative Council enacts regional law, approves
46
+ budgets, and has the power to impeach a sitting chief executive. Judiciary: The
47
+ Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
48
+ inconsistent with the Basic Law. Judges are appointed by the chief executive on
49
+ the advice of a recommendation commission. The chief executive is the head of
50
+ government and serves for a maximum of two five-year terms. The State Council
51
+ (led by the Premier of China) appoints the chief executive after nomination by
52
+ the Election Committee, which is composed of 1500 business, community, and government
53
+ leaders.'
54
+ - source_sentence: how many chromosomes does a human diploid cell have
55
+ sentences:
56
+ - The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
57
+ at a considerable advantage. However, the government was still mired in debt,
58
+ and declared bankruptcy that year. Most of the government's revenues came from
59
+ taxes and excise duties, not imported silver and other goods. The Ottoman Empire
60
+ had long menaced the fringes of the Habsburg dominions in Austria and northwest
61
+ Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
62
+ capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
63
+ Ottomans through a considerably more maritime strategy, hampering Ottoman landings
64
+ on the Venetian territories in the Eastern Mediterranean. Only in response to
65
+ raids on the eastern coast of Spain did Charles personally lead attacks against
66
+ holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
67
+ off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
68
+ vital island of Malta, defended by the Knights of St. John, were defeated. The
69
+ death of Suleiman the Magnificent the following year and his succession by Selim
70
+ II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
71
+ In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
72
+ Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
73
+ the Battle of Lepanto, in the largest naval battle fought in European waters since
74
+ Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
75
+ historic Spanish novel Don Quixote
76
+ - 'The 1930s were the team''s first golden era, when they improved their game through
77
+ play with more experienced teams. The Combinado del Pacífico (a squad composed
78
+ of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
79
+ with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
80
+ success. During one of these tours—Alianza Lima''s undefeated journey through
81
+ Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
82
+ by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
83
+ Sports historian Richard Witzig described these three as "a soccer triumvirate
84
+ unsurpassed in the world at that time", citing their combined innovation and effectiveness
85
+ at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
86
+ Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
87
+ as South American champions. Historian David Goldblatt assessed the decline of
88
+ its previous success: "despite all the apparent preconditions for footballing
89
+ growth and success, Peruvian football disappeared". He attributes this sudden
90
+ decline to Peruvian authorities'' repression of "social, sporting and political
91
+ organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
92
+ Peru performed creditably at the South American Championships, placing third in
93
+ Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
94
+ Cup finals, over two legs to eventual champions Brazil.'
95
+ - In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
96
+ and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
97
+ perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
98
+ who constituted 90% of Polish Jewry, made up half of all Poles killed during the
99
+ war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
100
+ and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
101
+ from actively risking death in order to save Jewish lives, and passive refusal
102
+ to inform on them, to indifference, blackmail, and in extreme cases, committing
103
+ premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
104
+ Polish citizens in the Holocaust was sporadic, but incidents of hostility against
105
+ Jews are well documented and have been a subject of renewed scholarly interest
106
+ during the 21st century.
107
+ - source_sentence: what is the difference between ice brent crude and wti crude
108
+ sentences:
109
+ - ==== Spring and Autumn period (722–476 BC) ====
110
+ - SpaceX has also bought and is modifying several residential properties in Boca
111
+ Chica Village, but apparently planning to leave them in residential use, about
112
+ 2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
113
+ offer to buy each of the houses in Boca Chica Village for three times the fair
114
+ market value along with an offer of VIP invitations to future launch events. The
115
+ 3x offer was said to be "non-negotiable." Homeowners were given two weeks for
116
+ this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
117
+ Department announced a proposal to transfer 43 acres of Boca Chica State Park
118
+ lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
119
+ National Wildlife Refuge.
120
+ - However, exclusive US control of this resource was eventually challenged, and
121
+ the Bering Sea Controversy resulted when the United States seized over 150 sealing
122
+ ships flying the British flag, based out of the coast of British Columbia. The
123
+ conflict between the United States and Britain was resolved by an arbitration
124
+ tribunal in 1893. The waters of the Bering Sea were deemed to be international
125
+ waters, contrary to the US contention that they were an internal sea. The US was
126
+ required to make a payment to Britain, and both nations were required to follow
127
+ regulations developed to preserve the resource.
128
+ - source_sentence: why is there a citgo sign in boston
129
+ sentences:
130
+ - Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
131
+ single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
132
+ of the 100 Greatest Country Artists of All Time. After the death of former flame
133
+ Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
134
+ "Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
135
+ The song's release the following day, on the eve of Campbell's funeral, drew ire
136
+ and criticism being exploitative. Tucker claimed that a portion of the proceeds
137
+ will benefit the Alzheimer's Foundation of America, but the foundation stated
138
+ it was not involved in the promotion and has not received any funds. Tucker released
139
+ While I'm Livin', her first collection of original material since 2002's Tanya,
140
+ in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
141
+ with Carlile brought onto the project after initially being approached for songs
142
+ by Jennings but after having professed such an admiration of Tucker and her work,
143
+ Jennings felt it necessary for her to co-produce the record alongside him. Tucker
144
+ performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
145
+ at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
146
+ single, "Hard Luck", was released on June 28, along with its accompanying music
147
+ video.
148
+ - ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
149
+ being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
150
+ ==
151
+ - The massive Islamic invasions of the mid-7th century began a long struggle between
152
+ Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
153
+ soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
154
+ Antioch and was reduced to that of Constantinople, the empire's capital. As a
155
+ result of Islamic domination of the Mediterranean, the Frankish state, centred
156
+ away from that sea, was able to evolve as the dominant power that shaped the Western
157
+ Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
158
+ advance in the West and the failed siege of Constantinople halted it in the East.
159
+ Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
160
+ the city of Ravenna from which it governed the small fragments of Italy, including
161
+ Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
162
+ by a no longer existent exarch was not asked for during the election in 752 of
163
+ Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
164
+ power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
165
+ king Pepin the Short conquered the Lombards. He then gifted the lands of the former
166
+ exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
167
+ Byzantine East were in conflict during the Photian schism, when Photius criticized
168
+ the Latin west for adding of the filioque clause, after being excommunicated by
169
+ Nicholas I. Though the schism was reconciled, unresolved issues would lead to
170
+ further division.
171
+ - source_sentence: who organized the native resistance to the british
172
+ sentences:
173
+ - === Engines === == Fifth generation (WL; 2021) ==
174
+ - '=== Unitarism === All states are unitary states, not federations or aggregates
175
+ of local governments. Local governments within them are created by and exist by
176
+ virtue of state law, and local governments within each state are subject to the
177
+ central authority of that particular state. State governments commonly delegate
178
+ some authority to local units and channel policy decisions down to them for implementation.
179
+ In a few states, local units of government are permitted a degree of home rule
180
+ over various matters. The prevailing legal theory of state preeminence over local
181
+ governments, referred to as Dillon''s Rule, holds that, A municipal corporation
182
+ possesses and can exercise the following powers and no others: First, those granted
183
+ in express words; second, those necessarily implied or necessarily incident to
184
+ the powers expressly granted; third, those absolutely essential to the declared
185
+ objects and purposes of the corporation—not simply convenient but indispensable;
186
+ fourth, any fair doubt as to the existence of power is resolved by the courts
187
+ against the corporation—against the existence of the powers. Each state defines
188
+ for itself what powers it will allow local governments. Generally, four categories
189
+ of power may be given to local jurisdictions: Structural – power to choose the
190
+ form of government, charter and enact charter revisions, Functional – power to
191
+ exercise local self-government in a broad or limited manner, Fiscal – authority
192
+ to determine revenue sources, set tax rates, borrow funds and other related financial
193
+ activities, Personnel – authority to set employment rules, remuneration rates,
194
+ employment conditions and collective bargaining. == Relationships =='
195
+ - Throughout the war, the British deported the Acadians to the Thirteen Colonies
196
+ and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
197
+ Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
198
+ force of French, Canadians, and their Native American allies led by the Marquis
199
+ de Montcalm launched an attack against the key British post at Fort Oswego on
200
+ Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
201
+ year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
202
+ Native Americans laid siege to Fort William Henry on the southern shores of Lake
203
+ George, and after three weeks of fighting the British commander Monroe surrendered.
204
+ Montcalm gave him honorable terms to return to England and not to fight for 18
205
+ months. And yet, when the British force with civilians was three miles from the
206
+ fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
207
+ pipeline_tag: sentence-similarity
208
+ library_name: sentence-transformers
209
+ ---
210
+
211
+ # SentenceTransformer based on BAAI/bge-base-en-v1.5
212
+
213
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
214
+
215
+ ## Model Details
216
+
217
+ ### Model Description
218
+ - **Model Type:** Sentence Transformer
219
+ - **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
220
+ - **Maximum Sequence Length:** 512 tokens
221
+ - **Output Dimensionality:** 768 dimensions
222
+ - **Similarity Function:** Cosine Similarity
223
+ <!-- - **Training Dataset:** Unknown -->
224
+ <!-- - **Language:** Unknown -->
225
+ <!-- - **License:** Unknown -->
226
+
227
+ ### Model Sources
228
+
229
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
230
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
231
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
232
+
233
+ ### Full Model Architecture
234
+
235
+ ```
236
+ SentenceTransformer(
237
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
238
+ (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
239
+ (2): Normalize()
240
+ )
241
+ ```
242
+
243
+ ## Usage
244
+
245
+ ### Direct Usage (Sentence Transformers)
246
+
247
+ First install the Sentence Transformers library:
248
+
249
+ ```bash
250
+ pip install -U sentence-transformers
251
+ ```
252
+
253
+ Then you can load this model and run inference.
254
+ ```python
255
+ from sentence_transformers import SentenceTransformer
256
+
257
+ # Download from the 🤗 Hub
258
+ model = SentenceTransformer("sentence_transformers_model_id")
259
+ # Run inference
260
+ sentences = [
261
+ 'who organized the native resistance to the british',
262
+ "Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
263
+ "=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
264
+ ]
265
+ embeddings = model.encode(sentences)
266
+ print(embeddings.shape)
267
+ # [3, 768]
268
+
269
+ # Get the similarity scores for the embeddings
270
+ similarities = model.similarity(embeddings, embeddings)
271
+ print(similarities.shape)
272
+ # [3, 3]
273
+ ```
274
+
275
+ <!--
276
+ ### Direct Usage (Transformers)
277
+
278
+ <details><summary>Click to see the direct usage in Transformers</summary>
279
+
280
+ </details>
281
+ -->
282
+
283
+ <!--
284
+ ### Downstream Usage (Sentence Transformers)
285
+
286
+ You can finetune this model on your own dataset.
287
+
288
+ <details><summary>Click to expand</summary>
289
+
290
+ </details>
291
+ -->
292
+
293
+ <!--
294
+ ### Out-of-Scope Use
295
+
296
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
297
+ -->
298
+
299
+ <!--
300
+ ## Bias, Risks and Limitations
301
+
302
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
303
+ -->
304
+
305
+ <!--
306
+ ### Recommendations
307
+
308
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
309
+ -->
310
+
311
+ ## Training Details
312
+
313
+ ### Training Dataset
314
+
315
+ #### Unnamed Dataset
316
+
317
+ * Size: 5,604 training samples
318
+ * Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
319
+ * Approximate statistics based on the first 1000 samples:
320
+ | | sentence_0 | sentence_1 | label |
321
+ |:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
322
+ | type | string | string | float |
323
+ | details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
324
+ * Samples:
325
+ | sentence_0 | sentence_1 | label |
326
+ |:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
327
+ | <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
328
+ | <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
329
+ | <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
330
+ * Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
331
+ ```json
332
+ {
333
+ "loss_fct": "torch.nn.modules.loss.MSELoss"
334
+ }
335
+ ```
336
+
337
+ ### Training Hyperparameters
338
+ #### Non-Default Hyperparameters
339
+
340
+ - `per_device_train_batch_size`: 16
341
+ - `per_device_eval_batch_size`: 16
342
+ - `multi_dataset_batch_sampler`: round_robin
343
+
344
+ #### All Hyperparameters
345
+ <details><summary>Click to expand</summary>
346
+
347
+ - `overwrite_output_dir`: False
348
+ - `do_predict`: False
349
+ - `eval_strategy`: no
350
+ - `prediction_loss_only`: True
351
+ - `per_device_train_batch_size`: 16
352
+ - `per_device_eval_batch_size`: 16
353
+ - `per_gpu_train_batch_size`: None
354
+ - `per_gpu_eval_batch_size`: None
355
+ - `gradient_accumulation_steps`: 1
356
+ - `eval_accumulation_steps`: None
357
+ - `torch_empty_cache_steps`: None
358
+ - `learning_rate`: 5e-05
359
+ - `weight_decay`: 0.0
360
+ - `adam_beta1`: 0.9
361
+ - `adam_beta2`: 0.999
362
+ - `adam_epsilon`: 1e-08
363
+ - `max_grad_norm`: 1
364
+ - `num_train_epochs`: 3
365
+ - `max_steps`: -1
366
+ - `lr_scheduler_type`: linear
367
+ - `lr_scheduler_kwargs`: {}
368
+ - `warmup_ratio`: 0.0
369
+ - `warmup_steps`: 0
370
+ - `log_level`: passive
371
+ - `log_level_replica`: warning
372
+ - `log_on_each_node`: True
373
+ - `logging_nan_inf_filter`: True
374
+ - `save_safetensors`: True
375
+ - `save_on_each_node`: False
376
+ - `save_only_model`: False
377
+ - `restore_callback_states_from_checkpoint`: False
378
+ - `no_cuda`: False
379
+ - `use_cpu`: False
380
+ - `use_mps_device`: False
381
+ - `seed`: 42
382
+ - `data_seed`: None
383
+ - `jit_mode_eval`: False
384
+ - `use_ipex`: False
385
+ - `bf16`: False
386
+ - `fp16`: False
387
+ - `fp16_opt_level`: O1
388
+ - `half_precision_backend`: auto
389
+ - `bf16_full_eval`: False
390
+ - `fp16_full_eval`: False
391
+ - `tf32`: None
392
+ - `local_rank`: 0
393
+ - `ddp_backend`: None
394
+ - `tpu_num_cores`: None
395
+ - `tpu_metrics_debug`: False
396
+ - `debug`: []
397
+ - `dataloader_drop_last`: False
398
+ - `dataloader_num_workers`: 0
399
+ - `dataloader_prefetch_factor`: None
400
+ - `past_index`: -1
401
+ - `disable_tqdm`: False
402
+ - `remove_unused_columns`: True
403
+ - `label_names`: None
404
+ - `load_best_model_at_end`: False
405
+ - `ignore_data_skip`: False
406
+ - `fsdp`: []
407
+ - `fsdp_min_num_params`: 0
408
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
409
+ - `fsdp_transformer_layer_cls_to_wrap`: None
410
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
411
+ - `deepspeed`: None
412
+ - `label_smoothing_factor`: 0.0
413
+ - `optim`: adamw_torch
414
+ - `optim_args`: None
415
+ - `adafactor`: False
416
+ - `group_by_length`: False
417
+ - `length_column_name`: length
418
+ - `ddp_find_unused_parameters`: None
419
+ - `ddp_bucket_cap_mb`: None
420
+ - `ddp_broadcast_buffers`: False
421
+ - `dataloader_pin_memory`: True
422
+ - `dataloader_persistent_workers`: False
423
+ - `skip_memory_metrics`: True
424
+ - `use_legacy_prediction_loop`: False
425
+ - `push_to_hub`: False
426
+ - `resume_from_checkpoint`: None
427
+ - `hub_model_id`: None
428
+ - `hub_strategy`: every_save
429
+ - `hub_private_repo`: None
430
+ - `hub_always_push`: False
431
+ - `gradient_checkpointing`: False
432
+ - `gradient_checkpointing_kwargs`: None
433
+ - `include_inputs_for_metrics`: False
434
+ - `include_for_metrics`: []
435
+ - `eval_do_concat_batches`: True
436
+ - `fp16_backend`: auto
437
+ - `push_to_hub_model_id`: None
438
+ - `push_to_hub_organization`: None
439
+ - `mp_parameters`:
440
+ - `auto_find_batch_size`: False
441
+ - `full_determinism`: False
442
+ - `torchdynamo`: None
443
+ - `ray_scope`: last
444
+ - `ddp_timeout`: 1800
445
+ - `torch_compile`: False
446
+ - `torch_compile_backend`: None
447
+ - `torch_compile_mode`: None
448
+ - `include_tokens_per_second`: False
449
+ - `include_num_input_tokens_seen`: False
450
+ - `neftune_noise_alpha`: None
451
+ - `optim_target_modules`: None
452
+ - `batch_eval_metrics`: False
453
+ - `eval_on_start`: False
454
+ - `use_liger_kernel`: False
455
+ - `eval_use_gather_object`: False
456
+ - `average_tokens_across_devices`: False
457
+ - `prompts`: None
458
+ - `batch_sampler`: batch_sampler
459
+ - `multi_dataset_batch_sampler`: round_robin
460
+
461
+ </details>
462
+
463
+ ### Training Logs
464
+ | Epoch | Step | Training Loss |
465
+ |:------:|:----:|:-------------:|
466
+ | 1.4245 | 500 | 0.1336 |
467
+ | 2.8490 | 1000 | 0.0787 |
468
+
469
+
470
+ ### Framework Versions
471
+ - Python: 3.12.3
472
+ - Sentence Transformers: 4.1.0
473
+ - Transformers: 4.52.4
474
+ - PyTorch: 2.7.0+cu128
475
+ - Accelerate: 1.7.0
476
+ - Datasets: 3.6.0
477
+ - Tokenizers: 0.21.1
478
+
479
+ ## Citation
480
+
481
+ ### BibTeX
482
+
483
+ #### Sentence Transformers
484
+ ```bibtex
485
+ @inproceedings{reimers-2019-sentence-bert,
486
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
487
+ author = "Reimers, Nils and Gurevych, Iryna",
488
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
489
+ month = "11",
490
+ year = "2019",
491
+ publisher = "Association for Computational Linguistics",
492
+ url = "https://arxiv.org/abs/1908.10084",
493
+ }
494
+ ```
495
+
496
+ <!--
497
+ ## Glossary
498
+
499
+ *Clearly define terms in order to be accessible across audiences.*
500
+ -->
501
+
502
+ <!--
503
+ ## Model Card Authors
504
+
505
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
506
+ -->
507
+
508
+ <!--
509
+ ## Model Card Contact
510
+
511
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
512
+ -->
checkpoints/checkpoint-1053/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BertModel"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "classifier_dropout": null,
7
+ "gradient_checkpointing": false,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "LABEL_0"
13
+ },
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
+ "layer_norm_eps": 1e-12,
20
+ "max_position_embeddings": 512,
21
+ "model_type": "bert",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 12,
24
+ "pad_token_id": 0,
25
+ "position_embedding_type": "absolute",
26
+ "torch_dtype": "float32",
27
+ "transformers_version": "4.52.4",
28
+ "type_vocab_size": 2,
29
+ "use_cache": true,
30
+ "vocab_size": 30522
31
+ }
checkpoints/checkpoint-1053/config_sentence_transformers.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "4.1.0",
4
+ "transformers": "4.52.4",
5
+ "pytorch": "2.7.0+cu128"
6
+ },
7
+ "prompts": {},
8
+ "default_prompt_name": null,
9
+ "similarity_fn_name": "cosine"
10
+ }
checkpoints/checkpoint-1053/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3c22492b93885a269f991e4912889fc64ca6c3858c1c70c987be738dcef7688
3
+ size 437951328
checkpoints/checkpoint-1053/modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
checkpoints/checkpoint-1053/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a03e5dacb924a89a3d5bbc1745ffadfbc7eaa1842a14c2f01b9b31b9c5762c41
3
+ size 871298443
checkpoints/checkpoint-1053/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69e7c36ebc48e5ab4614ef9885ace5ca0ce2b44bf8627bdbe99df5543059ca9c
3
+ size 14645
checkpoints/checkpoint-1053/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:744864483bede6d7cdca80d8a161998b8653394b0c8e6fbcc2fd07a220b1a8d3
3
+ size 1465
checkpoints/checkpoint-1053/sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": true
4
+ }
checkpoints/checkpoint-1053/special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
checkpoints/checkpoint-1053/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/checkpoint-1053/tokenizer_config.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "extra_special_tokens": {},
49
+ "mask_token": "[MASK]",
50
+ "model_max_length": 512,
51
+ "never_split": null,
52
+ "pad_token": "[PAD]",
53
+ "sep_token": "[SEP]",
54
+ "strip_accents": null,
55
+ "tokenize_chinese_chars": true,
56
+ "tokenizer_class": "BertTokenizer",
57
+ "unk_token": "[UNK]"
58
+ }
checkpoints/checkpoint-1053/trainer_state.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 3.0,
6
+ "eval_steps": 0,
7
+ "global_step": 1053,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 1.4245014245014245,
14
+ "grad_norm": 1.1360502243041992,
15
+ "learning_rate": 1.1673728813559325e-05,
16
+ "loss": 0.1336,
17
+ "step": 500
18
+ },
19
+ {
20
+ "epoch": 2.849002849002849,
21
+ "grad_norm": 1.3151546716690063,
22
+ "learning_rate": 1.0805084745762714e-06,
23
+ "loss": 0.0787,
24
+ "step": 1000
25
+ }
26
+ ],
27
+ "logging_steps": 500,
28
+ "max_steps": 1053,
29
+ "num_input_tokens_seen": 0,
30
+ "num_train_epochs": 3,
31
+ "save_steps": 175,
32
+ "stateful_callbacks": {
33
+ "TrainerControl": {
34
+ "args": {
35
+ "should_epoch_stop": false,
36
+ "should_evaluate": false,
37
+ "should_log": false,
38
+ "should_save": true,
39
+ "should_training_stop": true
40
+ },
41
+ "attributes": {}
42
+ }
43
+ },
44
+ "total_flos": 0.0,
45
+ "train_batch_size": 16,
46
+ "trial_name": null,
47
+ "trial_params": null
48
+ }
checkpoints/checkpoint-1053/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:435635c51c00ae7c9634e1f44d69a2daae13b846b1d2e6a26d23d637a11c7e7f
3
+ size 5969
checkpoints/checkpoint-1053/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/checkpoint-875/1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 768,
3
+ "pooling_mode_cls_token": true,
4
+ "pooling_mode_mean_tokens": false,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
checkpoints/checkpoint-875/README.md ADDED
@@ -0,0 +1,511 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - sentence-transformers
4
+ - sentence-similarity
5
+ - feature-extraction
6
+ - generated_from_trainer
7
+ - dataset_size:5604
8
+ - loss:CosineSimilarityLoss
9
+ base_model: BAAI/bge-base-en-v1.5
10
+ widget:
11
+ - source_sentence: what are the powers of the virginia executive branch
12
+ sentences:
13
+ - The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
14
+ came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
15
+ Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
16
+ Seifert. They have been division champions 22 times between 1970 and 2023, making
17
+ them one of the most successful teams in NFL history. The 49ers sit alone in NFL
18
+ history for most playoff wins (38), having been in the league playoffs 30 times
19
+ (29 times in the NFL and one time in the AAFC), and have also played in the most
20
+ NFC Championship games (19), hosting 11 of them, also an NFC record. The team
21
+ has set numerous notable NFL records, including most consecutive away games won
22
+ (18), most consecutive seasons leading the league in scoring (4), most consecutive
23
+ games scored (420 games from 1977 to 2004), most field goals in a season (44),
24
+ most games won in a season (18), and most touchdowns (8) and points scored (55)
25
+ in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
26
+ in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
27
+ branch of the 49ers completed the acquisition of English soccer club Leeds United
28
+ and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
29
+ - In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
30
+ to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
31
+ Group were looking into selling the Arby's side of the business to focus on the
32
+ Wendy's brand. It was officially announced the companies would split on January
33
+ 21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
34
+ Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
35
+ East with the first location opening in Dubai in the United Arab Emirates in May
36
+ 2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
37
+ with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
38
+ the split, the former Wendy's/Arby's Group became The Wendy's Company.
39
+ - 'Executive: The Chief Executive is responsible for enforcing regional law, can
40
+ force reconsideration of legislation, and appoints Executive Council members and
41
+ principal officials. Acting with the Executive Council, the Chief Executive-in-Council
42
+ can propose new bills, issue subordinate legislation, and has authority to dissolve
43
+ the legislature. In states of emergency or public danger, the Chief Executive-in-Council
44
+ is further empowered to enact any regulation necessary to restore public order.
45
+ Legislature: The unicameral Legislative Council enacts regional law, approves
46
+ budgets, and has the power to impeach a sitting chief executive. Judiciary: The
47
+ Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
48
+ inconsistent with the Basic Law. Judges are appointed by the chief executive on
49
+ the advice of a recommendation commission. The chief executive is the head of
50
+ government and serves for a maximum of two five-year terms. The State Council
51
+ (led by the Premier of China) appoints the chief executive after nomination by
52
+ the Election Committee, which is composed of 1500 business, community, and government
53
+ leaders.'
54
+ - source_sentence: how many chromosomes does a human diploid cell have
55
+ sentences:
56
+ - The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
57
+ at a considerable advantage. However, the government was still mired in debt,
58
+ and declared bankruptcy that year. Most of the government's revenues came from
59
+ taxes and excise duties, not imported silver and other goods. The Ottoman Empire
60
+ had long menaced the fringes of the Habsburg dominions in Austria and northwest
61
+ Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
62
+ capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
63
+ Ottomans through a considerably more maritime strategy, hampering Ottoman landings
64
+ on the Venetian territories in the Eastern Mediterranean. Only in response to
65
+ raids on the eastern coast of Spain did Charles personally lead attacks against
66
+ holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
67
+ off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
68
+ vital island of Malta, defended by the Knights of St. John, were defeated. The
69
+ death of Suleiman the Magnificent the following year and his succession by Selim
70
+ II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
71
+ In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
72
+ Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
73
+ the Battle of Lepanto, in the largest naval battle fought in European waters since
74
+ Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
75
+ historic Spanish novel Don Quixote
76
+ - 'The 1930s were the team''s first golden era, when they improved their game through
77
+ play with more experienced teams. The Combinado del Pacífico (a squad composed
78
+ of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
79
+ with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
80
+ success. During one of these tours—Alianza Lima''s undefeated journey through
81
+ Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
82
+ by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
83
+ Sports historian Richard Witzig described these three as "a soccer triumvirate
84
+ unsurpassed in the world at that time", citing their combined innovation and effectiveness
85
+ at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
86
+ Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
87
+ as South American champions. Historian David Goldblatt assessed the decline of
88
+ its previous success: "despite all the apparent preconditions for footballing
89
+ growth and success, Peruvian football disappeared". He attributes this sudden
90
+ decline to Peruvian authorities'' repression of "social, sporting and political
91
+ organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
92
+ Peru performed creditably at the South American Championships, placing third in
93
+ Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
94
+ Cup finals, over two legs to eventual champions Brazil.'
95
+ - In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
96
+ and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
97
+ perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
98
+ who constituted 90% of Polish Jewry, made up half of all Poles killed during the
99
+ war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
100
+ and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
101
+ from actively risking death in order to save Jewish lives, and passive refusal
102
+ to inform on them, to indifference, blackmail, and in extreme cases, committing
103
+ premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
104
+ Polish citizens in the Holocaust was sporadic, but incidents of hostility against
105
+ Jews are well documented and have been a subject of renewed scholarly interest
106
+ during the 21st century.
107
+ - source_sentence: what is the difference between ice brent crude and wti crude
108
+ sentences:
109
+ - ==== Spring and Autumn period (722–476 BC) ====
110
+ - SpaceX has also bought and is modifying several residential properties in Boca
111
+ Chica Village, but apparently planning to leave them in residential use, about
112
+ 2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
113
+ offer to buy each of the houses in Boca Chica Village for three times the fair
114
+ market value along with an offer of VIP invitations to future launch events. The
115
+ 3x offer was said to be "non-negotiable." Homeowners were given two weeks for
116
+ this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
117
+ Department announced a proposal to transfer 43 acres of Boca Chica State Park
118
+ lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
119
+ National Wildlife Refuge.
120
+ - However, exclusive US control of this resource was eventually challenged, and
121
+ the Bering Sea Controversy resulted when the United States seized over 150 sealing
122
+ ships flying the British flag, based out of the coast of British Columbia. The
123
+ conflict between the United States and Britain was resolved by an arbitration
124
+ tribunal in 1893. The waters of the Bering Sea were deemed to be international
125
+ waters, contrary to the US contention that they were an internal sea. The US was
126
+ required to make a payment to Britain, and both nations were required to follow
127
+ regulations developed to preserve the resource.
128
+ - source_sentence: why is there a citgo sign in boston
129
+ sentences:
130
+ - Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
131
+ single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
132
+ of the 100 Greatest Country Artists of All Time. After the death of former flame
133
+ Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
134
+ "Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
135
+ The song's release the following day, on the eve of Campbell's funeral, drew ire
136
+ and criticism being exploitative. Tucker claimed that a portion of the proceeds
137
+ will benefit the Alzheimer's Foundation of America, but the foundation stated
138
+ it was not involved in the promotion and has not received any funds. Tucker released
139
+ While I'm Livin', her first collection of original material since 2002's Tanya,
140
+ in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
141
+ with Carlile brought onto the project after initially being approached for songs
142
+ by Jennings but after having professed such an admiration of Tucker and her work,
143
+ Jennings felt it necessary for her to co-produce the record alongside him. Tucker
144
+ performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
145
+ at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
146
+ single, "Hard Luck", was released on June 28, along with its accompanying music
147
+ video.
148
+ - ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
149
+ being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
150
+ ==
151
+ - The massive Islamic invasions of the mid-7th century began a long struggle between
152
+ Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
153
+ soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
154
+ Antioch and was reduced to that of Constantinople, the empire's capital. As a
155
+ result of Islamic domination of the Mediterranean, the Frankish state, centred
156
+ away from that sea, was able to evolve as the dominant power that shaped the Western
157
+ Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
158
+ advance in the West and the failed siege of Constantinople halted it in the East.
159
+ Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
160
+ the city of Ravenna from which it governed the small fragments of Italy, including
161
+ Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
162
+ by a no longer existent exarch was not asked for during the election in 752 of
163
+ Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
164
+ power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
165
+ king Pepin the Short conquered the Lombards. He then gifted the lands of the former
166
+ exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
167
+ Byzantine East were in conflict during the Photian schism, when Photius criticized
168
+ the Latin west for adding of the filioque clause, after being excommunicated by
169
+ Nicholas I. Though the schism was reconciled, unresolved issues would lead to
170
+ further division.
171
+ - source_sentence: who organized the native resistance to the british
172
+ sentences:
173
+ - === Engines === == Fifth generation (WL; 2021) ==
174
+ - '=== Unitarism === All states are unitary states, not federations or aggregates
175
+ of local governments. Local governments within them are created by and exist by
176
+ virtue of state law, and local governments within each state are subject to the
177
+ central authority of that particular state. State governments commonly delegate
178
+ some authority to local units and channel policy decisions down to them for implementation.
179
+ In a few states, local units of government are permitted a degree of home rule
180
+ over various matters. The prevailing legal theory of state preeminence over local
181
+ governments, referred to as Dillon''s Rule, holds that, A municipal corporation
182
+ possesses and can exercise the following powers and no others: First, those granted
183
+ in express words; second, those necessarily implied or necessarily incident to
184
+ the powers expressly granted; third, those absolutely essential to the declared
185
+ objects and purposes of the corporation—not simply convenient but indispensable;
186
+ fourth, any fair doubt as to the existence of power is resolved by the courts
187
+ against the corporation—against the existence of the powers. Each state defines
188
+ for itself what powers it will allow local governments. Generally, four categories
189
+ of power may be given to local jurisdictions: Structural – power to choose the
190
+ form of government, charter and enact charter revisions, Functional – power to
191
+ exercise local self-government in a broad or limited manner, Fiscal – authority
192
+ to determine revenue sources, set tax rates, borrow funds and other related financial
193
+ activities, Personnel – authority to set employment rules, remuneration rates,
194
+ employment conditions and collective bargaining. == Relationships =='
195
+ - Throughout the war, the British deported the Acadians to the Thirteen Colonies
196
+ and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
197
+ Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
198
+ force of French, Canadians, and their Native American allies led by the Marquis
199
+ de Montcalm launched an attack against the key British post at Fort Oswego on
200
+ Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
201
+ year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
202
+ Native Americans laid siege to Fort William Henry on the southern shores of Lake
203
+ George, and after three weeks of fighting the British commander Monroe surrendered.
204
+ Montcalm gave him honorable terms to return to England and not to fight for 18
205
+ months. And yet, when the British force with civilians was three miles from the
206
+ fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
207
+ pipeline_tag: sentence-similarity
208
+ library_name: sentence-transformers
209
+ ---
210
+
211
+ # SentenceTransformer based on BAAI/bge-base-en-v1.5
212
+
213
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
214
+
215
+ ## Model Details
216
+
217
+ ### Model Description
218
+ - **Model Type:** Sentence Transformer
219
+ - **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
220
+ - **Maximum Sequence Length:** 512 tokens
221
+ - **Output Dimensionality:** 768 dimensions
222
+ - **Similarity Function:** Cosine Similarity
223
+ <!-- - **Training Dataset:** Unknown -->
224
+ <!-- - **Language:** Unknown -->
225
+ <!-- - **License:** Unknown -->
226
+
227
+ ### Model Sources
228
+
229
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
230
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
231
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
232
+
233
+ ### Full Model Architecture
234
+
235
+ ```
236
+ SentenceTransformer(
237
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
238
+ (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
239
+ (2): Normalize()
240
+ )
241
+ ```
242
+
243
+ ## Usage
244
+
245
+ ### Direct Usage (Sentence Transformers)
246
+
247
+ First install the Sentence Transformers library:
248
+
249
+ ```bash
250
+ pip install -U sentence-transformers
251
+ ```
252
+
253
+ Then you can load this model and run inference.
254
+ ```python
255
+ from sentence_transformers import SentenceTransformer
256
+
257
+ # Download from the 🤗 Hub
258
+ model = SentenceTransformer("sentence_transformers_model_id")
259
+ # Run inference
260
+ sentences = [
261
+ 'who organized the native resistance to the british',
262
+ "Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
263
+ "=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
264
+ ]
265
+ embeddings = model.encode(sentences)
266
+ print(embeddings.shape)
267
+ # [3, 768]
268
+
269
+ # Get the similarity scores for the embeddings
270
+ similarities = model.similarity(embeddings, embeddings)
271
+ print(similarities.shape)
272
+ # [3, 3]
273
+ ```
274
+
275
+ <!--
276
+ ### Direct Usage (Transformers)
277
+
278
+ <details><summary>Click to see the direct usage in Transformers</summary>
279
+
280
+ </details>
281
+ -->
282
+
283
+ <!--
284
+ ### Downstream Usage (Sentence Transformers)
285
+
286
+ You can finetune this model on your own dataset.
287
+
288
+ <details><summary>Click to expand</summary>
289
+
290
+ </details>
291
+ -->
292
+
293
+ <!--
294
+ ### Out-of-Scope Use
295
+
296
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
297
+ -->
298
+
299
+ <!--
300
+ ## Bias, Risks and Limitations
301
+
302
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
303
+ -->
304
+
305
+ <!--
306
+ ### Recommendations
307
+
308
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
309
+ -->
310
+
311
+ ## Training Details
312
+
313
+ ### Training Dataset
314
+
315
+ #### Unnamed Dataset
316
+
317
+ * Size: 5,604 training samples
318
+ * Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
319
+ * Approximate statistics based on the first 1000 samples:
320
+ | | sentence_0 | sentence_1 | label |
321
+ |:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
322
+ | type | string | string | float |
323
+ | details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
324
+ * Samples:
325
+ | sentence_0 | sentence_1 | label |
326
+ |:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
327
+ | <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
328
+ | <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
329
+ | <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
330
+ * Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
331
+ ```json
332
+ {
333
+ "loss_fct": "torch.nn.modules.loss.MSELoss"
334
+ }
335
+ ```
336
+
337
+ ### Training Hyperparameters
338
+ #### Non-Default Hyperparameters
339
+
340
+ - `per_device_train_batch_size`: 16
341
+ - `per_device_eval_batch_size`: 16
342
+ - `multi_dataset_batch_sampler`: round_robin
343
+
344
+ #### All Hyperparameters
345
+ <details><summary>Click to expand</summary>
346
+
347
+ - `overwrite_output_dir`: False
348
+ - `do_predict`: False
349
+ - `eval_strategy`: no
350
+ - `prediction_loss_only`: True
351
+ - `per_device_train_batch_size`: 16
352
+ - `per_device_eval_batch_size`: 16
353
+ - `per_gpu_train_batch_size`: None
354
+ - `per_gpu_eval_batch_size`: None
355
+ - `gradient_accumulation_steps`: 1
356
+ - `eval_accumulation_steps`: None
357
+ - `torch_empty_cache_steps`: None
358
+ - `learning_rate`: 5e-05
359
+ - `weight_decay`: 0.0
360
+ - `adam_beta1`: 0.9
361
+ - `adam_beta2`: 0.999
362
+ - `adam_epsilon`: 1e-08
363
+ - `max_grad_norm`: 1
364
+ - `num_train_epochs`: 3
365
+ - `max_steps`: -1
366
+ - `lr_scheduler_type`: linear
367
+ - `lr_scheduler_kwargs`: {}
368
+ - `warmup_ratio`: 0.0
369
+ - `warmup_steps`: 0
370
+ - `log_level`: passive
371
+ - `log_level_replica`: warning
372
+ - `log_on_each_node`: True
373
+ - `logging_nan_inf_filter`: True
374
+ - `save_safetensors`: True
375
+ - `save_on_each_node`: False
376
+ - `save_only_model`: False
377
+ - `restore_callback_states_from_checkpoint`: False
378
+ - `no_cuda`: False
379
+ - `use_cpu`: False
380
+ - `use_mps_device`: False
381
+ - `seed`: 42
382
+ - `data_seed`: None
383
+ - `jit_mode_eval`: False
384
+ - `use_ipex`: False
385
+ - `bf16`: False
386
+ - `fp16`: False
387
+ - `fp16_opt_level`: O1
388
+ - `half_precision_backend`: auto
389
+ - `bf16_full_eval`: False
390
+ - `fp16_full_eval`: False
391
+ - `tf32`: None
392
+ - `local_rank`: 0
393
+ - `ddp_backend`: None
394
+ - `tpu_num_cores`: None
395
+ - `tpu_metrics_debug`: False
396
+ - `debug`: []
397
+ - `dataloader_drop_last`: False
398
+ - `dataloader_num_workers`: 0
399
+ - `dataloader_prefetch_factor`: None
400
+ - `past_index`: -1
401
+ - `disable_tqdm`: False
402
+ - `remove_unused_columns`: True
403
+ - `label_names`: None
404
+ - `load_best_model_at_end`: False
405
+ - `ignore_data_skip`: False
406
+ - `fsdp`: []
407
+ - `fsdp_min_num_params`: 0
408
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
409
+ - `fsdp_transformer_layer_cls_to_wrap`: None
410
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
411
+ - `deepspeed`: None
412
+ - `label_smoothing_factor`: 0.0
413
+ - `optim`: adamw_torch
414
+ - `optim_args`: None
415
+ - `adafactor`: False
416
+ - `group_by_length`: False
417
+ - `length_column_name`: length
418
+ - `ddp_find_unused_parameters`: None
419
+ - `ddp_bucket_cap_mb`: None
420
+ - `ddp_broadcast_buffers`: False
421
+ - `dataloader_pin_memory`: True
422
+ - `dataloader_persistent_workers`: False
423
+ - `skip_memory_metrics`: True
424
+ - `use_legacy_prediction_loop`: False
425
+ - `push_to_hub`: False
426
+ - `resume_from_checkpoint`: None
427
+ - `hub_model_id`: None
428
+ - `hub_strategy`: every_save
429
+ - `hub_private_repo`: None
430
+ - `hub_always_push`: False
431
+ - `gradient_checkpointing`: False
432
+ - `gradient_checkpointing_kwargs`: None
433
+ - `include_inputs_for_metrics`: False
434
+ - `include_for_metrics`: []
435
+ - `eval_do_concat_batches`: True
436
+ - `fp16_backend`: auto
437
+ - `push_to_hub_model_id`: None
438
+ - `push_to_hub_organization`: None
439
+ - `mp_parameters`:
440
+ - `auto_find_batch_size`: False
441
+ - `full_determinism`: False
442
+ - `torchdynamo`: None
443
+ - `ray_scope`: last
444
+ - `ddp_timeout`: 1800
445
+ - `torch_compile`: False
446
+ - `torch_compile_backend`: None
447
+ - `torch_compile_mode`: None
448
+ - `include_tokens_per_second`: False
449
+ - `include_num_input_tokens_seen`: False
450
+ - `neftune_noise_alpha`: None
451
+ - `optim_target_modules`: None
452
+ - `batch_eval_metrics`: False
453
+ - `eval_on_start`: False
454
+ - `use_liger_kernel`: False
455
+ - `eval_use_gather_object`: False
456
+ - `average_tokens_across_devices`: False
457
+ - `prompts`: None
458
+ - `batch_sampler`: batch_sampler
459
+ - `multi_dataset_batch_sampler`: round_robin
460
+
461
+ </details>
462
+
463
+ ### Training Logs
464
+ | Epoch | Step | Training Loss |
465
+ |:------:|:----:|:-------------:|
466
+ | 1.4245 | 500 | 0.1336 |
467
+
468
+
469
+ ### Framework Versions
470
+ - Python: 3.12.3
471
+ - Sentence Transformers: 4.1.0
472
+ - Transformers: 4.52.4
473
+ - PyTorch: 2.7.0+cu128
474
+ - Accelerate: 1.7.0
475
+ - Datasets: 3.6.0
476
+ - Tokenizers: 0.21.1
477
+
478
+ ## Citation
479
+
480
+ ### BibTeX
481
+
482
+ #### Sentence Transformers
483
+ ```bibtex
484
+ @inproceedings{reimers-2019-sentence-bert,
485
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
486
+ author = "Reimers, Nils and Gurevych, Iryna",
487
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
488
+ month = "11",
489
+ year = "2019",
490
+ publisher = "Association for Computational Linguistics",
491
+ url = "https://arxiv.org/abs/1908.10084",
492
+ }
493
+ ```
494
+
495
+ <!--
496
+ ## Glossary
497
+
498
+ *Clearly define terms in order to be accessible across audiences.*
499
+ -->
500
+
501
+ <!--
502
+ ## Model Card Authors
503
+
504
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
505
+ -->
506
+
507
+ <!--
508
+ ## Model Card Contact
509
+
510
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
511
+ -->
checkpoints/checkpoint-875/config.json ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "BertModel"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "classifier_dropout": null,
7
+ "gradient_checkpointing": false,
8
+ "hidden_act": "gelu",
9
+ "hidden_dropout_prob": 0.1,
10
+ "hidden_size": 768,
11
+ "id2label": {
12
+ "0": "LABEL_0"
13
+ },
14
+ "initializer_range": 0.02,
15
+ "intermediate_size": 3072,
16
+ "label2id": {
17
+ "LABEL_0": 0
18
+ },
19
+ "layer_norm_eps": 1e-12,
20
+ "max_position_embeddings": 512,
21
+ "model_type": "bert",
22
+ "num_attention_heads": 12,
23
+ "num_hidden_layers": 12,
24
+ "pad_token_id": 0,
25
+ "position_embedding_type": "absolute",
26
+ "torch_dtype": "float32",
27
+ "transformers_version": "4.52.4",
28
+ "type_vocab_size": 2,
29
+ "use_cache": true,
30
+ "vocab_size": 30522
31
+ }
checkpoints/checkpoint-875/config_sentence_transformers.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "__version__": {
3
+ "sentence_transformers": "4.1.0",
4
+ "transformers": "4.52.4",
5
+ "pytorch": "2.7.0+cu128"
6
+ },
7
+ "prompts": {},
8
+ "default_prompt_name": null,
9
+ "similarity_fn_name": "cosine"
10
+ }
checkpoints/checkpoint-875/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03748a0a3c686eca813a869f8c058104e3ebc60afe181cf1f84ce350b19700c3
3
+ size 437951328
checkpoints/checkpoint-875/modules.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ },
14
+ {
15
+ "idx": 2,
16
+ "name": "2",
17
+ "path": "2_Normalize",
18
+ "type": "sentence_transformers.models.Normalize"
19
+ }
20
+ ]
checkpoints/checkpoint-875/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32c4db7c16f83a330ca3fb70c99ff336f6fb949322d617573d8f6b386dfab6fe
3
+ size 871298443
checkpoints/checkpoint-875/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dab8f58abd1458a3a02165ce5c02b8ea6d425be95636530c1481c4b6a088bf15
3
+ size 14645
checkpoints/checkpoint-875/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3b5728b1dd51f6dbcb263d93e234d70c8999325b78869b893d0a4f6057dd5eb
3
+ size 1465
checkpoints/checkpoint-875/sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": true
4
+ }
checkpoints/checkpoint-875/special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
checkpoints/checkpoint-875/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
checkpoints/checkpoint-875/tokenizer_config.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": true,
48
+ "extra_special_tokens": {},
49
+ "mask_token": "[MASK]",
50
+ "model_max_length": 512,
51
+ "never_split": null,
52
+ "pad_token": "[PAD]",
53
+ "sep_token": "[SEP]",
54
+ "strip_accents": null,
55
+ "tokenize_chinese_chars": true,
56
+ "tokenizer_class": "BertTokenizer",
57
+ "unk_token": "[UNK]"
58
+ }
checkpoints/checkpoint-875/trainer_state.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_global_step": null,
3
+ "best_metric": null,
4
+ "best_model_checkpoint": null,
5
+ "epoch": 2.492877492877493,
6
+ "eval_steps": 0,
7
+ "global_step": 875,
8
+ "is_hyper_param_search": false,
9
+ "is_local_process_zero": true,
10
+ "is_world_process_zero": true,
11
+ "log_history": [
12
+ {
13
+ "epoch": 1.4245014245014245,
14
+ "grad_norm": 1.1360502243041992,
15
+ "learning_rate": 1.1673728813559325e-05,
16
+ "loss": 0.1336,
17
+ "step": 500
18
+ }
19
+ ],
20
+ "logging_steps": 500,
21
+ "max_steps": 1053,
22
+ "num_input_tokens_seen": 0,
23
+ "num_train_epochs": 3,
24
+ "save_steps": 175,
25
+ "stateful_callbacks": {
26
+ "TrainerControl": {
27
+ "args": {
28
+ "should_epoch_stop": false,
29
+ "should_evaluate": false,
30
+ "should_log": false,
31
+ "should_save": true,
32
+ "should_training_stop": false
33
+ },
34
+ "attributes": {}
35
+ }
36
+ },
37
+ "total_flos": 0.0,
38
+ "train_batch_size": 16,
39
+ "trial_name": null,
40
+ "trial_params": null
41
+ }
checkpoints/checkpoint-875/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:435635c51c00ae7c9634e1f44d69a2daae13b846b1d2e6a26d23d637a11c7e7f
3
+ size 5969
checkpoints/checkpoint-875/vocab.txt ADDED
The diff for this file is too large to render. See raw diff