Upload fine-tuned retriever model
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- 1_Pooling/config.json +10 -0
- README.md +512 -0
- checkpoints/checkpoint-1050/1_Pooling/config.json +10 -0
- checkpoints/checkpoint-1050/README.md +512 -0
- checkpoints/checkpoint-1050/config.json +31 -0
- checkpoints/checkpoint-1050/config_sentence_transformers.json +10 -0
- checkpoints/checkpoint-1050/model.safetensors +3 -0
- checkpoints/checkpoint-1050/modules.json +20 -0
- checkpoints/checkpoint-1050/optimizer.pt +3 -0
- checkpoints/checkpoint-1050/rng_state.pth +3 -0
- checkpoints/checkpoint-1050/scheduler.pt +3 -0
- checkpoints/checkpoint-1050/sentence_bert_config.json +4 -0
- checkpoints/checkpoint-1050/special_tokens_map.json +37 -0
- checkpoints/checkpoint-1050/tokenizer.json +0 -0
- checkpoints/checkpoint-1050/tokenizer_config.json +58 -0
- checkpoints/checkpoint-1050/trainer_state.json +48 -0
- checkpoints/checkpoint-1050/training_args.bin +3 -0
- checkpoints/checkpoint-1050/vocab.txt +0 -0
- checkpoints/checkpoint-1053/1_Pooling/config.json +10 -0
- checkpoints/checkpoint-1053/README.md +512 -0
- checkpoints/checkpoint-1053/config.json +31 -0
- checkpoints/checkpoint-1053/config_sentence_transformers.json +10 -0
- checkpoints/checkpoint-1053/model.safetensors +3 -0
- checkpoints/checkpoint-1053/modules.json +20 -0
- checkpoints/checkpoint-1053/optimizer.pt +3 -0
- checkpoints/checkpoint-1053/rng_state.pth +3 -0
- checkpoints/checkpoint-1053/scheduler.pt +3 -0
- checkpoints/checkpoint-1053/sentence_bert_config.json +4 -0
- checkpoints/checkpoint-1053/special_tokens_map.json +37 -0
- checkpoints/checkpoint-1053/tokenizer.json +0 -0
- checkpoints/checkpoint-1053/tokenizer_config.json +58 -0
- checkpoints/checkpoint-1053/trainer_state.json +48 -0
- checkpoints/checkpoint-1053/training_args.bin +3 -0
- checkpoints/checkpoint-1053/vocab.txt +0 -0
- checkpoints/checkpoint-875/1_Pooling/config.json +10 -0
- checkpoints/checkpoint-875/README.md +511 -0
- checkpoints/checkpoint-875/config.json +31 -0
- checkpoints/checkpoint-875/config_sentence_transformers.json +10 -0
- checkpoints/checkpoint-875/model.safetensors +3 -0
- checkpoints/checkpoint-875/modules.json +20 -0
- checkpoints/checkpoint-875/optimizer.pt +3 -0
- checkpoints/checkpoint-875/rng_state.pth +3 -0
- checkpoints/checkpoint-875/scheduler.pt +3 -0
- checkpoints/checkpoint-875/sentence_bert_config.json +4 -0
- checkpoints/checkpoint-875/special_tokens_map.json +37 -0
- checkpoints/checkpoint-875/tokenizer.json +0 -0
- checkpoints/checkpoint-875/tokenizer_config.json +58 -0
- checkpoints/checkpoint-875/trainer_state.json +41 -0
- checkpoints/checkpoint-875/training_args.bin +3 -0
- checkpoints/checkpoint-875/vocab.txt +0 -0
1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": true,
|
| 4 |
+
"pooling_mode_mean_tokens": false,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
README.md
ADDED
|
@@ -0,0 +1,512 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:5604
|
| 8 |
+
- loss:CosineSimilarityLoss
|
| 9 |
+
base_model: BAAI/bge-base-en-v1.5
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: what are the powers of the virginia executive branch
|
| 12 |
+
sentences:
|
| 13 |
+
- The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
|
| 14 |
+
came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
|
| 15 |
+
Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
|
| 16 |
+
Seifert. They have been division champions 22 times between 1970 and 2023, making
|
| 17 |
+
them one of the most successful teams in NFL history. The 49ers sit alone in NFL
|
| 18 |
+
history for most playoff wins (38), having been in the league playoffs 30 times
|
| 19 |
+
(29 times in the NFL and one time in the AAFC), and have also played in the most
|
| 20 |
+
NFC Championship games (19), hosting 11 of them, also an NFC record. The team
|
| 21 |
+
has set numerous notable NFL records, including most consecutive away games won
|
| 22 |
+
(18), most consecutive seasons leading the league in scoring (4), most consecutive
|
| 23 |
+
games scored (420 games from 1977 to 2004), most field goals in a season (44),
|
| 24 |
+
most games won in a season (18), and most touchdowns (8) and points scored (55)
|
| 25 |
+
in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
|
| 26 |
+
in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
|
| 27 |
+
branch of the 49ers completed the acquisition of English soccer club Leeds United
|
| 28 |
+
and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
|
| 29 |
+
- In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
|
| 30 |
+
to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
|
| 31 |
+
Group were looking into selling the Arby's side of the business to focus on the
|
| 32 |
+
Wendy's brand. It was officially announced the companies would split on January
|
| 33 |
+
21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
|
| 34 |
+
Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
|
| 35 |
+
East with the first location opening in Dubai in the United Arab Emirates in May
|
| 36 |
+
2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
|
| 37 |
+
with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
|
| 38 |
+
the split, the former Wendy's/Arby's Group became The Wendy's Company.
|
| 39 |
+
- 'Executive: The Chief Executive is responsible for enforcing regional law, can
|
| 40 |
+
force reconsideration of legislation, and appoints Executive Council members and
|
| 41 |
+
principal officials. Acting with the Executive Council, the Chief Executive-in-Council
|
| 42 |
+
can propose new bills, issue subordinate legislation, and has authority to dissolve
|
| 43 |
+
the legislature. In states of emergency or public danger, the Chief Executive-in-Council
|
| 44 |
+
is further empowered to enact any regulation necessary to restore public order.
|
| 45 |
+
Legislature: The unicameral Legislative Council enacts regional law, approves
|
| 46 |
+
budgets, and has the power to impeach a sitting chief executive. Judiciary: The
|
| 47 |
+
Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
|
| 48 |
+
inconsistent with the Basic Law. Judges are appointed by the chief executive on
|
| 49 |
+
the advice of a recommendation commission. The chief executive is the head of
|
| 50 |
+
government and serves for a maximum of two five-year terms. The State Council
|
| 51 |
+
(led by the Premier of China) appoints the chief executive after nomination by
|
| 52 |
+
the Election Committee, which is composed of 1500 business, community, and government
|
| 53 |
+
leaders.'
|
| 54 |
+
- source_sentence: how many chromosomes does a human diploid cell have
|
| 55 |
+
sentences:
|
| 56 |
+
- The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
|
| 57 |
+
at a considerable advantage. However, the government was still mired in debt,
|
| 58 |
+
and declared bankruptcy that year. Most of the government's revenues came from
|
| 59 |
+
taxes and excise duties, not imported silver and other goods. The Ottoman Empire
|
| 60 |
+
had long menaced the fringes of the Habsburg dominions in Austria and northwest
|
| 61 |
+
Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
|
| 62 |
+
capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
|
| 63 |
+
Ottomans through a considerably more maritime strategy, hampering Ottoman landings
|
| 64 |
+
on the Venetian territories in the Eastern Mediterranean. Only in response to
|
| 65 |
+
raids on the eastern coast of Spain did Charles personally lead attacks against
|
| 66 |
+
holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
|
| 67 |
+
off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
|
| 68 |
+
vital island of Malta, defended by the Knights of St. John, were defeated. The
|
| 69 |
+
death of Suleiman the Magnificent the following year and his succession by Selim
|
| 70 |
+
II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
|
| 71 |
+
In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
|
| 72 |
+
Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
|
| 73 |
+
the Battle of Lepanto, in the largest naval battle fought in European waters since
|
| 74 |
+
Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
|
| 75 |
+
historic Spanish novel Don Quixote
|
| 76 |
+
- 'The 1930s were the team''s first golden era, when they improved their game through
|
| 77 |
+
play with more experienced teams. The Combinado del Pacífico (a squad composed
|
| 78 |
+
of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
|
| 79 |
+
with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
|
| 80 |
+
success. During one of these tours—Alianza Lima''s undefeated journey through
|
| 81 |
+
Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
|
| 82 |
+
by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
|
| 83 |
+
Sports historian Richard Witzig described these three as "a soccer triumvirate
|
| 84 |
+
unsurpassed in the world at that time", citing their combined innovation and effectiveness
|
| 85 |
+
at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
|
| 86 |
+
Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
|
| 87 |
+
as South American champions. Historian David Goldblatt assessed the decline of
|
| 88 |
+
its previous success: "despite all the apparent preconditions for footballing
|
| 89 |
+
growth and success, Peruvian football disappeared". He attributes this sudden
|
| 90 |
+
decline to Peruvian authorities'' repression of "social, sporting and political
|
| 91 |
+
organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
|
| 92 |
+
Peru performed creditably at the South American Championships, placing third in
|
| 93 |
+
Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
|
| 94 |
+
Cup finals, over two legs to eventual champions Brazil.'
|
| 95 |
+
- In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
|
| 96 |
+
and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
|
| 97 |
+
perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
|
| 98 |
+
who constituted 90% of Polish Jewry, made up half of all Poles killed during the
|
| 99 |
+
war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
|
| 100 |
+
and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
|
| 101 |
+
from actively risking death in order to save Jewish lives, and passive refusal
|
| 102 |
+
to inform on them, to indifference, blackmail, and in extreme cases, committing
|
| 103 |
+
premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
|
| 104 |
+
Polish citizens in the Holocaust was sporadic, but incidents of hostility against
|
| 105 |
+
Jews are well documented and have been a subject of renewed scholarly interest
|
| 106 |
+
during the 21st century.
|
| 107 |
+
- source_sentence: what is the difference between ice brent crude and wti crude
|
| 108 |
+
sentences:
|
| 109 |
+
- ==== Spring and Autumn period (722–476 BC) ====
|
| 110 |
+
- SpaceX has also bought and is modifying several residential properties in Boca
|
| 111 |
+
Chica Village, but apparently planning to leave them in residential use, about
|
| 112 |
+
2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
|
| 113 |
+
offer to buy each of the houses in Boca Chica Village for three times the fair
|
| 114 |
+
market value along with an offer of VIP invitations to future launch events. The
|
| 115 |
+
3x offer was said to be "non-negotiable." Homeowners were given two weeks for
|
| 116 |
+
this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
|
| 117 |
+
Department announced a proposal to transfer 43 acres of Boca Chica State Park
|
| 118 |
+
lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
|
| 119 |
+
National Wildlife Refuge.
|
| 120 |
+
- However, exclusive US control of this resource was eventually challenged, and
|
| 121 |
+
the Bering Sea Controversy resulted when the United States seized over 150 sealing
|
| 122 |
+
ships flying the British flag, based out of the coast of British Columbia. The
|
| 123 |
+
conflict between the United States and Britain was resolved by an arbitration
|
| 124 |
+
tribunal in 1893. The waters of the Bering Sea were deemed to be international
|
| 125 |
+
waters, contrary to the US contention that they were an internal sea. The US was
|
| 126 |
+
required to make a payment to Britain, and both nations were required to follow
|
| 127 |
+
regulations developed to preserve the resource.
|
| 128 |
+
- source_sentence: why is there a citgo sign in boston
|
| 129 |
+
sentences:
|
| 130 |
+
- Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
|
| 131 |
+
single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
|
| 132 |
+
of the 100 Greatest Country Artists of All Time. After the death of former flame
|
| 133 |
+
Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
|
| 134 |
+
"Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
|
| 135 |
+
The song's release the following day, on the eve of Campbell's funeral, drew ire
|
| 136 |
+
and criticism being exploitative. Tucker claimed that a portion of the proceeds
|
| 137 |
+
will benefit the Alzheimer's Foundation of America, but the foundation stated
|
| 138 |
+
it was not involved in the promotion and has not received any funds. Tucker released
|
| 139 |
+
While I'm Livin', her first collection of original material since 2002's Tanya,
|
| 140 |
+
in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
|
| 141 |
+
with Carlile brought onto the project after initially being approached for songs
|
| 142 |
+
by Jennings but after having professed such an admiration of Tucker and her work,
|
| 143 |
+
Jennings felt it necessary for her to co-produce the record alongside him. Tucker
|
| 144 |
+
performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
|
| 145 |
+
at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
|
| 146 |
+
single, "Hard Luck", was released on June 28, along with its accompanying music
|
| 147 |
+
video.
|
| 148 |
+
- ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
|
| 149 |
+
being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
|
| 150 |
+
==
|
| 151 |
+
- The massive Islamic invasions of the mid-7th century began a long struggle between
|
| 152 |
+
Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
|
| 153 |
+
soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
|
| 154 |
+
Antioch and was reduced to that of Constantinople, the empire's capital. As a
|
| 155 |
+
result of Islamic domination of the Mediterranean, the Frankish state, centred
|
| 156 |
+
away from that sea, was able to evolve as the dominant power that shaped the Western
|
| 157 |
+
Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
|
| 158 |
+
advance in the West and the failed siege of Constantinople halted it in the East.
|
| 159 |
+
Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
|
| 160 |
+
the city of Ravenna from which it governed the small fragments of Italy, including
|
| 161 |
+
Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
|
| 162 |
+
by a no longer existent exarch was not asked for during the election in 752 of
|
| 163 |
+
Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
|
| 164 |
+
power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
|
| 165 |
+
king Pepin the Short conquered the Lombards. He then gifted the lands of the former
|
| 166 |
+
exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
|
| 167 |
+
Byzantine East were in conflict during the Photian schism, when Photius criticized
|
| 168 |
+
the Latin west for adding of the filioque clause, after being excommunicated by
|
| 169 |
+
Nicholas I. Though the schism was reconciled, unresolved issues would lead to
|
| 170 |
+
further division.
|
| 171 |
+
- source_sentence: who organized the native resistance to the british
|
| 172 |
+
sentences:
|
| 173 |
+
- === Engines === == Fifth generation (WL; 2021) ==
|
| 174 |
+
- '=== Unitarism === All states are unitary states, not federations or aggregates
|
| 175 |
+
of local governments. Local governments within them are created by and exist by
|
| 176 |
+
virtue of state law, and local governments within each state are subject to the
|
| 177 |
+
central authority of that particular state. State governments commonly delegate
|
| 178 |
+
some authority to local units and channel policy decisions down to them for implementation.
|
| 179 |
+
In a few states, local units of government are permitted a degree of home rule
|
| 180 |
+
over various matters. The prevailing legal theory of state preeminence over local
|
| 181 |
+
governments, referred to as Dillon''s Rule, holds that, A municipal corporation
|
| 182 |
+
possesses and can exercise the following powers and no others: First, those granted
|
| 183 |
+
in express words; second, those necessarily implied or necessarily incident to
|
| 184 |
+
the powers expressly granted; third, those absolutely essential to the declared
|
| 185 |
+
objects and purposes of the corporation—not simply convenient but indispensable;
|
| 186 |
+
fourth, any fair doubt as to the existence of power is resolved by the courts
|
| 187 |
+
against the corporation—against the existence of the powers. Each state defines
|
| 188 |
+
for itself what powers it will allow local governments. Generally, four categories
|
| 189 |
+
of power may be given to local jurisdictions: Structural – power to choose the
|
| 190 |
+
form of government, charter and enact charter revisions, Functional – power to
|
| 191 |
+
exercise local self-government in a broad or limited manner, Fiscal – authority
|
| 192 |
+
to determine revenue sources, set tax rates, borrow funds and other related financial
|
| 193 |
+
activities, Personnel – authority to set employment rules, remuneration rates,
|
| 194 |
+
employment conditions and collective bargaining. == Relationships =='
|
| 195 |
+
- Throughout the war, the British deported the Acadians to the Thirteen Colonies
|
| 196 |
+
and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
|
| 197 |
+
Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
|
| 198 |
+
force of French, Canadians, and their Native American allies led by the Marquis
|
| 199 |
+
de Montcalm launched an attack against the key British post at Fort Oswego on
|
| 200 |
+
Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
|
| 201 |
+
year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
|
| 202 |
+
Native Americans laid siege to Fort William Henry on the southern shores of Lake
|
| 203 |
+
George, and after three weeks of fighting the British commander Monroe surrendered.
|
| 204 |
+
Montcalm gave him honorable terms to return to England and not to fight for 18
|
| 205 |
+
months. And yet, when the British force with civilians was three miles from the
|
| 206 |
+
fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
|
| 207 |
+
pipeline_tag: sentence-similarity
|
| 208 |
+
library_name: sentence-transformers
|
| 209 |
+
---
|
| 210 |
+
|
| 211 |
+
# SentenceTransformer based on BAAI/bge-base-en-v1.5
|
| 212 |
+
|
| 213 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 214 |
+
|
| 215 |
+
## Model Details
|
| 216 |
+
|
| 217 |
+
### Model Description
|
| 218 |
+
- **Model Type:** Sentence Transformer
|
| 219 |
+
- **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
|
| 220 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 221 |
+
- **Output Dimensionality:** 768 dimensions
|
| 222 |
+
- **Similarity Function:** Cosine Similarity
|
| 223 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 224 |
+
<!-- - **Language:** Unknown -->
|
| 225 |
+
<!-- - **License:** Unknown -->
|
| 226 |
+
|
| 227 |
+
### Model Sources
|
| 228 |
+
|
| 229 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 230 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 231 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 232 |
+
|
| 233 |
+
### Full Model Architecture
|
| 234 |
+
|
| 235 |
+
```
|
| 236 |
+
SentenceTransformer(
|
| 237 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
|
| 238 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 239 |
+
(2): Normalize()
|
| 240 |
+
)
|
| 241 |
+
```
|
| 242 |
+
|
| 243 |
+
## Usage
|
| 244 |
+
|
| 245 |
+
### Direct Usage (Sentence Transformers)
|
| 246 |
+
|
| 247 |
+
First install the Sentence Transformers library:
|
| 248 |
+
|
| 249 |
+
```bash
|
| 250 |
+
pip install -U sentence-transformers
|
| 251 |
+
```
|
| 252 |
+
|
| 253 |
+
Then you can load this model and run inference.
|
| 254 |
+
```python
|
| 255 |
+
from sentence_transformers import SentenceTransformer
|
| 256 |
+
|
| 257 |
+
# Download from the 🤗 Hub
|
| 258 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 259 |
+
# Run inference
|
| 260 |
+
sentences = [
|
| 261 |
+
'who organized the native resistance to the british',
|
| 262 |
+
"Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
|
| 263 |
+
"=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
|
| 264 |
+
]
|
| 265 |
+
embeddings = model.encode(sentences)
|
| 266 |
+
print(embeddings.shape)
|
| 267 |
+
# [3, 768]
|
| 268 |
+
|
| 269 |
+
# Get the similarity scores for the embeddings
|
| 270 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 271 |
+
print(similarities.shape)
|
| 272 |
+
# [3, 3]
|
| 273 |
+
```
|
| 274 |
+
|
| 275 |
+
<!--
|
| 276 |
+
### Direct Usage (Transformers)
|
| 277 |
+
|
| 278 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 279 |
+
|
| 280 |
+
</details>
|
| 281 |
+
-->
|
| 282 |
+
|
| 283 |
+
<!--
|
| 284 |
+
### Downstream Usage (Sentence Transformers)
|
| 285 |
+
|
| 286 |
+
You can finetune this model on your own dataset.
|
| 287 |
+
|
| 288 |
+
<details><summary>Click to expand</summary>
|
| 289 |
+
|
| 290 |
+
</details>
|
| 291 |
+
-->
|
| 292 |
+
|
| 293 |
+
<!--
|
| 294 |
+
### Out-of-Scope Use
|
| 295 |
+
|
| 296 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 297 |
+
-->
|
| 298 |
+
|
| 299 |
+
<!--
|
| 300 |
+
## Bias, Risks and Limitations
|
| 301 |
+
|
| 302 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 303 |
+
-->
|
| 304 |
+
|
| 305 |
+
<!--
|
| 306 |
+
### Recommendations
|
| 307 |
+
|
| 308 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 309 |
+
-->
|
| 310 |
+
|
| 311 |
+
## Training Details
|
| 312 |
+
|
| 313 |
+
### Training Dataset
|
| 314 |
+
|
| 315 |
+
#### Unnamed Dataset
|
| 316 |
+
|
| 317 |
+
* Size: 5,604 training samples
|
| 318 |
+
* Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
|
| 319 |
+
* Approximate statistics based on the first 1000 samples:
|
| 320 |
+
| | sentence_0 | sentence_1 | label |
|
| 321 |
+
|:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
| 322 |
+
| type | string | string | float |
|
| 323 |
+
| details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
|
| 324 |
+
* Samples:
|
| 325 |
+
| sentence_0 | sentence_1 | label |
|
| 326 |
+
|:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
| 327 |
+
| <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
|
| 328 |
+
| <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
|
| 329 |
+
| <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
|
| 330 |
+
* Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
|
| 331 |
+
```json
|
| 332 |
+
{
|
| 333 |
+
"loss_fct": "torch.nn.modules.loss.MSELoss"
|
| 334 |
+
}
|
| 335 |
+
```
|
| 336 |
+
|
| 337 |
+
### Training Hyperparameters
|
| 338 |
+
#### Non-Default Hyperparameters
|
| 339 |
+
|
| 340 |
+
- `per_device_train_batch_size`: 16
|
| 341 |
+
- `per_device_eval_batch_size`: 16
|
| 342 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 343 |
+
|
| 344 |
+
#### All Hyperparameters
|
| 345 |
+
<details><summary>Click to expand</summary>
|
| 346 |
+
|
| 347 |
+
- `overwrite_output_dir`: False
|
| 348 |
+
- `do_predict`: False
|
| 349 |
+
- `eval_strategy`: no
|
| 350 |
+
- `prediction_loss_only`: True
|
| 351 |
+
- `per_device_train_batch_size`: 16
|
| 352 |
+
- `per_device_eval_batch_size`: 16
|
| 353 |
+
- `per_gpu_train_batch_size`: None
|
| 354 |
+
- `per_gpu_eval_batch_size`: None
|
| 355 |
+
- `gradient_accumulation_steps`: 1
|
| 356 |
+
- `eval_accumulation_steps`: None
|
| 357 |
+
- `torch_empty_cache_steps`: None
|
| 358 |
+
- `learning_rate`: 5e-05
|
| 359 |
+
- `weight_decay`: 0.0
|
| 360 |
+
- `adam_beta1`: 0.9
|
| 361 |
+
- `adam_beta2`: 0.999
|
| 362 |
+
- `adam_epsilon`: 1e-08
|
| 363 |
+
- `max_grad_norm`: 1
|
| 364 |
+
- `num_train_epochs`: 3
|
| 365 |
+
- `max_steps`: -1
|
| 366 |
+
- `lr_scheduler_type`: linear
|
| 367 |
+
- `lr_scheduler_kwargs`: {}
|
| 368 |
+
- `warmup_ratio`: 0.0
|
| 369 |
+
- `warmup_steps`: 0
|
| 370 |
+
- `log_level`: passive
|
| 371 |
+
- `log_level_replica`: warning
|
| 372 |
+
- `log_on_each_node`: True
|
| 373 |
+
- `logging_nan_inf_filter`: True
|
| 374 |
+
- `save_safetensors`: True
|
| 375 |
+
- `save_on_each_node`: False
|
| 376 |
+
- `save_only_model`: False
|
| 377 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 378 |
+
- `no_cuda`: False
|
| 379 |
+
- `use_cpu`: False
|
| 380 |
+
- `use_mps_device`: False
|
| 381 |
+
- `seed`: 42
|
| 382 |
+
- `data_seed`: None
|
| 383 |
+
- `jit_mode_eval`: False
|
| 384 |
+
- `use_ipex`: False
|
| 385 |
+
- `bf16`: False
|
| 386 |
+
- `fp16`: False
|
| 387 |
+
- `fp16_opt_level`: O1
|
| 388 |
+
- `half_precision_backend`: auto
|
| 389 |
+
- `bf16_full_eval`: False
|
| 390 |
+
- `fp16_full_eval`: False
|
| 391 |
+
- `tf32`: None
|
| 392 |
+
- `local_rank`: 0
|
| 393 |
+
- `ddp_backend`: None
|
| 394 |
+
- `tpu_num_cores`: None
|
| 395 |
+
- `tpu_metrics_debug`: False
|
| 396 |
+
- `debug`: []
|
| 397 |
+
- `dataloader_drop_last`: False
|
| 398 |
+
- `dataloader_num_workers`: 0
|
| 399 |
+
- `dataloader_prefetch_factor`: None
|
| 400 |
+
- `past_index`: -1
|
| 401 |
+
- `disable_tqdm`: False
|
| 402 |
+
- `remove_unused_columns`: True
|
| 403 |
+
- `label_names`: None
|
| 404 |
+
- `load_best_model_at_end`: False
|
| 405 |
+
- `ignore_data_skip`: False
|
| 406 |
+
- `fsdp`: []
|
| 407 |
+
- `fsdp_min_num_params`: 0
|
| 408 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 409 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 410 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 411 |
+
- `deepspeed`: None
|
| 412 |
+
- `label_smoothing_factor`: 0.0
|
| 413 |
+
- `optim`: adamw_torch
|
| 414 |
+
- `optim_args`: None
|
| 415 |
+
- `adafactor`: False
|
| 416 |
+
- `group_by_length`: False
|
| 417 |
+
- `length_column_name`: length
|
| 418 |
+
- `ddp_find_unused_parameters`: None
|
| 419 |
+
- `ddp_bucket_cap_mb`: None
|
| 420 |
+
- `ddp_broadcast_buffers`: False
|
| 421 |
+
- `dataloader_pin_memory`: True
|
| 422 |
+
- `dataloader_persistent_workers`: False
|
| 423 |
+
- `skip_memory_metrics`: True
|
| 424 |
+
- `use_legacy_prediction_loop`: False
|
| 425 |
+
- `push_to_hub`: False
|
| 426 |
+
- `resume_from_checkpoint`: None
|
| 427 |
+
- `hub_model_id`: None
|
| 428 |
+
- `hub_strategy`: every_save
|
| 429 |
+
- `hub_private_repo`: None
|
| 430 |
+
- `hub_always_push`: False
|
| 431 |
+
- `gradient_checkpointing`: False
|
| 432 |
+
- `gradient_checkpointing_kwargs`: None
|
| 433 |
+
- `include_inputs_for_metrics`: False
|
| 434 |
+
- `include_for_metrics`: []
|
| 435 |
+
- `eval_do_concat_batches`: True
|
| 436 |
+
- `fp16_backend`: auto
|
| 437 |
+
- `push_to_hub_model_id`: None
|
| 438 |
+
- `push_to_hub_organization`: None
|
| 439 |
+
- `mp_parameters`:
|
| 440 |
+
- `auto_find_batch_size`: False
|
| 441 |
+
- `full_determinism`: False
|
| 442 |
+
- `torchdynamo`: None
|
| 443 |
+
- `ray_scope`: last
|
| 444 |
+
- `ddp_timeout`: 1800
|
| 445 |
+
- `torch_compile`: False
|
| 446 |
+
- `torch_compile_backend`: None
|
| 447 |
+
- `torch_compile_mode`: None
|
| 448 |
+
- `include_tokens_per_second`: False
|
| 449 |
+
- `include_num_input_tokens_seen`: False
|
| 450 |
+
- `neftune_noise_alpha`: None
|
| 451 |
+
- `optim_target_modules`: None
|
| 452 |
+
- `batch_eval_metrics`: False
|
| 453 |
+
- `eval_on_start`: False
|
| 454 |
+
- `use_liger_kernel`: False
|
| 455 |
+
- `eval_use_gather_object`: False
|
| 456 |
+
- `average_tokens_across_devices`: False
|
| 457 |
+
- `prompts`: None
|
| 458 |
+
- `batch_sampler`: batch_sampler
|
| 459 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 460 |
+
|
| 461 |
+
</details>
|
| 462 |
+
|
| 463 |
+
### Training Logs
|
| 464 |
+
| Epoch | Step | Training Loss |
|
| 465 |
+
|:------:|:----:|:-------------:|
|
| 466 |
+
| 1.4245 | 500 | 0.1336 |
|
| 467 |
+
| 2.8490 | 1000 | 0.0787 |
|
| 468 |
+
|
| 469 |
+
|
| 470 |
+
### Framework Versions
|
| 471 |
+
- Python: 3.12.3
|
| 472 |
+
- Sentence Transformers: 4.1.0
|
| 473 |
+
- Transformers: 4.52.4
|
| 474 |
+
- PyTorch: 2.7.0+cu128
|
| 475 |
+
- Accelerate: 1.7.0
|
| 476 |
+
- Datasets: 3.6.0
|
| 477 |
+
- Tokenizers: 0.21.1
|
| 478 |
+
|
| 479 |
+
## Citation
|
| 480 |
+
|
| 481 |
+
### BibTeX
|
| 482 |
+
|
| 483 |
+
#### Sentence Transformers
|
| 484 |
+
```bibtex
|
| 485 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 486 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 487 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 488 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 489 |
+
month = "11",
|
| 490 |
+
year = "2019",
|
| 491 |
+
publisher = "Association for Computational Linguistics",
|
| 492 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 493 |
+
}
|
| 494 |
+
```
|
| 495 |
+
|
| 496 |
+
<!--
|
| 497 |
+
## Glossary
|
| 498 |
+
|
| 499 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 500 |
+
-->
|
| 501 |
+
|
| 502 |
+
<!--
|
| 503 |
+
## Model Card Authors
|
| 504 |
+
|
| 505 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 506 |
+
-->
|
| 507 |
+
|
| 508 |
+
<!--
|
| 509 |
+
## Model Card Contact
|
| 510 |
+
|
| 511 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 512 |
+
-->
|
checkpoints/checkpoint-1050/1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": true,
|
| 4 |
+
"pooling_mode_mean_tokens": false,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
checkpoints/checkpoint-1050/README.md
ADDED
|
@@ -0,0 +1,512 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:5604
|
| 8 |
+
- loss:CosineSimilarityLoss
|
| 9 |
+
base_model: BAAI/bge-base-en-v1.5
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: what are the powers of the virginia executive branch
|
| 12 |
+
sentences:
|
| 13 |
+
- The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
|
| 14 |
+
came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
|
| 15 |
+
Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
|
| 16 |
+
Seifert. They have been division champions 22 times between 1970 and 2023, making
|
| 17 |
+
them one of the most successful teams in NFL history. The 49ers sit alone in NFL
|
| 18 |
+
history for most playoff wins (38), having been in the league playoffs 30 times
|
| 19 |
+
(29 times in the NFL and one time in the AAFC), and have also played in the most
|
| 20 |
+
NFC Championship games (19), hosting 11 of them, also an NFC record. The team
|
| 21 |
+
has set numerous notable NFL records, including most consecutive away games won
|
| 22 |
+
(18), most consecutive seasons leading the league in scoring (4), most consecutive
|
| 23 |
+
games scored (420 games from 1977 to 2004), most field goals in a season (44),
|
| 24 |
+
most games won in a season (18), and most touchdowns (8) and points scored (55)
|
| 25 |
+
in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
|
| 26 |
+
in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
|
| 27 |
+
branch of the 49ers completed the acquisition of English soccer club Leeds United
|
| 28 |
+
and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
|
| 29 |
+
- In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
|
| 30 |
+
to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
|
| 31 |
+
Group were looking into selling the Arby's side of the business to focus on the
|
| 32 |
+
Wendy's brand. It was officially announced the companies would split on January
|
| 33 |
+
21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
|
| 34 |
+
Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
|
| 35 |
+
East with the first location opening in Dubai in the United Arab Emirates in May
|
| 36 |
+
2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
|
| 37 |
+
with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
|
| 38 |
+
the split, the former Wendy's/Arby's Group became The Wendy's Company.
|
| 39 |
+
- 'Executive: The Chief Executive is responsible for enforcing regional law, can
|
| 40 |
+
force reconsideration of legislation, and appoints Executive Council members and
|
| 41 |
+
principal officials. Acting with the Executive Council, the Chief Executive-in-Council
|
| 42 |
+
can propose new bills, issue subordinate legislation, and has authority to dissolve
|
| 43 |
+
the legislature. In states of emergency or public danger, the Chief Executive-in-Council
|
| 44 |
+
is further empowered to enact any regulation necessary to restore public order.
|
| 45 |
+
Legislature: The unicameral Legislative Council enacts regional law, approves
|
| 46 |
+
budgets, and has the power to impeach a sitting chief executive. Judiciary: The
|
| 47 |
+
Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
|
| 48 |
+
inconsistent with the Basic Law. Judges are appointed by the chief executive on
|
| 49 |
+
the advice of a recommendation commission. The chief executive is the head of
|
| 50 |
+
government and serves for a maximum of two five-year terms. The State Council
|
| 51 |
+
(led by the Premier of China) appoints the chief executive after nomination by
|
| 52 |
+
the Election Committee, which is composed of 1500 business, community, and government
|
| 53 |
+
leaders.'
|
| 54 |
+
- source_sentence: how many chromosomes does a human diploid cell have
|
| 55 |
+
sentences:
|
| 56 |
+
- The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
|
| 57 |
+
at a considerable advantage. However, the government was still mired in debt,
|
| 58 |
+
and declared bankruptcy that year. Most of the government's revenues came from
|
| 59 |
+
taxes and excise duties, not imported silver and other goods. The Ottoman Empire
|
| 60 |
+
had long menaced the fringes of the Habsburg dominions in Austria and northwest
|
| 61 |
+
Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
|
| 62 |
+
capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
|
| 63 |
+
Ottomans through a considerably more maritime strategy, hampering Ottoman landings
|
| 64 |
+
on the Venetian territories in the Eastern Mediterranean. Only in response to
|
| 65 |
+
raids on the eastern coast of Spain did Charles personally lead attacks against
|
| 66 |
+
holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
|
| 67 |
+
off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
|
| 68 |
+
vital island of Malta, defended by the Knights of St. John, were defeated. The
|
| 69 |
+
death of Suleiman the Magnificent the following year and his succession by Selim
|
| 70 |
+
II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
|
| 71 |
+
In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
|
| 72 |
+
Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
|
| 73 |
+
the Battle of Lepanto, in the largest naval battle fought in European waters since
|
| 74 |
+
Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
|
| 75 |
+
historic Spanish novel Don Quixote
|
| 76 |
+
- 'The 1930s were the team''s first golden era, when they improved their game through
|
| 77 |
+
play with more experienced teams. The Combinado del Pacífico (a squad composed
|
| 78 |
+
of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
|
| 79 |
+
with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
|
| 80 |
+
success. During one of these tours—Alianza Lima''s undefeated journey through
|
| 81 |
+
Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
|
| 82 |
+
by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
|
| 83 |
+
Sports historian Richard Witzig described these three as "a soccer triumvirate
|
| 84 |
+
unsurpassed in the world at that time", citing their combined innovation and effectiveness
|
| 85 |
+
at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
|
| 86 |
+
Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
|
| 87 |
+
as South American champions. Historian David Goldblatt assessed the decline of
|
| 88 |
+
its previous success: "despite all the apparent preconditions for footballing
|
| 89 |
+
growth and success, Peruvian football disappeared". He attributes this sudden
|
| 90 |
+
decline to Peruvian authorities'' repression of "social, sporting and political
|
| 91 |
+
organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
|
| 92 |
+
Peru performed creditably at the South American Championships, placing third in
|
| 93 |
+
Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
|
| 94 |
+
Cup finals, over two legs to eventual champions Brazil.'
|
| 95 |
+
- In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
|
| 96 |
+
and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
|
| 97 |
+
perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
|
| 98 |
+
who constituted 90% of Polish Jewry, made up half of all Poles killed during the
|
| 99 |
+
war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
|
| 100 |
+
and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
|
| 101 |
+
from actively risking death in order to save Jewish lives, and passive refusal
|
| 102 |
+
to inform on them, to indifference, blackmail, and in extreme cases, committing
|
| 103 |
+
premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
|
| 104 |
+
Polish citizens in the Holocaust was sporadic, but incidents of hostility against
|
| 105 |
+
Jews are well documented and have been a subject of renewed scholarly interest
|
| 106 |
+
during the 21st century.
|
| 107 |
+
- source_sentence: what is the difference between ice brent crude and wti crude
|
| 108 |
+
sentences:
|
| 109 |
+
- ==== Spring and Autumn period (722–476 BC) ====
|
| 110 |
+
- SpaceX has also bought and is modifying several residential properties in Boca
|
| 111 |
+
Chica Village, but apparently planning to leave them in residential use, about
|
| 112 |
+
2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
|
| 113 |
+
offer to buy each of the houses in Boca Chica Village for three times the fair
|
| 114 |
+
market value along with an offer of VIP invitations to future launch events. The
|
| 115 |
+
3x offer was said to be "non-negotiable." Homeowners were given two weeks for
|
| 116 |
+
this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
|
| 117 |
+
Department announced a proposal to transfer 43 acres of Boca Chica State Park
|
| 118 |
+
lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
|
| 119 |
+
National Wildlife Refuge.
|
| 120 |
+
- However, exclusive US control of this resource was eventually challenged, and
|
| 121 |
+
the Bering Sea Controversy resulted when the United States seized over 150 sealing
|
| 122 |
+
ships flying the British flag, based out of the coast of British Columbia. The
|
| 123 |
+
conflict between the United States and Britain was resolved by an arbitration
|
| 124 |
+
tribunal in 1893. The waters of the Bering Sea were deemed to be international
|
| 125 |
+
waters, contrary to the US contention that they were an internal sea. The US was
|
| 126 |
+
required to make a payment to Britain, and both nations were required to follow
|
| 127 |
+
regulations developed to preserve the resource.
|
| 128 |
+
- source_sentence: why is there a citgo sign in boston
|
| 129 |
+
sentences:
|
| 130 |
+
- Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
|
| 131 |
+
single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
|
| 132 |
+
of the 100 Greatest Country Artists of All Time. After the death of former flame
|
| 133 |
+
Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
|
| 134 |
+
"Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
|
| 135 |
+
The song's release the following day, on the eve of Campbell's funeral, drew ire
|
| 136 |
+
and criticism being exploitative. Tucker claimed that a portion of the proceeds
|
| 137 |
+
will benefit the Alzheimer's Foundation of America, but the foundation stated
|
| 138 |
+
it was not involved in the promotion and has not received any funds. Tucker released
|
| 139 |
+
While I'm Livin', her first collection of original material since 2002's Tanya,
|
| 140 |
+
in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
|
| 141 |
+
with Carlile brought onto the project after initially being approached for songs
|
| 142 |
+
by Jennings but after having professed such an admiration of Tucker and her work,
|
| 143 |
+
Jennings felt it necessary for her to co-produce the record alongside him. Tucker
|
| 144 |
+
performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
|
| 145 |
+
at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
|
| 146 |
+
single, "Hard Luck", was released on June 28, along with its accompanying music
|
| 147 |
+
video.
|
| 148 |
+
- ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
|
| 149 |
+
being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
|
| 150 |
+
==
|
| 151 |
+
- The massive Islamic invasions of the mid-7th century began a long struggle between
|
| 152 |
+
Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
|
| 153 |
+
soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
|
| 154 |
+
Antioch and was reduced to that of Constantinople, the empire's capital. As a
|
| 155 |
+
result of Islamic domination of the Mediterranean, the Frankish state, centred
|
| 156 |
+
away from that sea, was able to evolve as the dominant power that shaped the Western
|
| 157 |
+
Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
|
| 158 |
+
advance in the West and the failed siege of Constantinople halted it in the East.
|
| 159 |
+
Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
|
| 160 |
+
the city of Ravenna from which it governed the small fragments of Italy, including
|
| 161 |
+
Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
|
| 162 |
+
by a no longer existent exarch was not asked for during the election in 752 of
|
| 163 |
+
Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
|
| 164 |
+
power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
|
| 165 |
+
king Pepin the Short conquered the Lombards. He then gifted the lands of the former
|
| 166 |
+
exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
|
| 167 |
+
Byzantine East were in conflict during the Photian schism, when Photius criticized
|
| 168 |
+
the Latin west for adding of the filioque clause, after being excommunicated by
|
| 169 |
+
Nicholas I. Though the schism was reconciled, unresolved issues would lead to
|
| 170 |
+
further division.
|
| 171 |
+
- source_sentence: who organized the native resistance to the british
|
| 172 |
+
sentences:
|
| 173 |
+
- === Engines === == Fifth generation (WL; 2021) ==
|
| 174 |
+
- '=== Unitarism === All states are unitary states, not federations or aggregates
|
| 175 |
+
of local governments. Local governments within them are created by and exist by
|
| 176 |
+
virtue of state law, and local governments within each state are subject to the
|
| 177 |
+
central authority of that particular state. State governments commonly delegate
|
| 178 |
+
some authority to local units and channel policy decisions down to them for implementation.
|
| 179 |
+
In a few states, local units of government are permitted a degree of home rule
|
| 180 |
+
over various matters. The prevailing legal theory of state preeminence over local
|
| 181 |
+
governments, referred to as Dillon''s Rule, holds that, A municipal corporation
|
| 182 |
+
possesses and can exercise the following powers and no others: First, those granted
|
| 183 |
+
in express words; second, those necessarily implied or necessarily incident to
|
| 184 |
+
the powers expressly granted; third, those absolutely essential to the declared
|
| 185 |
+
objects and purposes of the corporation—not simply convenient but indispensable;
|
| 186 |
+
fourth, any fair doubt as to the existence of power is resolved by the courts
|
| 187 |
+
against the corporation—against the existence of the powers. Each state defines
|
| 188 |
+
for itself what powers it will allow local governments. Generally, four categories
|
| 189 |
+
of power may be given to local jurisdictions: Structural – power to choose the
|
| 190 |
+
form of government, charter and enact charter revisions, Functional – power to
|
| 191 |
+
exercise local self-government in a broad or limited manner, Fiscal – authority
|
| 192 |
+
to determine revenue sources, set tax rates, borrow funds and other related financial
|
| 193 |
+
activities, Personnel – authority to set employment rules, remuneration rates,
|
| 194 |
+
employment conditions and collective bargaining. == Relationships =='
|
| 195 |
+
- Throughout the war, the British deported the Acadians to the Thirteen Colonies
|
| 196 |
+
and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
|
| 197 |
+
Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
|
| 198 |
+
force of French, Canadians, and their Native American allies led by the Marquis
|
| 199 |
+
de Montcalm launched an attack against the key British post at Fort Oswego on
|
| 200 |
+
Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
|
| 201 |
+
year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
|
| 202 |
+
Native Americans laid siege to Fort William Henry on the southern shores of Lake
|
| 203 |
+
George, and after three weeks of fighting the British commander Monroe surrendered.
|
| 204 |
+
Montcalm gave him honorable terms to return to England and not to fight for 18
|
| 205 |
+
months. And yet, when the British force with civilians was three miles from the
|
| 206 |
+
fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
|
| 207 |
+
pipeline_tag: sentence-similarity
|
| 208 |
+
library_name: sentence-transformers
|
| 209 |
+
---
|
| 210 |
+
|
| 211 |
+
# SentenceTransformer based on BAAI/bge-base-en-v1.5
|
| 212 |
+
|
| 213 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 214 |
+
|
| 215 |
+
## Model Details
|
| 216 |
+
|
| 217 |
+
### Model Description
|
| 218 |
+
- **Model Type:** Sentence Transformer
|
| 219 |
+
- **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
|
| 220 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 221 |
+
- **Output Dimensionality:** 768 dimensions
|
| 222 |
+
- **Similarity Function:** Cosine Similarity
|
| 223 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 224 |
+
<!-- - **Language:** Unknown -->
|
| 225 |
+
<!-- - **License:** Unknown -->
|
| 226 |
+
|
| 227 |
+
### Model Sources
|
| 228 |
+
|
| 229 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 230 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 231 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 232 |
+
|
| 233 |
+
### Full Model Architecture
|
| 234 |
+
|
| 235 |
+
```
|
| 236 |
+
SentenceTransformer(
|
| 237 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
|
| 238 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 239 |
+
(2): Normalize()
|
| 240 |
+
)
|
| 241 |
+
```
|
| 242 |
+
|
| 243 |
+
## Usage
|
| 244 |
+
|
| 245 |
+
### Direct Usage (Sentence Transformers)
|
| 246 |
+
|
| 247 |
+
First install the Sentence Transformers library:
|
| 248 |
+
|
| 249 |
+
```bash
|
| 250 |
+
pip install -U sentence-transformers
|
| 251 |
+
```
|
| 252 |
+
|
| 253 |
+
Then you can load this model and run inference.
|
| 254 |
+
```python
|
| 255 |
+
from sentence_transformers import SentenceTransformer
|
| 256 |
+
|
| 257 |
+
# Download from the 🤗 Hub
|
| 258 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 259 |
+
# Run inference
|
| 260 |
+
sentences = [
|
| 261 |
+
'who organized the native resistance to the british',
|
| 262 |
+
"Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
|
| 263 |
+
"=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
|
| 264 |
+
]
|
| 265 |
+
embeddings = model.encode(sentences)
|
| 266 |
+
print(embeddings.shape)
|
| 267 |
+
# [3, 768]
|
| 268 |
+
|
| 269 |
+
# Get the similarity scores for the embeddings
|
| 270 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 271 |
+
print(similarities.shape)
|
| 272 |
+
# [3, 3]
|
| 273 |
+
```
|
| 274 |
+
|
| 275 |
+
<!--
|
| 276 |
+
### Direct Usage (Transformers)
|
| 277 |
+
|
| 278 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 279 |
+
|
| 280 |
+
</details>
|
| 281 |
+
-->
|
| 282 |
+
|
| 283 |
+
<!--
|
| 284 |
+
### Downstream Usage (Sentence Transformers)
|
| 285 |
+
|
| 286 |
+
You can finetune this model on your own dataset.
|
| 287 |
+
|
| 288 |
+
<details><summary>Click to expand</summary>
|
| 289 |
+
|
| 290 |
+
</details>
|
| 291 |
+
-->
|
| 292 |
+
|
| 293 |
+
<!--
|
| 294 |
+
### Out-of-Scope Use
|
| 295 |
+
|
| 296 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 297 |
+
-->
|
| 298 |
+
|
| 299 |
+
<!--
|
| 300 |
+
## Bias, Risks and Limitations
|
| 301 |
+
|
| 302 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 303 |
+
-->
|
| 304 |
+
|
| 305 |
+
<!--
|
| 306 |
+
### Recommendations
|
| 307 |
+
|
| 308 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 309 |
+
-->
|
| 310 |
+
|
| 311 |
+
## Training Details
|
| 312 |
+
|
| 313 |
+
### Training Dataset
|
| 314 |
+
|
| 315 |
+
#### Unnamed Dataset
|
| 316 |
+
|
| 317 |
+
* Size: 5,604 training samples
|
| 318 |
+
* Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
|
| 319 |
+
* Approximate statistics based on the first 1000 samples:
|
| 320 |
+
| | sentence_0 | sentence_1 | label |
|
| 321 |
+
|:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
| 322 |
+
| type | string | string | float |
|
| 323 |
+
| details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
|
| 324 |
+
* Samples:
|
| 325 |
+
| sentence_0 | sentence_1 | label |
|
| 326 |
+
|:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
| 327 |
+
| <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
|
| 328 |
+
| <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
|
| 329 |
+
| <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
|
| 330 |
+
* Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
|
| 331 |
+
```json
|
| 332 |
+
{
|
| 333 |
+
"loss_fct": "torch.nn.modules.loss.MSELoss"
|
| 334 |
+
}
|
| 335 |
+
```
|
| 336 |
+
|
| 337 |
+
### Training Hyperparameters
|
| 338 |
+
#### Non-Default Hyperparameters
|
| 339 |
+
|
| 340 |
+
- `per_device_train_batch_size`: 16
|
| 341 |
+
- `per_device_eval_batch_size`: 16
|
| 342 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 343 |
+
|
| 344 |
+
#### All Hyperparameters
|
| 345 |
+
<details><summary>Click to expand</summary>
|
| 346 |
+
|
| 347 |
+
- `overwrite_output_dir`: False
|
| 348 |
+
- `do_predict`: False
|
| 349 |
+
- `eval_strategy`: no
|
| 350 |
+
- `prediction_loss_only`: True
|
| 351 |
+
- `per_device_train_batch_size`: 16
|
| 352 |
+
- `per_device_eval_batch_size`: 16
|
| 353 |
+
- `per_gpu_train_batch_size`: None
|
| 354 |
+
- `per_gpu_eval_batch_size`: None
|
| 355 |
+
- `gradient_accumulation_steps`: 1
|
| 356 |
+
- `eval_accumulation_steps`: None
|
| 357 |
+
- `torch_empty_cache_steps`: None
|
| 358 |
+
- `learning_rate`: 5e-05
|
| 359 |
+
- `weight_decay`: 0.0
|
| 360 |
+
- `adam_beta1`: 0.9
|
| 361 |
+
- `adam_beta2`: 0.999
|
| 362 |
+
- `adam_epsilon`: 1e-08
|
| 363 |
+
- `max_grad_norm`: 1
|
| 364 |
+
- `num_train_epochs`: 3
|
| 365 |
+
- `max_steps`: -1
|
| 366 |
+
- `lr_scheduler_type`: linear
|
| 367 |
+
- `lr_scheduler_kwargs`: {}
|
| 368 |
+
- `warmup_ratio`: 0.0
|
| 369 |
+
- `warmup_steps`: 0
|
| 370 |
+
- `log_level`: passive
|
| 371 |
+
- `log_level_replica`: warning
|
| 372 |
+
- `log_on_each_node`: True
|
| 373 |
+
- `logging_nan_inf_filter`: True
|
| 374 |
+
- `save_safetensors`: True
|
| 375 |
+
- `save_on_each_node`: False
|
| 376 |
+
- `save_only_model`: False
|
| 377 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 378 |
+
- `no_cuda`: False
|
| 379 |
+
- `use_cpu`: False
|
| 380 |
+
- `use_mps_device`: False
|
| 381 |
+
- `seed`: 42
|
| 382 |
+
- `data_seed`: None
|
| 383 |
+
- `jit_mode_eval`: False
|
| 384 |
+
- `use_ipex`: False
|
| 385 |
+
- `bf16`: False
|
| 386 |
+
- `fp16`: False
|
| 387 |
+
- `fp16_opt_level`: O1
|
| 388 |
+
- `half_precision_backend`: auto
|
| 389 |
+
- `bf16_full_eval`: False
|
| 390 |
+
- `fp16_full_eval`: False
|
| 391 |
+
- `tf32`: None
|
| 392 |
+
- `local_rank`: 0
|
| 393 |
+
- `ddp_backend`: None
|
| 394 |
+
- `tpu_num_cores`: None
|
| 395 |
+
- `tpu_metrics_debug`: False
|
| 396 |
+
- `debug`: []
|
| 397 |
+
- `dataloader_drop_last`: False
|
| 398 |
+
- `dataloader_num_workers`: 0
|
| 399 |
+
- `dataloader_prefetch_factor`: None
|
| 400 |
+
- `past_index`: -1
|
| 401 |
+
- `disable_tqdm`: False
|
| 402 |
+
- `remove_unused_columns`: True
|
| 403 |
+
- `label_names`: None
|
| 404 |
+
- `load_best_model_at_end`: False
|
| 405 |
+
- `ignore_data_skip`: False
|
| 406 |
+
- `fsdp`: []
|
| 407 |
+
- `fsdp_min_num_params`: 0
|
| 408 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 409 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 410 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 411 |
+
- `deepspeed`: None
|
| 412 |
+
- `label_smoothing_factor`: 0.0
|
| 413 |
+
- `optim`: adamw_torch
|
| 414 |
+
- `optim_args`: None
|
| 415 |
+
- `adafactor`: False
|
| 416 |
+
- `group_by_length`: False
|
| 417 |
+
- `length_column_name`: length
|
| 418 |
+
- `ddp_find_unused_parameters`: None
|
| 419 |
+
- `ddp_bucket_cap_mb`: None
|
| 420 |
+
- `ddp_broadcast_buffers`: False
|
| 421 |
+
- `dataloader_pin_memory`: True
|
| 422 |
+
- `dataloader_persistent_workers`: False
|
| 423 |
+
- `skip_memory_metrics`: True
|
| 424 |
+
- `use_legacy_prediction_loop`: False
|
| 425 |
+
- `push_to_hub`: False
|
| 426 |
+
- `resume_from_checkpoint`: None
|
| 427 |
+
- `hub_model_id`: None
|
| 428 |
+
- `hub_strategy`: every_save
|
| 429 |
+
- `hub_private_repo`: None
|
| 430 |
+
- `hub_always_push`: False
|
| 431 |
+
- `gradient_checkpointing`: False
|
| 432 |
+
- `gradient_checkpointing_kwargs`: None
|
| 433 |
+
- `include_inputs_for_metrics`: False
|
| 434 |
+
- `include_for_metrics`: []
|
| 435 |
+
- `eval_do_concat_batches`: True
|
| 436 |
+
- `fp16_backend`: auto
|
| 437 |
+
- `push_to_hub_model_id`: None
|
| 438 |
+
- `push_to_hub_organization`: None
|
| 439 |
+
- `mp_parameters`:
|
| 440 |
+
- `auto_find_batch_size`: False
|
| 441 |
+
- `full_determinism`: False
|
| 442 |
+
- `torchdynamo`: None
|
| 443 |
+
- `ray_scope`: last
|
| 444 |
+
- `ddp_timeout`: 1800
|
| 445 |
+
- `torch_compile`: False
|
| 446 |
+
- `torch_compile_backend`: None
|
| 447 |
+
- `torch_compile_mode`: None
|
| 448 |
+
- `include_tokens_per_second`: False
|
| 449 |
+
- `include_num_input_tokens_seen`: False
|
| 450 |
+
- `neftune_noise_alpha`: None
|
| 451 |
+
- `optim_target_modules`: None
|
| 452 |
+
- `batch_eval_metrics`: False
|
| 453 |
+
- `eval_on_start`: False
|
| 454 |
+
- `use_liger_kernel`: False
|
| 455 |
+
- `eval_use_gather_object`: False
|
| 456 |
+
- `average_tokens_across_devices`: False
|
| 457 |
+
- `prompts`: None
|
| 458 |
+
- `batch_sampler`: batch_sampler
|
| 459 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 460 |
+
|
| 461 |
+
</details>
|
| 462 |
+
|
| 463 |
+
### Training Logs
|
| 464 |
+
| Epoch | Step | Training Loss |
|
| 465 |
+
|:------:|:----:|:-------------:|
|
| 466 |
+
| 1.4245 | 500 | 0.1336 |
|
| 467 |
+
| 2.8490 | 1000 | 0.0787 |
|
| 468 |
+
|
| 469 |
+
|
| 470 |
+
### Framework Versions
|
| 471 |
+
- Python: 3.12.3
|
| 472 |
+
- Sentence Transformers: 4.1.0
|
| 473 |
+
- Transformers: 4.52.4
|
| 474 |
+
- PyTorch: 2.7.0+cu128
|
| 475 |
+
- Accelerate: 1.7.0
|
| 476 |
+
- Datasets: 3.6.0
|
| 477 |
+
- Tokenizers: 0.21.1
|
| 478 |
+
|
| 479 |
+
## Citation
|
| 480 |
+
|
| 481 |
+
### BibTeX
|
| 482 |
+
|
| 483 |
+
#### Sentence Transformers
|
| 484 |
+
```bibtex
|
| 485 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 486 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 487 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 488 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 489 |
+
month = "11",
|
| 490 |
+
year = "2019",
|
| 491 |
+
publisher = "Association for Computational Linguistics",
|
| 492 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 493 |
+
}
|
| 494 |
+
```
|
| 495 |
+
|
| 496 |
+
<!--
|
| 497 |
+
## Glossary
|
| 498 |
+
|
| 499 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 500 |
+
-->
|
| 501 |
+
|
| 502 |
+
<!--
|
| 503 |
+
## Model Card Authors
|
| 504 |
+
|
| 505 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 506 |
+
-->
|
| 507 |
+
|
| 508 |
+
<!--
|
| 509 |
+
## Model Card Contact
|
| 510 |
+
|
| 511 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 512 |
+
-->
|
checkpoints/checkpoint-1050/config.json
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"BertModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"classifier_dropout": null,
|
| 7 |
+
"gradient_checkpointing": false,
|
| 8 |
+
"hidden_act": "gelu",
|
| 9 |
+
"hidden_dropout_prob": 0.1,
|
| 10 |
+
"hidden_size": 768,
|
| 11 |
+
"id2label": {
|
| 12 |
+
"0": "LABEL_0"
|
| 13 |
+
},
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 3072,
|
| 16 |
+
"label2id": {
|
| 17 |
+
"LABEL_0": 0
|
| 18 |
+
},
|
| 19 |
+
"layer_norm_eps": 1e-12,
|
| 20 |
+
"max_position_embeddings": 512,
|
| 21 |
+
"model_type": "bert",
|
| 22 |
+
"num_attention_heads": 12,
|
| 23 |
+
"num_hidden_layers": 12,
|
| 24 |
+
"pad_token_id": 0,
|
| 25 |
+
"position_embedding_type": "absolute",
|
| 26 |
+
"torch_dtype": "float32",
|
| 27 |
+
"transformers_version": "4.52.4",
|
| 28 |
+
"type_vocab_size": 2,
|
| 29 |
+
"use_cache": true,
|
| 30 |
+
"vocab_size": 30522
|
| 31 |
+
}
|
checkpoints/checkpoint-1050/config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"__version__": {
|
| 3 |
+
"sentence_transformers": "4.1.0",
|
| 4 |
+
"transformers": "4.52.4",
|
| 5 |
+
"pytorch": "2.7.0+cu128"
|
| 6 |
+
},
|
| 7 |
+
"prompts": {},
|
| 8 |
+
"default_prompt_name": null,
|
| 9 |
+
"similarity_fn_name": "cosine"
|
| 10 |
+
}
|
checkpoints/checkpoint-1050/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3c22492b93885a269f991e4912889fc64ca6c3858c1c70c987be738dcef7688
|
| 3 |
+
size 437951328
|
checkpoints/checkpoint-1050/modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
checkpoints/checkpoint-1050/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f0ff831e8ebad83480d98bba5381f4ee4b2f5a4a19885a5ad94be0b4e29c149
|
| 3 |
+
size 871298443
|
checkpoints/checkpoint-1050/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89fa75f44154aa9bc84403650f7166a41d177f71d86d3b4b9da11dd2045ca9f9
|
| 3 |
+
size 14645
|
checkpoints/checkpoint-1050/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:356de2ffe1b65399b40bb30d5b2a7127c39f387944414d23149ed66c1ab0c34b
|
| 3 |
+
size 1465
|
checkpoints/checkpoint-1050/sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 512,
|
| 3 |
+
"do_lower_case": true
|
| 4 |
+
}
|
checkpoints/checkpoint-1050/special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
checkpoints/checkpoint-1050/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoints/checkpoint-1050/tokenizer_config.json
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"100": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"101": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"102": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"103": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_basic_tokenize": true,
|
| 47 |
+
"do_lower_case": true,
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "[MASK]",
|
| 50 |
+
"model_max_length": 512,
|
| 51 |
+
"never_split": null,
|
| 52 |
+
"pad_token": "[PAD]",
|
| 53 |
+
"sep_token": "[SEP]",
|
| 54 |
+
"strip_accents": null,
|
| 55 |
+
"tokenize_chinese_chars": true,
|
| 56 |
+
"tokenizer_class": "BertTokenizer",
|
| 57 |
+
"unk_token": "[UNK]"
|
| 58 |
+
}
|
checkpoints/checkpoint-1050/trainer_state.json
ADDED
|
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_global_step": null,
|
| 3 |
+
"best_metric": null,
|
| 4 |
+
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 2.9914529914529915,
|
| 6 |
+
"eval_steps": 0,
|
| 7 |
+
"global_step": 1050,
|
| 8 |
+
"is_hyper_param_search": false,
|
| 9 |
+
"is_local_process_zero": true,
|
| 10 |
+
"is_world_process_zero": true,
|
| 11 |
+
"log_history": [
|
| 12 |
+
{
|
| 13 |
+
"epoch": 1.4245014245014245,
|
| 14 |
+
"grad_norm": 1.1360502243041992,
|
| 15 |
+
"learning_rate": 1.1673728813559325e-05,
|
| 16 |
+
"loss": 0.1336,
|
| 17 |
+
"step": 500
|
| 18 |
+
},
|
| 19 |
+
{
|
| 20 |
+
"epoch": 2.849002849002849,
|
| 21 |
+
"grad_norm": 1.3151546716690063,
|
| 22 |
+
"learning_rate": 1.0805084745762714e-06,
|
| 23 |
+
"loss": 0.0787,
|
| 24 |
+
"step": 1000
|
| 25 |
+
}
|
| 26 |
+
],
|
| 27 |
+
"logging_steps": 500,
|
| 28 |
+
"max_steps": 1053,
|
| 29 |
+
"num_input_tokens_seen": 0,
|
| 30 |
+
"num_train_epochs": 3,
|
| 31 |
+
"save_steps": 175,
|
| 32 |
+
"stateful_callbacks": {
|
| 33 |
+
"TrainerControl": {
|
| 34 |
+
"args": {
|
| 35 |
+
"should_epoch_stop": false,
|
| 36 |
+
"should_evaluate": false,
|
| 37 |
+
"should_log": false,
|
| 38 |
+
"should_save": true,
|
| 39 |
+
"should_training_stop": false
|
| 40 |
+
},
|
| 41 |
+
"attributes": {}
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"total_flos": 0.0,
|
| 45 |
+
"train_batch_size": 16,
|
| 46 |
+
"trial_name": null,
|
| 47 |
+
"trial_params": null
|
| 48 |
+
}
|
checkpoints/checkpoint-1050/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:435635c51c00ae7c9634e1f44d69a2daae13b846b1d2e6a26d23d637a11c7e7f
|
| 3 |
+
size 5969
|
checkpoints/checkpoint-1050/vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoints/checkpoint-1053/1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": true,
|
| 4 |
+
"pooling_mode_mean_tokens": false,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
checkpoints/checkpoint-1053/README.md
ADDED
|
@@ -0,0 +1,512 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:5604
|
| 8 |
+
- loss:CosineSimilarityLoss
|
| 9 |
+
base_model: BAAI/bge-base-en-v1.5
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: what are the powers of the virginia executive branch
|
| 12 |
+
sentences:
|
| 13 |
+
- The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
|
| 14 |
+
came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
|
| 15 |
+
Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
|
| 16 |
+
Seifert. They have been division champions 22 times between 1970 and 2023, making
|
| 17 |
+
them one of the most successful teams in NFL history. The 49ers sit alone in NFL
|
| 18 |
+
history for most playoff wins (38), having been in the league playoffs 30 times
|
| 19 |
+
(29 times in the NFL and one time in the AAFC), and have also played in the most
|
| 20 |
+
NFC Championship games (19), hosting 11 of them, also an NFC record. The team
|
| 21 |
+
has set numerous notable NFL records, including most consecutive away games won
|
| 22 |
+
(18), most consecutive seasons leading the league in scoring (4), most consecutive
|
| 23 |
+
games scored (420 games from 1977 to 2004), most field goals in a season (44),
|
| 24 |
+
most games won in a season (18), and most touchdowns (8) and points scored (55)
|
| 25 |
+
in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
|
| 26 |
+
in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
|
| 27 |
+
branch of the 49ers completed the acquisition of English soccer club Leeds United
|
| 28 |
+
and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
|
| 29 |
+
- In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
|
| 30 |
+
to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
|
| 31 |
+
Group were looking into selling the Arby's side of the business to focus on the
|
| 32 |
+
Wendy's brand. It was officially announced the companies would split on January
|
| 33 |
+
21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
|
| 34 |
+
Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
|
| 35 |
+
East with the first location opening in Dubai in the United Arab Emirates in May
|
| 36 |
+
2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
|
| 37 |
+
with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
|
| 38 |
+
the split, the former Wendy's/Arby's Group became The Wendy's Company.
|
| 39 |
+
- 'Executive: The Chief Executive is responsible for enforcing regional law, can
|
| 40 |
+
force reconsideration of legislation, and appoints Executive Council members and
|
| 41 |
+
principal officials. Acting with the Executive Council, the Chief Executive-in-Council
|
| 42 |
+
can propose new bills, issue subordinate legislation, and has authority to dissolve
|
| 43 |
+
the legislature. In states of emergency or public danger, the Chief Executive-in-Council
|
| 44 |
+
is further empowered to enact any regulation necessary to restore public order.
|
| 45 |
+
Legislature: The unicameral Legislative Council enacts regional law, approves
|
| 46 |
+
budgets, and has the power to impeach a sitting chief executive. Judiciary: The
|
| 47 |
+
Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
|
| 48 |
+
inconsistent with the Basic Law. Judges are appointed by the chief executive on
|
| 49 |
+
the advice of a recommendation commission. The chief executive is the head of
|
| 50 |
+
government and serves for a maximum of two five-year terms. The State Council
|
| 51 |
+
(led by the Premier of China) appoints the chief executive after nomination by
|
| 52 |
+
the Election Committee, which is composed of 1500 business, community, and government
|
| 53 |
+
leaders.'
|
| 54 |
+
- source_sentence: how many chromosomes does a human diploid cell have
|
| 55 |
+
sentences:
|
| 56 |
+
- The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
|
| 57 |
+
at a considerable advantage. However, the government was still mired in debt,
|
| 58 |
+
and declared bankruptcy that year. Most of the government's revenues came from
|
| 59 |
+
taxes and excise duties, not imported silver and other goods. The Ottoman Empire
|
| 60 |
+
had long menaced the fringes of the Habsburg dominions in Austria and northwest
|
| 61 |
+
Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
|
| 62 |
+
capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
|
| 63 |
+
Ottomans through a considerably more maritime strategy, hampering Ottoman landings
|
| 64 |
+
on the Venetian territories in the Eastern Mediterranean. Only in response to
|
| 65 |
+
raids on the eastern coast of Spain did Charles personally lead attacks against
|
| 66 |
+
holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
|
| 67 |
+
off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
|
| 68 |
+
vital island of Malta, defended by the Knights of St. John, were defeated. The
|
| 69 |
+
death of Suleiman the Magnificent the following year and his succession by Selim
|
| 70 |
+
II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
|
| 71 |
+
In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
|
| 72 |
+
Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
|
| 73 |
+
the Battle of Lepanto, in the largest naval battle fought in European waters since
|
| 74 |
+
Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
|
| 75 |
+
historic Spanish novel Don Quixote
|
| 76 |
+
- 'The 1930s were the team''s first golden era, when they improved their game through
|
| 77 |
+
play with more experienced teams. The Combinado del Pacífico (a squad composed
|
| 78 |
+
of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
|
| 79 |
+
with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
|
| 80 |
+
success. During one of these tours—Alianza Lima''s undefeated journey through
|
| 81 |
+
Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
|
| 82 |
+
by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
|
| 83 |
+
Sports historian Richard Witzig described these three as "a soccer triumvirate
|
| 84 |
+
unsurpassed in the world at that time", citing their combined innovation and effectiveness
|
| 85 |
+
at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
|
| 86 |
+
Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
|
| 87 |
+
as South American champions. Historian David Goldblatt assessed the decline of
|
| 88 |
+
its previous success: "despite all the apparent preconditions for footballing
|
| 89 |
+
growth and success, Peruvian football disappeared". He attributes this sudden
|
| 90 |
+
decline to Peruvian authorities'' repression of "social, sporting and political
|
| 91 |
+
organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
|
| 92 |
+
Peru performed creditably at the South American Championships, placing third in
|
| 93 |
+
Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
|
| 94 |
+
Cup finals, over two legs to eventual champions Brazil.'
|
| 95 |
+
- In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
|
| 96 |
+
and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
|
| 97 |
+
perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
|
| 98 |
+
who constituted 90% of Polish Jewry, made up half of all Poles killed during the
|
| 99 |
+
war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
|
| 100 |
+
and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
|
| 101 |
+
from actively risking death in order to save Jewish lives, and passive refusal
|
| 102 |
+
to inform on them, to indifference, blackmail, and in extreme cases, committing
|
| 103 |
+
premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
|
| 104 |
+
Polish citizens in the Holocaust was sporadic, but incidents of hostility against
|
| 105 |
+
Jews are well documented and have been a subject of renewed scholarly interest
|
| 106 |
+
during the 21st century.
|
| 107 |
+
- source_sentence: what is the difference between ice brent crude and wti crude
|
| 108 |
+
sentences:
|
| 109 |
+
- ==== Spring and Autumn period (722–476 BC) ====
|
| 110 |
+
- SpaceX has also bought and is modifying several residential properties in Boca
|
| 111 |
+
Chica Village, but apparently planning to leave them in residential use, about
|
| 112 |
+
2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
|
| 113 |
+
offer to buy each of the houses in Boca Chica Village for three times the fair
|
| 114 |
+
market value along with an offer of VIP invitations to future launch events. The
|
| 115 |
+
3x offer was said to be "non-negotiable." Homeowners were given two weeks for
|
| 116 |
+
this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
|
| 117 |
+
Department announced a proposal to transfer 43 acres of Boca Chica State Park
|
| 118 |
+
lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
|
| 119 |
+
National Wildlife Refuge.
|
| 120 |
+
- However, exclusive US control of this resource was eventually challenged, and
|
| 121 |
+
the Bering Sea Controversy resulted when the United States seized over 150 sealing
|
| 122 |
+
ships flying the British flag, based out of the coast of British Columbia. The
|
| 123 |
+
conflict between the United States and Britain was resolved by an arbitration
|
| 124 |
+
tribunal in 1893. The waters of the Bering Sea were deemed to be international
|
| 125 |
+
waters, contrary to the US contention that they were an internal sea. The US was
|
| 126 |
+
required to make a payment to Britain, and both nations were required to follow
|
| 127 |
+
regulations developed to preserve the resource.
|
| 128 |
+
- source_sentence: why is there a citgo sign in boston
|
| 129 |
+
sentences:
|
| 130 |
+
- Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
|
| 131 |
+
single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
|
| 132 |
+
of the 100 Greatest Country Artists of All Time. After the death of former flame
|
| 133 |
+
Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
|
| 134 |
+
"Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
|
| 135 |
+
The song's release the following day, on the eve of Campbell's funeral, drew ire
|
| 136 |
+
and criticism being exploitative. Tucker claimed that a portion of the proceeds
|
| 137 |
+
will benefit the Alzheimer's Foundation of America, but the foundation stated
|
| 138 |
+
it was not involved in the promotion and has not received any funds. Tucker released
|
| 139 |
+
While I'm Livin', her first collection of original material since 2002's Tanya,
|
| 140 |
+
in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
|
| 141 |
+
with Carlile brought onto the project after initially being approached for songs
|
| 142 |
+
by Jennings but after having professed such an admiration of Tucker and her work,
|
| 143 |
+
Jennings felt it necessary for her to co-produce the record alongside him. Tucker
|
| 144 |
+
performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
|
| 145 |
+
at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
|
| 146 |
+
single, "Hard Luck", was released on June 28, along with its accompanying music
|
| 147 |
+
video.
|
| 148 |
+
- ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
|
| 149 |
+
being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
|
| 150 |
+
==
|
| 151 |
+
- The massive Islamic invasions of the mid-7th century began a long struggle between
|
| 152 |
+
Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
|
| 153 |
+
soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
|
| 154 |
+
Antioch and was reduced to that of Constantinople, the empire's capital. As a
|
| 155 |
+
result of Islamic domination of the Mediterranean, the Frankish state, centred
|
| 156 |
+
away from that sea, was able to evolve as the dominant power that shaped the Western
|
| 157 |
+
Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
|
| 158 |
+
advance in the West and the failed siege of Constantinople halted it in the East.
|
| 159 |
+
Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
|
| 160 |
+
the city of Ravenna from which it governed the small fragments of Italy, including
|
| 161 |
+
Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
|
| 162 |
+
by a no longer existent exarch was not asked for during the election in 752 of
|
| 163 |
+
Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
|
| 164 |
+
power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
|
| 165 |
+
king Pepin the Short conquered the Lombards. He then gifted the lands of the former
|
| 166 |
+
exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
|
| 167 |
+
Byzantine East were in conflict during the Photian schism, when Photius criticized
|
| 168 |
+
the Latin west for adding of the filioque clause, after being excommunicated by
|
| 169 |
+
Nicholas I. Though the schism was reconciled, unresolved issues would lead to
|
| 170 |
+
further division.
|
| 171 |
+
- source_sentence: who organized the native resistance to the british
|
| 172 |
+
sentences:
|
| 173 |
+
- === Engines === == Fifth generation (WL; 2021) ==
|
| 174 |
+
- '=== Unitarism === All states are unitary states, not federations or aggregates
|
| 175 |
+
of local governments. Local governments within them are created by and exist by
|
| 176 |
+
virtue of state law, and local governments within each state are subject to the
|
| 177 |
+
central authority of that particular state. State governments commonly delegate
|
| 178 |
+
some authority to local units and channel policy decisions down to them for implementation.
|
| 179 |
+
In a few states, local units of government are permitted a degree of home rule
|
| 180 |
+
over various matters. The prevailing legal theory of state preeminence over local
|
| 181 |
+
governments, referred to as Dillon''s Rule, holds that, A municipal corporation
|
| 182 |
+
possesses and can exercise the following powers and no others: First, those granted
|
| 183 |
+
in express words; second, those necessarily implied or necessarily incident to
|
| 184 |
+
the powers expressly granted; third, those absolutely essential to the declared
|
| 185 |
+
objects and purposes of the corporation—not simply convenient but indispensable;
|
| 186 |
+
fourth, any fair doubt as to the existence of power is resolved by the courts
|
| 187 |
+
against the corporation—against the existence of the powers. Each state defines
|
| 188 |
+
for itself what powers it will allow local governments. Generally, four categories
|
| 189 |
+
of power may be given to local jurisdictions: Structural – power to choose the
|
| 190 |
+
form of government, charter and enact charter revisions, Functional – power to
|
| 191 |
+
exercise local self-government in a broad or limited manner, Fiscal – authority
|
| 192 |
+
to determine revenue sources, set tax rates, borrow funds and other related financial
|
| 193 |
+
activities, Personnel – authority to set employment rules, remuneration rates,
|
| 194 |
+
employment conditions and collective bargaining. == Relationships =='
|
| 195 |
+
- Throughout the war, the British deported the Acadians to the Thirteen Colonies
|
| 196 |
+
and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
|
| 197 |
+
Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
|
| 198 |
+
force of French, Canadians, and their Native American allies led by the Marquis
|
| 199 |
+
de Montcalm launched an attack against the key British post at Fort Oswego on
|
| 200 |
+
Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
|
| 201 |
+
year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
|
| 202 |
+
Native Americans laid siege to Fort William Henry on the southern shores of Lake
|
| 203 |
+
George, and after three weeks of fighting the British commander Monroe surrendered.
|
| 204 |
+
Montcalm gave him honorable terms to return to England and not to fight for 18
|
| 205 |
+
months. And yet, when the British force with civilians was three miles from the
|
| 206 |
+
fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
|
| 207 |
+
pipeline_tag: sentence-similarity
|
| 208 |
+
library_name: sentence-transformers
|
| 209 |
+
---
|
| 210 |
+
|
| 211 |
+
# SentenceTransformer based on BAAI/bge-base-en-v1.5
|
| 212 |
+
|
| 213 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 214 |
+
|
| 215 |
+
## Model Details
|
| 216 |
+
|
| 217 |
+
### Model Description
|
| 218 |
+
- **Model Type:** Sentence Transformer
|
| 219 |
+
- **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
|
| 220 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 221 |
+
- **Output Dimensionality:** 768 dimensions
|
| 222 |
+
- **Similarity Function:** Cosine Similarity
|
| 223 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 224 |
+
<!-- - **Language:** Unknown -->
|
| 225 |
+
<!-- - **License:** Unknown -->
|
| 226 |
+
|
| 227 |
+
### Model Sources
|
| 228 |
+
|
| 229 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 230 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 231 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 232 |
+
|
| 233 |
+
### Full Model Architecture
|
| 234 |
+
|
| 235 |
+
```
|
| 236 |
+
SentenceTransformer(
|
| 237 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
|
| 238 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 239 |
+
(2): Normalize()
|
| 240 |
+
)
|
| 241 |
+
```
|
| 242 |
+
|
| 243 |
+
## Usage
|
| 244 |
+
|
| 245 |
+
### Direct Usage (Sentence Transformers)
|
| 246 |
+
|
| 247 |
+
First install the Sentence Transformers library:
|
| 248 |
+
|
| 249 |
+
```bash
|
| 250 |
+
pip install -U sentence-transformers
|
| 251 |
+
```
|
| 252 |
+
|
| 253 |
+
Then you can load this model and run inference.
|
| 254 |
+
```python
|
| 255 |
+
from sentence_transformers import SentenceTransformer
|
| 256 |
+
|
| 257 |
+
# Download from the 🤗 Hub
|
| 258 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 259 |
+
# Run inference
|
| 260 |
+
sentences = [
|
| 261 |
+
'who organized the native resistance to the british',
|
| 262 |
+
"Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
|
| 263 |
+
"=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
|
| 264 |
+
]
|
| 265 |
+
embeddings = model.encode(sentences)
|
| 266 |
+
print(embeddings.shape)
|
| 267 |
+
# [3, 768]
|
| 268 |
+
|
| 269 |
+
# Get the similarity scores for the embeddings
|
| 270 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 271 |
+
print(similarities.shape)
|
| 272 |
+
# [3, 3]
|
| 273 |
+
```
|
| 274 |
+
|
| 275 |
+
<!--
|
| 276 |
+
### Direct Usage (Transformers)
|
| 277 |
+
|
| 278 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 279 |
+
|
| 280 |
+
</details>
|
| 281 |
+
-->
|
| 282 |
+
|
| 283 |
+
<!--
|
| 284 |
+
### Downstream Usage (Sentence Transformers)
|
| 285 |
+
|
| 286 |
+
You can finetune this model on your own dataset.
|
| 287 |
+
|
| 288 |
+
<details><summary>Click to expand</summary>
|
| 289 |
+
|
| 290 |
+
</details>
|
| 291 |
+
-->
|
| 292 |
+
|
| 293 |
+
<!--
|
| 294 |
+
### Out-of-Scope Use
|
| 295 |
+
|
| 296 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 297 |
+
-->
|
| 298 |
+
|
| 299 |
+
<!--
|
| 300 |
+
## Bias, Risks and Limitations
|
| 301 |
+
|
| 302 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 303 |
+
-->
|
| 304 |
+
|
| 305 |
+
<!--
|
| 306 |
+
### Recommendations
|
| 307 |
+
|
| 308 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 309 |
+
-->
|
| 310 |
+
|
| 311 |
+
## Training Details
|
| 312 |
+
|
| 313 |
+
### Training Dataset
|
| 314 |
+
|
| 315 |
+
#### Unnamed Dataset
|
| 316 |
+
|
| 317 |
+
* Size: 5,604 training samples
|
| 318 |
+
* Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
|
| 319 |
+
* Approximate statistics based on the first 1000 samples:
|
| 320 |
+
| | sentence_0 | sentence_1 | label |
|
| 321 |
+
|:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
| 322 |
+
| type | string | string | float |
|
| 323 |
+
| details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
|
| 324 |
+
* Samples:
|
| 325 |
+
| sentence_0 | sentence_1 | label |
|
| 326 |
+
|:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
| 327 |
+
| <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
|
| 328 |
+
| <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
|
| 329 |
+
| <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
|
| 330 |
+
* Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
|
| 331 |
+
```json
|
| 332 |
+
{
|
| 333 |
+
"loss_fct": "torch.nn.modules.loss.MSELoss"
|
| 334 |
+
}
|
| 335 |
+
```
|
| 336 |
+
|
| 337 |
+
### Training Hyperparameters
|
| 338 |
+
#### Non-Default Hyperparameters
|
| 339 |
+
|
| 340 |
+
- `per_device_train_batch_size`: 16
|
| 341 |
+
- `per_device_eval_batch_size`: 16
|
| 342 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 343 |
+
|
| 344 |
+
#### All Hyperparameters
|
| 345 |
+
<details><summary>Click to expand</summary>
|
| 346 |
+
|
| 347 |
+
- `overwrite_output_dir`: False
|
| 348 |
+
- `do_predict`: False
|
| 349 |
+
- `eval_strategy`: no
|
| 350 |
+
- `prediction_loss_only`: True
|
| 351 |
+
- `per_device_train_batch_size`: 16
|
| 352 |
+
- `per_device_eval_batch_size`: 16
|
| 353 |
+
- `per_gpu_train_batch_size`: None
|
| 354 |
+
- `per_gpu_eval_batch_size`: None
|
| 355 |
+
- `gradient_accumulation_steps`: 1
|
| 356 |
+
- `eval_accumulation_steps`: None
|
| 357 |
+
- `torch_empty_cache_steps`: None
|
| 358 |
+
- `learning_rate`: 5e-05
|
| 359 |
+
- `weight_decay`: 0.0
|
| 360 |
+
- `adam_beta1`: 0.9
|
| 361 |
+
- `adam_beta2`: 0.999
|
| 362 |
+
- `adam_epsilon`: 1e-08
|
| 363 |
+
- `max_grad_norm`: 1
|
| 364 |
+
- `num_train_epochs`: 3
|
| 365 |
+
- `max_steps`: -1
|
| 366 |
+
- `lr_scheduler_type`: linear
|
| 367 |
+
- `lr_scheduler_kwargs`: {}
|
| 368 |
+
- `warmup_ratio`: 0.0
|
| 369 |
+
- `warmup_steps`: 0
|
| 370 |
+
- `log_level`: passive
|
| 371 |
+
- `log_level_replica`: warning
|
| 372 |
+
- `log_on_each_node`: True
|
| 373 |
+
- `logging_nan_inf_filter`: True
|
| 374 |
+
- `save_safetensors`: True
|
| 375 |
+
- `save_on_each_node`: False
|
| 376 |
+
- `save_only_model`: False
|
| 377 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 378 |
+
- `no_cuda`: False
|
| 379 |
+
- `use_cpu`: False
|
| 380 |
+
- `use_mps_device`: False
|
| 381 |
+
- `seed`: 42
|
| 382 |
+
- `data_seed`: None
|
| 383 |
+
- `jit_mode_eval`: False
|
| 384 |
+
- `use_ipex`: False
|
| 385 |
+
- `bf16`: False
|
| 386 |
+
- `fp16`: False
|
| 387 |
+
- `fp16_opt_level`: O1
|
| 388 |
+
- `half_precision_backend`: auto
|
| 389 |
+
- `bf16_full_eval`: False
|
| 390 |
+
- `fp16_full_eval`: False
|
| 391 |
+
- `tf32`: None
|
| 392 |
+
- `local_rank`: 0
|
| 393 |
+
- `ddp_backend`: None
|
| 394 |
+
- `tpu_num_cores`: None
|
| 395 |
+
- `tpu_metrics_debug`: False
|
| 396 |
+
- `debug`: []
|
| 397 |
+
- `dataloader_drop_last`: False
|
| 398 |
+
- `dataloader_num_workers`: 0
|
| 399 |
+
- `dataloader_prefetch_factor`: None
|
| 400 |
+
- `past_index`: -1
|
| 401 |
+
- `disable_tqdm`: False
|
| 402 |
+
- `remove_unused_columns`: True
|
| 403 |
+
- `label_names`: None
|
| 404 |
+
- `load_best_model_at_end`: False
|
| 405 |
+
- `ignore_data_skip`: False
|
| 406 |
+
- `fsdp`: []
|
| 407 |
+
- `fsdp_min_num_params`: 0
|
| 408 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 409 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 410 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 411 |
+
- `deepspeed`: None
|
| 412 |
+
- `label_smoothing_factor`: 0.0
|
| 413 |
+
- `optim`: adamw_torch
|
| 414 |
+
- `optim_args`: None
|
| 415 |
+
- `adafactor`: False
|
| 416 |
+
- `group_by_length`: False
|
| 417 |
+
- `length_column_name`: length
|
| 418 |
+
- `ddp_find_unused_parameters`: None
|
| 419 |
+
- `ddp_bucket_cap_mb`: None
|
| 420 |
+
- `ddp_broadcast_buffers`: False
|
| 421 |
+
- `dataloader_pin_memory`: True
|
| 422 |
+
- `dataloader_persistent_workers`: False
|
| 423 |
+
- `skip_memory_metrics`: True
|
| 424 |
+
- `use_legacy_prediction_loop`: False
|
| 425 |
+
- `push_to_hub`: False
|
| 426 |
+
- `resume_from_checkpoint`: None
|
| 427 |
+
- `hub_model_id`: None
|
| 428 |
+
- `hub_strategy`: every_save
|
| 429 |
+
- `hub_private_repo`: None
|
| 430 |
+
- `hub_always_push`: False
|
| 431 |
+
- `gradient_checkpointing`: False
|
| 432 |
+
- `gradient_checkpointing_kwargs`: None
|
| 433 |
+
- `include_inputs_for_metrics`: False
|
| 434 |
+
- `include_for_metrics`: []
|
| 435 |
+
- `eval_do_concat_batches`: True
|
| 436 |
+
- `fp16_backend`: auto
|
| 437 |
+
- `push_to_hub_model_id`: None
|
| 438 |
+
- `push_to_hub_organization`: None
|
| 439 |
+
- `mp_parameters`:
|
| 440 |
+
- `auto_find_batch_size`: False
|
| 441 |
+
- `full_determinism`: False
|
| 442 |
+
- `torchdynamo`: None
|
| 443 |
+
- `ray_scope`: last
|
| 444 |
+
- `ddp_timeout`: 1800
|
| 445 |
+
- `torch_compile`: False
|
| 446 |
+
- `torch_compile_backend`: None
|
| 447 |
+
- `torch_compile_mode`: None
|
| 448 |
+
- `include_tokens_per_second`: False
|
| 449 |
+
- `include_num_input_tokens_seen`: False
|
| 450 |
+
- `neftune_noise_alpha`: None
|
| 451 |
+
- `optim_target_modules`: None
|
| 452 |
+
- `batch_eval_metrics`: False
|
| 453 |
+
- `eval_on_start`: False
|
| 454 |
+
- `use_liger_kernel`: False
|
| 455 |
+
- `eval_use_gather_object`: False
|
| 456 |
+
- `average_tokens_across_devices`: False
|
| 457 |
+
- `prompts`: None
|
| 458 |
+
- `batch_sampler`: batch_sampler
|
| 459 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 460 |
+
|
| 461 |
+
</details>
|
| 462 |
+
|
| 463 |
+
### Training Logs
|
| 464 |
+
| Epoch | Step | Training Loss |
|
| 465 |
+
|:------:|:----:|:-------------:|
|
| 466 |
+
| 1.4245 | 500 | 0.1336 |
|
| 467 |
+
| 2.8490 | 1000 | 0.0787 |
|
| 468 |
+
|
| 469 |
+
|
| 470 |
+
### Framework Versions
|
| 471 |
+
- Python: 3.12.3
|
| 472 |
+
- Sentence Transformers: 4.1.0
|
| 473 |
+
- Transformers: 4.52.4
|
| 474 |
+
- PyTorch: 2.7.0+cu128
|
| 475 |
+
- Accelerate: 1.7.0
|
| 476 |
+
- Datasets: 3.6.0
|
| 477 |
+
- Tokenizers: 0.21.1
|
| 478 |
+
|
| 479 |
+
## Citation
|
| 480 |
+
|
| 481 |
+
### BibTeX
|
| 482 |
+
|
| 483 |
+
#### Sentence Transformers
|
| 484 |
+
```bibtex
|
| 485 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 486 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 487 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 488 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 489 |
+
month = "11",
|
| 490 |
+
year = "2019",
|
| 491 |
+
publisher = "Association for Computational Linguistics",
|
| 492 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 493 |
+
}
|
| 494 |
+
```
|
| 495 |
+
|
| 496 |
+
<!--
|
| 497 |
+
## Glossary
|
| 498 |
+
|
| 499 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 500 |
+
-->
|
| 501 |
+
|
| 502 |
+
<!--
|
| 503 |
+
## Model Card Authors
|
| 504 |
+
|
| 505 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 506 |
+
-->
|
| 507 |
+
|
| 508 |
+
<!--
|
| 509 |
+
## Model Card Contact
|
| 510 |
+
|
| 511 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 512 |
+
-->
|
checkpoints/checkpoint-1053/config.json
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"BertModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"classifier_dropout": null,
|
| 7 |
+
"gradient_checkpointing": false,
|
| 8 |
+
"hidden_act": "gelu",
|
| 9 |
+
"hidden_dropout_prob": 0.1,
|
| 10 |
+
"hidden_size": 768,
|
| 11 |
+
"id2label": {
|
| 12 |
+
"0": "LABEL_0"
|
| 13 |
+
},
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 3072,
|
| 16 |
+
"label2id": {
|
| 17 |
+
"LABEL_0": 0
|
| 18 |
+
},
|
| 19 |
+
"layer_norm_eps": 1e-12,
|
| 20 |
+
"max_position_embeddings": 512,
|
| 21 |
+
"model_type": "bert",
|
| 22 |
+
"num_attention_heads": 12,
|
| 23 |
+
"num_hidden_layers": 12,
|
| 24 |
+
"pad_token_id": 0,
|
| 25 |
+
"position_embedding_type": "absolute",
|
| 26 |
+
"torch_dtype": "float32",
|
| 27 |
+
"transformers_version": "4.52.4",
|
| 28 |
+
"type_vocab_size": 2,
|
| 29 |
+
"use_cache": true,
|
| 30 |
+
"vocab_size": 30522
|
| 31 |
+
}
|
checkpoints/checkpoint-1053/config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"__version__": {
|
| 3 |
+
"sentence_transformers": "4.1.0",
|
| 4 |
+
"transformers": "4.52.4",
|
| 5 |
+
"pytorch": "2.7.0+cu128"
|
| 6 |
+
},
|
| 7 |
+
"prompts": {},
|
| 8 |
+
"default_prompt_name": null,
|
| 9 |
+
"similarity_fn_name": "cosine"
|
| 10 |
+
}
|
checkpoints/checkpoint-1053/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3c22492b93885a269f991e4912889fc64ca6c3858c1c70c987be738dcef7688
|
| 3 |
+
size 437951328
|
checkpoints/checkpoint-1053/modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
checkpoints/checkpoint-1053/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a03e5dacb924a89a3d5bbc1745ffadfbc7eaa1842a14c2f01b9b31b9c5762c41
|
| 3 |
+
size 871298443
|
checkpoints/checkpoint-1053/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69e7c36ebc48e5ab4614ef9885ace5ca0ce2b44bf8627bdbe99df5543059ca9c
|
| 3 |
+
size 14645
|
checkpoints/checkpoint-1053/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:744864483bede6d7cdca80d8a161998b8653394b0c8e6fbcc2fd07a220b1a8d3
|
| 3 |
+
size 1465
|
checkpoints/checkpoint-1053/sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 512,
|
| 3 |
+
"do_lower_case": true
|
| 4 |
+
}
|
checkpoints/checkpoint-1053/special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
checkpoints/checkpoint-1053/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoints/checkpoint-1053/tokenizer_config.json
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"100": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"101": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"102": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"103": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_basic_tokenize": true,
|
| 47 |
+
"do_lower_case": true,
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "[MASK]",
|
| 50 |
+
"model_max_length": 512,
|
| 51 |
+
"never_split": null,
|
| 52 |
+
"pad_token": "[PAD]",
|
| 53 |
+
"sep_token": "[SEP]",
|
| 54 |
+
"strip_accents": null,
|
| 55 |
+
"tokenize_chinese_chars": true,
|
| 56 |
+
"tokenizer_class": "BertTokenizer",
|
| 57 |
+
"unk_token": "[UNK]"
|
| 58 |
+
}
|
checkpoints/checkpoint-1053/trainer_state.json
ADDED
|
@@ -0,0 +1,48 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_global_step": null,
|
| 3 |
+
"best_metric": null,
|
| 4 |
+
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 3.0,
|
| 6 |
+
"eval_steps": 0,
|
| 7 |
+
"global_step": 1053,
|
| 8 |
+
"is_hyper_param_search": false,
|
| 9 |
+
"is_local_process_zero": true,
|
| 10 |
+
"is_world_process_zero": true,
|
| 11 |
+
"log_history": [
|
| 12 |
+
{
|
| 13 |
+
"epoch": 1.4245014245014245,
|
| 14 |
+
"grad_norm": 1.1360502243041992,
|
| 15 |
+
"learning_rate": 1.1673728813559325e-05,
|
| 16 |
+
"loss": 0.1336,
|
| 17 |
+
"step": 500
|
| 18 |
+
},
|
| 19 |
+
{
|
| 20 |
+
"epoch": 2.849002849002849,
|
| 21 |
+
"grad_norm": 1.3151546716690063,
|
| 22 |
+
"learning_rate": 1.0805084745762714e-06,
|
| 23 |
+
"loss": 0.0787,
|
| 24 |
+
"step": 1000
|
| 25 |
+
}
|
| 26 |
+
],
|
| 27 |
+
"logging_steps": 500,
|
| 28 |
+
"max_steps": 1053,
|
| 29 |
+
"num_input_tokens_seen": 0,
|
| 30 |
+
"num_train_epochs": 3,
|
| 31 |
+
"save_steps": 175,
|
| 32 |
+
"stateful_callbacks": {
|
| 33 |
+
"TrainerControl": {
|
| 34 |
+
"args": {
|
| 35 |
+
"should_epoch_stop": false,
|
| 36 |
+
"should_evaluate": false,
|
| 37 |
+
"should_log": false,
|
| 38 |
+
"should_save": true,
|
| 39 |
+
"should_training_stop": true
|
| 40 |
+
},
|
| 41 |
+
"attributes": {}
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"total_flos": 0.0,
|
| 45 |
+
"train_batch_size": 16,
|
| 46 |
+
"trial_name": null,
|
| 47 |
+
"trial_params": null
|
| 48 |
+
}
|
checkpoints/checkpoint-1053/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:435635c51c00ae7c9634e1f44d69a2daae13b846b1d2e6a26d23d637a11c7e7f
|
| 3 |
+
size 5969
|
checkpoints/checkpoint-1053/vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoints/checkpoint-875/1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": true,
|
| 4 |
+
"pooling_mode_mean_tokens": false,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
checkpoints/checkpoint-875/README.md
ADDED
|
@@ -0,0 +1,511 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:5604
|
| 8 |
+
- loss:CosineSimilarityLoss
|
| 9 |
+
base_model: BAAI/bge-base-en-v1.5
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: what are the powers of the virginia executive branch
|
| 12 |
+
sentences:
|
| 13 |
+
- The 49ers won five Super Bowl championships between 1981 and 1994. Four of those
|
| 14 |
+
came in the 1980s, and were led by Hall of Famers Joe Montana, Jerry Rice, Ronnie
|
| 15 |
+
Lott, Steve Young, Charles Haley, Fred Dean, and coaches Bill Walsh and George
|
| 16 |
+
Seifert. They have been division champions 22 times between 1970 and 2023, making
|
| 17 |
+
them one of the most successful teams in NFL history. The 49ers sit alone in NFL
|
| 18 |
+
history for most playoff wins (38), having been in the league playoffs 30 times
|
| 19 |
+
(29 times in the NFL and one time in the AAFC), and have also played in the most
|
| 20 |
+
NFC Championship games (19), hosting 11 of them, also an NFC record. The team
|
| 21 |
+
has set numerous notable NFL records, including most consecutive away games won
|
| 22 |
+
(18), most consecutive seasons leading the league in scoring (4), most consecutive
|
| 23 |
+
games scored (420 games from 1977 to 2004), most field goals in a season (44),
|
| 24 |
+
most games won in a season (18), and most touchdowns (8) and points scored (55)
|
| 25 |
+
in a Super Bowl. According to Forbes, the 49ers are the sixth most valuable team
|
| 26 |
+
in the NFL, valued at $6.8 billion as of August 2024. In June 2023, the enterprise
|
| 27 |
+
branch of the 49ers completed the acquisition of English soccer club Leeds United
|
| 28 |
+
and in May 2025, it acquired 51% of Scottish soccer club Rangers F.C.
|
| 29 |
+
- In 2008, Triarc purchased Wendy's, and changed its name to Wendy's/Arby's Group,
|
| 30 |
+
to reflect their core businesses. In January 2011, it was announced that Wendy's/Arby's
|
| 31 |
+
Group were looking into selling the Arby's side of the business to focus on the
|
| 32 |
+
Wendy's brand. It was officially announced the companies would split on January
|
| 33 |
+
21, 2011. In 2009, the Wendy's/Arby's Group signed a franchise deal with the Al
|
| 34 |
+
Jammaz Group of Saudi Arabia to open dual-branded Wendy's/Arby's through the Middle
|
| 35 |
+
East with the first location opening in Dubai in the United Arab Emirates in May
|
| 36 |
+
2010. The Wendy's/Arby's Group also signed a similar franchise deal in June 2010
|
| 37 |
+
with Tab Gida Sanayi ve Ticaret to open dual-branded restaurants in Turkey. After
|
| 38 |
+
the split, the former Wendy's/Arby's Group became The Wendy's Company.
|
| 39 |
+
- 'Executive: The Chief Executive is responsible for enforcing regional law, can
|
| 40 |
+
force reconsideration of legislation, and appoints Executive Council members and
|
| 41 |
+
principal officials. Acting with the Executive Council, the Chief Executive-in-Council
|
| 42 |
+
can propose new bills, issue subordinate legislation, and has authority to dissolve
|
| 43 |
+
the legislature. In states of emergency or public danger, the Chief Executive-in-Council
|
| 44 |
+
is further empowered to enact any regulation necessary to restore public order.
|
| 45 |
+
Legislature: The unicameral Legislative Council enacts regional law, approves
|
| 46 |
+
budgets, and has the power to impeach a sitting chief executive. Judiciary: The
|
| 47 |
+
Hong Kong Court of Final Appeal and lower courts interpret laws and overturn those
|
| 48 |
+
inconsistent with the Basic Law. Judges are appointed by the chief executive on
|
| 49 |
+
the advice of a recommendation commission. The chief executive is the head of
|
| 50 |
+
government and serves for a maximum of two five-year terms. The State Council
|
| 51 |
+
(led by the Premier of China) appoints the chief executive after nomination by
|
| 52 |
+
the Election Committee, which is composed of 1500 business, community, and government
|
| 53 |
+
leaders.'
|
| 54 |
+
- source_sentence: how many chromosomes does a human diploid cell have
|
| 55 |
+
sentences:
|
| 56 |
+
- The Peace of Cateau-Cambrésis in 1559 concluded the war with France, leaving Spain
|
| 57 |
+
at a considerable advantage. However, the government was still mired in debt,
|
| 58 |
+
and declared bankruptcy that year. Most of the government's revenues came from
|
| 59 |
+
taxes and excise duties, not imported silver and other goods. The Ottoman Empire
|
| 60 |
+
had long menaced the fringes of the Habsburg dominions in Austria and northwest
|
| 61 |
+
Africa. In response Ferdinand and Isabella had sent expeditions to North Africa,
|
| 62 |
+
capturing Melilla in 1497 and Oran in 1509. Charles had preferred to combat the
|
| 63 |
+
Ottomans through a considerably more maritime strategy, hampering Ottoman landings
|
| 64 |
+
on the Venetian territories in the Eastern Mediterranean. Only in response to
|
| 65 |
+
raids on the eastern coast of Spain did Charles personally lead attacks against
|
| 66 |
+
holdings in North Africa (1535). In 1560, the Ottomans battled the Spanish Navy
|
| 67 |
+
off the coast of Tunisia, but in 1565 Ottoman troops landing on the strategically
|
| 68 |
+
vital island of Malta, defended by the Knights of St. John, were defeated. The
|
| 69 |
+
death of Suleiman the Magnificent the following year and his succession by Selim
|
| 70 |
+
II emboldened Philip, who resolved to carry the war to the Ottoman homelands.
|
| 71 |
+
In 1571, a mixed naval expedition of Spanish, Venetian, and Papal ships led by
|
| 72 |
+
Charles' illegitimate son Don John of Austria annihilated the Ottoman fleet at
|
| 73 |
+
the Battle of Lepanto, in the largest naval battle fought in European waters since
|
| 74 |
+
Actium in 31 BC. The fleet included Miguel de Cervantes, future author of the
|
| 75 |
+
historic Spanish novel Don Quixote
|
| 76 |
+
- 'The 1930s were the team''s first golden era, when they improved their game through
|
| 77 |
+
play with more experienced teams. The Combinado del Pacífico (a squad composed
|
| 78 |
+
of Chilean and Peruvian footballers) toured Europe from 1933 to 1934. Starting
|
| 79 |
+
with Ciclista Lima in 1926, Peru''s football clubs toured Latin America with much
|
| 80 |
+
success. During one of these tours—Alianza Lima''s undefeated journey through
|
| 81 |
+
Chile in 1935—emerged the Rodillo Negro ("Black Roller"), a skillful group led
|
| 82 |
+
by forwards Alejandro Villanueva, Teodoro Fernández and goalkeeper Juan Valdivieso.
|
| 83 |
+
Sports historian Richard Witzig described these three as "a soccer triumvirate
|
| 84 |
+
unsurpassed in the world at that time", citing their combined innovation and effectiveness
|
| 85 |
+
at both ends of the field. Peru and the Rodillo Negro impressed at the 1936 Summer
|
| 86 |
+
Olympics, won the inaugural Bolivarian Games in 1938, and finished the decade
|
| 87 |
+
as South American champions. Historian David Goldblatt assessed the decline of
|
| 88 |
+
its previous success: "despite all the apparent preconditions for footballing
|
| 89 |
+
growth and success, Peruvian football disappeared". He attributes this sudden
|
| 90 |
+
decline to Peruvian authorities'' repression of "social, sporting and political
|
| 91 |
+
organisations among the urban and rural poor" during the 1940s and 1950s. Nevertheless,
|
| 92 |
+
Peru performed creditably at the South American Championships, placing third in
|
| 93 |
+
Brazil 1949 and Chile 1955, and missed qualification for the Sweden 1958 World
|
| 94 |
+
Cup finals, over two legs to eventual champions Brazil.'
|
| 95 |
+
- In 1939, at the start of World War II, Poland was partitioned between Nazi Germany
|
| 96 |
+
and the Soviet Union (see Molotov–Ribbentrop Pact). One-fifth of the Polish population
|
| 97 |
+
perished during World War II; the 3,000,000 Polish Jews murdered in the Holocaust,
|
| 98 |
+
who constituted 90% of Polish Jewry, made up half of all Poles killed during the
|
| 99 |
+
war. While the Holocaust occurred largely in German-occupied Poland, it was orchestrated
|
| 100 |
+
and perpetrated by the Nazis. Polish attitudes to the Holocaust varied widely,
|
| 101 |
+
from actively risking death in order to save Jewish lives, and passive refusal
|
| 102 |
+
to inform on them, to indifference, blackmail, and in extreme cases, committing
|
| 103 |
+
premeditated murders such as in the Jedwabne pogrom. Collaboration by non-Jewish
|
| 104 |
+
Polish citizens in the Holocaust was sporadic, but incidents of hostility against
|
| 105 |
+
Jews are well documented and have been a subject of renewed scholarly interest
|
| 106 |
+
during the 21st century.
|
| 107 |
+
- source_sentence: what is the difference between ice brent crude and wti crude
|
| 108 |
+
sentences:
|
| 109 |
+
- ==== Spring and Autumn period (722–476 BC) ====
|
| 110 |
+
- SpaceX has also bought and is modifying several residential properties in Boca
|
| 111 |
+
Chica Village, but apparently planning to leave them in residential use, about
|
| 112 |
+
2 miles (3.2 km) west of the launch site. In September 2019, SpaceX extended an
|
| 113 |
+
offer to buy each of the houses in Boca Chica Village for three times the fair
|
| 114 |
+
market value along with an offer of VIP invitations to future launch events. The
|
| 115 |
+
3x offer was said to be "non-negotiable." Homeowners were given two weeks for
|
| 116 |
+
this particular offer to remain valid. In January 2024, the Texas Parks and Wildlife
|
| 117 |
+
Department announced a proposal to transfer 43 acres of Boca Chica State Park
|
| 118 |
+
lands to SpaceX, in exchange for 477 new acres to be added to the Laguna Atascosa
|
| 119 |
+
National Wildlife Refuge.
|
| 120 |
+
- However, exclusive US control of this resource was eventually challenged, and
|
| 121 |
+
the Bering Sea Controversy resulted when the United States seized over 150 sealing
|
| 122 |
+
ships flying the British flag, based out of the coast of British Columbia. The
|
| 123 |
+
conflict between the United States and Britain was resolved by an arbitration
|
| 124 |
+
tribunal in 1893. The waters of the Bering Sea were deemed to be international
|
| 125 |
+
waters, contrary to the US contention that they were an internal sea. The US was
|
| 126 |
+
required to make a payment to Britain, and both nations were required to follow
|
| 127 |
+
regulations developed to preserve the resource.
|
| 128 |
+
- source_sentence: why is there a citgo sign in boston
|
| 129 |
+
sentences:
|
| 130 |
+
- Tucker appeared on Terri Clark's 2012 album Classic in a remake duet of her first
|
| 131 |
+
single "Delta Dawn". In June 2017, Tucker was featured in Rolling Stone as one
|
| 132 |
+
of the 100 Greatest Country Artists of All Time. After the death of former flame
|
| 133 |
+
Glen Campbell on August 8, 2017, Tucker released her first single since 2009,
|
| 134 |
+
"Forever Loving You", a song co-penned by Tennessee State Senator Rusty Crowe.
|
| 135 |
+
The song's release the following day, on the eve of Campbell's funeral, drew ire
|
| 136 |
+
and criticism being exploitative. Tucker claimed that a portion of the proceeds
|
| 137 |
+
will benefit the Alzheimer's Foundation of America, but the foundation stated
|
| 138 |
+
it was not involved in the promotion and has not received any funds. Tucker released
|
| 139 |
+
While I'm Livin', her first collection of original material since 2002's Tanya,
|
| 140 |
+
in 2019 via Fantasy Records. It was produced by Shooter Jennings and Brandi Carlile,
|
| 141 |
+
with Carlile brought onto the project after initially being approached for songs
|
| 142 |
+
by Jennings but after having professed such an admiration of Tucker and her work,
|
| 143 |
+
Jennings felt it necessary for her to co-produce the record alongside him. Tucker
|
| 144 |
+
performed "Bring My Flowers Now" at Loretta Lynn's all-star 87th birthday concert
|
| 145 |
+
at Nashville's Bridgestone Arena with Carlile playing piano. The album's first
|
| 146 |
+
single, "Hard Luck", was released on June 28, along with its accompanying music
|
| 147 |
+
video.
|
| 148 |
+
- ==== Golf ==== Numerous golf courses can be found in the city, with the most famous
|
| 149 |
+
being Bay Hill Club and Lodge, home to the Arnold Palmer Invitational. == Culture
|
| 150 |
+
==
|
| 151 |
+
- The massive Islamic invasions of the mid-7th century began a long struggle between
|
| 152 |
+
Christianity and Islam throughout the Mediterranean Basin. The Byzantine Empire
|
| 153 |
+
soon lost the lands of the eastern patriarchates of Jerusalem, Alexandria and
|
| 154 |
+
Antioch and was reduced to that of Constantinople, the empire's capital. As a
|
| 155 |
+
result of Islamic domination of the Mediterranean, the Frankish state, centred
|
| 156 |
+
away from that sea, was able to evolve as the dominant power that shaped the Western
|
| 157 |
+
Europe of the Middle Ages. The battles of Toulouse and Tours halted the Islamic
|
| 158 |
+
advance in the West and the failed siege of Constantinople halted it in the East.
|
| 159 |
+
Two or three decades later, in 751, the Byzantine Empire lost to the Lombards
|
| 160 |
+
the city of Ravenna from which it governed the small fragments of Italy, including
|
| 161 |
+
Rome, that acknowledged its sovereignty. The fall of Ravenna meant that confirmation
|
| 162 |
+
by a no longer existent exarch was not asked for during the election in 752 of
|
| 163 |
+
Pope Stephen II, and that the papacy was forced to look elsewhere for a civil
|
| 164 |
+
power to protect it. In 754, at the urgent request of Pope Stephen, the Frankish
|
| 165 |
+
king Pepin the Short conquered the Lombards. He then gifted the lands of the former
|
| 166 |
+
exarchate to the pope, initiating the Papal States. In the 860s, Rome and the
|
| 167 |
+
Byzantine East were in conflict during the Photian schism, when Photius criticized
|
| 168 |
+
the Latin west for adding of the filioque clause, after being excommunicated by
|
| 169 |
+
Nicholas I. Though the schism was reconciled, unresolved issues would lead to
|
| 170 |
+
further division.
|
| 171 |
+
- source_sentence: who organized the native resistance to the british
|
| 172 |
+
sentences:
|
| 173 |
+
- === Engines === == Fifth generation (WL; 2021) ==
|
| 174 |
+
- '=== Unitarism === All states are unitary states, not federations or aggregates
|
| 175 |
+
of local governments. Local governments within them are created by and exist by
|
| 176 |
+
virtue of state law, and local governments within each state are subject to the
|
| 177 |
+
central authority of that particular state. State governments commonly delegate
|
| 178 |
+
some authority to local units and channel policy decisions down to them for implementation.
|
| 179 |
+
In a few states, local units of government are permitted a degree of home rule
|
| 180 |
+
over various matters. The prevailing legal theory of state preeminence over local
|
| 181 |
+
governments, referred to as Dillon''s Rule, holds that, A municipal corporation
|
| 182 |
+
possesses and can exercise the following powers and no others: First, those granted
|
| 183 |
+
in express words; second, those necessarily implied or necessarily incident to
|
| 184 |
+
the powers expressly granted; third, those absolutely essential to the declared
|
| 185 |
+
objects and purposes of the corporation—not simply convenient but indispensable;
|
| 186 |
+
fourth, any fair doubt as to the existence of power is resolved by the courts
|
| 187 |
+
against the corporation—against the existence of the powers. Each state defines
|
| 188 |
+
for itself what powers it will allow local governments. Generally, four categories
|
| 189 |
+
of power may be given to local jurisdictions: Structural – power to choose the
|
| 190 |
+
form of government, charter and enact charter revisions, Functional – power to
|
| 191 |
+
exercise local self-government in a broad or limited manner, Fiscal – authority
|
| 192 |
+
to determine revenue sources, set tax rates, borrow funds and other related financial
|
| 193 |
+
activities, Personnel – authority to set employment rules, remuneration rates,
|
| 194 |
+
employment conditions and collective bargaining. == Relationships =='
|
| 195 |
+
- Throughout the war, the British deported the Acadians to the Thirteen Colonies
|
| 196 |
+
and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and
|
| 197 |
+
Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large
|
| 198 |
+
force of French, Canadians, and their Native American allies led by the Marquis
|
| 199 |
+
de Montcalm launched an attack against the key British post at Fort Oswego on
|
| 200 |
+
Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following
|
| 201 |
+
year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400
|
| 202 |
+
Native Americans laid siege to Fort William Henry on the southern shores of Lake
|
| 203 |
+
George, and after three weeks of fighting the British commander Monroe surrendered.
|
| 204 |
+
Montcalm gave him honorable terms to return to England and not to fight for 18
|
| 205 |
+
months. And yet, when the British force with civilians was three miles from the
|
| 206 |
+
fort, the Native American allies massacred about 1,100 of the 1,500 strong force.
|
| 207 |
+
pipeline_tag: sentence-similarity
|
| 208 |
+
library_name: sentence-transformers
|
| 209 |
+
---
|
| 210 |
+
|
| 211 |
+
# SentenceTransformer based on BAAI/bge-base-en-v1.5
|
| 212 |
+
|
| 213 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 214 |
+
|
| 215 |
+
## Model Details
|
| 216 |
+
|
| 217 |
+
### Model Description
|
| 218 |
+
- **Model Type:** Sentence Transformer
|
| 219 |
+
- **Base model:** [BAAI/bge-base-en-v1.5](https://huggingface.co/BAAI/bge-base-en-v1.5) <!-- at revision a5beb1e3e68b9ab74eb54cfd186867f64f240e1a -->
|
| 220 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 221 |
+
- **Output Dimensionality:** 768 dimensions
|
| 222 |
+
- **Similarity Function:** Cosine Similarity
|
| 223 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 224 |
+
<!-- - **Language:** Unknown -->
|
| 225 |
+
<!-- - **License:** Unknown -->
|
| 226 |
+
|
| 227 |
+
### Model Sources
|
| 228 |
+
|
| 229 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 230 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 231 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 232 |
+
|
| 233 |
+
### Full Model Architecture
|
| 234 |
+
|
| 235 |
+
```
|
| 236 |
+
SentenceTransformer(
|
| 237 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': True}) with Transformer model: BertModel
|
| 238 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': True, 'pooling_mode_mean_tokens': False, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 239 |
+
(2): Normalize()
|
| 240 |
+
)
|
| 241 |
+
```
|
| 242 |
+
|
| 243 |
+
## Usage
|
| 244 |
+
|
| 245 |
+
### Direct Usage (Sentence Transformers)
|
| 246 |
+
|
| 247 |
+
First install the Sentence Transformers library:
|
| 248 |
+
|
| 249 |
+
```bash
|
| 250 |
+
pip install -U sentence-transformers
|
| 251 |
+
```
|
| 252 |
+
|
| 253 |
+
Then you can load this model and run inference.
|
| 254 |
+
```python
|
| 255 |
+
from sentence_transformers import SentenceTransformer
|
| 256 |
+
|
| 257 |
+
# Download from the 🤗 Hub
|
| 258 |
+
model = SentenceTransformer("sentence_transformers_model_id")
|
| 259 |
+
# Run inference
|
| 260 |
+
sentences = [
|
| 261 |
+
'who organized the native resistance to the british',
|
| 262 |
+
"Throughout the war, the British deported the Acadians to the Thirteen Colonies and Europe, which the Acadian militias resisted with assistance from Mi'kmaq and Malisteet forces. The Great Upheaval continued from 1755 to 1764. In 1756, a large force of French, Canadians, and their Native American allies led by the Marquis de Montcalm launched an attack against the key British post at Fort Oswego on Lake Ontario from Fort Frontenac and forced the garrison to surrender. The following year Montcalm with a huge force of 7,200 French and Canadian troops and 2,400 Native Americans laid siege to Fort William Henry on the southern shores of Lake George, and after three weeks of fighting the British commander Monroe surrendered. Montcalm gave him honorable terms to return to England and not to fight for 18 months. And yet, when the British force with civilians was three miles from the fort, the Native American allies massacred about 1,100 of the 1,500 strong force.",
|
| 263 |
+
"=== Unitarism === All states are unitary states, not federations or aggregates of local governments. Local governments within them are created by and exist by virtue of state law, and local governments within each state are subject to the central authority of that particular state. State governments commonly delegate some authority to local units and channel policy decisions down to them for implementation. In a few states, local units of government are permitted a degree of home rule over various matters. The prevailing legal theory of state preeminence over local governments, referred to as Dillon's Rule, holds that, A municipal corporation possesses and can exercise the following powers and no others: First, those granted in express words; second, those necessarily implied or necessarily incident to the powers expressly granted; third, those absolutely essential to the declared objects and purposes of the corporation—not simply convenient but indispensable; fourth, any fair doubt as to the existence of power is resolved by the courts against the corporation—against the existence of the powers. Each state defines for itself what powers it will allow local governments. Generally, four categories of power may be given to local jurisdictions: Structural – power to choose the form of government, charter and enact charter revisions, Functional – power to exercise local self-government in a broad or limited manner, Fiscal – authority to determine revenue sources, set tax rates, borrow funds and other related financial activities, Personnel – authority to set employment rules, remuneration rates, employment conditions and collective bargaining. == Relationships ==",
|
| 264 |
+
]
|
| 265 |
+
embeddings = model.encode(sentences)
|
| 266 |
+
print(embeddings.shape)
|
| 267 |
+
# [3, 768]
|
| 268 |
+
|
| 269 |
+
# Get the similarity scores for the embeddings
|
| 270 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 271 |
+
print(similarities.shape)
|
| 272 |
+
# [3, 3]
|
| 273 |
+
```
|
| 274 |
+
|
| 275 |
+
<!--
|
| 276 |
+
### Direct Usage (Transformers)
|
| 277 |
+
|
| 278 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 279 |
+
|
| 280 |
+
</details>
|
| 281 |
+
-->
|
| 282 |
+
|
| 283 |
+
<!--
|
| 284 |
+
### Downstream Usage (Sentence Transformers)
|
| 285 |
+
|
| 286 |
+
You can finetune this model on your own dataset.
|
| 287 |
+
|
| 288 |
+
<details><summary>Click to expand</summary>
|
| 289 |
+
|
| 290 |
+
</details>
|
| 291 |
+
-->
|
| 292 |
+
|
| 293 |
+
<!--
|
| 294 |
+
### Out-of-Scope Use
|
| 295 |
+
|
| 296 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 297 |
+
-->
|
| 298 |
+
|
| 299 |
+
<!--
|
| 300 |
+
## Bias, Risks and Limitations
|
| 301 |
+
|
| 302 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 303 |
+
-->
|
| 304 |
+
|
| 305 |
+
<!--
|
| 306 |
+
### Recommendations
|
| 307 |
+
|
| 308 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 309 |
+
-->
|
| 310 |
+
|
| 311 |
+
## Training Details
|
| 312 |
+
|
| 313 |
+
### Training Dataset
|
| 314 |
+
|
| 315 |
+
#### Unnamed Dataset
|
| 316 |
+
|
| 317 |
+
* Size: 5,604 training samples
|
| 318 |
+
* Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
|
| 319 |
+
* Approximate statistics based on the first 1000 samples:
|
| 320 |
+
| | sentence_0 | sentence_1 | label |
|
| 321 |
+
|:--------|:-----------------------------------------------------------------------------------|:------------------------------------------------------------------------------------|:---------------------------------------------------------------|
|
| 322 |
+
| type | string | string | float |
|
| 323 |
+
| details | <ul><li>min: 10 tokens</li><li>mean: 11.84 tokens</li><li>max: 25 tokens</li></ul> | <ul><li>min: 8 tokens</li><li>mean: 218.19 tokens</li><li>max: 322 tokens</li></ul> | <ul><li>min: 0.0</li><li>mean: 0.37</li><li>max: 1.0</li></ul> |
|
| 324 |
+
* Samples:
|
| 325 |
+
| sentence_0 | sentence_1 | label |
|
| 326 |
+
|:-----------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:-----------------|
|
| 327 |
+
| <code>who played guitar solo on reeling in the years</code> | <code>Eric Patrick Clapton (born 30 March 1945) is an English rock and blues guitarist, singer, and songwriter. He is regarded as one of the most successful and influential guitarists in rock music. Clapton ranked second in Rolling Stone's list of the "100 Greatest Guitarists of All Time" and fourth in Gibson's "Top 50 Guitarists of All Time". He was named number five in Time magazine's list of "The 10 Best Electric Guitar Players" in 2009. After playing in a number of different local bands, Clapton joined the Yardbirds from 1963 to 1965, and John Mayall & the Bluesbreakers from 1965 to 1966. After leaving Mayall, he formed the power trio Cream with drummer Ginger Baker and bassist/vocalist Jack Bruce, in which Clapton played sustained blues improvisations and "arty, blues-based psychedelic pop". After four successful albums, Cream broke up in November 1968. Clapton then formed the blues rock band Blind Faith with Baker, Steve Winwood, and Ric Grech, recording one album and performing on one...</code> | <code>1.0</code> |
|
| 328 |
+
| <code>how a population of wolves may have undergone speciation to form the first population of dogs</code> | <code>Geological evidence suggests that approximately 3 million years ago, South America became connected to North America when the Bolivar Trough marine barrier disappeared and the Panamanian land bridge formed. The joining of these two land masses led to the Great American Interchange, in which biota from both continents expanded their ranges. The first species known to have made the northward migration was Pliometanastes, a fossil ground sloth roughly the size of a modern black bear. Migrations to the Southern Hemisphere were undertaken by several North American mammalian carnivores. Fewer species migrated in the opposite direction from south to north. The result of the expansion of a North American fauna was a mass extinction in which hundreds of species disappeared in a relatively short time. About 60% of present-day South American mammals have evolved from North American species. Some South American species were able to adapt and spread into North America. Apart from Pliometanastes, du...</code> | <code>1.0</code> |
|
| 329 |
+
| <code>who is credited with promoting the use of factor analysis and why</code> | <code>The enemies of President Davis proposed that the Confederacy "died of Davis". He was unfavorably compared to George Washington by critics such as Edward Alfred Pollard, editor of the most influential newspaper in the Confederacy, the Daily Richmond Examiner. Beyond the early honeymoon period, Davis was never popular. Ellis Merton Coulter, viewed by historians as a Confederate apologist, argues that Davis was unable to mobilize Confederate nationalism in support of his government effectively, and especially failed to appeal to the small farmers who made up the bulk of the population. Davis failed to build a network of supporters who would speak up when he came under criticism, and he repeatedly alienated governors and other state-based leaders by demanding centralized control of the war effort.</code> | <code>0.0</code> |
|
| 330 |
+
* Loss: [<code>CosineSimilarityLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#cosinesimilarityloss) with these parameters:
|
| 331 |
+
```json
|
| 332 |
+
{
|
| 333 |
+
"loss_fct": "torch.nn.modules.loss.MSELoss"
|
| 334 |
+
}
|
| 335 |
+
```
|
| 336 |
+
|
| 337 |
+
### Training Hyperparameters
|
| 338 |
+
#### Non-Default Hyperparameters
|
| 339 |
+
|
| 340 |
+
- `per_device_train_batch_size`: 16
|
| 341 |
+
- `per_device_eval_batch_size`: 16
|
| 342 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 343 |
+
|
| 344 |
+
#### All Hyperparameters
|
| 345 |
+
<details><summary>Click to expand</summary>
|
| 346 |
+
|
| 347 |
+
- `overwrite_output_dir`: False
|
| 348 |
+
- `do_predict`: False
|
| 349 |
+
- `eval_strategy`: no
|
| 350 |
+
- `prediction_loss_only`: True
|
| 351 |
+
- `per_device_train_batch_size`: 16
|
| 352 |
+
- `per_device_eval_batch_size`: 16
|
| 353 |
+
- `per_gpu_train_batch_size`: None
|
| 354 |
+
- `per_gpu_eval_batch_size`: None
|
| 355 |
+
- `gradient_accumulation_steps`: 1
|
| 356 |
+
- `eval_accumulation_steps`: None
|
| 357 |
+
- `torch_empty_cache_steps`: None
|
| 358 |
+
- `learning_rate`: 5e-05
|
| 359 |
+
- `weight_decay`: 0.0
|
| 360 |
+
- `adam_beta1`: 0.9
|
| 361 |
+
- `adam_beta2`: 0.999
|
| 362 |
+
- `adam_epsilon`: 1e-08
|
| 363 |
+
- `max_grad_norm`: 1
|
| 364 |
+
- `num_train_epochs`: 3
|
| 365 |
+
- `max_steps`: -1
|
| 366 |
+
- `lr_scheduler_type`: linear
|
| 367 |
+
- `lr_scheduler_kwargs`: {}
|
| 368 |
+
- `warmup_ratio`: 0.0
|
| 369 |
+
- `warmup_steps`: 0
|
| 370 |
+
- `log_level`: passive
|
| 371 |
+
- `log_level_replica`: warning
|
| 372 |
+
- `log_on_each_node`: True
|
| 373 |
+
- `logging_nan_inf_filter`: True
|
| 374 |
+
- `save_safetensors`: True
|
| 375 |
+
- `save_on_each_node`: False
|
| 376 |
+
- `save_only_model`: False
|
| 377 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 378 |
+
- `no_cuda`: False
|
| 379 |
+
- `use_cpu`: False
|
| 380 |
+
- `use_mps_device`: False
|
| 381 |
+
- `seed`: 42
|
| 382 |
+
- `data_seed`: None
|
| 383 |
+
- `jit_mode_eval`: False
|
| 384 |
+
- `use_ipex`: False
|
| 385 |
+
- `bf16`: False
|
| 386 |
+
- `fp16`: False
|
| 387 |
+
- `fp16_opt_level`: O1
|
| 388 |
+
- `half_precision_backend`: auto
|
| 389 |
+
- `bf16_full_eval`: False
|
| 390 |
+
- `fp16_full_eval`: False
|
| 391 |
+
- `tf32`: None
|
| 392 |
+
- `local_rank`: 0
|
| 393 |
+
- `ddp_backend`: None
|
| 394 |
+
- `tpu_num_cores`: None
|
| 395 |
+
- `tpu_metrics_debug`: False
|
| 396 |
+
- `debug`: []
|
| 397 |
+
- `dataloader_drop_last`: False
|
| 398 |
+
- `dataloader_num_workers`: 0
|
| 399 |
+
- `dataloader_prefetch_factor`: None
|
| 400 |
+
- `past_index`: -1
|
| 401 |
+
- `disable_tqdm`: False
|
| 402 |
+
- `remove_unused_columns`: True
|
| 403 |
+
- `label_names`: None
|
| 404 |
+
- `load_best_model_at_end`: False
|
| 405 |
+
- `ignore_data_skip`: False
|
| 406 |
+
- `fsdp`: []
|
| 407 |
+
- `fsdp_min_num_params`: 0
|
| 408 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 409 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 410 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 411 |
+
- `deepspeed`: None
|
| 412 |
+
- `label_smoothing_factor`: 0.0
|
| 413 |
+
- `optim`: adamw_torch
|
| 414 |
+
- `optim_args`: None
|
| 415 |
+
- `adafactor`: False
|
| 416 |
+
- `group_by_length`: False
|
| 417 |
+
- `length_column_name`: length
|
| 418 |
+
- `ddp_find_unused_parameters`: None
|
| 419 |
+
- `ddp_bucket_cap_mb`: None
|
| 420 |
+
- `ddp_broadcast_buffers`: False
|
| 421 |
+
- `dataloader_pin_memory`: True
|
| 422 |
+
- `dataloader_persistent_workers`: False
|
| 423 |
+
- `skip_memory_metrics`: True
|
| 424 |
+
- `use_legacy_prediction_loop`: False
|
| 425 |
+
- `push_to_hub`: False
|
| 426 |
+
- `resume_from_checkpoint`: None
|
| 427 |
+
- `hub_model_id`: None
|
| 428 |
+
- `hub_strategy`: every_save
|
| 429 |
+
- `hub_private_repo`: None
|
| 430 |
+
- `hub_always_push`: False
|
| 431 |
+
- `gradient_checkpointing`: False
|
| 432 |
+
- `gradient_checkpointing_kwargs`: None
|
| 433 |
+
- `include_inputs_for_metrics`: False
|
| 434 |
+
- `include_for_metrics`: []
|
| 435 |
+
- `eval_do_concat_batches`: True
|
| 436 |
+
- `fp16_backend`: auto
|
| 437 |
+
- `push_to_hub_model_id`: None
|
| 438 |
+
- `push_to_hub_organization`: None
|
| 439 |
+
- `mp_parameters`:
|
| 440 |
+
- `auto_find_batch_size`: False
|
| 441 |
+
- `full_determinism`: False
|
| 442 |
+
- `torchdynamo`: None
|
| 443 |
+
- `ray_scope`: last
|
| 444 |
+
- `ddp_timeout`: 1800
|
| 445 |
+
- `torch_compile`: False
|
| 446 |
+
- `torch_compile_backend`: None
|
| 447 |
+
- `torch_compile_mode`: None
|
| 448 |
+
- `include_tokens_per_second`: False
|
| 449 |
+
- `include_num_input_tokens_seen`: False
|
| 450 |
+
- `neftune_noise_alpha`: None
|
| 451 |
+
- `optim_target_modules`: None
|
| 452 |
+
- `batch_eval_metrics`: False
|
| 453 |
+
- `eval_on_start`: False
|
| 454 |
+
- `use_liger_kernel`: False
|
| 455 |
+
- `eval_use_gather_object`: False
|
| 456 |
+
- `average_tokens_across_devices`: False
|
| 457 |
+
- `prompts`: None
|
| 458 |
+
- `batch_sampler`: batch_sampler
|
| 459 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 460 |
+
|
| 461 |
+
</details>
|
| 462 |
+
|
| 463 |
+
### Training Logs
|
| 464 |
+
| Epoch | Step | Training Loss |
|
| 465 |
+
|:------:|:----:|:-------------:|
|
| 466 |
+
| 1.4245 | 500 | 0.1336 |
|
| 467 |
+
|
| 468 |
+
|
| 469 |
+
### Framework Versions
|
| 470 |
+
- Python: 3.12.3
|
| 471 |
+
- Sentence Transformers: 4.1.0
|
| 472 |
+
- Transformers: 4.52.4
|
| 473 |
+
- PyTorch: 2.7.0+cu128
|
| 474 |
+
- Accelerate: 1.7.0
|
| 475 |
+
- Datasets: 3.6.0
|
| 476 |
+
- Tokenizers: 0.21.1
|
| 477 |
+
|
| 478 |
+
## Citation
|
| 479 |
+
|
| 480 |
+
### BibTeX
|
| 481 |
+
|
| 482 |
+
#### Sentence Transformers
|
| 483 |
+
```bibtex
|
| 484 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 485 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 486 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 487 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 488 |
+
month = "11",
|
| 489 |
+
year = "2019",
|
| 490 |
+
publisher = "Association for Computational Linguistics",
|
| 491 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 492 |
+
}
|
| 493 |
+
```
|
| 494 |
+
|
| 495 |
+
<!--
|
| 496 |
+
## Glossary
|
| 497 |
+
|
| 498 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 499 |
+
-->
|
| 500 |
+
|
| 501 |
+
<!--
|
| 502 |
+
## Model Card Authors
|
| 503 |
+
|
| 504 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 505 |
+
-->
|
| 506 |
+
|
| 507 |
+
<!--
|
| 508 |
+
## Model Card Contact
|
| 509 |
+
|
| 510 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 511 |
+
-->
|
checkpoints/checkpoint-875/config.json
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"BertModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"classifier_dropout": null,
|
| 7 |
+
"gradient_checkpointing": false,
|
| 8 |
+
"hidden_act": "gelu",
|
| 9 |
+
"hidden_dropout_prob": 0.1,
|
| 10 |
+
"hidden_size": 768,
|
| 11 |
+
"id2label": {
|
| 12 |
+
"0": "LABEL_0"
|
| 13 |
+
},
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 3072,
|
| 16 |
+
"label2id": {
|
| 17 |
+
"LABEL_0": 0
|
| 18 |
+
},
|
| 19 |
+
"layer_norm_eps": 1e-12,
|
| 20 |
+
"max_position_embeddings": 512,
|
| 21 |
+
"model_type": "bert",
|
| 22 |
+
"num_attention_heads": 12,
|
| 23 |
+
"num_hidden_layers": 12,
|
| 24 |
+
"pad_token_id": 0,
|
| 25 |
+
"position_embedding_type": "absolute",
|
| 26 |
+
"torch_dtype": "float32",
|
| 27 |
+
"transformers_version": "4.52.4",
|
| 28 |
+
"type_vocab_size": 2,
|
| 29 |
+
"use_cache": true,
|
| 30 |
+
"vocab_size": 30522
|
| 31 |
+
}
|
checkpoints/checkpoint-875/config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"__version__": {
|
| 3 |
+
"sentence_transformers": "4.1.0",
|
| 4 |
+
"transformers": "4.52.4",
|
| 5 |
+
"pytorch": "2.7.0+cu128"
|
| 6 |
+
},
|
| 7 |
+
"prompts": {},
|
| 8 |
+
"default_prompt_name": null,
|
| 9 |
+
"similarity_fn_name": "cosine"
|
| 10 |
+
}
|
checkpoints/checkpoint-875/model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03748a0a3c686eca813a869f8c058104e3ebc60afe181cf1f84ce350b19700c3
|
| 3 |
+
size 437951328
|
checkpoints/checkpoint-875/modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
checkpoints/checkpoint-875/optimizer.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:32c4db7c16f83a330ca3fb70c99ff336f6fb949322d617573d8f6b386dfab6fe
|
| 3 |
+
size 871298443
|
checkpoints/checkpoint-875/rng_state.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dab8f58abd1458a3a02165ce5c02b8ea6d425be95636530c1481c4b6a088bf15
|
| 3 |
+
size 14645
|
checkpoints/checkpoint-875/scheduler.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3b5728b1dd51f6dbcb263d93e234d70c8999325b78869b893d0a4f6057dd5eb
|
| 3 |
+
size 1465
|
checkpoints/checkpoint-875/sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 512,
|
| 3 |
+
"do_lower_case": true
|
| 4 |
+
}
|
checkpoints/checkpoint-875/special_tokens_map.json
ADDED
|
@@ -0,0 +1,37 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cls_token": {
|
| 3 |
+
"content": "[CLS]",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"mask_token": {
|
| 10 |
+
"content": "[MASK]",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "[PAD]",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"sep_token": {
|
| 24 |
+
"content": "[SEP]",
|
| 25 |
+
"lstrip": false,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"unk_token": {
|
| 31 |
+
"content": "[UNK]",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
}
|
| 37 |
+
}
|
checkpoints/checkpoint-875/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
checkpoints/checkpoint-875/tokenizer_config.json
ADDED
|
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "[PAD]",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"100": {
|
| 12 |
+
"content": "[UNK]",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"101": {
|
| 20 |
+
"content": "[CLS]",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"102": {
|
| 28 |
+
"content": "[SEP]",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"103": {
|
| 36 |
+
"content": "[MASK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"clean_up_tokenization_spaces": true,
|
| 45 |
+
"cls_token": "[CLS]",
|
| 46 |
+
"do_basic_tokenize": true,
|
| 47 |
+
"do_lower_case": true,
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "[MASK]",
|
| 50 |
+
"model_max_length": 512,
|
| 51 |
+
"never_split": null,
|
| 52 |
+
"pad_token": "[PAD]",
|
| 53 |
+
"sep_token": "[SEP]",
|
| 54 |
+
"strip_accents": null,
|
| 55 |
+
"tokenize_chinese_chars": true,
|
| 56 |
+
"tokenizer_class": "BertTokenizer",
|
| 57 |
+
"unk_token": "[UNK]"
|
| 58 |
+
}
|
checkpoints/checkpoint-875/trainer_state.json
ADDED
|
@@ -0,0 +1,41 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"best_global_step": null,
|
| 3 |
+
"best_metric": null,
|
| 4 |
+
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 2.492877492877493,
|
| 6 |
+
"eval_steps": 0,
|
| 7 |
+
"global_step": 875,
|
| 8 |
+
"is_hyper_param_search": false,
|
| 9 |
+
"is_local_process_zero": true,
|
| 10 |
+
"is_world_process_zero": true,
|
| 11 |
+
"log_history": [
|
| 12 |
+
{
|
| 13 |
+
"epoch": 1.4245014245014245,
|
| 14 |
+
"grad_norm": 1.1360502243041992,
|
| 15 |
+
"learning_rate": 1.1673728813559325e-05,
|
| 16 |
+
"loss": 0.1336,
|
| 17 |
+
"step": 500
|
| 18 |
+
}
|
| 19 |
+
],
|
| 20 |
+
"logging_steps": 500,
|
| 21 |
+
"max_steps": 1053,
|
| 22 |
+
"num_input_tokens_seen": 0,
|
| 23 |
+
"num_train_epochs": 3,
|
| 24 |
+
"save_steps": 175,
|
| 25 |
+
"stateful_callbacks": {
|
| 26 |
+
"TrainerControl": {
|
| 27 |
+
"args": {
|
| 28 |
+
"should_epoch_stop": false,
|
| 29 |
+
"should_evaluate": false,
|
| 30 |
+
"should_log": false,
|
| 31 |
+
"should_save": true,
|
| 32 |
+
"should_training_stop": false
|
| 33 |
+
},
|
| 34 |
+
"attributes": {}
|
| 35 |
+
}
|
| 36 |
+
},
|
| 37 |
+
"total_flos": 0.0,
|
| 38 |
+
"train_batch_size": 16,
|
| 39 |
+
"trial_name": null,
|
| 40 |
+
"trial_params": null
|
| 41 |
+
}
|
checkpoints/checkpoint-875/training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:435635c51c00ae7c9634e1f44d69a2daae13b846b1d2e6a26d23d637a11c7e7f
|
| 3 |
+
size 5969
|
checkpoints/checkpoint-875/vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|