Upload folder using huggingface_hub
Browse files- .gitattributes +1 -0
- 1_Pooling/config.json +10 -0
- README.md +428 -0
- config.json +27 -0
- config_sentence_transformers.json +14 -0
- config_setfit.json +17 -0
- model.safetensors +3 -0
- model_head.pkl +3 -0
- modules.json +20 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +3 -0
- tokenizer_config.json +55 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
README.md
ADDED
|
@@ -0,0 +1,428 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- setfit
|
| 4 |
+
- sentence-transformers
|
| 5 |
+
- text-classification
|
| 6 |
+
- generated_from_setfit_trainer
|
| 7 |
+
widget:
|
| 8 |
+
- text: Isolated 500kHz 1mΩ current sensor ICs. Allegro MicroSystems is exploiting
|
| 9 |
+
tunnel magnetoresistance to measure current with 500kHz bandwidth, and less noise
|
| 10 |
+
that Hall effect isolated current
|
| 11 |
+
- text: Cruz Azul vs Club Leon Prediction and Betting Tips. Mexican Liga MX returns
|
| 12 |
+
with a fresh set of fixtures as Cruz Azul and Club Leon square off at the Estadio
|
| 13 |
+
Olímpico Universitario on Saturday.
|
| 14 |
+
- text: Bavarian PM calls to stop refugee payments for Ukrainians Ambassador responds.
|
| 15 |
+
Read more
|
| 16 |
+
- text: HDFC Bank Bonus Issue One Share For Every One Held Board Approves Plan.
|
| 17 |
+
The record date for determining the eligible shareholders to receive HDFC Bank
|
| 18 |
+
bonus equity shares is Wednesday, Aug. 27, 2025.
|
| 19 |
+
- text: Finding Truth In Other Religions A Call For Openness. Christians do not have
|
| 20 |
+
to believe other religions are absolutely false, indeed, they can believe they
|
| 21 |
+
were inspired and lead to Christ.
|
| 22 |
+
metrics:
|
| 23 |
+
- accuracy
|
| 24 |
+
pipeline_tag: text-classification
|
| 25 |
+
library_name: setfit
|
| 26 |
+
inference: true
|
| 27 |
+
base_model: intfloat/multilingual-e5-base
|
| 28 |
+
model-index:
|
| 29 |
+
- name: SetFit with intfloat/multilingual-e5-base
|
| 30 |
+
results:
|
| 31 |
+
- task:
|
| 32 |
+
type: text-classification
|
| 33 |
+
name: Text Classification
|
| 34 |
+
dataset:
|
| 35 |
+
name: Unknown
|
| 36 |
+
type: unknown
|
| 37 |
+
split: test
|
| 38 |
+
metrics:
|
| 39 |
+
- type: accuracy
|
| 40 |
+
value: 0.8222222222222222
|
| 41 |
+
name: Accuracy
|
| 42 |
+
---
|
| 43 |
+
|
| 44 |
+
# SetFit with intfloat/multilingual-e5-base
|
| 45 |
+
|
| 46 |
+
This is a [SetFit](https://github.com/huggingface/setfit) model that can be used for Text Classification. This SetFit model uses [intfloat/multilingual-e5-base](https://huggingface.co/intfloat/multilingual-e5-base) as the Sentence Transformer embedding model. A [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance is used for classification.
|
| 47 |
+
|
| 48 |
+
The model has been trained using an efficient few-shot learning technique that involves:
|
| 49 |
+
|
| 50 |
+
1. Fine-tuning a [Sentence Transformer](https://www.sbert.net) with contrastive learning.
|
| 51 |
+
2. Training a classification head with features from the fine-tuned Sentence Transformer.
|
| 52 |
+
|
| 53 |
+
## Model Details
|
| 54 |
+
|
| 55 |
+
### Model Description
|
| 56 |
+
- **Model Type:** SetFit
|
| 57 |
+
- **Sentence Transformer body:** [intfloat/multilingual-e5-base](https://huggingface.co/intfloat/multilingual-e5-base)
|
| 58 |
+
- **Classification head:** a [LogisticRegression](https://scikit-learn.org/stable/modules/generated/sklearn.linear_model.LogisticRegression.html) instance
|
| 59 |
+
- **Maximum Sequence Length:** 512 tokens
|
| 60 |
+
- **Number of Classes:** 12 classes
|
| 61 |
+
<!-- - **Training Dataset:** [Unknown](https://huggingface.co/datasets/unknown) -->
|
| 62 |
+
<!-- - **Language:** Unknown -->
|
| 63 |
+
<!-- - **License:** Unknown -->
|
| 64 |
+
|
| 65 |
+
### Model Sources
|
| 66 |
+
|
| 67 |
+
- **Repository:** [SetFit on GitHub](https://github.com/huggingface/setfit)
|
| 68 |
+
- **Paper:** [Efficient Few-Shot Learning Without Prompts](https://arxiv.org/abs/2209.11055)
|
| 69 |
+
- **Blogpost:** [SetFit: Efficient Few-Shot Learning Without Prompts](https://huggingface.co/blog/setfit)
|
| 70 |
+
|
| 71 |
+
### Model Labels
|
| 72 |
+
| Label | Examples |
|
| 73 |
+
|:--------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 74 |
+
| Business | <ul><li>'Atour stock price target raised to 39 by Macquarie By Investing. Atour stock price target raised to 39 by Macquarie'</li><li>'1 Smart Growth Stock to Buy With Under 100 in August. Upstart is on track to generate over 1 billion in annual revenue for the first time in its history.'</li><li>'Circle shares climb as Q2 revenue surges 53 on Stablecoin demand. Circle Internet Group shares rose on Tuesday after the company reported its first quarterly earnings as a public company.'</li></ul> |
|
| 75 |
+
| Politics | <ul><li>'Mieke Vogels Condemns Climate Violence.. Understands Radicalization Amid Belgium s OCAD Report Fallout. Climate activism in Belgium faces concerns over radicalization, as GroenPlus chair Mieke Vogels urges understanding of youth climate urgency.'</li><li>'The Paradox of Slavery in American History. Juneteenth marks the end of slavery in the U.S., yet the legacy of human bondage extends far beyond American shores. From African complicity in the slave trade to Black slaveholders in early America, and the persistence of slavery in parts of modern Africa, this article explores the often overlooked complexities of a global and ongoing issue.'</li><li>'Government of Egypt, UNHCR and UNDP Launch Egypt Refugee and Resilience Response Plan. Government of Egypt, UNHCR and UNDP Launch Egypt Refugee and Resilience Response Plan'</li></ul> |
|
| 76 |
+
| Entertainment | <ul><li>'Proms in the Park back in West Bridgford with Wild Boys headlining. The award-winning Proms in the Park returns to Bridgford Park in West Bridgford on Saturday June 28 from 12.30pm to 9pm with live 80s band Wild Boys'</li><li>'Marvellous thriller with Adolescence and Line of Duty stars streaming free. This underrated period thriller which originally aired on BBC One is now available to watch for free'</li><li>'Jadakiss Reflects On The Lox, Dipset Verzuz Battle I Was Out Of My Mind. Jadakiss reflects on The Lox s legendary Verzuz battle against Dipset in his new podcast with Fat Joe.'</li></ul> |
|
| 77 |
+
| Crime | <ul><li>'Fake buyer dupes seller of four split ACs worth Rs 2 lakh, arrested. Excelsior Correspondent JAMMU, Aug 8 Police have arrested two individuals involved in a fraud case where four split AC units worth nearly Rs 2 lakh were deceitfully taken from a seller. The case came to light after Karamjeet Singh, a resident of Sanjay Nagar, reported that he received a call on August 5 from an unknown number regarding the purchase of four split air conditioners. Believing the caller, Singh sent the units through an auto-rickshaw to the provided location. Upon'</li><li>'Stanislaus Co. worker exposes personal data of nearly 10,000 veterans. The email was initially sent at 2 09 p.m. Monday, followed by a message from the same employee at 3 18 p.m. stating, Please delete, email sent in error.'</li><li>'Odisha Islamists attack ambulance during Muharram procession. An ambulance carrying critically ill children was attacked by an Islamist mob during a Muharram procession in Remuna, Balasore'</li></ul> |
|
| 78 |
+
| Science | <ul><li>'Lost monuments of the people of the cloud forest unearthed at Gran Pajatén. The World Monuments Fund WMF has announced the discovery of more than 100 previously undocumented structures at Gran Pajatén, located within Peru s Río Abiseo National Park.'</li><li>'Green ammonia revolution New electrolyte strategy boosts sustainable fertilizer production. A joint international research team has, for the first time, unveiled the crucial link between the structure of the solid electrolyte interphase SEI and the efficiency of lithium-mediated nitrogen reduction to ammonia, a promising eco-friendly approach to fertilizer production. Using in situ spectroscopy, the team directly observed the previously poorly understood SEI formation process, revealing that the ethanol-to-water ratio in the electrolyte significantly impacts ammonia conversion efficiency. This discovery opens a new avenue for sustainable fertilizer production by reducing reliance on fossil fuels and lowering greenhouse gas emissions.'</li><li>'The Kessler Effect The Haunted Housewives. Author Christopher Lee Jones spoke about the Kessler Effect-- the problem of accumulating space debris. Followed by Theresa Argie and Cathi Weber, known as the Haunted Housewives, with insights from their paranormal investigations.'</li></ul> |
|
| 79 |
+
| Lifestyle | <ul><li>'These are the 15 best things to do in Houston this weekend. weekend event planner'</li><li>'No Better Place to Be Locals embrace Open Day. The team at Capricorn Adventist Retirement Plus rolled out the welcome mat recently for a special open day event, offering ...'</li><li>'Carter s Memorial Day Sale offers 50 off sitewide with deals starting from just 2. Carter s Memorial Day Sale offers 50 off sitewide with deals starting from just 2. Prices are as marked. Customers receive free delivery on orders of 35 or more. One of our top picks from this sale is the 2-Piece Mickey Mouse Polo Shirt and Shorts that s marked down to 19 and originally sold for 38.'</li></ul> |
|
| 80 |
+
| Education | <ul><li>'5 best traditional learning techniques that parents need to teach their children. While modern education is heavily influenced by gadgets, online videos, and digital apps, there s something irreplaceably beautiful about traditional learning techniques. These aren t just old-school methods they are rooted in culture, tested across generations, and carry a kind of warmth that modern tools can never replicate. Many of these techniques don t just aim at stuffing information into the brain they help children build patience, deepen memory, and develop emotional bonding with the learning process itself. Here are 5 such forgotten gems that deserve a comeback.'</li><li>'Classroom Central supports students, teachers for upcoming school year. Christina Klukow, who teaches at Tuckaseegee Elementary, is going into her 14th year of teaching. She said she teaches fourth grade at the best school.'</li><li>'Most Chosen By Older Students. Find the right college for you. Search colleges by cost, size, location, and more to find your best fit.'</li></ul> |
|
| 81 |
+
| Sports | <ul><li>'Siraj Bowls to Harry Maguire, Pant Takes Penalty as Bruno Fernandes Watches Team India Joins Man Utd in Epic Crossover. In a memorable sporting crossover, the Indian cricket team on Sunday linked up with players of the world-renowned football club Manchester United and exchanged jerseys and pleasantries while engaging in some light-hearted drills., Cricket, Times Now'</li><li>'Probable Biggest Trade Moves Between IPL Teams Ahead 2026 Season. The IPL franchises will be looking to compose their teams and be in a position of strength from now on. Here are some trade moves between IPL franchises that can surprise the fans and experts.'</li><li>'La Liga 2025 26 live streaming When does the Spanish league season begin? When and where to watch in India?. Football News La Liga is set to begin on Friday, with Barcelona, Real Madrid, and Atletico Madrid vying for the title. Barcelona, the defending champions, are deter'</li></ul> |
|
| 82 |
+
| Health | <ul><li>'Doctor s five foods that help you full for longer and lose weight. A weight loss expert shared the five foods he recommends to anyone wanting to feel full for longer and shed pounds'</li><li>'Extracellular Vesicles Delivered by a Nanofiber-Hydrogel Composite Enhance Healing In Vivo in a Model of Crohn s Disease Perianal Fistula. ARTICLE Extracellular Vesicles Delivered by a Nanofiber-Hydrogel Composite Enhance Healing In Vivo in a Model of Crohn s Disease Perianal Fistula AUTHORS Ling Li, Zhicheng Yao, Kevan J Salimian5, Jiayuan Kong, Atif Zaheer, Alyssa Parian, Susan L Gearhart, Hai-Quan Mao, Florin M Selaru JOURNAL Adv Healthc Mater. 2025 Mar 14 7 e2402292. doi 10.1002 adhm.202402292. Epub 2024 Sep 6. Abstract Perianal fistulas represent a common, aggressive, and disabling complication of Crohn s disease CD .'</li><li>'Beating the Odds Diagnosed with Stage IV Lung Cancer at 44. At 44, Jennifer Olson was diagnosed with stage IV lung cancer. Ten years later, she s in remission and sharing her powerful story of survival, faith, and resilience. Discover how she beat the odds, found support, and continues to inspire others facing lung cancer.'</li></ul> |
|
| 83 |
+
| General News | <ul><li>'Miss Maddy U d by Yur GF s stepDd. You may like these posts'</li><li>'What s that going to be next to Calvary Baptist Church?. An Edwardsville business will be moving to a new location.'</li><li>'Several Bright Explosions Captured Over Newburgh, New York. A security camera captured two explosive bursts of light that appeared over Newburgh, New York in the early morning hours this weekend.'</li></ul> |
|
| 84 |
+
| Technology | <ul><li>'Centre launches RailOne super app to streamline all passenger services. The Centre on Tuesday launched RailOne , a super app designed to serve as a one-stop platform for all railway-related queries, passenger needs and services INDIA BEYOND'</li><li>'Cherishville s Summer 2025 in Second Life. As I noted back in 2018, America s historic Route 66 has been a popular theme for Second Life region designs over the years. In fact I made the observation about Motorheadz Café Route66, designed by ROCKET Rocket Biedermann - see Another trip on Route 66 in Second Life. Another popular Route 66 destination from'</li><li>'M2 MacBook Air is available with Rs 30,000 discount on Flipkart. Looking for a great laptop deal? The MacBook Air M2 is now under Rs 70,000 on Flipkart powerful, sleek, and packed with impressive features.'</li></ul> |
|
| 85 |
+
| Religion | <ul><li>'Religion growing in importance for S poreans IPS study. Read more at straitstimes. Read more at straitstimes.'</li><li>'Islam s Greatest Stories of Love. Premieres Friday, Aug. 22, 2025 at 8 p.m. on KPBS 2 PBS app. This powerful two-hour documentary about how a heartbroken woman finds solace is told in five great love stories from the Islamic tradition. At the heart of the film is Ariella Gayotto Hohl, a young Muslim woman grappling with the loss of her beloved father.'</li><li>'Free Methodist World Missions. North Macedonia Pray for pastors and leaders as they seek to overcome racial issues, grow the body of Christ and develop healthy disciples.'</li></ul> |
|
| 86 |
+
|
| 87 |
+
## Evaluation
|
| 88 |
+
|
| 89 |
+
### Metrics
|
| 90 |
+
| Label | Accuracy |
|
| 91 |
+
|:--------|:---------|
|
| 92 |
+
| **all** | 0.8222 |
|
| 93 |
+
|
| 94 |
+
## Uses
|
| 95 |
+
|
| 96 |
+
### Direct Use for Inference
|
| 97 |
+
|
| 98 |
+
First install the SetFit library:
|
| 99 |
+
|
| 100 |
+
```bash
|
| 101 |
+
pip install setfit
|
| 102 |
+
```
|
| 103 |
+
|
| 104 |
+
Then you can load this model and run inference.
|
| 105 |
+
|
| 106 |
+
```python
|
| 107 |
+
from setfit import SetFitModel
|
| 108 |
+
|
| 109 |
+
# Download from the 🤗 Hub
|
| 110 |
+
model = SetFitModel.from_pretrained("setfit_model_id")
|
| 111 |
+
# Run inference
|
| 112 |
+
preds = model("Bavarian PM calls to stop refugee payments for Ukrainians Ambassador responds. Read more")
|
| 113 |
+
```
|
| 114 |
+
|
| 115 |
+
<!--
|
| 116 |
+
### Downstream Use
|
| 117 |
+
|
| 118 |
+
*List how someone could finetune this model on their own dataset.*
|
| 119 |
+
-->
|
| 120 |
+
|
| 121 |
+
<!--
|
| 122 |
+
### Out-of-Scope Use
|
| 123 |
+
|
| 124 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 125 |
+
-->
|
| 126 |
+
|
| 127 |
+
<!--
|
| 128 |
+
## Bias, Risks and Limitations
|
| 129 |
+
|
| 130 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 131 |
+
-->
|
| 132 |
+
|
| 133 |
+
<!--
|
| 134 |
+
### Recommendations
|
| 135 |
+
|
| 136 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 137 |
+
-->
|
| 138 |
+
|
| 139 |
+
## Training Details
|
| 140 |
+
|
| 141 |
+
### Training Set Metrics
|
| 142 |
+
| Training set | Min | Median | Max |
|
| 143 |
+
|:-------------|:----|:--------|:----|
|
| 144 |
+
| Word count | 2 | 42.6906 | 454 |
|
| 145 |
+
|
| 146 |
+
| Label | Training Sample Count |
|
| 147 |
+
|:--------------|:----------------------|
|
| 148 |
+
| Business | 346 |
|
| 149 |
+
| Sports | 244 |
|
| 150 |
+
| Politics | 210 |
|
| 151 |
+
| Lifestyle | 186 |
|
| 152 |
+
| General News | 186 |
|
| 153 |
+
| Entertainment | 150 |
|
| 154 |
+
| Crime | 98 |
|
| 155 |
+
| Technology | 71 |
|
| 156 |
+
| Health | 70 |
|
| 157 |
+
| Science | 30 |
|
| 158 |
+
| Religion | 13 |
|
| 159 |
+
| Education | 12 |
|
| 160 |
+
|
| 161 |
+
### Training Hyperparameters
|
| 162 |
+
- batch_size: (16, 16)
|
| 163 |
+
- num_epochs: (5, 5)
|
| 164 |
+
- max_steps: -1
|
| 165 |
+
- sampling_strategy: oversampling
|
| 166 |
+
- num_iterations: 10
|
| 167 |
+
- body_learning_rate: (2e-05, 1e-05)
|
| 168 |
+
- head_learning_rate: 0.01
|
| 169 |
+
- loss: CosineSimilarityLoss
|
| 170 |
+
- distance_metric: cosine_distance
|
| 171 |
+
- margin: 0.25
|
| 172 |
+
- end_to_end: False
|
| 173 |
+
- use_amp: False
|
| 174 |
+
- warmup_proportion: 0.1
|
| 175 |
+
- l2_weight: 0.01
|
| 176 |
+
- seed: 42
|
| 177 |
+
- eval_max_steps: -1
|
| 178 |
+
- load_best_model_at_end: False
|
| 179 |
+
|
| 180 |
+
### Training Results
|
| 181 |
+
| Epoch | Step | Training Loss | Validation Loss |
|
| 182 |
+
|:------:|:-----:|:-------------:|:---------------:|
|
| 183 |
+
| 0.0005 | 1 | 0.1861 | - |
|
| 184 |
+
| 0.0248 | 50 | 0.3204 | - |
|
| 185 |
+
| 0.0495 | 100 | 0.2765 | - |
|
| 186 |
+
| 0.0743 | 150 | 0.2462 | - |
|
| 187 |
+
| 0.0990 | 200 | 0.2192 | - |
|
| 188 |
+
| 0.1238 | 250 | 0.1755 | - |
|
| 189 |
+
| 0.1485 | 300 | 0.135 | - |
|
| 190 |
+
| 0.1733 | 350 | 0.1135 | - |
|
| 191 |
+
| 0.1980 | 400 | 0.092 | - |
|
| 192 |
+
| 0.2228 | 450 | 0.0885 | - |
|
| 193 |
+
| 0.2475 | 500 | 0.0739 | - |
|
| 194 |
+
| 0.2723 | 550 | 0.0762 | - |
|
| 195 |
+
| 0.2970 | 600 | 0.0688 | - |
|
| 196 |
+
| 0.3218 | 650 | 0.0633 | - |
|
| 197 |
+
| 0.3465 | 700 | 0.0535 | - |
|
| 198 |
+
| 0.3713 | 750 | 0.0363 | - |
|
| 199 |
+
| 0.3960 | 800 | 0.0388 | - |
|
| 200 |
+
| 0.4208 | 850 | 0.0339 | - |
|
| 201 |
+
| 0.4455 | 900 | 0.0265 | - |
|
| 202 |
+
| 0.4703 | 950 | 0.0344 | - |
|
| 203 |
+
| 0.4950 | 1000 | 0.016 | - |
|
| 204 |
+
| 0.5198 | 1050 | 0.0231 | - |
|
| 205 |
+
| 0.5446 | 1100 | 0.0152 | - |
|
| 206 |
+
| 0.5693 | 1150 | 0.0118 | - |
|
| 207 |
+
| 0.5941 | 1200 | 0.0102 | - |
|
| 208 |
+
| 0.6188 | 1250 | 0.0089 | - |
|
| 209 |
+
| 0.6436 | 1300 | 0.0125 | - |
|
| 210 |
+
| 0.6683 | 1350 | 0.0082 | - |
|
| 211 |
+
| 0.6931 | 1400 | 0.004 | - |
|
| 212 |
+
| 0.7178 | 1450 | 0.004 | - |
|
| 213 |
+
| 0.7426 | 1500 | 0.0062 | - |
|
| 214 |
+
| 0.7673 | 1550 | 0.004 | - |
|
| 215 |
+
| 0.7921 | 1600 | 0.0039 | - |
|
| 216 |
+
| 0.8168 | 1650 | 0.0111 | - |
|
| 217 |
+
| 0.8416 | 1700 | 0.0024 | - |
|
| 218 |
+
| 0.8663 | 1750 | 0.0047 | - |
|
| 219 |
+
| 0.8911 | 1800 | 0.0013 | - |
|
| 220 |
+
| 0.9158 | 1850 | 0.0023 | - |
|
| 221 |
+
| 0.9406 | 1900 | 0.0039 | - |
|
| 222 |
+
| 0.9653 | 1950 | 0.0036 | - |
|
| 223 |
+
| 0.9901 | 2000 | 0.004 | - |
|
| 224 |
+
| 1.0149 | 2050 | 0.0007 | - |
|
| 225 |
+
| 1.0396 | 2100 | 0.001 | - |
|
| 226 |
+
| 1.0644 | 2150 | 0.0029 | - |
|
| 227 |
+
| 1.0891 | 2200 | 0.0005 | - |
|
| 228 |
+
| 1.1139 | 2250 | 0.0005 | - |
|
| 229 |
+
| 1.1386 | 2300 | 0.0006 | - |
|
| 230 |
+
| 1.1634 | 2350 | 0.0003 | - |
|
| 231 |
+
| 1.1881 | 2400 | 0.0002 | - |
|
| 232 |
+
| 1.2129 | 2450 | 0.0018 | - |
|
| 233 |
+
| 1.2376 | 2500 | 0.0013 | - |
|
| 234 |
+
| 1.2624 | 2550 | 0.0039 | - |
|
| 235 |
+
| 1.2871 | 2600 | 0.0025 | - |
|
| 236 |
+
| 1.3119 | 2650 | 0.0025 | - |
|
| 237 |
+
| 1.3366 | 2700 | 0.0013 | - |
|
| 238 |
+
| 1.3614 | 2750 | 0.0017 | - |
|
| 239 |
+
| 1.3861 | 2800 | 0.0005 | - |
|
| 240 |
+
| 1.4109 | 2850 | 0.0012 | - |
|
| 241 |
+
| 1.4356 | 2900 | 0.0002 | - |
|
| 242 |
+
| 1.4604 | 2950 | 0.0006 | - |
|
| 243 |
+
| 1.4851 | 3000 | 0.0017 | - |
|
| 244 |
+
| 1.5099 | 3050 | 0.0004 | - |
|
| 245 |
+
| 1.5347 | 3100 | 0.0002 | - |
|
| 246 |
+
| 1.5594 | 3150 | 0.0015 | - |
|
| 247 |
+
| 1.5842 | 3200 | 0.0002 | - |
|
| 248 |
+
| 1.6089 | 3250 | 0.0002 | - |
|
| 249 |
+
| 1.6337 | 3300 | 0.0023 | - |
|
| 250 |
+
| 1.6584 | 3350 | 0.0025 | - |
|
| 251 |
+
| 1.6832 | 3400 | 0.0002 | - |
|
| 252 |
+
| 1.7079 | 3450 | 0.0006 | - |
|
| 253 |
+
| 1.7327 | 3500 | 0.0006 | - |
|
| 254 |
+
| 1.7574 | 3550 | 0.0014 | - |
|
| 255 |
+
| 1.7822 | 3600 | 0.0003 | - |
|
| 256 |
+
| 1.8069 | 3650 | 0.0024 | - |
|
| 257 |
+
| 1.8317 | 3700 | 0.0003 | - |
|
| 258 |
+
| 1.8564 | 3750 | 0.001 | - |
|
| 259 |
+
| 1.8812 | 3800 | 0.0005 | - |
|
| 260 |
+
| 1.9059 | 3850 | 0.0014 | - |
|
| 261 |
+
| 1.9307 | 3900 | 0.0007 | - |
|
| 262 |
+
| 1.9554 | 3950 | 0.0016 | - |
|
| 263 |
+
| 1.9802 | 4000 | 0.0013 | - |
|
| 264 |
+
| 2.0050 | 4050 | 0.0007 | - |
|
| 265 |
+
| 2.0297 | 4100 | 0.001 | - |
|
| 266 |
+
| 2.0545 | 4150 | 0.0005 | - |
|
| 267 |
+
| 2.0792 | 4200 | 0.0002 | - |
|
| 268 |
+
| 2.1040 | 4250 | 0.0001 | - |
|
| 269 |
+
| 2.1287 | 4300 | 0.0003 | - |
|
| 270 |
+
| 2.1535 | 4350 | 0.0001 | - |
|
| 271 |
+
| 2.1782 | 4400 | 0.0009 | - |
|
| 272 |
+
| 2.2030 | 4450 | 0.0002 | - |
|
| 273 |
+
| 2.2277 | 4500 | 0.0004 | - |
|
| 274 |
+
| 2.2525 | 4550 | 0.0003 | - |
|
| 275 |
+
| 2.2772 | 4600 | 0.0001 | - |
|
| 276 |
+
| 2.3020 | 4650 | 0.0001 | - |
|
| 277 |
+
| 2.3267 | 4700 | 0.0011 | - |
|
| 278 |
+
| 2.3515 | 4750 | 0.0016 | - |
|
| 279 |
+
| 2.3762 | 4800 | 0.0004 | - |
|
| 280 |
+
| 2.4010 | 4850 | 0.0002 | - |
|
| 281 |
+
| 2.4257 | 4900 | 0.0001 | - |
|
| 282 |
+
| 2.4505 | 4950 | 0.0004 | - |
|
| 283 |
+
| 2.4752 | 5000 | 0.0001 | - |
|
| 284 |
+
| 2.5 | 5050 | 0.0002 | - |
|
| 285 |
+
| 2.5248 | 5100 | 0.0017 | - |
|
| 286 |
+
| 2.5495 | 5150 | 0.0002 | - |
|
| 287 |
+
| 2.5743 | 5200 | 0.0001 | - |
|
| 288 |
+
| 2.5990 | 5250 | 0.0013 | - |
|
| 289 |
+
| 2.6238 | 5300 | 0.0014 | - |
|
| 290 |
+
| 2.6485 | 5350 | 0.0001 | - |
|
| 291 |
+
| 2.6733 | 5400 | 0.0001 | - |
|
| 292 |
+
| 2.6980 | 5450 | 0.0001 | - |
|
| 293 |
+
| 2.7228 | 5500 | 0.0001 | - |
|
| 294 |
+
| 2.7475 | 5550 | 0.0001 | - |
|
| 295 |
+
| 2.7723 | 5600 | 0.0001 | - |
|
| 296 |
+
| 2.7970 | 5650 | 0.0001 | - |
|
| 297 |
+
| 2.8218 | 5700 | 0.0 | - |
|
| 298 |
+
| 2.8465 | 5750 | 0.0 | - |
|
| 299 |
+
| 2.8713 | 5800 | 0.0012 | - |
|
| 300 |
+
| 2.8960 | 5850 | 0.0001 | - |
|
| 301 |
+
| 2.9208 | 5900 | 0.0001 | - |
|
| 302 |
+
| 2.9455 | 5950 | 0.0003 | - |
|
| 303 |
+
| 2.9703 | 6000 | 0.0001 | - |
|
| 304 |
+
| 2.9950 | 6050 | 0.0001 | - |
|
| 305 |
+
| 3.0198 | 6100 | 0.0 | - |
|
| 306 |
+
| 3.0446 | 6150 | 0.0 | - |
|
| 307 |
+
| 3.0693 | 6200 | 0.0 | - |
|
| 308 |
+
| 3.0941 | 6250 | 0.0 | - |
|
| 309 |
+
| 3.1188 | 6300 | 0.0 | - |
|
| 310 |
+
| 3.1436 | 6350 | 0.0 | - |
|
| 311 |
+
| 3.1683 | 6400 | 0.0 | - |
|
| 312 |
+
| 3.1931 | 6450 | 0.0001 | - |
|
| 313 |
+
| 3.2178 | 6500 | 0.0001 | - |
|
| 314 |
+
| 3.2426 | 6550 | 0.0001 | - |
|
| 315 |
+
| 3.2673 | 6600 | 0.0 | - |
|
| 316 |
+
| 3.2921 | 6650 | 0.0 | - |
|
| 317 |
+
| 3.3168 | 6700 | 0.0 | - |
|
| 318 |
+
| 3.3416 | 6750 | 0.0 | - |
|
| 319 |
+
| 3.3663 | 6800 | 0.0 | - |
|
| 320 |
+
| 3.3911 | 6850 | 0.0012 | - |
|
| 321 |
+
| 3.4158 | 6900 | 0.0013 | - |
|
| 322 |
+
| 3.4406 | 6950 | 0.0001 | - |
|
| 323 |
+
| 3.4653 | 7000 | 0.001 | - |
|
| 324 |
+
| 3.4901 | 7050 | 0.0001 | - |
|
| 325 |
+
| 3.5149 | 7100 | 0.0002 | - |
|
| 326 |
+
| 3.5396 | 7150 | 0.0002 | - |
|
| 327 |
+
| 3.5644 | 7200 | 0.0001 | - |
|
| 328 |
+
| 3.5891 | 7250 | 0.0001 | - |
|
| 329 |
+
| 3.6139 | 7300 | 0.0002 | - |
|
| 330 |
+
| 3.6386 | 7350 | 0.0001 | - |
|
| 331 |
+
| 3.6634 | 7400 | 0.0001 | - |
|
| 332 |
+
| 3.6881 | 7450 | 0.0013 | - |
|
| 333 |
+
| 3.7129 | 7500 | 0.0001 | - |
|
| 334 |
+
| 3.7376 | 7550 | 0.0 | - |
|
| 335 |
+
| 3.7624 | 7600 | 0.0 | - |
|
| 336 |
+
| 3.7871 | 7650 | 0.0 | - |
|
| 337 |
+
| 3.8119 | 7700 | 0.0 | - |
|
| 338 |
+
| 3.8366 | 7750 | 0.0 | - |
|
| 339 |
+
| 3.8614 | 7800 | 0.0 | - |
|
| 340 |
+
| 3.8861 | 7850 | 0.0 | - |
|
| 341 |
+
| 3.9109 | 7900 | 0.0 | - |
|
| 342 |
+
| 3.9356 | 7950 | 0.0 | - |
|
| 343 |
+
| 3.9604 | 8000 | 0.0 | - |
|
| 344 |
+
| 3.9851 | 8050 | 0.0 | - |
|
| 345 |
+
| 4.0099 | 8100 | 0.0001 | - |
|
| 346 |
+
| 4.0347 | 8150 | 0.0 | - |
|
| 347 |
+
| 4.0594 | 8200 | 0.0 | - |
|
| 348 |
+
| 4.0842 | 8250 | 0.0 | - |
|
| 349 |
+
| 4.1089 | 8300 | 0.0 | - |
|
| 350 |
+
| 4.1337 | 8350 | 0.0 | - |
|
| 351 |
+
| 4.1584 | 8400 | 0.0 | - |
|
| 352 |
+
| 4.1832 | 8450 | 0.0 | - |
|
| 353 |
+
| 4.2079 | 8500 | 0.0 | - |
|
| 354 |
+
| 4.2327 | 8550 | 0.0 | - |
|
| 355 |
+
| 4.2574 | 8600 | 0.0 | - |
|
| 356 |
+
| 4.2822 | 8650 | 0.0 | - |
|
| 357 |
+
| 4.3069 | 8700 | 0.0 | - |
|
| 358 |
+
| 4.3317 | 8750 | 0.0 | - |
|
| 359 |
+
| 4.3564 | 8800 | 0.0 | - |
|
| 360 |
+
| 4.3812 | 8850 | 0.0 | - |
|
| 361 |
+
| 4.4059 | 8900 | 0.0 | - |
|
| 362 |
+
| 4.4307 | 8950 | 0.0 | - |
|
| 363 |
+
| 4.4554 | 9000 | 0.0 | - |
|
| 364 |
+
| 4.4802 | 9050 | 0.0 | - |
|
| 365 |
+
| 4.5050 | 9100 | 0.0 | - |
|
| 366 |
+
| 4.5297 | 9150 | 0.0 | - |
|
| 367 |
+
| 4.5545 | 9200 | 0.0 | - |
|
| 368 |
+
| 4.5792 | 9250 | 0.0008 | - |
|
| 369 |
+
| 4.6040 | 9300 | 0.0001 | - |
|
| 370 |
+
| 4.6287 | 9350 | 0.0 | - |
|
| 371 |
+
| 4.6535 | 9400 | 0.0 | - |
|
| 372 |
+
| 4.6782 | 9450 | 0.0 | - |
|
| 373 |
+
| 4.7030 | 9500 | 0.0 | - |
|
| 374 |
+
| 4.7277 | 9550 | 0.0013 | - |
|
| 375 |
+
| 4.7525 | 9600 | 0.0001 | - |
|
| 376 |
+
| 4.7772 | 9650 | 0.0 | - |
|
| 377 |
+
| 4.8020 | 9700 | 0.0001 | - |
|
| 378 |
+
| 4.8267 | 9750 | 0.0 | - |
|
| 379 |
+
| 4.8515 | 9800 | 0.0 | - |
|
| 380 |
+
| 4.8762 | 9850 | 0.0 | - |
|
| 381 |
+
| 4.9010 | 9900 | 0.0 | - |
|
| 382 |
+
| 4.9257 | 9950 | 0.0001 | - |
|
| 383 |
+
| 4.9505 | 10000 | 0.0 | - |
|
| 384 |
+
| 4.9752 | 10050 | 0.0 | - |
|
| 385 |
+
| 5.0 | 10100 | 0.0001 | - |
|
| 386 |
+
|
| 387 |
+
### Framework Versions
|
| 388 |
+
- Python: 3.10.12
|
| 389 |
+
- SetFit: 1.1.3
|
| 390 |
+
- Sentence Transformers: 5.1.0
|
| 391 |
+
- Transformers: 4.55.2
|
| 392 |
+
- PyTorch: 2.7.1+cu118
|
| 393 |
+
- Datasets: 4.0.0
|
| 394 |
+
- Tokenizers: 0.21.4
|
| 395 |
+
|
| 396 |
+
## Citation
|
| 397 |
+
|
| 398 |
+
### BibTeX
|
| 399 |
+
```bibtex
|
| 400 |
+
@article{https://doi.org/10.48550/arxiv.2209.11055,
|
| 401 |
+
doi = {10.48550/ARXIV.2209.11055},
|
| 402 |
+
url = {https://arxiv.org/abs/2209.11055},
|
| 403 |
+
author = {Tunstall, Lewis and Reimers, Nils and Jo, Unso Eun Seo and Bates, Luke and Korat, Daniel and Wasserblat, Moshe and Pereg, Oren},
|
| 404 |
+
keywords = {Computation and Language (cs.CL), FOS: Computer and information sciences, FOS: Computer and information sciences},
|
| 405 |
+
title = {Efficient Few-Shot Learning Without Prompts},
|
| 406 |
+
publisher = {arXiv},
|
| 407 |
+
year = {2022},
|
| 408 |
+
copyright = {Creative Commons Attribution 4.0 International}
|
| 409 |
+
}
|
| 410 |
+
```
|
| 411 |
+
|
| 412 |
+
<!--
|
| 413 |
+
## Glossary
|
| 414 |
+
|
| 415 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 416 |
+
-->
|
| 417 |
+
|
| 418 |
+
<!--
|
| 419 |
+
## Model Card Authors
|
| 420 |
+
|
| 421 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 422 |
+
-->
|
| 423 |
+
|
| 424 |
+
<!--
|
| 425 |
+
## Model Card Contact
|
| 426 |
+
|
| 427 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 428 |
+
-->
|
config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"XLMRobertaModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"classifier_dropout": null,
|
| 8 |
+
"eos_token_id": 2,
|
| 9 |
+
"hidden_act": "gelu",
|
| 10 |
+
"hidden_dropout_prob": 0.1,
|
| 11 |
+
"hidden_size": 768,
|
| 12 |
+
"initializer_range": 0.02,
|
| 13 |
+
"intermediate_size": 3072,
|
| 14 |
+
"layer_norm_eps": 1e-05,
|
| 15 |
+
"max_position_embeddings": 514,
|
| 16 |
+
"model_type": "xlm-roberta",
|
| 17 |
+
"num_attention_heads": 12,
|
| 18 |
+
"num_hidden_layers": 12,
|
| 19 |
+
"output_past": true,
|
| 20 |
+
"pad_token_id": 1,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"torch_dtype": "float32",
|
| 23 |
+
"transformers_version": "4.55.2",
|
| 24 |
+
"type_vocab_size": 1,
|
| 25 |
+
"use_cache": true,
|
| 26 |
+
"vocab_size": 250002
|
| 27 |
+
}
|
config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_type": "SentenceTransformer",
|
| 3 |
+
"__version__": {
|
| 4 |
+
"sentence_transformers": "5.1.0",
|
| 5 |
+
"transformers": "4.55.2",
|
| 6 |
+
"pytorch": "2.7.1+cu118"
|
| 7 |
+
},
|
| 8 |
+
"prompts": {
|
| 9 |
+
"query": "",
|
| 10 |
+
"document": ""
|
| 11 |
+
},
|
| 12 |
+
"default_prompt_name": null,
|
| 13 |
+
"similarity_fn_name": "cosine"
|
| 14 |
+
}
|
config_setfit.json
ADDED
|
@@ -0,0 +1,17 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"labels": [
|
| 3 |
+
"Business",
|
| 4 |
+
"Sports",
|
| 5 |
+
"Politics",
|
| 6 |
+
"Lifestyle",
|
| 7 |
+
"General News",
|
| 8 |
+
"Entertainment",
|
| 9 |
+
"Crime",
|
| 10 |
+
"Technology",
|
| 11 |
+
"Health",
|
| 12 |
+
"Science",
|
| 13 |
+
"Religion",
|
| 14 |
+
"Education"
|
| 15 |
+
],
|
| 16 |
+
"normalize_embeddings": false
|
| 17 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8fd2f98d0a89a73d43df9c2f5bb5695e5e9805c2a997f64dcfea380747ae6a9
|
| 3 |
+
size 1112197096
|
model_head.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71f16511fe2b5a59ca1a69dba4b4367efb212dbfc1fecc204e4acf68cea1cc02
|
| 3 |
+
size 75287
|
modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 512,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "<unk>",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
tokenizer.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:883b037111086fd4dfebbbc9b7cee11e1517b5e0c0514879478661440f137085
|
| 3 |
+
size 17082987
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": false,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"250001": {
|
| 36 |
+
"content": "<mask>",
|
| 37 |
+
"lstrip": true,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"bos_token": "<s>",
|
| 45 |
+
"clean_up_tokenization_spaces": true,
|
| 46 |
+
"cls_token": "<s>",
|
| 47 |
+
"eos_token": "</s>",
|
| 48 |
+
"extra_special_tokens": {},
|
| 49 |
+
"mask_token": "<mask>",
|
| 50 |
+
"model_max_length": 512,
|
| 51 |
+
"pad_token": "<pad>",
|
| 52 |
+
"sep_token": "</s>",
|
| 53 |
+
"tokenizer_class": "XLMRobertaTokenizer",
|
| 54 |
+
"unk_token": "<unk>"
|
| 55 |
+
}
|