Add new SentenceTransformer model
Browse files- 1_Pooling/config.json +10 -0
- README.md +567 -0
- config.json +23 -0
- config_sentence_transformers.json +10 -0
- model.safetensors +3 -0
- modules.json +20 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +73 -0
- vocab.txt +0 -0
1_Pooling/config.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"word_embedding_dimension": 768,
|
| 3 |
+
"pooling_mode_cls_token": false,
|
| 4 |
+
"pooling_mode_mean_tokens": true,
|
| 5 |
+
"pooling_mode_max_tokens": false,
|
| 6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
| 7 |
+
"pooling_mode_weightedmean_tokens": false,
|
| 8 |
+
"pooling_mode_lasttoken": false,
|
| 9 |
+
"include_prompt": true
|
| 10 |
+
}
|
README.md
ADDED
|
@@ -0,0 +1,567 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
tags:
|
| 3 |
+
- sentence-transformers
|
| 4 |
+
- sentence-similarity
|
| 5 |
+
- feature-extraction
|
| 6 |
+
- generated_from_trainer
|
| 7 |
+
- dataset_size:108121
|
| 8 |
+
- loss:TripletLoss
|
| 9 |
+
base_model: sentence-transformers/all-mpnet-base-v2
|
| 10 |
+
widget:
|
| 11 |
+
- source_sentence: "NAME: Zucchini, Peppers, and Tomatoes\n\nCATEGORY: Lunch/Snacks\n\
|
| 12 |
+
\nKEYWORDS: Peppers, Vegetable, Low Protein, Low Cholesterol, < 60 Mins, Inexpensive,\
|
| 13 |
+
\ Lunch/Snacks\n\nTOOLS: pan\n\nINGREDIENTS: zucchini, butter, olive oil, onion,\
|
| 14 |
+
\ bell pepper, chopped tomato, basil, oregano, feta cheese, parmesan cheese, black\
|
| 15 |
+
\ olive\n\nINSTRUCTIONS: \nWash, trim, and slice zucchini.\nSalt zucchini lightly\
|
| 16 |
+
\ and allow to drain for about ten minutes, then pat dry.\nHeat the butter and\
|
| 17 |
+
\ oil, sauté onions until wilted.\nAdd the zucchini and peppers, cook 2 to 3 minutes.\n\
|
| 18 |
+
Stir in tomatoes, herbs, and add salt and pepper to taste.\nCook 4 to 5 minutes,\
|
| 19 |
+
\ or until the vegetables are tender.\nIf the tomatoes are especially juicy, cook\
|
| 20 |
+
\ briefly over high heat to reduce pan juices.\nRemove from heat, stir in optional\
|
| 21 |
+
\ feta and olives or parmesan, if desired."
|
| 22 |
+
sentences:
|
| 23 |
+
- "NAME: Zuvers Barbecue Sauce\n\nCATEGORY: Sauces\n\nKEYWORDS: < 30 Mins, Sauces\n\
|
| 24 |
+
\nTOOLS: sauce pan, separate bowl\n\nINGREDIENTS: molasses, ketchup, apple cider\
|
| 25 |
+
\ vinegar, worcestershire sauce, liquid smoke, brown sugar, onion powder, chili\
|
| 26 |
+
\ powder, dry mustard, garlic powder, cornstarch, water\n\nINSTRUCTIONS: \nMix\
|
| 27 |
+
\ first 5 ingredients in sauce pan. Turn burner on low.\nMix next 5 dry ingredients\
|
| 28 |
+
\ in a separate bowl, and stir into the wet ingredients a little at a time, to\
|
| 29 |
+
\ make sure everything is smooth.\nOnce it is all mixed together, turn burner\
|
| 30 |
+
\ to medium and bring to a simmer, stirring occassionally. Simmer 15 minutes\
|
| 31 |
+
\ to meld flavors.\nMix cornstarch and water, stir into sauce and simmer 5 more\
|
| 32 |
+
\ minutes."
|
| 33 |
+
- "NAME: Honey BBQ Wings Like Kfc's\n\nCATEGORY: < 4 Hours\n\nKEYWORDS: < 4 Hours\n\
|
| 34 |
+
\nTOOLS: cooling rack, small saucepan\n\nINGREDIENTS: purpose flour, salt, black\
|
| 35 |
+
\ pepper, chicken wing, bbq sauce, honey\n\nINSTRUCTIONS: \nIn a shallow dish,\
|
| 36 |
+
\ combine flour, salt, and pepper.\nCoat chicken in flour mixture; refrigerate\
|
| 37 |
+
\ for 1 hour; coat chicken again with remaining flour mixture.\nIn a small saucepan,\
|
| 38 |
+
\ heat BBQ sauce and honey until warm; turn heat to low and keep warm.\nDeep-fry\
|
| 39 |
+
\ chicken, 8-10 pieces at a time, in 375 degree oil for 13 minutes.\nDrain chicken\
|
| 40 |
+
\ on cooling racks.\nImmediately toss fried chicken with BBQ sauce mixture.\n\
|
| 41 |
+
Repeat with remaining chicken."
|
| 42 |
+
- "NAME: Whipped Carrots\n\nCATEGORY: Vegetable\n\nKEYWORDS: Low Protein, < 60 Mins,\
|
| 43 |
+
\ Easy, Vegetable\n\nTOOLS: peeler, mixer, mixing bowl, large saucepan, knife\n\
|
| 44 |
+
\nINGREDIENTS: carrot, butter, nutmeg, milk, salt\n\nINSTRUCTIONS: \nWash the\
|
| 45 |
+
\ carrots and peel and trim ends.\nCut the carrots in half and place in a large\
|
| 46 |
+
\ saucepan with enough water to cover them. Add salt and bring to a boil.\nCook\
|
| 47 |
+
\ until tender.\nDrain the carrots and place them in a mixing bowl. Add milk,\
|
| 48 |
+
\ butter and nutmeg. Beat with an electric beater until smooth."
|
| 49 |
+
- source_sentence: "NAME: Beef and Cabbage Soup a La Shoneys\n\nCATEGORY: Low Cholesterol\n\
|
| 50 |
+
\nKEYWORDS: < 60 Mins, Low Cholesterol\n\nTOOLS: knife, pan\n\nINGREDIENTS: ground\
|
| 51 |
+
\ beef, cabbage, celery rib, bell pepper, onion, kidney bean, tomato, beef bouillon\
|
| 52 |
+
\ cube, garlic clove, worcestershire sauce, water, pepper\n\nINSTRUCTIONS: \n\
|
| 53 |
+
Dice the vegetables.\nBrown the ground beef.\nDrain.\nAdd onion, celery, bell\
|
| 54 |
+
\ pepper and garlic.\nCook until wilted.\nAdd the diced cabbage.\nAdd tomatoes\
|
| 55 |
+
\ juice and all.\nAdd Worcestershire sauce.\nAdd pepper.\nAdd 2 cups water.\n\
|
| 56 |
+
add boullion cubes\nAdd drained beans.\nCook 30 minutes."
|
| 57 |
+
sentences:
|
| 58 |
+
- "NAME: Lemon Cupcakes\n\nCATEGORY: Dessert\n\nKEYWORDS: Lemon, Citrus, Fruit,\
|
| 59 |
+
\ < 60 Mins, Dessert\n\nTOOLS: oven, wire rack, spatula, mixing bowl, cake pan,\
|
| 60 |
+
\ eletric mixer, toothpick\n\nINGREDIENTS: butter, butter, lemon, white flour,\
|
| 61 |
+
\ baking powder, salt, egg, sugar, butter, powdered sugar, lemon juice\n\nINSTRUCTIONS:\
|
| 62 |
+
\ \nPreheat the oven to 325°F Insert liners into medium cupcake pans.\nPrepare\
|
| 63 |
+
\ cupcakes. Melt butter and lemon zest on low heat; the heat helps release the\
|
| 64 |
+
\ flavors and spice the butter.\nIn a bowl, sift flour, baking powder and salt.\n\
|
| 65 |
+
Place eggs and sugar in a mixing bowl, beating on medium speed.\nGradually add\
|
| 66 |
+
\ in the dry ingredients, alternating with the melted butter and mix until mixture\
|
| 67 |
+
\ is light and airy.\nFill the cupcake liners two-third full.\nBake for 20-25\
|
| 68 |
+
\ minutes or until cupcakes are springy to the touch and a toothpick inserted\
|
| 69 |
+
\ in cupcake's center comes out clean.\nRemove from oven and cool on wire rack\
|
| 70 |
+
\ for 10 minutes.\nPrepare glaze: in an eletric mixer,beat butter with powdered\
|
| 71 |
+
\ sugar and lemon juice until frosting is integrated and smooth (add 1 more tablespoon\
|
| 72 |
+
\ of lemon juice for creamier texture if desired).\nUsing a spatula, spread frosting\
|
| 73 |
+
\ on each cupcake, decorating with lemon zest."
|
| 74 |
+
- "NAME: Scones\n\nCATEGORY: Scones\n\nKEYWORDS: Quick Breads, Breads, Healthy,\
|
| 75 |
+
\ Kid Friendly, Brunch, < 15 Mins, Easy, Scones\n\nTOOLS: bowl, knife, glass\n\
|
| 76 |
+
\nINGREDIENTS: self raising flour, salt, butter, milk, flour\n\nINSTRUCTIONS:\
|
| 77 |
+
\ \nSift flour and salt into a bowl.\nMelt butter and pour into flour.\nAdd milk\
|
| 78 |
+
\ gradually, stirring with a knife, until you have a moist dough.\nTurn onto a\
|
| 79 |
+
\ floured board, knead lightly, then press dough out until it is about 1 inch\
|
| 80 |
+
\ thick.\nCut with a cookie cutter or glass, and place on a hot floured tray,\
|
| 81 |
+
\ with each scone touching.\nBake at 220C for 10-15 minutes.\nServe hot with chilled\
|
| 82 |
+
\ butter, and strawberry jam!"
|
| 83 |
+
- "NAME: Asparagus, Bean, and Feta Salad\n\nCATEGORY: Vegetable\n\nKEYWORDS: Low\
|
| 84 |
+
\ Cholesterol, Healthy, < 30 Mins, Easy, Vegetable\n\nTOOLS: steamer, large bowl,\
|
| 85 |
+
\ whisk\n\nINGREDIENTS: asparagus, cannellini bean, radish, feta cheese, green\
|
| 86 |
+
\ onion, lemon juice, mint, olive oil, salt, black pepper\n\nINSTRUCTIONS: \n\
|
| 87 |
+
steam the asparagus, covered, 2 minutes or until crsip-tender. Rinse asparagus\
|
| 88 |
+
\ with cold water and drain.\nCombine asparagus and next 4 ingredients in a large\
|
| 89 |
+
\ bowl.\nCombine the juice and remaining ingredients in a small bowl; stir well\
|
| 90 |
+
\ with a whisk. Pour over asparagus mixture and toss gently to coat."
|
| 91 |
+
- source_sentence: "NAME: Lemon Broccoli\n\nCATEGORY: Vegetable\n\nKEYWORDS: Low Protein,\
|
| 92 |
+
\ < 15 Mins, Stove Top, Easy, Vegetable\n\nTOOLS: \n\nINGREDIENTS: broccoli floret,\
|
| 93 |
+
\ lemon juice, butter, lemon rind\n\nINSTRUCTIONS: \nSteam florets until they\
|
| 94 |
+
\ are crisp-tender, about 6 minutes.\nDrain well.\nToss with lemon juice, butter,\
|
| 95 |
+
\ and lemon rind."
|
| 96 |
+
sentences:
|
| 97 |
+
- "NAME: Party Pinwheels\n\nCATEGORY: < 30 Mins\n\nKEYWORDS: Easy, < 30 Mins\n\n\
|
| 98 |
+
TOOLS: platter, bowl\n\nINGREDIENTS: cream cheese, dill weed, green onion, bell\
|
| 99 |
+
\ pepper, celery, flour tortilla, salsa\n\nINSTRUCTIONS: \nMix first three ingredients\
|
| 100 |
+
\ together. Mix well.\nSpread on Tortillas.\nIf using peppers and/or celery sprinkle\
|
| 101 |
+
\ over tortillas.\nRoll up each tortilla tightly.\nWrap in saran wrap.\nChill\
|
| 102 |
+
\ at least 2 hours. I recommend overnight.\nBefore serving, slice into 1 inch\
|
| 103 |
+
\ slices and put on platter. Serve with a bowl of salsa or taco sauce."
|
| 104 |
+
- "NAME: Healthy Veggie Scramble\n\nCATEGORY: Breakfast\n\nKEYWORDS: Vegetable,\
|
| 105 |
+
\ Very Low Carbs, < 15 Mins, Easy, Breakfast\n\nTOOLS: \n\nINGREDIENTS: egg, spinach,\
|
| 106 |
+
\ onion, green pepper, mushroom, tomato\n\nINSTRUCTIONS: \nSautee veggies with\
|
| 107 |
+
\ non-fat cooking spray, add scrambled eggs, cook until done."
|
| 108 |
+
- "NAME: Baked Banana Oatmeal\n\nCATEGORY: Breakfast\n\nKEYWORDS: Healthy, Kid Friendly,\
|
| 109 |
+
\ Brunch, < 60 Mins, Easy, From Scratch, Breakfast\n\nTOOLS: oven, knife, prepared\
|
| 110 |
+
\ pan\n\nINGREDIENTS: rolled oat, oat, baking powder, salt, cinnamon, sugar, egg,\
|
| 111 |
+
\ banana, skim milk, vanilla, brown sugar\n\nINSTRUCTIONS: \nPreheat oven to 375.\n\
|
| 112 |
+
Spray an 8 inch square pan with cooking spray.\nStir together oats, baking powder,\
|
| 113 |
+
\ salt and cinnamon.\nAdd sugar, an egg, 1 mashed banana, milk and vanilla. Stir\
|
| 114 |
+
\ just until combined.\nPour into prepared pan and top with a layer of sliced\
|
| 115 |
+
\ bananas.\nBake for 25 minutes.\nTop with brown sugar and broil until golden.\
|
| 116 |
+
\ About 3-4 minutes, but watch it carefully!"
|
| 117 |
+
- source_sentence: "NAME: Carrots and Mushrooms Saute\n\nCATEGORY: Vegetable\n\nKEYWORDS:\
|
| 118 |
+
\ European, Low Protein, Low Cholesterol, Hanukkah, < 60 Mins, Stove Top, Easy,\
|
| 119 |
+
\ Vegetable\n\nTOOLS: large skillet, pot, medium saucepan\n\nINGREDIENTS: carrot,\
|
| 120 |
+
\ olive oil, garlic clove, mushroom, sugar, dry thyme, salt, black pepper\n\n\
|
| 121 |
+
INSTRUCTIONS: \nPlace carrots in a medium saucepan. Add water to cover by one\
|
| 122 |
+
\ inch. Bring to a boil. Partially cover and boil until tender crisp, about\
|
| 123 |
+
\ 5-8 minutes. Drain.\nHeat olive oil in a large skillet over medium low heat.\
|
| 124 |
+
\ Add garlic and mushrooms and saute, stirring occasionally, until mushroom liquid\
|
| 125 |
+
\ evaporates, about 6 minutes.\nAdd carrots, sugar, thyme, salt and pepper, cover\
|
| 126 |
+
\ and cook over low heat 15 minutes. Uncover, remove garlic; discard. Increase\
|
| 127 |
+
\ heat to medium-high; cook, stirring often, until carrots and mushrooms are very\
|
| 128 |
+
\ lightly browned, 2-5 minutes."
|
| 129 |
+
sentences:
|
| 130 |
+
- "NAME: Yummy Garlicky Green Beans\n\nCATEGORY: Vegetable\n\nKEYWORDS: Low Protein,\
|
| 131 |
+
\ Low Cholesterol, < 30 Mins, Easy, Vegetable\n\nTOOLS: skillet, pan, knife block\n\
|
| 132 |
+
\nINGREDIENTS: olive oil, green bean, salt, garlic clove\n\nINSTRUCTIONS: \nHeat\
|
| 133 |
+
\ the olive oil in a skillet on medium heat. Add green beans making sure that\
|
| 134 |
+
\ olive oil is distributed evenly, season with salt depending on your taste. Saute\
|
| 135 |
+
\ for about 10-15 minutes until softened but still crispy. Add minced garlic coating\
|
| 136 |
+
\ all green beans evenly for about 2-3 minutes, not too long as you don't want\
|
| 137 |
+
\ the garlic to brown at all--this can leave a bitter flavor. Immediately take\
|
| 138 |
+
\ off heat, let sit for another 2-3 minute Enjoy!\nI love garlic and usually use\
|
| 139 |
+
\ the 6 cloves, but you can use less to your taste."
|
| 140 |
+
- "NAME: Ramadan Date Bars\n\nCATEGORY: Bar Cookie\n\nKEYWORDS: Dessert, Cookie\
|
| 141 |
+
\ & Brownie, Fruit, Toddler Friendly, Kid Friendly, Ramadan, < 60 Mins, Easy,\
|
| 142 |
+
\ Bar Cookie\n\nTOOLS: knife, oven, mixer, pan\n\nINGREDIENTS: butter, brown sugar,\
|
| 143 |
+
\ egg, vanilla essence, self raising flour, date, walnut\n\nINSTRUCTIONS: \nPreheat\
|
| 144 |
+
\ oven to 350 F.\nCream the butter and sugar together.\nBeat in the egg and vanilla\
|
| 145 |
+
\ essence.\nFold in the flour, mix well.\nadd in chopped dates and walnuts.\n\
|
| 146 |
+
baked in a greased 9x13 pan for 20 - 25 minutes\ncut into bars or squares when\
|
| 147 |
+
\ cooled."
|
| 148 |
+
- "NAME: Easiest BBQ Chicken Ever\n\nCATEGORY: Chicken\n\nKEYWORDS: Poultry, Meat,\
|
| 149 |
+
\ Weeknight, Oven, < 4 Hours, Easy, Chicken\n\nTOOLS: glass casserole dish, oven,\
|
| 150 |
+
\ glass\n\nINGREDIENTS: chicken breast, bbq sauce, brown sugar, butter, chili\
|
| 151 |
+
\ powder\n\nINSTRUCTIONS: \nMelt butter in glass casserole dish, put in frozen\
|
| 152 |
+
\ chicken, top with brown sugar, chili powder and pour bbq sauce over; bake at\
|
| 153 |
+
\ 400 for one hour."
|
| 154 |
+
- source_sentence: "NAME: Lemon-Limeade Concentrate\n\nCATEGORY: Beverages\n\nKEYWORDS:\
|
| 155 |
+
\ Lemon, Lime, Citrus, Fruit, Canadian, Low Protein, Low Cholesterol, Healthy,\
|
| 156 |
+
\ Summer, < 15 Mins, Refrigerator, Beginner Cook, Stove Top, Easy, Beverages\n\
|
| 157 |
+
\nTOOLS: pot, fridge\n\nINGREDIENTS: sugar, water, lemon juice, lime juice\n\n\
|
| 158 |
+
INSTRUCTIONS: \nCombine sugar and water.\nBring to a boil, stirring occasionally.\n\
|
| 159 |
+
Boil 5 minutes, stirring occasionally.\nLet cool.\nStir in lemon and lime juices.\n\
|
| 160 |
+
Put in a jar with a tight fitting lid.\nSeal and refrigerate at least 6 hours\
|
| 161 |
+
\ before using.\nThis can be kept in the fridge for up to 2 weeks."
|
| 162 |
+
sentences:
|
| 163 |
+
- "NAME: Party Punch Ice Ring\n\nCATEGORY: Punch Beverage\n\nKEYWORDS: Beverages,\
|
| 164 |
+
\ Fruit, Low Protein, Low Cholesterol, Healthy, Free Of..., Potluck, Spring, Summer,\
|
| 165 |
+
\ Winter, Christmas, Hanukkah, Ramadan, Weeknight, St. Patrick's Day, Freezer,\
|
| 166 |
+
\ < 4 Hours, Easy, Punch Beverage\n\nTOOLS: punch bowl\n\nINGREDIENTS: ginger\
|
| 167 |
+
\ ale, lemon juice\n\nINSTRUCTIONS: \nDecoration suggestions:\nApricot halves.\n\
|
| 168 |
+
mint leaves.\norange peel.\ngreen grapes.\nstrawberries.\nMix ginger ale with\
|
| 169 |
+
\ lemon juice.\nPour 2 1/2 cups of the mixture into a 1 quart ring.\nFreeze.\n\
|
| 170 |
+
Arrange desired decorations on top of the ice.\nSlowly, pour remaining juice mixture\
|
| 171 |
+
\ over the top so that you don't disturb your decorations.\nFreeze -- To unmold,\
|
| 172 |
+
\ run cold water over the bottom; it will then slip out.\nFloat in the top of\
|
| 173 |
+
\ your punch bowl for a very pretty presentation."
|
| 174 |
+
- "NAME: Crock Pot Cream of Spinach Soup\n\nCATEGORY: Spinach\n\nKEYWORDS: Cheese,\
|
| 175 |
+
\ Greens, Vegetable, Very Low Carbs, Winter, Brunch, < 15 Mins, Beginner Cook,\
|
| 176 |
+
\ Easy, Inexpensive, Spinach\n\nTOOLS: to crock pot, pan\n\nINGREDIENTS: frozen\
|
| 177 |
+
\ spinach, cream cheese, milk, chicken broth, onion, cayenne pepper, paprika\n\
|
| 178 |
+
\nINSTRUCTIONS: \nDrain the spinach and add to crock pot.\nDump all the other\
|
| 179 |
+
\ ingredients into the crock pot.\nCook on low for 6-8 hours.\nENJOY!"
|
| 180 |
+
- "NAME: Spiced Mushrooms\n\nCATEGORY: Lunch/Snacks\n\nKEYWORDS: Vegetable, Asian,\
|
| 181 |
+
\ Indian, Low Protein, Vegan, Spicy, Savory, < 30 Mins, Lunch/Snacks\n\nTOOLS:\
|
| 182 |
+
\ bowl, wok, glass\n\nINGREDIENTS: button mushroom, ground cardamom, ground black\
|
| 183 |
+
\ pepper, ground nutmeg, ground cumin, ground coriander, ground turmeric, olive\
|
| 184 |
+
\ oil\n\nINSTRUCTIONS: \nPlace mushrooms into a large ceramic, glass or plastic\
|
| 185 |
+
\ bowl.\nCombine two thirds of oil, cardamom, pepper, nutmeg, cumin, coriander\
|
| 186 |
+
\ and turmeric in a small jug.\nPour mixture over mushrooms and toss well to coat\
|
| 187 |
+
\ mushrooms in mixture.\nSet aside to marinate for 15 minutes.\nHeat a wok over\
|
| 188 |
+
\ high heat until hot.\nAdd remaining oil and mushrooms and stir-fry for 3-4 minutes\
|
| 189 |
+
\ or until golden and just tender.\nServe hot."
|
| 190 |
+
pipeline_tag: sentence-similarity
|
| 191 |
+
library_name: sentence-transformers
|
| 192 |
+
metrics:
|
| 193 |
+
- cosine_accuracy
|
| 194 |
+
model-index:
|
| 195 |
+
- name: SentenceTransformer based on sentence-transformers/all-mpnet-base-v2
|
| 196 |
+
results:
|
| 197 |
+
- task:
|
| 198 |
+
type: triplet
|
| 199 |
+
name: Triplet
|
| 200 |
+
dataset:
|
| 201 |
+
name: dev
|
| 202 |
+
type: dev
|
| 203 |
+
metrics:
|
| 204 |
+
- type: cosine_accuracy
|
| 205 |
+
value: 0.9024872183799744
|
| 206 |
+
name: Cosine Accuracy
|
| 207 |
+
---
|
| 208 |
+
|
| 209 |
+
# SentenceTransformer based on sentence-transformers/all-mpnet-base-v2
|
| 210 |
+
|
| 211 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
| 212 |
+
|
| 213 |
+
## Model Details
|
| 214 |
+
|
| 215 |
+
### Model Description
|
| 216 |
+
- **Model Type:** Sentence Transformer
|
| 217 |
+
- **Base model:** [sentence-transformers/all-mpnet-base-v2](https://huggingface.co/sentence-transformers/all-mpnet-base-v2) <!-- at revision 12e86a3c702fc3c50205a8db88f0ec7c0b6b94a0 -->
|
| 218 |
+
- **Maximum Sequence Length:** 384 tokens
|
| 219 |
+
- **Output Dimensionality:** 768 dimensions
|
| 220 |
+
- **Similarity Function:** Cosine Similarity
|
| 221 |
+
<!-- - **Training Dataset:** Unknown -->
|
| 222 |
+
<!-- - **Language:** Unknown -->
|
| 223 |
+
<!-- - **License:** Unknown -->
|
| 224 |
+
|
| 225 |
+
### Model Sources
|
| 226 |
+
|
| 227 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
| 228 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
| 229 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
| 230 |
+
|
| 231 |
+
### Full Model Architecture
|
| 232 |
+
|
| 233 |
+
```
|
| 234 |
+
SentenceTransformer(
|
| 235 |
+
(0): Transformer({'max_seq_length': 384, 'do_lower_case': False}) with Transformer model: MPNetModel
|
| 236 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
| 237 |
+
(2): Normalize()
|
| 238 |
+
)
|
| 239 |
+
```
|
| 240 |
+
|
| 241 |
+
## Usage
|
| 242 |
+
|
| 243 |
+
### Direct Usage (Sentence Transformers)
|
| 244 |
+
|
| 245 |
+
First install the Sentence Transformers library:
|
| 246 |
+
|
| 247 |
+
```bash
|
| 248 |
+
pip install -U sentence-transformers
|
| 249 |
+
```
|
| 250 |
+
|
| 251 |
+
Then you can load this model and run inference.
|
| 252 |
+
```python
|
| 253 |
+
from sentence_transformers import SentenceTransformer
|
| 254 |
+
|
| 255 |
+
# Download from the 🤗 Hub
|
| 256 |
+
model = SentenceTransformer("GPTasty/TastyRecipesEmbedderV2")
|
| 257 |
+
# Run inference
|
| 258 |
+
sentences = [
|
| 259 |
+
'NAME: Lemon-Limeade Concentrate\n\nCATEGORY: Beverages\n\nKEYWORDS: Lemon, Lime, Citrus, Fruit, Canadian, Low Protein, Low Cholesterol, Healthy, Summer, < 15 Mins, Refrigerator, Beginner Cook, Stove Top, Easy, Beverages\n\nTOOLS: pot, fridge\n\nINGREDIENTS: sugar, water, lemon juice, lime juice\n\nINSTRUCTIONS: \nCombine sugar and water.\nBring to a boil, stirring occasionally.\nBoil 5 minutes, stirring occasionally.\nLet cool.\nStir in lemon and lime juices.\nPut in a jar with a tight fitting lid.\nSeal and refrigerate at least 6 hours before using.\nThis can be kept in the fridge for up to 2 weeks.',
|
| 260 |
+
"NAME: Party Punch Ice Ring\n\nCATEGORY: Punch Beverage\n\nKEYWORDS: Beverages, Fruit, Low Protein, Low Cholesterol, Healthy, Free Of..., Potluck, Spring, Summer, Winter, Christmas, Hanukkah, Ramadan, Weeknight, St. Patrick's Day, Freezer, < 4 Hours, Easy, Punch Beverage\n\nTOOLS: punch bowl\n\nINGREDIENTS: ginger ale, lemon juice\n\nINSTRUCTIONS: \nDecoration suggestions:\nApricot halves.\nmint leaves.\norange peel.\ngreen grapes.\nstrawberries.\nMix ginger ale with lemon juice.\nPour 2 1/2 cups of the mixture into a 1 quart ring.\nFreeze.\nArrange desired decorations on top of the ice.\nSlowly, pour remaining juice mixture over the top so that you don't disturb your decorations.\nFreeze -- To unmold, run cold water over the bottom; it will then slip out.\nFloat in the top of your punch bowl for a very pretty presentation.",
|
| 261 |
+
'NAME: Crock Pot Cream of Spinach Soup\n\nCATEGORY: Spinach\n\nKEYWORDS: Cheese, Greens, Vegetable, Very Low Carbs, Winter, Brunch, < 15 Mins, Beginner Cook, Easy, Inexpensive, Spinach\n\nTOOLS: to crock pot, pan\n\nINGREDIENTS: frozen spinach, cream cheese, milk, chicken broth, onion, cayenne pepper, paprika\n\nINSTRUCTIONS: \nDrain the spinach and add to crock pot.\nDump all the other ingredients into the crock pot.\nCook on low for 6-8 hours.\nENJOY!',
|
| 262 |
+
]
|
| 263 |
+
embeddings = model.encode(sentences)
|
| 264 |
+
print(embeddings.shape)
|
| 265 |
+
# [3, 768]
|
| 266 |
+
|
| 267 |
+
# Get the similarity scores for the embeddings
|
| 268 |
+
similarities = model.similarity(embeddings, embeddings)
|
| 269 |
+
print(similarities.shape)
|
| 270 |
+
# [3, 3]
|
| 271 |
+
```
|
| 272 |
+
|
| 273 |
+
<!--
|
| 274 |
+
### Direct Usage (Transformers)
|
| 275 |
+
|
| 276 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
| 277 |
+
|
| 278 |
+
</details>
|
| 279 |
+
-->
|
| 280 |
+
|
| 281 |
+
<!--
|
| 282 |
+
### Downstream Usage (Sentence Transformers)
|
| 283 |
+
|
| 284 |
+
You can finetune this model on your own dataset.
|
| 285 |
+
|
| 286 |
+
<details><summary>Click to expand</summary>
|
| 287 |
+
|
| 288 |
+
</details>
|
| 289 |
+
-->
|
| 290 |
+
|
| 291 |
+
<!--
|
| 292 |
+
### Out-of-Scope Use
|
| 293 |
+
|
| 294 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
| 295 |
+
-->
|
| 296 |
+
|
| 297 |
+
## Evaluation
|
| 298 |
+
|
| 299 |
+
### Metrics
|
| 300 |
+
|
| 301 |
+
#### Triplet
|
| 302 |
+
|
| 303 |
+
* Dataset: `dev`
|
| 304 |
+
* Evaluated with [<code>TripletEvaluator</code>](https://sbert.net/docs/package_reference/sentence_transformer/evaluation.html#sentence_transformers.evaluation.TripletEvaluator)
|
| 305 |
+
|
| 306 |
+
| Metric | Value |
|
| 307 |
+
|:--------------------|:-----------|
|
| 308 |
+
| **cosine_accuracy** | **0.9025** |
|
| 309 |
+
|
| 310 |
+
<!--
|
| 311 |
+
## Bias, Risks and Limitations
|
| 312 |
+
|
| 313 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
| 314 |
+
-->
|
| 315 |
+
|
| 316 |
+
<!--
|
| 317 |
+
### Recommendations
|
| 318 |
+
|
| 319 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
| 320 |
+
-->
|
| 321 |
+
|
| 322 |
+
## Training Details
|
| 323 |
+
|
| 324 |
+
### Training Dataset
|
| 325 |
+
|
| 326 |
+
#### Unnamed Dataset
|
| 327 |
+
|
| 328 |
+
* Size: 108,121 training samples
|
| 329 |
+
* Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>sentence_2</code>
|
| 330 |
+
* Approximate statistics based on the first 1000 samples:
|
| 331 |
+
| | sentence_0 | sentence_1 | sentence_2 |
|
| 332 |
+
|:--------|:-------------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|:-------------------------------------------------------------------------------------|
|
| 333 |
+
| type | string | string | string |
|
| 334 |
+
| details | <ul><li>min: 46 tokens</li><li>mean: 180.14 tokens</li><li>max: 384 tokens</li></ul> | <ul><li>min: 44 tokens</li><li>mean: 182.29 tokens</li><li>max: 384 tokens</li></ul> | <ul><li>min: 54 tokens</li><li>mean: 204.96 tokens</li><li>max: 384 tokens</li></ul> |
|
| 335 |
+
* Samples:
|
| 336 |
+
| sentence_0 | sentence_1 | sentence_2 |
|
| 337 |
+
|:--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
|
| 338 |
+
| <code>NAME: Cupcake Cream Cheese Frosting<br><br>CATEGORY: Dessert<br><br>KEYWORDS: < 15 Mins, Easy, Dessert<br><br>TOOLS: <br><br>INGREDIENTS: cream cheese, butter, vanilla, powdered sugar<br><br>INSTRUCTIONS: <br>Blend all ingredients until smooth.</code> | <code>NAME: Creamy Caramel Apple Cider<br><br>CATEGORY: Beverages<br><br>KEYWORDS: Thanksgiving, Halloween, Sweet, < 30 Mins, Easy, Beverages<br><br>TOOLS: medium saucepan, steamer, small chilled bowl<br><br>INGREDIENTS: heavy cream, brown sugar, apple cider, water, heavy cream, brown sugar<br><br>INSTRUCTIONS: <br>First, bring the cream and brown sugar to a boil in a medium saucepan over medium heat. Stir in the cider and the water and raise the heat to medium high, heating just until the cider begins to steam, about 4 minutes.<br>Divide among 4 mugs, top each one with 2 tablespoons of caramel whipped cream (recipe follows) and serve immediately.<br>Caramel Whipped Cream: In a small chilled bowl, whip the heavy cream with the brown sugar until soft peaks form.</code> | <code>NAME: My Mom's Burger Soup<br><br>CATEGORY: Potato<br><br>KEYWORDS: Vegetable, Meat, Kid Friendly, < 60 Mins, Easy, Potato<br><br>TOOLS: large pot, pan<br><br>INGREDIENTS: lean ground beef, onion, corn, tomato sauce, potato, water<br><br>INSTRUCTIONS: <br>Put ground beef and onion in a large pot, break up beef as it browns over medium heat.<br>When meat is browned, add corn, tomato sauce, then potatoes.<br>Add enough water to fill pot almost to the top (I use a 6qt. pot).<br>Bring to a boil, reduce heat and simmer until the potatoes are cooked.<br>Season with salt and pepper.<br>Serve with crusty bread and butter.</code> |
|
| 339 |
+
| <code>NAME: Green Bean & Bacon Wraps<br><br>CATEGORY: Beans<br><br>KEYWORDS: Low Protein, Low Cholesterol, < 60 Mins, Easy, Beans<br><br>TOOLS: baking dish, oven<br><br>INGREDIENTS: green bean, bacon<br><br>INSTRUCTIONS: <br>Drain water off of green beans.<br>Take five green beans and wrap with bacon end to end.<br>Lay in shallow baking dish.<br>Bake for 35 min at 375 degrees or until bacon is done.<br>Add salt and pepper to taste.</code> | <code>NAME: German Warm Cabbage Salad (Krautsalat)<br><br>CATEGORY: Vegetable<br><br>KEYWORDS: German, European, Low Protein, Low Cholesterol, Free Of..., Savory, < 60 Mins, Easy, Inexpensive, Vegetable<br><br>TOOLS: frying pan, knife<br><br>INGREDIENTS: cabbage, bacon, onion, cider vinegar, garlic<br><br>INSTRUCTIONS: <br>Cut the bacon into tiny bits.<br>Fry it in a big deep frying pan and fish out all the bits after they are crisp.<br>Cut up the onion and garlic and fry them in the bacon fat.<br>When they are brown, pour in the vinegar.<br>Bring it just up to a simmer, add all the cabbage and bacon, toss it as you would a salad, and serve it.<br>The cabbage doesn't cook, but it wilts a little under the hot vinegar.</code> | <code>NAME: Scandinavian Christmas Crispy Krumkake<br><br>CATEGORY: Dessert<br><br>KEYWORDS: Cookie & Brownie, Scandinavian, European, Christmas, < 30 Mins, Dessert<br><br>TOOLS: oven, knife, mixer, spoon, medium bowl<br><br>INGREDIENTS: sugar, butter, egg, milk, purpose flour, water<br><br>INSTRUCTIONS: <br>In a medium bowl, cream the sugar with the butter. Beat in the eggs until mixture is light and lemon colored. Beat in the milk and flour until blended and smooth. Let stand 30 minutes.<br>Preheat krumkake iron over medium heat on top of range until a drop of water sizzles when dropped on top.<br>Open iron; lightly brush inside top and bottom with shortening, oil or melted butter. Spoon 1 tablespoon batter onto center of hot iron. Close iron. Bake about 1 minute on each side until cookie is lightly browned. Insert tip of a knife under cookie to remove from iron; roll hot cookie into a cigar or cone shape. Cool on rack. Cookies become crisp as they cool. Repeat with remaining batter. Batter will thicken as you use it...</code> |
|
| 340 |
+
| <code>NAME: Orlando Bloom's Pasta Au Pistou<br><br>CATEGORY: Lunch/Snacks<br><br>KEYWORDS: Vegetable, Caribbean, Low Cholesterol, Healthy, < 30 Mins, Small Appliance, Lunch/Snacks<br><br>TOOLS: blender, saucepan, food processor<br><br>INGREDIENTS: spaghetti, parsley, basil, garlic clove, parmesan cheese, salt, olive oil, onion, tomato, brown sugar<br><br>INSTRUCTIONS: <br>Cook the pasta according to directions until al dente, then drain and rinse. Pour the pasta back into the saucepan, and replace the lid to keep warm.<br>In a blender or food processor, combine the parsley, basil, garlic, Parmesan, salt and 1 tablespoon of the oil. Process to a smooth paste.<br>Heat the remaining tablespoon of oil in a medium frying pan. Add the onion and cook, stirring occasionally, for about 7 minutes or until soft.<br>Add the tomatoes and cook for about 5 minutes. Reduce the heat and season, adding the brown sugar and cook for about 5 minutes.<br>Remove from the heat and stir in the herb mixture. Toss the pasta with the sauce and serve immediately.</code> | <code>NAME: Tomato and Basil Pasta<br><br>CATEGORY: Penne<br><br>KEYWORDS: Vegetable, European, Low Cholesterol, Toddler Friendly, Healthy, Kid Friendly, < 30 Mins, Beginner Cook, Easy, Inexpensive, Penne<br><br>TOOLS: knife, cooking pot, pan, potato masher, fork<br><br>INGREDIENTS: olive oil, garlic clove, basil, crushed red pepper flake, chopped tomato, pasta, parmesan cheese, romano cheese<br><br>INSTRUCTIONS: <br>Cook pasta as per box instructions.<br>While pasta is cooking, heat oil with copped garlic.<br>Add a handful of chopped FRESH basil.<br>Heat five minutes.<br>Slowly stir in chopped tomatoes, juice and all.<br>Add as much crushed red pepper flakes as you like, no more than 1 table.<br>Cook until tomatoes are soft enough to crush, about 20 minutes on med-low.<br>Crush tomatoes in pan with fork or potato masher.<br>Drain pasta and return to cooking pot.<br>Slowly add sauce and mix together.<br>It will look like not enough sauce to cover pasta, but this is a lite sauce and not to overpowering.<br>Add fresh grated parmasiano cheese or fresh romano ...</code> | <code>NAME: Spaghetti Kugel<br><br>CATEGORY: < 60 Mins<br><br>KEYWORDS: < 60 Mins<br><br>TOOLS: pan, baking dish<br><br>INGREDIENTS: cream cheese, butter, margarine, egg, sour cream, sugar, salt, vanilla, golden raisin, cinnamon<br><br>INSTRUCTIONS: <br>Cream cheese and butter, mixing until well blended.<br>Blend in eggs, sour cream, sugar, vanilla, and salt.<br>Add cooked spaghetti and raisins. Mix well.<br>Pour mixture into a 2 1/2 quart baking dish.<br>Sprinkle with cinnamon.<br>Bake at 375 degrees for 30 to 35 minutes or until set.</code> |
|
| 341 |
+
* Loss: [<code>TripletLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#tripletloss) with these parameters:
|
| 342 |
+
```json
|
| 343 |
+
{
|
| 344 |
+
"distance_metric": "TripletDistanceMetric.EUCLIDEAN",
|
| 345 |
+
"triplet_margin": 5
|
| 346 |
+
}
|
| 347 |
+
```
|
| 348 |
+
|
| 349 |
+
### Training Hyperparameters
|
| 350 |
+
#### Non-Default Hyperparameters
|
| 351 |
+
|
| 352 |
+
- `eval_strategy`: steps
|
| 353 |
+
- `num_train_epochs`: 1
|
| 354 |
+
- `fp16`: True
|
| 355 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 356 |
+
|
| 357 |
+
#### All Hyperparameters
|
| 358 |
+
<details><summary>Click to expand</summary>
|
| 359 |
+
|
| 360 |
+
- `overwrite_output_dir`: False
|
| 361 |
+
- `do_predict`: False
|
| 362 |
+
- `eval_strategy`: steps
|
| 363 |
+
- `prediction_loss_only`: True
|
| 364 |
+
- `per_device_train_batch_size`: 8
|
| 365 |
+
- `per_device_eval_batch_size`: 8
|
| 366 |
+
- `per_gpu_train_batch_size`: None
|
| 367 |
+
- `per_gpu_eval_batch_size`: None
|
| 368 |
+
- `gradient_accumulation_steps`: 1
|
| 369 |
+
- `eval_accumulation_steps`: None
|
| 370 |
+
- `torch_empty_cache_steps`: None
|
| 371 |
+
- `learning_rate`: 5e-05
|
| 372 |
+
- `weight_decay`: 0.0
|
| 373 |
+
- `adam_beta1`: 0.9
|
| 374 |
+
- `adam_beta2`: 0.999
|
| 375 |
+
- `adam_epsilon`: 1e-08
|
| 376 |
+
- `max_grad_norm`: 1.0
|
| 377 |
+
- `num_train_epochs`: 1
|
| 378 |
+
- `max_steps`: -1
|
| 379 |
+
- `lr_scheduler_type`: linear
|
| 380 |
+
- `lr_scheduler_kwargs`: {}
|
| 381 |
+
- `warmup_ratio`: 0.0
|
| 382 |
+
- `warmup_steps`: 0
|
| 383 |
+
- `log_level`: passive
|
| 384 |
+
- `log_level_replica`: warning
|
| 385 |
+
- `log_on_each_node`: True
|
| 386 |
+
- `logging_nan_inf_filter`: True
|
| 387 |
+
- `save_safetensors`: True
|
| 388 |
+
- `save_on_each_node`: False
|
| 389 |
+
- `save_only_model`: False
|
| 390 |
+
- `restore_callback_states_from_checkpoint`: False
|
| 391 |
+
- `no_cuda`: False
|
| 392 |
+
- `use_cpu`: False
|
| 393 |
+
- `use_mps_device`: False
|
| 394 |
+
- `seed`: 42
|
| 395 |
+
- `data_seed`: None
|
| 396 |
+
- `jit_mode_eval`: False
|
| 397 |
+
- `use_ipex`: False
|
| 398 |
+
- `bf16`: False
|
| 399 |
+
- `fp16`: True
|
| 400 |
+
- `fp16_opt_level`: O1
|
| 401 |
+
- `half_precision_backend`: auto
|
| 402 |
+
- `bf16_full_eval`: False
|
| 403 |
+
- `fp16_full_eval`: False
|
| 404 |
+
- `tf32`: None
|
| 405 |
+
- `local_rank`: 0
|
| 406 |
+
- `ddp_backend`: None
|
| 407 |
+
- `tpu_num_cores`: None
|
| 408 |
+
- `tpu_metrics_debug`: False
|
| 409 |
+
- `debug`: []
|
| 410 |
+
- `dataloader_drop_last`: False
|
| 411 |
+
- `dataloader_num_workers`: 0
|
| 412 |
+
- `dataloader_prefetch_factor`: None
|
| 413 |
+
- `past_index`: -1
|
| 414 |
+
- `disable_tqdm`: False
|
| 415 |
+
- `remove_unused_columns`: True
|
| 416 |
+
- `label_names`: None
|
| 417 |
+
- `load_best_model_at_end`: False
|
| 418 |
+
- `ignore_data_skip`: False
|
| 419 |
+
- `fsdp`: []
|
| 420 |
+
- `fsdp_min_num_params`: 0
|
| 421 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
| 422 |
+
- `tp_size`: 0
|
| 423 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
| 424 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
| 425 |
+
- `deepspeed`: None
|
| 426 |
+
- `label_smoothing_factor`: 0.0
|
| 427 |
+
- `optim`: adamw_torch
|
| 428 |
+
- `optim_args`: None
|
| 429 |
+
- `adafactor`: False
|
| 430 |
+
- `group_by_length`: False
|
| 431 |
+
- `length_column_name`: length
|
| 432 |
+
- `ddp_find_unused_parameters`: None
|
| 433 |
+
- `ddp_bucket_cap_mb`: None
|
| 434 |
+
- `ddp_broadcast_buffers`: False
|
| 435 |
+
- `dataloader_pin_memory`: True
|
| 436 |
+
- `dataloader_persistent_workers`: False
|
| 437 |
+
- `skip_memory_metrics`: True
|
| 438 |
+
- `use_legacy_prediction_loop`: False
|
| 439 |
+
- `push_to_hub`: False
|
| 440 |
+
- `resume_from_checkpoint`: None
|
| 441 |
+
- `hub_model_id`: None
|
| 442 |
+
- `hub_strategy`: every_save
|
| 443 |
+
- `hub_private_repo`: None
|
| 444 |
+
- `hub_always_push`: False
|
| 445 |
+
- `gradient_checkpointing`: False
|
| 446 |
+
- `gradient_checkpointing_kwargs`: None
|
| 447 |
+
- `include_inputs_for_metrics`: False
|
| 448 |
+
- `include_for_metrics`: []
|
| 449 |
+
- `eval_do_concat_batches`: True
|
| 450 |
+
- `fp16_backend`: auto
|
| 451 |
+
- `push_to_hub_model_id`: None
|
| 452 |
+
- `push_to_hub_organization`: None
|
| 453 |
+
- `mp_parameters`:
|
| 454 |
+
- `auto_find_batch_size`: False
|
| 455 |
+
- `full_determinism`: False
|
| 456 |
+
- `torchdynamo`: None
|
| 457 |
+
- `ray_scope`: last
|
| 458 |
+
- `ddp_timeout`: 1800
|
| 459 |
+
- `torch_compile`: False
|
| 460 |
+
- `torch_compile_backend`: None
|
| 461 |
+
- `torch_compile_mode`: None
|
| 462 |
+
- `dispatch_batches`: None
|
| 463 |
+
- `split_batches`: None
|
| 464 |
+
- `include_tokens_per_second`: False
|
| 465 |
+
- `include_num_input_tokens_seen`: False
|
| 466 |
+
- `neftune_noise_alpha`: None
|
| 467 |
+
- `optim_target_modules`: None
|
| 468 |
+
- `batch_eval_metrics`: False
|
| 469 |
+
- `eval_on_start`: False
|
| 470 |
+
- `use_liger_kernel`: False
|
| 471 |
+
- `eval_use_gather_object`: False
|
| 472 |
+
- `average_tokens_across_devices`: False
|
| 473 |
+
- `prompts`: None
|
| 474 |
+
- `batch_sampler`: batch_sampler
|
| 475 |
+
- `multi_dataset_batch_sampler`: round_robin
|
| 476 |
+
|
| 477 |
+
</details>
|
| 478 |
+
|
| 479 |
+
### Training Logs
|
| 480 |
+
| Epoch | Step | Training Loss | dev_cosine_accuracy |
|
| 481 |
+
|:------:|:-----:|:-------------:|:-------------------:|
|
| 482 |
+
| 0 | 0 | - | 0.9943 |
|
| 483 |
+
| 0.0370 | 500 | 4.1105 | 0.9579 |
|
| 484 |
+
| 0.0740 | 1000 | 3.6849 | 0.9568 |
|
| 485 |
+
| 0.1110 | 1500 | 3.7002 | 0.9688 |
|
| 486 |
+
| 0.1480 | 2000 | 3.6835 | 0.9553 |
|
| 487 |
+
| 0.1850 | 2500 | 3.6524 | 0.9438 |
|
| 488 |
+
| 0.2220 | 3000 | 3.647 | 0.9512 |
|
| 489 |
+
| 0.2590 | 3500 | 3.6126 | 0.9459 |
|
| 490 |
+
| 0.2959 | 4000 | 3.5819 | 0.9468 |
|
| 491 |
+
| 0.3329 | 4500 | 3.608 | 0.9456 |
|
| 492 |
+
| 0.3699 | 5000 | 3.6183 | 0.9493 |
|
| 493 |
+
| 0.4069 | 5500 | 3.6224 | 0.9166 |
|
| 494 |
+
| 0.4439 | 6000 | 3.6505 | 0.9380 |
|
| 495 |
+
| 0.4809 | 6500 | 3.5647 | 0.9055 |
|
| 496 |
+
| 0.5179 | 7000 | 3.578 | 0.9109 |
|
| 497 |
+
| 0.5549 | 7500 | 3.5536 | 0.9250 |
|
| 498 |
+
| 0.5919 | 8000 | 3.5693 | 0.9340 |
|
| 499 |
+
| 0.6289 | 8500 | 3.5777 | 0.9241 |
|
| 500 |
+
| 0.6659 | 9000 | 3.5123 | 0.9003 |
|
| 501 |
+
| 0.7029 | 9500 | 3.5304 | 0.9094 |
|
| 502 |
+
| 0.7399 | 10000 | 3.5692 | 0.9126 |
|
| 503 |
+
| 0.7769 | 10500 | 3.5485 | 0.8999 |
|
| 504 |
+
| 0.8139 | 11000 | 3.5491 | 0.9145 |
|
| 505 |
+
| 0.8508 | 11500 | 3.5322 | 0.9135 |
|
| 506 |
+
| 0.8878 | 12000 | 3.5212 | 0.9034 |
|
| 507 |
+
| 0.9248 | 12500 | 3.5389 | 0.9024 |
|
| 508 |
+
| 0.9618 | 13000 | 3.5122 | 0.9002 |
|
| 509 |
+
| 0.9988 | 13500 | 3.5146 | 0.9018 |
|
| 510 |
+
| 1.0 | 13516 | - | 0.9025 |
|
| 511 |
+
|
| 512 |
+
|
| 513 |
+
### Framework Versions
|
| 514 |
+
- Python: 3.11.3
|
| 515 |
+
- Sentence Transformers: 3.4.1
|
| 516 |
+
- Transformers: 4.50.0
|
| 517 |
+
- PyTorch: 2.6.0+cu126
|
| 518 |
+
- Accelerate: 1.5.2
|
| 519 |
+
- Datasets: 3.4.1
|
| 520 |
+
- Tokenizers: 0.21.1
|
| 521 |
+
|
| 522 |
+
## Citation
|
| 523 |
+
|
| 524 |
+
### BibTeX
|
| 525 |
+
|
| 526 |
+
#### Sentence Transformers
|
| 527 |
+
```bibtex
|
| 528 |
+
@inproceedings{reimers-2019-sentence-bert,
|
| 529 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
| 530 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
| 531 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
| 532 |
+
month = "11",
|
| 533 |
+
year = "2019",
|
| 534 |
+
publisher = "Association for Computational Linguistics",
|
| 535 |
+
url = "https://arxiv.org/abs/1908.10084",
|
| 536 |
+
}
|
| 537 |
+
```
|
| 538 |
+
|
| 539 |
+
#### TripletLoss
|
| 540 |
+
```bibtex
|
| 541 |
+
@misc{hermans2017defense,
|
| 542 |
+
title={In Defense of the Triplet Loss for Person Re-Identification},
|
| 543 |
+
author={Alexander Hermans and Lucas Beyer and Bastian Leibe},
|
| 544 |
+
year={2017},
|
| 545 |
+
eprint={1703.07737},
|
| 546 |
+
archivePrefix={arXiv},
|
| 547 |
+
primaryClass={cs.CV}
|
| 548 |
+
}
|
| 549 |
+
```
|
| 550 |
+
|
| 551 |
+
<!--
|
| 552 |
+
## Glossary
|
| 553 |
+
|
| 554 |
+
*Clearly define terms in order to be accessible across audiences.*
|
| 555 |
+
-->
|
| 556 |
+
|
| 557 |
+
<!--
|
| 558 |
+
## Model Card Authors
|
| 559 |
+
|
| 560 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
| 561 |
+
-->
|
| 562 |
+
|
| 563 |
+
<!--
|
| 564 |
+
## Model Card Contact
|
| 565 |
+
|
| 566 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
| 567 |
+
-->
|
config.json
ADDED
|
@@ -0,0 +1,23 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"MPNetModel"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"eos_token_id": 2,
|
| 8 |
+
"hidden_act": "gelu",
|
| 9 |
+
"hidden_dropout_prob": 0.1,
|
| 10 |
+
"hidden_size": 768,
|
| 11 |
+
"initializer_range": 0.02,
|
| 12 |
+
"intermediate_size": 3072,
|
| 13 |
+
"layer_norm_eps": 1e-05,
|
| 14 |
+
"max_position_embeddings": 514,
|
| 15 |
+
"model_type": "mpnet",
|
| 16 |
+
"num_attention_heads": 12,
|
| 17 |
+
"num_hidden_layers": 12,
|
| 18 |
+
"pad_token_id": 1,
|
| 19 |
+
"relative_attention_num_buckets": 32,
|
| 20 |
+
"torch_dtype": "float32",
|
| 21 |
+
"transformers_version": "4.50.0",
|
| 22 |
+
"vocab_size": 30527
|
| 23 |
+
}
|
config_sentence_transformers.json
ADDED
|
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"__version__": {
|
| 3 |
+
"sentence_transformers": "3.4.1",
|
| 4 |
+
"transformers": "4.50.0",
|
| 5 |
+
"pytorch": "2.6.0+cu126"
|
| 6 |
+
},
|
| 7 |
+
"prompts": {},
|
| 8 |
+
"default_prompt_name": null,
|
| 9 |
+
"similarity_fn_name": "cosine"
|
| 10 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39e978c7daacd439c379021f25f248fb12d351f17706c99897da554731699607
|
| 3 |
+
size 437967672
|
modules.json
ADDED
|
@@ -0,0 +1,20 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"idx": 0,
|
| 4 |
+
"name": "0",
|
| 5 |
+
"path": "",
|
| 6 |
+
"type": "sentence_transformers.models.Transformer"
|
| 7 |
+
},
|
| 8 |
+
{
|
| 9 |
+
"idx": 1,
|
| 10 |
+
"name": "1",
|
| 11 |
+
"path": "1_Pooling",
|
| 12 |
+
"type": "sentence_transformers.models.Pooling"
|
| 13 |
+
},
|
| 14 |
+
{
|
| 15 |
+
"idx": 2,
|
| 16 |
+
"name": "2",
|
| 17 |
+
"path": "2_Normalize",
|
| 18 |
+
"type": "sentence_transformers.models.Normalize"
|
| 19 |
+
}
|
| 20 |
+
]
|
sentence_bert_config.json
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"max_seq_length": 384,
|
| 3 |
+
"do_lower_case": false
|
| 4 |
+
}
|
special_tokens_map.json
ADDED
|
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"bos_token": {
|
| 3 |
+
"content": "<s>",
|
| 4 |
+
"lstrip": false,
|
| 5 |
+
"normalized": false,
|
| 6 |
+
"rstrip": false,
|
| 7 |
+
"single_word": false
|
| 8 |
+
},
|
| 9 |
+
"cls_token": {
|
| 10 |
+
"content": "<s>",
|
| 11 |
+
"lstrip": false,
|
| 12 |
+
"normalized": false,
|
| 13 |
+
"rstrip": false,
|
| 14 |
+
"single_word": false
|
| 15 |
+
},
|
| 16 |
+
"eos_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": false,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
+
"mask_token": {
|
| 24 |
+
"content": "<mask>",
|
| 25 |
+
"lstrip": true,
|
| 26 |
+
"normalized": false,
|
| 27 |
+
"rstrip": false,
|
| 28 |
+
"single_word": false
|
| 29 |
+
},
|
| 30 |
+
"pad_token": {
|
| 31 |
+
"content": "<pad>",
|
| 32 |
+
"lstrip": false,
|
| 33 |
+
"normalized": false,
|
| 34 |
+
"rstrip": false,
|
| 35 |
+
"single_word": false
|
| 36 |
+
},
|
| 37 |
+
"sep_token": {
|
| 38 |
+
"content": "</s>",
|
| 39 |
+
"lstrip": false,
|
| 40 |
+
"normalized": false,
|
| 41 |
+
"rstrip": false,
|
| 42 |
+
"single_word": false
|
| 43 |
+
},
|
| 44 |
+
"unk_token": {
|
| 45 |
+
"content": "[UNK]",
|
| 46 |
+
"lstrip": false,
|
| 47 |
+
"normalized": false,
|
| 48 |
+
"rstrip": false,
|
| 49 |
+
"single_word": false
|
| 50 |
+
}
|
| 51 |
+
}
|
tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
tokenizer_config.json
ADDED
|
@@ -0,0 +1,73 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"added_tokens_decoder": {
|
| 3 |
+
"0": {
|
| 4 |
+
"content": "<s>",
|
| 5 |
+
"lstrip": false,
|
| 6 |
+
"normalized": false,
|
| 7 |
+
"rstrip": false,
|
| 8 |
+
"single_word": false,
|
| 9 |
+
"special": true
|
| 10 |
+
},
|
| 11 |
+
"1": {
|
| 12 |
+
"content": "<pad>",
|
| 13 |
+
"lstrip": false,
|
| 14 |
+
"normalized": false,
|
| 15 |
+
"rstrip": false,
|
| 16 |
+
"single_word": false,
|
| 17 |
+
"special": true
|
| 18 |
+
},
|
| 19 |
+
"2": {
|
| 20 |
+
"content": "</s>",
|
| 21 |
+
"lstrip": false,
|
| 22 |
+
"normalized": false,
|
| 23 |
+
"rstrip": false,
|
| 24 |
+
"single_word": false,
|
| 25 |
+
"special": true
|
| 26 |
+
},
|
| 27 |
+
"3": {
|
| 28 |
+
"content": "<unk>",
|
| 29 |
+
"lstrip": false,
|
| 30 |
+
"normalized": true,
|
| 31 |
+
"rstrip": false,
|
| 32 |
+
"single_word": false,
|
| 33 |
+
"special": true
|
| 34 |
+
},
|
| 35 |
+
"104": {
|
| 36 |
+
"content": "[UNK]",
|
| 37 |
+
"lstrip": false,
|
| 38 |
+
"normalized": false,
|
| 39 |
+
"rstrip": false,
|
| 40 |
+
"single_word": false,
|
| 41 |
+
"special": true
|
| 42 |
+
},
|
| 43 |
+
"30526": {
|
| 44 |
+
"content": "<mask>",
|
| 45 |
+
"lstrip": true,
|
| 46 |
+
"normalized": false,
|
| 47 |
+
"rstrip": false,
|
| 48 |
+
"single_word": false,
|
| 49 |
+
"special": true
|
| 50 |
+
}
|
| 51 |
+
},
|
| 52 |
+
"bos_token": "<s>",
|
| 53 |
+
"clean_up_tokenization_spaces": false,
|
| 54 |
+
"cls_token": "<s>",
|
| 55 |
+
"do_lower_case": true,
|
| 56 |
+
"eos_token": "</s>",
|
| 57 |
+
"extra_special_tokens": {},
|
| 58 |
+
"mask_token": "<mask>",
|
| 59 |
+
"max_length": 128,
|
| 60 |
+
"model_max_length": 384,
|
| 61 |
+
"pad_to_multiple_of": null,
|
| 62 |
+
"pad_token": "<pad>",
|
| 63 |
+
"pad_token_type_id": 0,
|
| 64 |
+
"padding_side": "right",
|
| 65 |
+
"sep_token": "</s>",
|
| 66 |
+
"stride": 0,
|
| 67 |
+
"strip_accents": null,
|
| 68 |
+
"tokenize_chinese_chars": true,
|
| 69 |
+
"tokenizer_class": "MPNetTokenizer",
|
| 70 |
+
"truncation_side": "right",
|
| 71 |
+
"truncation_strategy": "longest_first",
|
| 72 |
+
"unk_token": "[UNK]"
|
| 73 |
+
}
|
vocab.txt
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|