Update code snippets, MRL

Files changed (1) hide show

README.md +42 -18

README.md CHANGED Viewed

@@ -32,7 +32,7 @@ tags:
 - Model Size: 0.5B
 - Embedding Dimension: 896
 - Max Input Tokens: 32k
-- MLR: 896 512 256 128 64
 - Attn: Bidirectional attention
 - Pooling: Mean pooling
@@ -93,20 +93,32 @@ Then you can use the model like this:
 ```python
 from sentence_transformers import SentenceTransformer
-sentences = ["This is an example sentence", "Each sentence is converted"]
-model = SentenceTransformer("{MODEL_NAME_OR_PATH}", trust_remote_code=True, model_kwargs={"torch_dtype": torch.bfloat16, "attn_implementation": "flash_attention_2"})
 model.max_seq_length = 512
 embeddings = model.encode(
-    sentences,
     normalize_embeddings=True,
-    batch_size=256,
-    show_progress_bar=True
-    )
 print(embeddings)
 ```
 We add task instructions for asymmetric tasks: retrieval, reranking, classification, and clustering.
@@ -115,22 +127,34 @@ If you want to add task instructions to the query, you can use the model like th
 ```python
 from sentence_transformers import SentenceTransformer
-sentences = ["This is an example sentence", "Each sentence is converted"]
-model = SentenceTransformer("{MODEL_NAME_OR_PATH}", trust_remote_code=True, model_kwargs={"torch_dtype": torch.bfloat16, "attn_implementation": "flash_attention_2"})
 model.max_seq_length = 512
-prompt = "Instruct: Classifying the category of french news. \n Query: "
 embeddings = model.encode(
-    sentences,
     prompt=prompt,
     normalize_embeddings=True,
-    batch_size=256,
-    show_progress_bar=True
-    )
 print(embeddings)
 ```
 ### vllm support

 - Model Size: 0.5B
 - Embedding Dimension: 896
 - Max Input Tokens: 32k
+- MRL dimensions: 896, 512, 256, 128, and 64
 - Attn: Bidirectional attention
 - Pooling: Mean pooling
 ```python
 from sentence_transformers import SentenceTransformer
+import torch
+model = SentenceTransformer(
+    "KaLM-Embedding/KaLM-embedding-multilingual-mini-instruct-v2.5",
+    trust_remote_code=True,
+    model_kwargs={
+        "torch_dtype": torch.bfloat16,
+        "attn_implementation": "flash_attention_2",  # Optional
+    },
+)
 model.max_seq_length = 512
+sentences = ["This is an example sentence", "Each sentence is converted"]
 embeddings = model.encode(
+    sentences,
     normalize_embeddings=True,
+    batch_size=256,
+    show_progress_bar=True,
+)
 print(embeddings)
+'''
+[[-0.01043701 -0.02172852  0.0100708  ... -0.02807617  0.00157166
+  -0.03637695]
+ [-0.00424194  0.02966309  0.03686523 ... -0.02587891  0.01953125
+  -0.00125122]]
+'''
 ```
 We add task instructions for asymmetric tasks: retrieval, reranking, classification, and clustering.
 ```python
 from sentence_transformers import SentenceTransformer
+import torch
+model = SentenceTransformer(
+    "KaLM-Embedding/KaLM-embedding-multilingual-mini-instruct-v2.5",
+    trust_remote_code=True,
+    model_kwargs={
+        "torch_dtype": torch.bfloat16,
+        "attn_implementation": "flash_attention_2",  # Optional
+    },
+)
 model.max_seq_length = 512
+sentences = ["This is an example sentence", "Each sentence is converted"]
+prompt = "Instruct: Classifying the category of french news.\nQuery:"
 embeddings = model.encode(
+    sentences,
     prompt=prompt,
     normalize_embeddings=True,
+    batch_size=256,
+    show_progress_bar=True,
+)
 print(embeddings)
+'''
+[[-0.01867676  0.02319336  0.00280762 ... -0.02075195  0.00196838
+  -0.0703125 ]
+ [-0.0067749   0.03491211  0.01434326 ... -0.0043335   0.00509644
+  -0.04174805]]
+'''
 ```
 ### vllm support