Instructions to use benjamintli/modernbert-codesearchnet with libraries, inference providers, notebooks, and local apps. Follow these links to get started.

Libraries

How to use benjamintli/modernbert-codesearchnet with sentence-transformers:

from sentence_transformers import SentenceTransformer

model = SentenceTransformer("benjamintli/modernbert-codesearchnet")

sentences = [
    "Return a Python AST node for `recur` occurring inside a `loop`.",
    "def _reset(self, name=None):\n        \"\"\"Revert specified property to default value\n\n        If no property is specified, all properties are returned to default.\n        \"\"\"\n        if name is None:\n            for key in self._props:\n                if isinstance(self._props[key], basic.Property):\n                    self._reset(key)\n            return\n        if name not in self._props:\n            raise AttributeError(\"Input name '{}' is not a known \"\n                                 \"property or attribute\".format(name))\n        if not isinstance(self._props[name], basic.Property):\n            raise AttributeError(\"Cannot reset GettableProperty \"\n                                 \"'{}'\".format(name))\n        if name in self._defaults:\n            val = self._defaults[name]\n        else:\n            val = self._props[name].default\n        if callable(val):\n            val = val()\n        setattr(self, name, val)",
    "def cancel(self):\n        '''\n        Cancel a running workflow.\n\n        Args:\n            None\n\n        Returns:\n            None\n        '''\n        if not self.id:\n            raise WorkflowError('Workflow is not running.  Cannot cancel.')\n\n        if self.batch_values:\n            self.workflow.batch_workflow_cancel(self.id)\n        else:\n            self.workflow.cancel(self.id)",
    "def __loop_recur_to_py_ast(ctx: GeneratorContext, node: Recur) -> GeneratedPyAST:\n    \"\"\"Return a Python AST node for `recur` occurring inside a `loop`.\"\"\"\n    assert node.op == NodeOp.RECUR\n\n    recur_deps: List[ast.AST] = []\n    recur_targets: List[ast.Name] = []\n    recur_exprs: List[ast.AST] = []\n    for name, expr in zip(ctx.recur_point.binding_names, node.exprs):\n        expr_ast = gen_py_ast(ctx, expr)\n        recur_deps.extend(expr_ast.dependencies)\n        recur_targets.append(ast.Name(id=name, ctx=ast.Store()))\n        recur_exprs.append(expr_ast.node)\n\n    if len(recur_targets) == 1:\n        assert len(recur_exprs) == 1\n        recur_deps.append(ast.Assign(targets=recur_targets, value=recur_exprs[0]))\n    else:\n        recur_deps.append(\n            ast.Assign(\n                targets=[ast.Tuple(elts=recur_targets, ctx=ast.Store())],\n                value=ast.Tuple(elts=recur_exprs, ctx=ast.Load()),\n            )\n        )\n    recur_deps.append(ast.Continue())\n\n    return GeneratedPyAST(node=ast.NameConstant(None), dependencies=recur_deps)"
]
embeddings = model.encode(sentences)

similarities = model.similarity(embeddings, embeddings)
print(similarities.shape)
# [4, 4]

Notebooks
Google Colab
Kaggle

benjamintli commited on Mar 17

Commit

38dc3d1

verified ·

1 Parent(s): d7d9122

Training in progress, epoch 1

Browse files

Files changed (6) hide show

config.json +77 -0
eval/Information-Retrieval_evaluation_eval_results.csv +2 -0
model.safetensors +3 -0
tokenizer.json +0 -0
tokenizer_config.json +23 -0
training_args.bin +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,77 @@

+{
+  "architectures": [
+    "ModernBertModel"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 50281,
+  "classifier_activation": "gelu",
+  "classifier_bias": false,
+  "classifier_dropout": 0.0,
+  "classifier_pooling": "mean",
+  "cls_token_id": 50281,
+  "decoder_bias": true,
+  "deterministic_flash_attn": false,
+  "dtype": "float32",
+  "embedding_dropout": 0.0,
+  "eos_token_id": 50282,
+  "global_attn_every_n_layers": 3,
+  "gradient_checkpointing": false,
+  "hidden_activation": "gelu",
+  "hidden_size": 768,
+  "initializer_cutoff_factor": 2.0,
+  "initializer_range": 0.02,
+  "intermediate_size": 1152,
+  "layer_norm_eps": 1e-05,
+  "layer_types": [
+    "full_attention",
+    "sliding_attention",
+    "sliding_attention",
+    "full_attention",
+    "sliding_attention",
+    "sliding_attention",
+    "full_attention",
+    "sliding_attention",
+    "sliding_attention",
+    "full_attention",
+    "sliding_attention",
+    "sliding_attention",
+    "full_attention",
+    "sliding_attention",
+    "sliding_attention",
+    "full_attention",
+    "sliding_attention",
+    "sliding_attention",
+    "full_attention",
+    "sliding_attention",
+    "sliding_attention",
+    "full_attention"
+  ],
+  "local_attention": 128,
+  "max_position_embeddings": 8192,
+  "mlp_bias": false,
+  "mlp_dropout": 0.0,
+  "model_type": "modernbert",
+  "norm_bias": false,
+  "norm_eps": 1e-05,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 22,
+  "pad_token_id": 50283,
+  "position_embedding_type": "absolute",
+  "rope_parameters": {
+    "full_attention": {
+      "rope_theta": 160000.0,
+      "rope_type": "default"
+    },
+    "sliding_attention": {
+      "rope_theta": 10000.0,
+      "rope_type": "default"
+    }
+  },
+  "sep_token_id": 50282,
+  "sparse_pred_ignore_index": -100,
+  "sparse_prediction": false,
+  "tie_word_embeddings": true,
+  "transformers_version": "5.3.0",
+  "vocab_size": 50368
+}

eval/Information-Retrieval_evaluation_eval_results.csv ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ epoch,steps,cosine-Accuracy@1,cosine-Accuracy@3,cosine-Accuracy@5,cosine-Accuracy@10,cosine-Precision@1,cosine-Recall@1,cosine-Precision@3,cosine-Recall@3,cosine-Precision@5,cosine-Recall@5,cosine-Precision@10,cosine-Recall@10,cosine-MRR@10,cosine-NDCG@10,cosine-MAP@100
2	+ 1.0,46,0.9480526153529956,0.9703010995786662,0.9751824067413422,0.9806803000719351,0.9480526153529956,0.9480526153529956,0.32343369985955533,0.9703010995786662,0.19503648134826843,0.9751824067413422,0.09806803000719352,0.9806803000719351,0.9601788099886978,0.9652143122800294,0.9606213024321194

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc642ec9824513c91f2240b2eb85eb1064056c9beaffe91dfee4ab08060ca9cc
+size 596070136

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "backend": "tokenizers",
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "is_local": false,
+  "mask_token": "[MASK]",
+  "max_length": 512,
+  "model_input_names": [
+    "input_ids",
+    "attention_mask"
+  ],
+  "model_max_length": 512,
+  "pad_to_multiple_of": null,
+  "pad_token": "[PAD]",
+  "pad_token_type_id": 0,
+  "padding_side": "right",
+  "sep_token": "[SEP]",
+  "stride": 0,
+  "tokenizer_class": "TokenizersBackend",
+  "truncation_side": "right",
+  "truncation_strategy": "longest_first",
+  "unk_token": "[UNK]"
+}

training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef1f8b2637a58af8dc05416e5559a0e43ffd64425f40bc2694f58b547af137ef
+size 5585