tobil
/

qmd-training-scripts

tobil commited on Jan 24

Commit

d8b72d4

verified ·

1 Parent(s): 6ca0e08

Upload train_grpo.py with huggingface_hub

Files changed (1) hide show

train_grpo.py CHANGED Viewed

@@ -158,7 +158,7 @@ class QMDRewardFunction:
         self.embedder = SentenceTransformer('all-MiniLM-L6-v2')
         print("Embedding model loaded.")
-    def __call__(self, completions: list[str], prompts: list[str] = None) -> list[float]:
         """Compute rewards for a batch of completions."""
         rewards = []

         self.embedder = SentenceTransformer('all-MiniLM-L6-v2')
         print("Embedding model loaded.")
+    def __call__(self, completions: list[str], prompts: list[str] = None, **kwargs) -> list[float]:
         """Compute rewards for a batch of completions."""
         rewards = []