| import os | |
| import torch | |
| from transformers import AutoTokenizer | |
| from modeling_reward import load_finetuned_model | |
| def main(): | |
| repo_root = os.path.dirname(os.path.abspath(__file__)) | |
| tokenizer = AutoTokenizer.from_pretrained(repo_root) | |
| model = load_finetuned_model(repo_root) | |
| sql = "SELECT COUNT(*) FROM orders WHERE status = 'complete';" | |
| reasoning = "think: Count rows in orders filtered by status 'complete'." | |
| nl = "How many completed orders exist?" | |
| text = f"SQL: {sql}\nReasoning: {reasoning}\nNL: {nl}" | |
| inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=2048) | |
| with torch.no_grad(): | |
| score = model(**inputs)["scores"].item() | |
| print(f"Reward score: {score:.3f}") | |
| if __name__ == "__main__": | |
| main() | |