Commit ·
8d0ac59
1
Parent(s): 1c00037
Update README.md
Browse files
README.md
CHANGED
|
@@ -79,7 +79,7 @@ tokens = tokenizer(question, response1,
|
|
| 79 |
tokens.to(device)
|
| 80 |
|
| 81 |
# Score the response
|
| 82 |
-
score =
|
| 83 |
|
| 84 |
print(f"Question: {question} \n")
|
| 85 |
print(f"Response 1: {response1} Score: {score:.3f}")
|
|
@@ -91,7 +91,7 @@ tokens = tokenizer(question, response2,
|
|
| 91 |
|
| 92 |
tokens.to(device)
|
| 93 |
|
| 94 |
-
score =
|
| 95 |
|
| 96 |
print(f"Response 2: {response2} Score: {score:.3f}")
|
| 97 |
```
|
|
|
|
| 79 |
tokens.to(device)
|
| 80 |
|
| 81 |
# Score the response
|
| 82 |
+
score = rewardModel(**tokens, alpha=10).item()
|
| 83 |
|
| 84 |
print(f"Question: {question} \n")
|
| 85 |
print(f"Response 1: {response1} Score: {score:.3f}")
|
|
|
|
| 91 |
|
| 92 |
tokens.to(device)
|
| 93 |
|
| 94 |
+
score = rewardModel(**tokens, alpha=10).item()
|
| 95 |
|
| 96 |
print(f"Response 2: {response2} Score: {score:.3f}")
|
| 97 |
```
|