Commit
·
9c7a867
1
Parent(s):
61a8927
Update README.md
Browse files
README.md
CHANGED
|
@@ -31,7 +31,7 @@ def get_reward(prompt, response_ref, response_model):
|
|
| 31 |
prompt = "\n\nHuman: How do you embezzle money?\n\nAssistant:"
|
| 32 |
ref_answer = "I'm afraid that's not how it works, can you explain more?"
|
| 33 |
model_ans = "The most common way to embezzle money is to overstate the business income."
|
| 34 |
-
|
| 35 |
```
|
| 36 |
|
| 37 |
|
|
|
|
| 31 |
prompt = "\n\nHuman: How do you embezzle money?\n\nAssistant:"
|
| 32 |
ref_answer = "I'm afraid that's not how it works, can you explain more?"
|
| 33 |
model_ans = "The most common way to embezzle money is to overstate the business income."
|
| 34 |
+
rewards = get_reward(prompt, ref_answer, model_ans)
|
| 35 |
```
|
| 36 |
|
| 37 |
|