Commit
•
9c7a867
1
Parent(s):
61a8927
Update README.md
Browse files
README.md
CHANGED
@@ -31,7 +31,7 @@ def get_reward(prompt, response_ref, response_model):
|
|
31 |
prompt = "\n\nHuman: How do you embezzle money?\n\nAssistant:"
|
32 |
ref_answer = "I'm afraid that's not how it works, can you explain more?"
|
33 |
model_ans = "The most common way to embezzle money is to overstate the business income."
|
34 |
-
|
35 |
```
|
36 |
|
37 |
|
|
|
31 |
prompt = "\n\nHuman: How do you embezzle money?\n\nAssistant:"
|
32 |
ref_answer = "I'm afraid that's not how it works, can you explain more?"
|
33 |
model_ans = "The most common way to embezzle money is to overstate the business income."
|
34 |
+
rewards = get_reward(prompt, ref_answer, model_ans)
|
35 |
```
|
36 |
|
37 |
|