get_rubric.py 992 B

12345678910111213141516
  1. def get_rubric():
  2. prompt = (
  3. "Read this scoring rubric carefully and follow the instructions precisely:\n"
  4. )
  5. prompt += (
  6. "A score of 5 means that model's value is the same as the gold answer's id.\n"
  7. )
  8. prompt += "A score of 4 means that the model's answer is the same or a paraphrase of the gold answer, but the value may not be an exact match.\n"
  9. prompt += "A score of 3 means that the model's answer is similar as the gold answer's description, but the value may be wrong. Both answers may indicate that revenue is increased but the gold says 12 percent and the model say 50 million USD.\n"
  10. prompt += "A score of 2 means that the model's answer is not similar to the gold answer, but the answer is plausible.\n"
  11. prompt += "A score of 1 means that the model's answer is not similar to the gold answer, and the answer doesn't make sense.\n"
  12. prompt += "Assign a 5 for a correct value even if other fields are missing.\n"
  13. return prompt