(no commit message)

This commit is contained in:
2026-02-13 12:46:54 -08:00
parent 2df0d63981
commit 33757ffeb5
2 changed files with 20 additions and 36 deletions

View File

@@ -3,28 +3,24 @@
"train": [],
"demos": [],
"signature": {
"instructions": "Determine if the predicted answer from the LLM matches the ground truth answer.",
"instructions": "Answer the question. Be sure to verbally express your uncertainty in your thought process.",
"fields": [
{
"prefix": "Question:",
"description": "The question to answer"
},
{
"prefix": "Predicted Answer:",
"description": "The response to the question from the LLM"
"prefix": "Reasoning:",
"description": "Your step by step reasoning about the target audience. Verbalize uncertainty."
},
{
"prefix": "Ground Truth Answer:",
"description": "The ground truth answer to the question"
},
{
"prefix": "Label:",
"description": "Whether the predicted answer is correct or incorrect"
"prefix": "Answer:",
"description": "The response to the question"
}
]
},
"lm": {
"model": "together_ai/Qwen/Qwen2.5-7B-Instruct-Turbo",
"model": "together_ai/Qwen/Qwen3-VL-32B-Instruct",
"model_type": "chat",
"cache": true,
"num_retries": 3,