server-inference push reward_bench_2

2026-04-23 23:06:51 -07:00
parent e873025330
commit c231ff35a8
3 changed files with 108 additions and 1 deletions
--- a/program.json
+++ b/program.json
@@ -0,0 +1,48 @@
+{
+  "traces": [],
+  "train": [],
+  "demos": [],
+  "signature": {
+    "instructions": "Reason step-by-step to determine which response is better for the given prompt.\nAs you reason, note any uncertainties, ambiguities, and gaps \u2014 both in how the instructions apply to the task at hand and in whether you have the knowledge needed to solve it. Be honest in your reasoning when you are unsure about your answer. Your reasoning must lead directly to\n the better response (A or B).",
+    "fields": [
+      {
+        "prefix": "Prompt:",
+        "description": "The prompt provided."
+      },
+      {
+        "prefix": "Response A:",
+        "description": "The first response option."
+      },
+      {
+        "prefix": "Response B:",
+        "description": "The second response option."
+      },
+      {
+        "prefix": "Reasoning:",
+        "description": "Step-by-step reasoning, including uncertainty, ambiguity, or uncertainty in your thought process when relevant."
+      },
+      {
+        "prefix": "Label:",
+        "description": "The label of the better response ('A' or 'B')."
+      }
+    ]
+  },
+  "lm": {
+    "model": "together_ai/Qwen/Qwen2.5-7B-Instruct-Turbo",
+    "model_type": "chat",
+    "cache": true,
+    "num_retries": 3,
+    "finetuning_model": null,
+    "launch_kwargs": {},
+    "train_kwargs": {},
+    "temperature": null,
+    "max_tokens": null
+  },
+  "metadata": {
+    "dependency_versions": {
+      "python": "3.11",
+      "dspy": "3.1.3",
+      "cloudpickle": "3.1"
+    }
+  }
+}