From c231ff35a8bb8f7b4c6799f3751453be2789edb1 Mon Sep 17 00:00:00 2001
From: Tyrin Todd <tyrin@modaic.dev>
Date: Thu, 23 Apr 2026 23:06:51 -0700
Subject: [PATCH] server-inference push reward_bench_2

---
 README.md    |  5 ++++-
 config.json  | 56 ++++++++++++++++++++++++++++++++++++++++++++++++++++
 program.json | 48 ++++++++++++++++++++++++++++++++++++++++++++
 3 files changed, 108 insertions(+), 1 deletion(-)
 create mode 100644 config.json
 create mode 100644 program.json

diff --git a/README.md b/README.md
index 4756645..b0d7062 100644
--- a/README.md
+++ b/README.md
@@ -1,2 +1,5 @@
-# reward_bench_2
+---
+{}
+---
 
+# reward_bench_2
\ No newline at end of file
diff --git a/config.json b/config.json
new file mode 100644
index 0000000..56de063
--- /dev/null
+++ b/config.json
@@ -0,0 +1,56 @@
+{
+  "model": null,
+  "signature": {
+    "description": "Reason step-by-step to determine which response is better for the given prompt.\nAs you reason, note any uncertainties, ambiguities, and gaps \u2014 both in how the instructions apply to the task at hand and in whether you have the knowledge needed to solve it. Be honest in your reasoning when you are unsure about your answer. Your reasoning must lead directly to\n the better response (A or B).",
+    "properties": {
+      "prompt": {
+        "__dspy_field_type": "input",
+        "desc": "The prompt provided.",
+        "prefix": "Prompt:",
+        "title": "Prompt",
+        "type": "string"
+      },
+      "response_A": {
+        "__dspy_field_type": "input",
+        "desc": "The first response option.",
+        "prefix": "Response A:",
+        "title": "Response A",
+        "type": "string"
+      },
+      "response_B": {
+        "__dspy_field_type": "input",
+        "desc": "The second response option.",
+        "prefix": "Response B:",
+        "title": "Response B",
+        "type": "string"
+      },
+      "reasoning": {
+        "__dspy_field_type": "output",
+        "desc": "Step-by-step reasoning, including uncertainty, ambiguity, or uncertainty in your thought process when relevant.",
+        "prefix": "Reasoning:",
+        "title": "Reasoning",
+        "type": "string"
+      },
+      "label": {
+        "__dspy_field_type": "output",
+        "desc": "The label of the better response ('A' or 'B').",
+        "enum": [
+          "A",
+          "B"
+        ],
+        "prefix": "Label:",
+        "title": "Label",
+        "type": "string"
+      }
+    },
+    "required": [
+      "prompt",
+      "response_A",
+      "response_B",
+      "reasoning",
+      "label"
+    ],
+    "title": "PromptPreferenceJudgeSig",
+    "type": "object"
+  }
+}
\ No newline at end of file
diff --git a/program.json b/program.json
new file mode 100644
index 0000000..b6b76df
--- /dev/null
+++ b/program.json
@@ -0,0 +1,48 @@
+{
+  "traces": [],
+  "train": [],
+  "demos": [],
+  "signature": {
+    "instructions": "Reason step-by-step to determine which response is better for the given prompt.\nAs you reason, note any uncertainties, ambiguities, and gaps \u2014 both in how the instructions apply to the task at hand and in whether you have the knowledge needed to solve it. Be honest in your reasoning when you are unsure about your answer. Your reasoning must lead directly to\n the better response (A or B).",
+    "fields": [
+      {
+        "prefix": "Prompt:",
+        "description": "The prompt provided."
+      },
+      {
+        "prefix": "Response A:",
+        "description": "The first response option."
+      },
+      {
+        "prefix": "Response B:",
+        "description": "The second response option."
+      },
+      {
+        "prefix": "Reasoning:",
+        "description": "Step-by-step reasoning, including uncertainty, ambiguity, or uncertainty in your thought process when relevant."
+      },
+      {
+        "prefix": "Label:",
+        "description": "The label of the better response ('A' or 'B')."
+      }
+    ]
+  },
+  "lm": {
+    "model": "together_ai/Qwen/Qwen2.5-7B-Instruct-Turbo",
+    "model_type": "chat",
+    "cache": true,
+    "num_retries": 3,
+    "finetuning_model": null,
+    "launch_kwargs": {},
+    "train_kwargs": {},
+    "temperature": null,
+    "max_tokens": null
+  },
+  "metadata": {
+    "dependency_versions": {
+      "python": "3.11",
+      "dspy": "3.1.3",
+      "cloudpickle": "3.1"
+    }
+  }
+}
\ No newline at end of file