Files
code-generator-trl-grpo/program.json
2025-12-24 00:30:21 -08:00

39 lines
913 B
JSON

{
"answer_question": {
"traces": [],
"train": [],
"demos": [],
"signature": {
"instructions": "Given the fields `query`, produce the fields `code`.",
"fields": [
{
"prefix": "Query:",
"description": "The query to generate code for."
},
{
"prefix": "Code:",
"description": "The code to generate as a python function."
}
]
},
"lm": {
"model": "openai//models/checkpoint-5",
"model_type": "chat",
"cache": true,
"num_retries": 3,
"finetuning_model": null,
"launch_kwargs": {},
"train_kwargs": {},
"temperature": 0.7,
"max_tokens": 1024,
"api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1"
}
},
"metadata": {
"dependency_versions": {
"python": "3.13",
"dspy": "3.0.4",
"cloudpickle": "3.1"
}
}
}