(no commit message)

This commit is contained in:
2025-12-24 00:33:38 -08:00
parent 76508b0062
commit 3982ab9745
3 changed files with 7 additions and 7 deletions

View File

@@ -1,6 +1,6 @@
{ {
"model": "openai//models/checkpoint-5", "model": "openai//models/checkpoint-5",
"api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1", "api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1",
"max_tokens": 1024, "max_tokens": 10000,
"temperature": 0.7 "temperature": 2
} }

View File

@@ -4,8 +4,8 @@ from modaic import PrecompiledProgram, PrecompiledConfig
class CodeGeneratorConfig(PrecompiledConfig): class CodeGeneratorConfig(PrecompiledConfig):
model : str = "openai//models/checkpoint-5" model : str = "openai//models/checkpoint-5"
api_base : str = "https://modaic-ai--grpo-demo-serve.modal.run/v1" api_base : str = "https://modaic-ai--grpo-demo-serve.modal.run/v1"
max_tokens : int = 1024 max_tokens : int = 10000
temperature : float = 0.7 temperature : float = 2
class CodeGeneration(dspy.Signature): class CodeGeneration(dspy.Signature):
@@ -32,6 +32,6 @@ class CodeGenerator(PrecompiledProgram):
code_generator = CodeGenerator(CodeGeneratorConfig()) code_generator = CodeGenerator(CodeGeneratorConfig())
print(code_generator(query="Write a python function that returns the sum of two numbers.").code) print(code_generator(query="Write a python function that returns the sum of two numbers.").code)
code_generator.push_to_hub("modaic/code-generator-trl-grpo", with_code=True, tag="v1") code_generator.push_to_hub("modaic/code-generator-trl-grpo", with_code=True, tag="v2")

View File

@@ -24,8 +24,8 @@
"finetuning_model": null, "finetuning_model": null,
"launch_kwargs": {}, "launch_kwargs": {},
"train_kwargs": {}, "train_kwargs": {},
"temperature": 0.7, "temperature": 2,
"max_tokens": 1024, "max_tokens": 10000,
"api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1" "api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1"
} }
}, },