2 Commits
v1 ... v2.0.1

Author SHA1 Message Date
fb1efa3b4a (no commit message) 2025-12-24 00:34:33 -08:00
3982ab9745 (no commit message) 2025-12-24 00:33:38 -08:00
3 changed files with 4 additions and 4 deletions

View File

@@ -1,6 +1,6 @@
{ {
"model": "openai//models/checkpoint-5", "model": "openai//models/checkpoint-5",
"api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1", "api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1",
"max_tokens": 1024, "max_tokens": 10000,
"temperature": 0.7 "temperature": 0.7
} }

View File

@@ -4,7 +4,7 @@ from modaic import PrecompiledProgram, PrecompiledConfig
class CodeGeneratorConfig(PrecompiledConfig): class CodeGeneratorConfig(PrecompiledConfig):
model : str = "openai//models/checkpoint-5" model : str = "openai//models/checkpoint-5"
api_base : str = "https://modaic-ai--grpo-demo-serve.modal.run/v1" api_base : str = "https://modaic-ai--grpo-demo-serve.modal.run/v1"
max_tokens : int = 1024 max_tokens : int = 10000
temperature : float = 0.7 temperature : float = 0.7
@@ -32,6 +32,6 @@ class CodeGenerator(PrecompiledProgram):
code_generator = CodeGenerator(CodeGeneratorConfig()) code_generator = CodeGenerator(CodeGeneratorConfig())
print(code_generator(query="Write a python function that returns the sum of two numbers.").code) print(code_generator(query="Write a python function that returns the sum of two numbers.").code)
code_generator.push_to_hub("modaic/code-generator-trl-grpo", with_code=True, tag="v1") code_generator.push_to_hub("modaic/code-generator-trl-grpo", with_code=True, tag="v2.0.1")

View File

@@ -25,7 +25,7 @@
"launch_kwargs": {}, "launch_kwargs": {},
"train_kwargs": {}, "train_kwargs": {},
"temperature": 0.7, "temperature": 0.7,
"max_tokens": 1024, "max_tokens": 10000,
"api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1" "api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1"
} }
}, },