(no commit message)
This commit is contained in:
@@ -2,5 +2,5 @@
|
||||
"model": "openai//models/checkpoint-5",
|
||||
"api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1",
|
||||
"max_tokens": 10000,
|
||||
"temperature": 2
|
||||
"temperature": 0.7
|
||||
}
|
||||
4
main.py
4
main.py
@@ -5,7 +5,7 @@ class CodeGeneratorConfig(PrecompiledConfig):
|
||||
model : str = "openai//models/checkpoint-5"
|
||||
api_base : str = "https://modaic-ai--grpo-demo-serve.modal.run/v1"
|
||||
max_tokens : int = 10000
|
||||
temperature : float = 2
|
||||
temperature : float = 0.7
|
||||
|
||||
|
||||
class CodeGeneration(dspy.Signature):
|
||||
@@ -32,6 +32,6 @@ class CodeGenerator(PrecompiledProgram):
|
||||
|
||||
code_generator = CodeGenerator(CodeGeneratorConfig())
|
||||
print(code_generator(query="Write a python function that returns the sum of two numbers.").code)
|
||||
code_generator.push_to_hub("modaic/code-generator-trl-grpo", with_code=True, tag="v2")
|
||||
code_generator.push_to_hub("modaic/code-generator-trl-grpo", with_code=True, tag="v2.0.1")
|
||||
|
||||
|
||||
@@ -24,7 +24,7 @@
|
||||
"finetuning_model": null,
|
||||
"launch_kwargs": {},
|
||||
"train_kwargs": {},
|
||||
"temperature": 2,
|
||||
"temperature": 0.7,
|
||||
"max_tokens": 10000,
|
||||
"api_base": "https://modaic-ai--grpo-demo-serve.modal.run/v1"
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user