This commit is contained in:
2025-10-21 14:13:38 -04:00
parent a413e05023
commit 7b1535f925
3 changed files with 108 additions and 6 deletions

View File

@@ -85,7 +85,6 @@ class AttackProgram(dspy.Module):
critique = critique.critique
return self.try_attacks[-1](harmful_intent=harmful_intent, critique=critique)
def metric(
self,
intent: str | dspy.Example,
@@ -100,7 +99,10 @@ class AttackProgram(dspy.Module):
target_client,
self.target_model_name,
attack_prompt,
inference_params={"max_tokens": self.max_attack_tokens, "temperature": self.temperature},
inference_params={
"max_tokens": self.max_attack_tokens,
"temperature": self.temperature,
},
)
if use_verdict:
score = verdict_judge(intent, response)[0] / 5
@@ -110,7 +112,6 @@ class AttackProgram(dspy.Module):
score = round(score)
return score
def eval_program(self, prog, eval_set):
evaluate = Evaluate(
devset=eval_set,