File size: 448 Bytes
a1382fa
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
--- a/benchmarks/validate.py
+++ b/benchmarks/validate.py
@@ -107,7 +107,7 @@
 def make_mock(task_name):
     mock = MockLLMBackend()
     t = TASKS[task_name]
     def actor(msgs):
         text = " ".join(m.content for m in msgs)
-        has_h = "Learned Strategies" in text and "None yet" not in text
+        has_h = ("Learned Strategies" in text or "When:" in text) and "None yet" not in text
         code = t["good"] if has_h else t["bad"]