mirror of
https://github.com/GammaTauAI/reflexion-human-eval
synced 2024-11-16 00:12:59 +00:00
cleanup
This commit is contained in:
parent
f2f507f7fd
commit
e88370e0f1
@ -34,8 +34,10 @@ def run_reflexion(
|
||||
|
||||
# if solved, exit early
|
||||
if is_passing:
|
||||
is_solved = True
|
||||
num_success += 1
|
||||
is_passing = exe.evaluate(
|
||||
item["entry_point"], cur_func_impl, item["test"], timeout=10)
|
||||
is_solved = is_passing
|
||||
num_success += int(is_passing)
|
||||
break
|
||||
|
||||
# use self-reflection to iteratively improve
|
||||
|
@ -74,7 +74,7 @@ def run_reflexion_ucs(
|
||||
# if solved, exit--pass_at_k 1 early
|
||||
if is_passing:
|
||||
debug_print("solved at first attempt")
|
||||
is_solved = exe.evaluate(item["prompt"], cur_func_impl, item["test"])
|
||||
is_solved = exe.evaluate(item["entry_point"], cur_func_impl, item["test"])
|
||||
num_success += 1 if is_solved else 0
|
||||
break
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user