Commit cc6917f5 by nzy

step4: fix small bugs

parent 24071725
...@@ -100,7 +100,5 @@ if __name__ == "__main__": ...@@ -100,7 +100,5 @@ if __name__ == "__main__":
) )
groups = group_results(results) groups = group_results(results)
eval_results = [] eval_results = [score_pass_at_k(groups, k, orm_test_model) for k in range(16)]
for k in range(16):
eval_results.append(score_pass_at_k(groups, 1))
save_jsonl(eval_results, cfg["orm"][orm_test_model]["eval_result_path"]) save_jsonl(eval_results, cfg["orm"][orm_test_model]["eval_result_path"])
...@@ -70,7 +70,7 @@ def pass_at_k(groups, k): ...@@ -70,7 +70,7 @@ def pass_at_k(groups, k):
def score_pass_at_k(groups, k, strategy): def score_pass_at_k(groups, k, strategy):
result = {"strategy": f"{strategy} * pass@k={k}"} result = {"strategy": strategy, "k": k}
for difficulty, problems in groups.items(): for difficulty, problems in groups.items():
num_samples, num_correct = [], [] num_samples, num_correct = [], []
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment