Commit a611bcf1 by nanziyuan

fix bugs

parent f3dd6691
...@@ -98,20 +98,13 @@ if __name__ == "__main__": ...@@ -98,20 +98,13 @@ if __name__ == "__main__":
# select pairs # select pairs
ds = defaultdict(dict)
for item in dataset:
ds[item["task_id"]][item["solution_id"]] = item
sorted_pairinfo = sorted(pairinfo, key=lambda x: x["similarity"])
task_groups = defaultdict(list) task_groups = defaultdict(list)
for item in pairinfo: for item in pairinfo:
task_groups[item["task_id"]].append(item) task_groups[item["task_id"]].append(item)
# Step 2: Select the 4 pairs with the smallest score for each task
selected_pairs = [] selected_pairs = []
for task, items in task_groups.items(): for task, items in task_groups.items():
# Sort items for this task by score and select the top 4 sorted_items = sorted(items, key=lambda x: x["similarity"], reverse=True)[:4]
sorted_items = sorted(items, key=lambda x: x["similarity"])[:4]
selected_pairs.extend(sorted_items) selected_pairs.extend(sorted_items)
save_jsonl(selected_pairs, args.output) save_jsonl(selected_pairs, args.output)
...@@ -4,15 +4,22 @@ model="/lustre/S/huangdi/open_for_out/models/Qwen2.5-Coder-7B-Instruct/" ...@@ -4,15 +4,22 @@ model="/lustre/S/huangdi/open_for_out/models/Qwen2.5-Coder-7B-Instruct/"
project="/lustre/S/nanziyuan/projects/ccc" project="/lustre/S/nanziyuan/projects/ccc"
modelname="qwen25_coder_inst" modelname="qwen25_coder_inst"
# APPS trainset="${project}/data/train/${modelname}-apps-train.jsonl"
# CUDA_VISIBLE_DEVICES=0,1,2,3 \ testset="${project}/data/test/${modelname}-apps-test.jsonl"
python -m codecritic.cli.gen_dataset \
--model ${model} \ train_selected_pairs="${project}/data/train/${modelname}-apps-train-selected_pairs.jsonl"
--apps /lustre/S/nanziyuan/datasets/apps/ \
--train "${project}/data/train/${modelname}-apps-train.jsonl" \ export CUDA_VISIBLE_DEVICES=0,1,2,3
--test "${project}/data/test/${modelname}-apps-test.jsonl"
## Sampling
# HumanEval & MBPP ## APPS
# python -m codecritic.cli.gen_dataset \
# --model ${model} \
# --apps /lustre/S/nanziyuan/datasets/apps/ \
# --train ${trainset} \
# --test ${testset}
## HumanEval & MBPP
# evalplus.evaluate \ # evalplus.evaluate \
# --model ${model} \ # --model ${model} \
# --n_samples 50 \ # --n_samples 50 \
...@@ -29,6 +36,11 @@ python -m codecritic.cli.gen_dataset \ ...@@ -29,6 +36,11 @@ python -m codecritic.cli.gen_dataset \
# --root "${project}/data/test/${modelname}-mbpp" \ # --root "${project}/data/test/${modelname}-mbpp" \
# --backend vllm # --backend vllm
# HumanEvalPack ## HumanEvalPack
## BigCodeBench
# BigCodeBench ## Training dataset
python -m codecritic.cli.select_preference_pairs \
--dataset ${trainset} \
--output ${train_selected_pairs}
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment