Commit 527f2798 by nanziyuan

inference 32b model

parent d66937e2
...@@ -13,7 +13,6 @@ def generate_worker(cuda_device, prompts, model_path, sampling_params): ...@@ -13,7 +13,6 @@ def generate_worker(cuda_device, prompts, model_path, sampling_params):
model=model_path, model=model_path,
seed=42, seed=42,
max_model_len=8 * 1024, max_model_len=8 * 1024,
swap_space=16,
tensor_parallel_size=len(cuda_device), tensor_parallel_size=len(cuda_device),
) )
...@@ -57,7 +56,6 @@ def score_worker(cuda_device, prompts, model_path, positive_token, negative_toke ...@@ -57,7 +56,6 @@ def score_worker(cuda_device, prompts, model_path, positive_token, negative_toke
model=model_path, model=model_path,
seed=42, seed=42,
max_model_len=8 * 1024, max_model_len=8 * 1024,
swap_space=16,
tensor_parallel_size=len(cuda_device), tensor_parallel_size=len(cuda_device),
) )
......
...@@ -3,6 +3,7 @@ set -xe ...@@ -3,6 +3,7 @@ set -xe
model="/lustre/S/huangdi/open_for_out/models/Qwen2.5-Coder-32B-Instruct" model="/lustre/S/huangdi/open_for_out/models/Qwen2.5-Coder-32B-Instruct"
project="/lustre/S/nanziyuan/projects/ccc" project="/lustre/S/nanziyuan/projects/ccc"
modelname="qwen25_coder_inst_32b" modelname="qwen25_coder_inst_32b"
tp=4
# APPS # APPS
# CUDA_VISIBLE_DEVICES=0,1,2,3 \ # CUDA_VISIBLE_DEVICES=0,1,2,3 \
...@@ -11,7 +12,7 @@ python -m codecritic.cli.gen_dataset \ ...@@ -11,7 +12,7 @@ python -m codecritic.cli.gen_dataset \
--apps /lustre/S/nanziyuan/datasets/apps/ \ --apps /lustre/S/nanziyuan/datasets/apps/ \
--train "${project}/data/train/${modelname}-apps-train.jsonl" \ --train "${project}/data/train/${modelname}-apps-train.jsonl" \
--test "${project}/data/test/${modelname}-apps-test.jsonl" \ --test "${project}/data/test/${modelname}-apps-test.jsonl" \
--tp 2 --tp ${tp}
# HumanEval & MBPP # HumanEval & MBPP
evalplus.evaluate \ evalplus.evaluate \
...@@ -21,7 +22,7 @@ evalplus.evaluate \ ...@@ -21,7 +22,7 @@ evalplus.evaluate \
--dataset humaneval \ --dataset humaneval \
--root "${project}/data/test/${modelname}-humaneval" \ --root "${project}/data/test/${modelname}-humaneval" \
--backend vllm \ --backend vllm \
--tp 2 --tp ${tp}
evalplus.evaluate \ evalplus.evaluate \
--model ${model} \ --model ${model} \
...@@ -30,7 +31,7 @@ evalplus.evaluate \ ...@@ -30,7 +31,7 @@ evalplus.evaluate \
--dataset mbpp \ --dataset mbpp \
--root "${project}/data/test/${modelname}-mbpp" \ --root "${project}/data/test/${modelname}-mbpp" \
--backend vllm \ --backend vllm \
--tp 2 --tp ${tp}
# HumanEvalPack # HumanEvalPack
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment