Commit ee225d88 by nanziyuan

fix script

parent 944b6831
...@@ -12,19 +12,19 @@ train_selected_pairs="${project}/data/train/${modelname}-apps-train-selected_pai ...@@ -12,19 +12,19 @@ train_selected_pairs="${project}/data/train/${modelname}-apps-train-selected_pai
apps="/lustre/S/nanziyuan/datasets/apps/" apps="/lustre/S/nanziyuan/datasets/apps/"
sft="${project}/data/train/${modelname}-sft.jsonl" sft="${project}/data/train/${modelname}-sft.jsonl"
ftmodel="${project}/model/algolr" ftmodel="${project}/model/qwen25_coder_inst_7b-algolr"
export CUDA_VISIBLE_DEVICES=0,1,2,3 ### export CUDA_VISIBLE_DEVICES=0,1,2,3
# python -m codecritic.cli.algolr \ python -m codecritic.cli.algolr \
# --model ${model} \ --model ${model} \
# --dataset ${trainset} \ --dataset ${trainset} \
# --pairinfo ${train_selected_pairs} \ --pairinfo ${train_selected_pairs} \
# --apps ${apps} \ --apps ${apps} \
# --output ${sft} \ --output ${sft} \
# --level beginner \ --level beginner \
# --tp 1 --tp 1
deepspeed --module \ deepspeed --module \
...@@ -34,7 +34,7 @@ openrlhf.cli.train_sft \ ...@@ -34,7 +34,7 @@ openrlhf.cli.train_sft \
--input_key question \ --input_key question \
--output_key response \ --output_key response \
--apply_chat_template \ --apply_chat_template \
--train_batch_size 32 \ --train_batch_size 256 \
--micro_train_batch_size 2 \ --micro_train_batch_size 2 \
--max_samples 500000 \ --max_samples 500000 \
--pretrain ${model} \ --pretrain ${model} \
...@@ -49,4 +49,4 @@ openrlhf.cli.train_sft \ ...@@ -49,4 +49,4 @@ openrlhf.cli.train_sft \
--learning_rate 5e-6 \ --learning_rate 5e-6 \
--load_checkpoint \ --load_checkpoint \
--gradient_checkpointing \ --gradient_checkpointing \
--use_tensorboard ${ftmodel}/runs --use_tensorboard "${ftmodel}_log"
...@@ -2,6 +2,7 @@ set -xe ...@@ -2,6 +2,7 @@ set -xe
dataset="/lustre/S/nanziyuan/projects/ccc/data/train/qwen25_coder_inst-apps-train-reward_dataset.jsonl" dataset="/lustre/S/nanziyuan/projects/ccc/data/train/qwen25_coder_inst-apps-train-reward_dataset.jsonl"
project="/lustre/S/nanziyuan/projects/ccc"
model="/lustre/S/huangdi/open_for_out/models/Qwen2.5-Coder-7B-Instruct/" model="/lustre/S/huangdi/open_for_out/models/Qwen2.5-Coder-7B-Instruct/"
ftmodel="${project}/model/qwen25_coder_inst_7b-orm" ftmodel="${project}/model/qwen25_coder_inst_7b-orm"
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment