mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-06-22 05:29:36 +00:00
* add grpo, support rlvr * add grpo, support rlvr * tested deepseek r1 pipeline * add ci * verify grpo r1 * verify grpo r1 * update readme, remove unused code * [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci * remove path * clean code * fix circular import * fix ci OOM * fix ci OOM * skip kto tp, fix qwen generation --------- Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
17 lines
455 B
Bash
Executable File
17 lines
455 B
Bash
Executable File
# run under /ColossalAI/applications/ColossalChat
|
|
export NCCL_SHM_DISABLE=1
|
|
export MAX_JOBS=1
|
|
export PRETRAINED_MODEL_PATH=./models
|
|
export SFT_DATASET=./sft_data
|
|
export PROMPT_DATASET=./prompt_data
|
|
export PROMPT_RLVR_DATASET=./prompt_data
|
|
export PREFERENCE_DATASET=./preference_data
|
|
export KTO_DATASET=./kto_data
|
|
mkdir models
|
|
mkdir sft_data
|
|
mkdir prompt_data
|
|
mkdir preference_data
|
|
mkdir kto_data
|
|
# ./tests/test_data_preparation.sh
|
|
# ./tests/test_train.sh
|