mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-09-06 03:20:52 +00:00
[moe] init mixtral impl
This commit is contained in:
19
applications/ColossalMoE/train.sh
Normal file
19
applications/ColossalMoE/train.sh
Normal file
@@ -0,0 +1,19 @@
|
||||
NUM_GPU=8
|
||||
MODEL="mistralai/Mixtral-8x7B-v0.1"
|
||||
SEQ_LENGTH=2048
|
||||
BATCH_SIZE=1
|
||||
LR=0.00001
|
||||
|
||||
# hybrid
|
||||
# torchrun --standalone --nproc_per_node $NUM_GPU \
|
||||
colossalai run --nproc_per_node $NUM_GPU --hostfile "hostfile" \
|
||||
train.py \
|
||||
--num_epoch 1 \
|
||||
--model_name $MODEL \
|
||||
--plugin "hybrid" \
|
||||
--batch_size $BATCH_SIZE \
|
||||
--lr $LR \
|
||||
--zero_stage 1 \
|
||||
--pp_size 2 \
|
||||
--dp_size 1 \
|
||||
--ep_size 8 \
|
Reference in New Issue
Block a user