[fix] fix mixtral modeling & policy; update wait handles; doing benchmarking for llama hybrid;

This commit is contained in:
duanjunwen
2024-11-15 05:58:56 +00:00
parent 014afbdb59
commit 5c2ebbfd48
4 changed files with 12 additions and 6 deletions

View File

@@ -122,7 +122,7 @@ def main():
num_ckpt_layers_per_stage=[19, 19, 19, 13],
),
"num_layers_per_stage": [19, 20, 20, 21],
# "pp_style": "interleaved",
"pp_style": "interleaved",
}
if args.custom_ckpt
else {}