From c7d3d0dc8f1d410d8acca1117158393c36965725 Mon Sep 17 00:00:00 2001 From: Tong Li Date: Thu, 19 Jun 2025 07:14:16 +0000 Subject: [PATCH] remove unused parameter --- colossalai/shardformer/modeling/qwen2.py | 1 - 1 file changed, 1 deletion(-) diff --git a/colossalai/shardformer/modeling/qwen2.py b/colossalai/shardformer/modeling/qwen2.py index 27571309e..8777ae77f 100644 --- a/colossalai/shardformer/modeling/qwen2.py +++ b/colossalai/shardformer/modeling/qwen2.py @@ -824,7 +824,6 @@ def get_lm_forward_with_dist_cross_entropy(shard_config: ShardConfig): output_attentions=output_attentions, output_hidden_states=output_hidden_states, return_dict=return_dict, - force_sp_output_gather=False, ) hidden_states = outputs[0]