tested after rebasing, fix importance sampling bug

This commit is contained in:
YeAnbang
2025-08-06 06:15:15 +00:00
parent 3746f73854
commit 32b2148670
4 changed files with 4 additions and 3 deletions

View File

@@ -273,6 +273,7 @@ class Qwen3PipelineForwards:
hidden_states: Optional[torch.FloatTensor] = None,
stage_index: Optional[List[int]] = None,
shard_config: ShardConfig = None,
**kwargs
):
r"""
Args: