tested after rebasing, fix importance sampling bug

This commit is contained in:
YeAnbang 2025-08-06 06:15:15 +00:00
parent 3746f73854
commit 32b2148670
4 changed files with 4 additions and 3 deletions

View File

@ -1,4 +1,4 @@
pandas>=1.4.1
sentencepiece
colossalai==0.4.7
colossalai>=0.4.7
prompt_toolkit

View File

@ -1,4 +1,4 @@
transformers==4.39.3
transformers>=4.39.3
tqdm
datasets==2.14.7
loralib

View File

@ -152,7 +152,7 @@ if __name__ == "__main__":
"-ei",
"--eval-interval",
type=int,
default=100,
default=-1,
help="Interval for evaluation. Evaluate every ei training steps.",
)
parser.add_argument(

View File

@ -273,6 +273,7 @@ class Qwen3PipelineForwards:
hidden_states: Optional[torch.FloatTensor] = None,
stage_index: Optional[List[int]] = None,
shard_config: ShardConfig = None,
**kwargs
):
r"""
Args: