fix logprob, add filtering, temperature annealing, lr descent

This commit is contained in:
YeAnbang
2025-03-21 10:24:24 +08:00
parent 7ee4452f8c
commit 0472f44163
7 changed files with 74 additions and 27 deletions

View File

@@ -22,7 +22,7 @@ if __name__ == "__main__":
inference_model_config = dict(path=args.model)
train_model_config = dict(path=args.model)
generate_config = dict(top_k=50, top_p=0.9, temperature=0.7)
generate_config = dict(top_k=50, top_p=0.75, temperature=0.9)
if args.backend == "transformers":
inference_model_config.update(