diff --git a/libs/langchain/langchain/llms/vllm.py b/libs/langchain/langchain/llms/vllm.py index d02b6ff02f2..46da858c775 100644 --- a/libs/langchain/langchain/llms/vllm.py +++ b/libs/langchain/langchain/llms/vllm.py @@ -54,6 +54,9 @@ class VLLM(BaseLLM): max_new_tokens: int = 512 """Maximum number of tokens to generate per output sequence.""" + logprobs: Optional[int] = None + """Number of log probabilities to return per output token.""" + client: Any #: :meta private: @root_validator() @@ -91,6 +94,7 @@ class VLLM(BaseLLM): "stop": self.stop, "ignore_eos": self.ignore_eos, "use_beam_search": self.use_beam_search, + "logprobs": self.logprobs, } def _generate(