community[patch]: allows using text-generation-inference /generate route with HuggingFaceEndpoint (#20100)

- **Description:** allows to use the /generate route of `text-generation-inference` with the `HuggingFaceEndpoint`
2025-09-03 03:59:42 +00:00 · 2024-04-30 05:09:55 +02:00
parent ea43c669f2
commit d7e12750df
1 changed files with 8 additions and 2 deletions
--- a/libs/community/langchain_community/llms/huggingface_endpoint.py
+++ b/libs/community/langchain_community/llms/huggingface_endpoint.py
@@ -258,7 +258,10 @@ class HuggingFaceEndpoint(LLM):
                stream=False,
                task=self.task,
            )
-            response_text = json.loads(response.decode())[0]["generated_text"]
+            try:
                response_text = json.loads(response.decode())[0]["generated_text"]
            except KeyError:
                response_text = json.loads(response.decode())["generated_text"]
            # Maybe the generation has stopped at one of the stop sequences:
            # then we remove this stop sequence from the end of the generated text
@@ -289,7 +292,10 @@ class HuggingFaceEndpoint(LLM):
                stream=False,
                task=self.task,
            )
-            response_text = json.loads(response.decode())[0]["generated_text"]
+            try:
                response_text = json.loads(response.decode())[0]["generated_text"]
            except KeyError:
                response_text = json.loads(response.decode())["generated_text"]
            # Maybe the generation has stopped at one of the stop sequences:
            # then remove this stop sequence from the end of the generated text