fix(community): allow support for disabling max_tokens args (#21534)

This PR fixes an issue with not able to use unlimited/infinity tokens from the respective provider for the LiteLLM provider. This is an issue when working in an agent environment that the token usage can drastically increase beyond the initial value set causing unexpected behavior.
2024-11-10 01:10:59 +00:00 · 2024-06-27 22:28:59 +02:00 · 2024-06-27 22:28:59 +02:00 · c6f700b7cb
commit c6f700b7cb
parent 2a0d6788f7
1 changed files with 1 additions and 1 deletions
--- a/libs/community/langchain_community/chat_models/litellm.py
+++ b/libs/community/langchain_community/chat_models/litellm.py
@ -191,7 +191,7 @@ class ChatLiteLLM(BaseChatModel):
    n: int = 1
    """Number of chat completions to generate for each prompt. Note that the API may
       not return the full n completions if duplicates are generated."""
-    max_tokens: int = 256
+    max_tokens: Optional[int] = None

    max_retries: int = 6