diff --git a/src/nio_llm/__main__.py b/src/nio_llm/__main__.py index 183ef39..d2113e9 100644 --- a/src/nio_llm/__main__.py +++ b/src/nio_llm/__main__.py @@ -23,7 +23,7 @@ def main( openai_api_endpoint: str = "http://localhost:8000/v1", openai_temperature: float = 0, openai_max_tokens: int = 256, - history_size: int = 3, + history_size: int = 5, ) -> None: """Instantiate and start the client. @@ -60,7 +60,7 @@ def main( Defaults to `256`. history_size (`int`): The number of messages to keep in history. - Defaults to `3`. + Defaults to `5`. """ # create the client client = LLMClient( diff --git a/src/nio_llm/client.py b/src/nio_llm/client.py index f7e318d..7453437 100644 --- a/src/nio_llm/client.py +++ b/src/nio_llm/client.py @@ -181,7 +181,6 @@ class LLMClient(AsyncClient): for message in self.history ], ], - stop=["<|im_end|>"], temperature=self.openai_temperature, max_tokens=self.openai_max_tokens, )