🚚 split logic in two seperate files, create nio_llm module

2024-09-19 19:45:28 +00:00 · 2023-05-24 21:57:48 +02:00 · 2023-05-24 21:57:48 +02:00 · 69e24bfbd6
parent aa6e8e79c2
commit 69e24bfbd6
4 changed files with 104 additions and 119 deletions
--- a/nio-llm/test.py
+++ b/nio-llm/test.py
@ -1,28 +0,0 @@
-from textwrap import dedent
-
-from llama_cpp import Llama
-
-llm = Llama(model_path="../../../llama.cpp/models/sv13B/stable-vicuna-13B.ggml.q5_1.bin", n_threads=12)
-
-msg = dedent(
-    """
-    You are pipobot, an arrogant assistant. Answer as concisely as possible.
-    <@fainsil:inpt.fr>: Qu'est ce qu'une intégrale de Lebesgue ?
-    <@pipobot:inpt.fr>:
-    """,
-).strip()
-
-print(msg)
-print(repr(msg))
-
-output = llm(
-    msg,
-    max_tokens=100,
-    stop=["<@fainsil:inpt.fr>:", "\n"],
-    echo=True,
-)
-
-print(output)
-res = output["choices"][0]["text"]
-print(res)
-print(res.removeprefix(msg).strip())
--- a/nio_llm/init.py
+++ b/nio_llm/init.py
--- a/nio_llm/client.py
+++ b/nio_llm/client.py
@ -1,17 +1,14 @@
 """A Matrix client that uses Llama to respond to messages."""

-import asyncio
 import logging
 import time
+from pathlib import Path
 from textwrap import dedent

-import click
-from huggingface_hub import hf_hub_download
 from llama_cpp import Llama
 from nio import AsyncClient, MatrixRoom, RoomMessageText
-from rich.logging import RichHandler

-logger = logging.getLogger("nio-llm")
+logger = logging.getLogger("nio-llm.client")


 class LLMClient(AsyncClient):
@ -23,7 +20,7 @@ class LLMClient(AsyncClient):
        homeserver: str,
        device_id: str,
        preprompt: str,
-        ggml_path: str,
+        ggml_path: Path,
        room: str,
    ):
        """Create a new LLMClient instance."""
@ -42,7 +39,7 @@ class LLMClient(AsyncClient):

        # create the Llama instance
        self.llm = Llama(
-            model_path=ggml_path,
+            model_path=str(ggml_path),
            n_threads=12,
        )

@ -125,87 +122,3 @@ class LLMClient(AsyncClient):
                "body": output,
            },
        )
-
-
-@click.command()
-@click.option("--homeserver", "-h", help="The homeserver to connect to.", required=True)
-@click.option("--device-id", "-d", help="The device ID to use.", required=True)
-@click.option("--username", "-u", help="The username to log in as.", required=True)
-@click.option("--password", "-p", help="The password to log in with.", required=True)
-@click.option("--room", "-r", help="The room to join.", required=True)
-@click.option("--preprompt", "-t", help="The preprompt to use.", required=True)
-def main(
-    homeserver: str,
-    device_id: str,
-    username: str,
-    password: str,
-    room: str,
-    preprompt: str,
-) -> None:
-    """Run the main program.
-
-    Download the model from HuggingFace Hub and start the async loop.
-    """
-    # download the model
-    ggml_path = hf_hub_download(
-        repo_id="TheBloke/stable-vicuna-13B-GGML",
-        filename="stable-vicuna-13B.ggmlv3.q5_1.bin",
-    )
-
-    asyncio.get_event_loop().run_until_complete(
-        _main(
-            ggml_path=ggml_path,
-            homeserver=homeserver,
-            device_id=device_id,
-            username=username,
-            password=password,
-            preprompt=preprompt,
-            room=room,
-        ),
-    )
-
-
-async def _main(
-    homeserver: str,
-    device_id: str,
-    username: str,
-    password: str,
-    room: str,
-    preprompt: str,
-    ggml_path: str,
-) -> None:
-    """Run the async main program.
-
-    Create the client, login, join the room, and sync forever.
-    """
-    # create the client
-    client = LLMClient(
-        homeserver=homeserver,
-        device_id=device_id,
-        username=username,
-        room=room,
-        preprompt=preprompt,
-        ggml_path=ggml_path,
-    )
-
-    # Login to the homeserver
-    logger.debug(await client.login(password))
-
-    # Join the room, if not already joined
-    logger.debug(await client.join(room))
-
-    # Sync with the server forever
-    await client.sync_forever(timeout=30000)
-
-
-if __name__ == "__main__":
-    # set up logging
-    logging.captureWarnings(True)
-    logging.basicConfig(
-        level="DEBUG",
-        format="%(name)s: %(message)s",
-        handlers=[RichHandler(markup=True)],
-    )
-
-    # run the main program (with environment variables)
-    main(auto_envvar_prefix="NIOLLM")
--- a/nio_llm/main.py
+++ b/nio_llm/main.py
@ -0,0 +1,100 @@
+"""The main program for nio-llm."""
+
+import asyncio
+import logging
+from pathlib import Path
+
+import click
+from huggingface_hub import hf_hub_download
+from rich.logging import RichHandler
+
+from nio_llm.client import LLMClient
+
+logger = logging.getLogger("nio-llm.main")
+
+
+@click.command()
+@click.option("--homeserver", "-h", help="The homeserver to connect to.", required=True)
+@click.option("--device-id", "-d", help="The device ID to use.", required=True)
+@click.option("--username", "-u", help="The username to log in as.", required=True)
+@click.option("--password", "-p", help="The password to log in with.", required=True)
+@click.option("--room", "-r", help="The room to join.", required=True)
+@click.option("--preprompt", "-t", help="The preprompt to use.", required=True)
+def main(
+    homeserver: str,
+    device_id: str,
+    username: str,
+    password: str,
+    room: str,
+    preprompt: str,
+) -> None:
+    """Run the main program.
+
+    Download the model from HuggingFace Hub and start the async loop.
+    """
+    # download the model
+    ggml_path = Path(
+        hf_hub_download(
+            repo_id="TheBloke/stable-vicuna-13B-GGML",
+            filename="stable-vicuna-13B.ggmlv3.q5_1.bin",
+        ),
+    )
+
+    # start the async loop
+    asyncio.get_event_loop().run_until_complete(
+        _main(
+            ggml_path=ggml_path,
+            homeserver=homeserver,
+            device_id=device_id,
+            username=username,
+            password=password,
+            preprompt=preprompt,
+            room=room,
+        ),
+    )
+
+
+async def _main(
+    homeserver: str,
+    device_id: str,
+    username: str,
+    password: str,
+    room: str,
+    preprompt: str,
+    ggml_path: Path,
+) -> None:
+    """Run the async main program.
+
+    Create the client, login, join the room, and sync forever.
+    """
+    # create the client
+    client = LLMClient(
+        homeserver=homeserver,
+        device_id=device_id,
+        username=username,
+        room=room,
+        preprompt=preprompt,
+        ggml_path=ggml_path,
+    )
+
+    # Login to the homeserver
+    logger.debug(await client.login(password))
+
+    # Join the room, if not already joined
+    logger.debug(await client.join(room))
+
+    # Sync with the server forever
+    await client.sync_forever(timeout=30000)
+
+
+if __name__ == "__main__":
+    # set up logging
+    logging.captureWarnings(True)
+    logging.basicConfig(
+        level="DEBUG",
+        format="%(name)s: %(message)s",
+        handlers=[RichHandler(markup=True)],
+    )
+
+    # run the main program (with environment variables)
+    main(auto_envvar_prefix="NIOLLM")