Enable load balanced servers

2024-01-10 15:11:36 +00:00 · 2024-01-10 15:11:36 +00:00 · f3aadd2ce0
commit f3aadd2ce0
parent 4028afce3d
1 changed files with 12 additions and 4 deletions
--- a/src/cogs/ollama.py
+++ b/src/cogs/ollama.py
@ -1,5 +1,4 @@
 import asyncio
-import collections
 import json
 import logging
 import textwrap
@ -35,6 +34,13 @@ class Ollama(commands.Cog):
    def __init__(self, bot: commands.Bot):
        self.bot = bot
        self.log = logging.getLogger("jimmy.cogs.ollama")
+        self.last_server = 0
+
+    def next_server(self, increment: bool = True) -> str:
+        """Returns the next server key."""
+        if increment:
+            self.last_server += 1
+        return SERVER_KEYS[self.last_server % len(SERVER_KEYS)]

    async def ollama_stream(self, iterator: aiohttp.StreamReader) -> typing.AsyncIterator[dict]:
        async for line in iterator:
@ -73,7 +79,7 @@ class Ollama(commands.Cog):
                discord.Option(
                    str,
                    "The server to use for ollama.",
-                    default=SERVER_KEYS[0],
+                    default="next",
                    choices=SERVER_KEYS
                )
            ],
@ -86,12 +92,14 @@ class Ollama(commands.Cog):
        try:
            model, tag = model.split(":", 1)
            model = model + ":" + tag
-            self.log.debug("Model %r already has a tag")
+            self.log.debug("Model %r already has a tag", model)
        except ValueError:
            model = model + ":latest"
            self.log.debug("Resolved model to %r" % model)

-        if server not in CONFIG["ollama"]:
+        if server == "next":
+            server = self.next_server()
+        elif server not in CONFIG["ollama"]:
            await ctx.respond("Invalid server")
            return