From 474fe98b38cee2f68b705b343b078678ceb84274 Mon Sep 17 00:00:00 2001
From: nex <me@nexy7574.co.uk>
Date: Sat, 11 Nov 2023 18:42:33 +0000
Subject: [PATCH] Add killswitch

---
 cogs/other.py | 30 ++++++++++++++++++++++++------
 1 file changed, 24 insertions(+), 6 deletions(-)
diff --git a/cogs/other.py b/cogs/other.py
index adb296a..19e0667 100644
--- a/cogs/other.py
+++ b/cogs/other.py
@@ -1831,7 +1831,9 @@ class OtherCog(commands.Cog):
                 await interaction.edit_original_response(view=self)
                 self.stop()
 
-    @commands.command(hidden=True)
+    @commands.command(
+        usage="[model:<name:tag>] [server:<ip[:port]>] <query>"
+    )
     @commands.is_owner()
     @commands.max_concurrency(1, wait=True)
     async def ollama(self, ctx: commands.Context, *, query: str):
@@ -1846,8 +1848,19 @@ class OtherCog(commands.Cog):
         else:
             model = "orca-mini"
 
-        msg = await ctx.reply(f"Preparing {model!r} <a:loading:1101463077586735174>")
-        async with httpx.AsyncClient(base_url="http://192.168.0.90:11434/api") as client:
+        if query.startswith("server:"):
+            host, query = query.split(" ", 1)
+            host = host[7:]
+            try:
+                host, port = host.split(":", 1)
+                int(port)
+            except ValueError:
+                host += ":11434"
+        else:
+            host = "192.168.0.90:11434"
+
+        msg = await ctx.reply(f"Preparing [{model!r}](http://{host}) <a:loading:1101463077586735174>")
+        async with httpx.AsyncClient(base_url=f"http://{host}/api") as client:
             # get models
             try:
                 response = await client.post("/show", json={"name": model})
@@ -1910,8 +1923,10 @@ class OtherCog(commands.Cog):
                     if response.status_code != 200:
                         error = await response.aread()
                         return await msg.edit(content="Failed to generate text: `%s`" % error.decode())
+                    self.ollama_locks[msg] = asyncio.Event()
+                    view = self.OllamaKillSwitchView(ctx, msg)
+                    await msg.edit(view=view)
                     async for chunk in ollama_stream_reader(response):
-                        print(chunk)
                         if "done" not in chunk.keys() or "response" not in chunk.keys():
                             continue
                         else:
@@ -1921,7 +1936,9 @@ class OtherCog(commands.Cog):
                             output.description += chunk["response"]
                             last_edit = msg.edited_at.timestamp() if msg.edited_at else msg.created_at.timestamp()
                             if (time() - last_edit) >= 5 or chunk["done"] is True:
-                                await msg.edit(content=content, embed=output)
+                                await msg.edit(content=content, embed=output, view=view)
+                            if self.ollama_locks[msg].is_set():
+                                return await msg.edit(content="Aborted.", embed=output, view=None)
 
                     def get_time_spent(nanoseconds: int) -> str:
                         hours, minutes, seconds = 0, 0, 0
@@ -1963,7 +1980,8 @@ class OtherCog(commands.Cog):
                             tokens_per_second
                         ),
                     )
-                    await msg.edit(content=None, embed=output)
+                    await msg.edit(content=None, embed=output, view=None)
+                    self.ollama_locks.pop(msg, None)
 
 
 def setup(bot):