Allow using system prompt and large user prompt

2024-03-22 09:08:03 +00:00 · 2024-03-22 09:08:03 +00:00 · 50c648a618
commit 50c648a618
parent 7cd2032de9
1 changed files with 60 additions and 7 deletions
--- a/src/cogs/ollama.py
+++ b/src/cogs/ollama.py
@ -8,6 +8,7 @@ import typing
 import base64
 import io
 import redis
 from discord import Interaction
 from discord.ui import View, button
 from fnmatch import fnmatch
@ -89,7 +90,7 @@ class ChatHistory:
            "threads:" + thread_id, json.dumps(self._internal[thread_id])
        )
-    def create_thread(self, member: discord.Member) -> str:
+    def create_thread(self, member: discord.Member, default: str | None = None) -> str:
        """
        Creates a thread, returns its ID.
        """
@ -100,7 +101,7 @@ class ChatHistory:
            "messages": []
        }
        with open("./assets/ollama-prompt.txt") as file:
-            system_prompt = file.read()
+            system_prompt = default or file.read()
        self.add_message(
            key,
            "system",
@ -190,6 +191,32 @@ class ChatHistory:
 SERVER_KEYS = list(CONFIG["ollama"].keys())
 class OllamaGetPrompt(discord.ui.Modal):
    def __init__(self, ctx: discord.ApplicationContext, prompt_type: str = "User"):
        super().__init__(
            discord.ui.InputText(
                style=discord.InputTextStyle.long,
                label="%s prompt" % prompt_type,
                placeholder="Enter your prompt here.",
            ),
            timeout=300,
            title="Ollama %s prompt" % prompt_type,
        )
        self.ctx = ctx
        self.prompt_type = prompt_type
        self.value = None
    async def interaction_check(self, interaction: discord.Interaction) -> bool:
        return interaction.user == self.ctx.user
    async def callback(self, interaction: Interaction):
        await interaction.response.defer()
        self.ctx.interaction = interaction
        self.value = self.children[0].value
        self.stop()
 class Ollama(commands.Cog):
    def __init__(self, bot: commands.Bot):
        self.bot = bot
@ -286,7 +313,28 @@ class Ollama(commands.Cog):
            if not self.history.get_thread(context):
                await ctx.respond("Invalid context key.")
                return
-        await ctx.defer()
+
        if query.startswith("$$"):
            prompt = OllamaGetPrompt(ctx, "System")
            await ctx.send_modal(prompt)
            await prompt.wait()
            system_query = prompt.value
            if not system_query:
                return await ctx.respond("No prompt provided. Aborting.")
        else:
            system_query = None
        if query == "$":
            prompt = OllamaGetPrompt(ctx)
            await ctx.send_modal(prompt)
            await prompt.wait()
            query = prompt.value
            if not query:
                return await ctx.respond("No prompt provided. Aborting.")
        try:
            await ctx.defer()
        except discord.HTTPException:
            pass
        model = model.casefold()
        try:
@ -294,7 +342,7 @@ class Ollama(commands.Cog):
            model = model + ":" + tag
            self.log.debug("Model %r already has a tag", model)
        except ValueError:
-            model = model + ":latest"
+            model += ":latest"
            self.log.debug("Resolved model to %r" % model)
        if image:
@ -315,7 +363,7 @@ class Ollama(commands.Cog):
                data = io.BytesIO()
                await image.save(data)
                data.seek(0)
-                image_data = base64.b64encode(data.read()).decode("utf-8")
+                image_data = base64.b64encode(data.read()).decode()
        else:
            image_data = None
@ -336,7 +384,12 @@ class Ollama(commands.Cog):
        async with aiohttp.ClientSession(
                base_url=server_config["base_url"],
-                timeout=aiohttp.ClientTimeout(0)
+                timeout=aiohttp.ClientTimeout(
                    connect=30,
                    sock_read=10800,
                    sock_connect=30,
                    total=10830
                )
        ) as session:
            embed = discord.Embed(
                title="Checking server...",
@ -482,7 +535,7 @@ class Ollama(commands.Cog):
            self.log.debug("Beginning to generate response with key %r.", key)
            if context is None:
-                context = self.history.create_thread(ctx.user)
+                context = self.history.create_thread(ctx.user, system_query)
            elif context is not None and self.history.get_thread(context) is None:
                __thread = self.history.find_thread(context)
                if not __thread: