Add OCR tech

2024-09-19 18:16:34 +01:00 · 2023-05-05 10:35:17 +01:00 · 2023-05-05 10:35:17 +01:00 · 34e63104f9
commit 34e63104f9
parent 7d9ed0f6ad
2 changed files with 50 additions and 0 deletions
--- a/cogs/other.py
+++ b/cogs/other.py
@ -21,6 +21,8 @@ from typing import Literal
 from typing import Tuple, Optional, Dict
 from pathlib import Path
 from urllib.parse import urlparse
+from PIL import Image
+import pytesseract

 import aiohttp
 import discord
@ -1521,6 +1523,52 @@ class OtherCog(commands.Cog):
        else:
            return await ctx.respond(result, view=GenerateNewView())

+    @commands.slash_command()
+    @commands.cooldown(1, 30, commands.BucketType.user)
+    @commands.max_concurrency(1, commands.BucketType.user)
+    async def ocr(
+            self,
+            ctx: discord.ApplicationContext,
+            attachment: discord.Option(
+                discord.SlashCommandOptionType.attachment,
+                description="Image to perform OCR on",
+            )
+    ):
+        """OCRs an image"""
+        await ctx.defer()
+        attachment: discord.Attachment
+        data = await attachment.read()
+        file = io.BytesIO(data)
+        file.seek(0)
+        img = await self.bot.loop.run_in_executor(None, Image.open, file)
+        try:
+            text = await self.bot.loop.run_in_executor(None, pytesseract.image_to_string, img)
+        except pytesseract.TesseractError as e:
+            return await ctx.respond(f"Failed to perform OCR: `{e}`")
+
+        if len(text) > ctx.guild.filesize_limit - 100:
+            try:
+                response = await self.http.put(
+                    "https://api.mystb.in/paste",
+                    json={
+                        "files": [
+                            {
+                                "filename": "ocr.txt",
+                                "content": text
+                            }
+                        ],
+                    }
+                )
+                response.raise_for_status()
+            except httpx.HTTPError:
+                return await ctx.respond("OCR content too large to post.")
+            else:
+                data = response.json()
+                return await ctx.respond("https://mystb.in/%s" % data["id"])
+
+        out_file = io.BytesIO(text.encode("utf-8", "replace"))
+        return await ctx.respond(file=discord.File(out_file, filename="ocr.txt"))
+

 def setup(bot):
    bot.add_cog(OtherCog(bot))
--- a/requirements.txt
+++ b/requirements.txt
@ -17,3 +17,5 @@ pyttsx3>=2.90
 yt-dlp
 beautifulsoup4>=4.12.0
 lxml>=4.9.2
+pytesseract>=0.3.10
+pillow>=9.5.0