markov: avoid float division in uint_to_bytes

It seems as though the float division could cause an issue where the actual value should be an integer but the float representation is slightly higher than that, causing the addition of an extra unnecessary byte. Although this works fine as long as the same function is used, it could cause problems if seemingly inconsequential details change. I switch to using divmod and checking for the presence of a remainder. This should ensure use of the exact minimum required number of bytes in the blob.
author: Arjun Satarkar <me@arjunsatarkar.net> 2024-03-20 03:07:54 +0000
committer: Arjun Satarkar <me@arjunsatarkar.net> 2024-03-20 03:07:54 +0000
commit: 16aeaa50db79e3c17194128a93d22370bf5daa33 (patch)
tree: cbcef052ca3afb49274513446514438fa1ed1604 /markov
parent: 92a0d3eb4fd919ff9ed33b81d379ccb77af43026 (diff)
download: aps-cogs-16aeaa50db79e3c17194128a93d22370bf5daa33.tar
aps-cogs-16aeaa50db79e3c17194128a93d22370bf5daa33.tar.gz
aps-cogs-16aeaa50db79e3c17194128a93d22370bf5daa33.zip
1 files changed, 17 insertions, 14 deletions
diff --git a/markov/markov.py b/markov/markov.py
index e206800..73ac08e 100644
--- a/markov/markov.py
+++ b/markov/markov.py
@@ -151,13 +151,29 @@ class Markov(commands.Cog):
     def uint_to_bytes(self, x: int):
         if x < 0:
             raise ValueError(f"x must be non-negative (got {x})")
-        return x.to_bytes(math.ceil(x.bit_length() / 8), byteorder="big", signed=False)
+        byte_length, remainder = divmod(x.bit_length(), 8)
+        if remainder:
+            byte_length += 1
+        return x.to_bytes(byte_length, byteorder="big", signed=False)
 
     def get_base_channel(self, channel_or_thread):
         if isinstance(channel_or_thread, discord.Thread):
             return channel_or_thread.parent
         return channel_or_thread
 
+    def append_token(self, text, token):
+        # NOTE: if changing PUNCTUATION, also change the regex in process_message() with the corresponding note
+        PUNCTUATION = r".,!?/;()"
+        if token == "/":
+            text = text[:-1] + token
+        elif token == "(":
+            text += token
+        elif token in PUNCTUATION:
+            text = text[:-1] + token + " "
+        else:
+            text += token + " "
+        return text
+
     @commands.group()
     async def markov(self, _ctx):
         """
@@ -385,19 +401,6 @@ class Markov(commands.Cog):
             await db.commit()
         await ctx.reply("All markov data for this guild has been deleted.")
 
-    def append_token(self, text, token):
-        # NOTE: if changing PUNCTUATION, also change the regex in process_message() with the corresponding note
-        PUNCTUATION = r".,!?/;()"
-        if token == "/":
-            text = text[:-1] + token
-        elif token == "(":
-            text += token
-        elif token in PUNCTUATION:
-            text = text[:-1] + token + " "
-        else:
-            text += token + " "
-        return text
-
     @markov.command()
     async def generate(self, ctx, member: discord.Member | None):
         if not await self.config.guild(ctx.guild).use_messages():
author	Arjun Satarkar <me@arjunsatarkar.net>	2024-03-20 03:07:54 +0000
committer	Arjun Satarkar <me@arjunsatarkar.net>	2024-03-20 03:07:54 +0000
commit	16aeaa50db79e3c17194128a93d22370bf5daa33 (patch)
tree	cbcef052ca3afb49274513446514438fa1ed1604 /markov
parent	92a0d3eb4fd919ff9ed33b81d379ccb77af43026 (diff)
download	aps-cogs-16aeaa50db79e3c17194128a93d22370bf5daa33.tar aps-cogs-16aeaa50db79e3c17194128a93d22370bf5daa33.tar.gz aps-cogs-16aeaa50db79e3c17194128a93d22370bf5daa33.zip