From a269979b29fccdc69c070ef6644c5a837621b1da Mon Sep 17 00:00:00 2001
From: ctih <78687256+ctih1@users.noreply.github.com>
Date: Mon, 6 Jan 2025 11:55:55 +0200
Subject: [PATCH 1/2] Fixed issues with creating a model, and added progress
 indicators

---
 customcommands/tf.py | 99 +++++++++++++++++++++++++++++++-------------
 1 file changed, 70 insertions(+), 29 deletions(-)

diff --git a/customcommands/tf.py b/customcommands/tf.py
index 9f74093..8043f57 100644
--- a/customcommands/tf.py
+++ b/customcommands/tf.py
@@ -6,7 +6,10 @@ import numpy as np
 import json
 from time import strftime, localtime
 import pickle
+import functools
 import re
+import time
+import asyncio
 
 ready: bool = True
 MODEL_MATCH_STRING = "[0-9]{2}_[0-9]{2}_[0-9]{4}-[0-9]{2}_[0-9]{2}"
@@ -30,6 +33,34 @@ except ImportError:
     ))
     ready = False
 
+class TFCallback(keras.callbacks.Callback):
+    def __init__(self,bot, progress_embed:discord.Embed, message):
+        self.embed:discord.Embed = progress_embed
+        self.bot:commands.Bot = bot
+        self.message = message
+        self.times:List[int] = [time.time()]
+        
+    def on_train_begin(self, logs=None):
+        pass
+        
+    async def send_message(self,message:str, description:str, **kwargs):
+        if "epoch" in kwargs:
+            self.times.append(time.time())
+            average_epoch_time:int = np.average(np.diff(np.array(self.times)))
+            description = f"ETA: {round(average_epoch_time)}s"
+        self.embed.add_field(name=f"<t:{round(time.time())}:t> - {message}",value=description,inline=False)
+        await self.message.edit(embed=self.embed)
+    
+    def on_train_end(self,logs=None):
+        self.bot.loop.create_task(self.send_message("Training stopped", "training has been stopped."))
+        
+    def on_epoch_begin(self, epoch, logs=None):
+        self.bot.loop.create_task(self.send_message(f"Starting epoch {epoch}","This might take a while", epoch=True))
+        
+    def on_epoch_end(self, epoch, logs=None):
+        self.bot.loop.create_task(self.send_message(f"Epoch {epoch} ended",f"Accuracy: {round(logs.get('accuracy',0.0),4)}"))
+        
+
 class Ai:
     def __init__(self):
         model_path = settings.get("model_path")
@@ -39,10 +70,7 @@ class Ai:
         self.batch_size = 64 
         
     def get_model_name_from_path(self,path:str):
-        print(path)
         match:re.Match = re.search(MODEL_MATCH_STRING, path)
-        
-        print(match.start)
         return path[match.start():][:match.end()]
 
     def generate_model_name(self) -> str:
@@ -96,7 +124,11 @@ class Ai:
         model_path:str = settings.get("model_path")
         if model_path:
             self.model = self.__load_model(model_path)
-
+            self.is_loaded = True
+    
+    async def run_async(self,func,bot,*args,**kwargs):
+        func = functools.partial(func,*args,**kwargs)
+        return await bot.loop.run_in_executor(None,func)
             
 class Learning(Ai):
     def __init__(self):
@@ -117,7 +149,8 @@ class Learning(Ai):
                 
         return x,y, tokenizer
     
-    def create_model(self,memory: List[str], iters:int=2):
+    def create_model(self,memory: list, iters:int=2):
+        memory = memory[:2000]
         X,y,tokenizer = self.__generate_labels_and_inputs(memory)
         maxlen:int = max([len(x) for x in X]) 
         x_pad = pad_sequences(X, maxlen=maxlen, padding="pre")
@@ -130,8 +163,10 @@ class Learning(Ai):
         model.add(Dense(VOCAB_SIZE, activation="softmax"))
         
         model.compile(optimizer="adam", loss="sparse_categorical_crossentropy", metrics=["accuracy"])
-        history = model.fit(x_pad, y, epochs=iters, batch_size=32)
+        history = model.fit(x_pad, y, epochs=iters, batch_size=64, callbacks=[tf_callback])
         self.save_model(model, tokenizer, history)
+        return
+
         
     def add_training(self,memory: List[str], iters:int=2):
         tokenizer_path = os.path.join(settings.get("model_path"),"tokenizer.pkl")
@@ -144,8 +179,9 @@ class Learning(Ai):
         x_pad = pad_sequences(X, maxlen=maxlen, padding="pre")
         y = np.array(y)
         
-        history = self.model.fit(x_pad,y, epochs=iters, validation_data=(x_pad,y), batch_size=64) # Idelaly, validation data would be seperate from the actual data
+        history = self.model.fit(x_pad,y, epochs=iters, validation_data=(x_pad,y), batch_size=64, callbacks=[tf_callback]) # Ideally, validation data would be seperate from the actual data
         self.save_model(self.model,tokenizer,history,self.get_model_name_from_path(settings.get("model_path")))
+        return
     
 class Generation(Ai):
     def __init__(self):
@@ -173,16 +209,16 @@ class Generation(Ai):
         
     
 VOCAB_SIZE = 100_000
-
 SETTINGS_TYPE = TypedDict("SETTINGS_TYPE", {
     "model_path":str, # path to the base folder of the model, aka .../models/05-01-2025-22_31/
     "tokenizer_path":str,
 })
 
-
+tf_callback:TFCallback
 model_dropdown_items = []
 settings: SETTINGS_TYPE = {}
 
+target_message:int
 learning:Learning
 generation: Generation
 
@@ -236,27 +272,15 @@ class DropdownView(discord.ui.View):
         self.add_item(Dropdown(models))
 
 
-class Tf(commands.Cog):
-    @staticmethod
-    def needs_ready(func):
-        def inner(args:tuple, kwargs:dict):
-            if not ready: 
-                raise AttributeError("Not ready!")
-            a = func(*args, **kwargs)
-            return a
-        return inner
-        
-    
+class Tf(commands.Cog):    
     def __init__(self,bot):
-        global learning, generation
-        global ready
+        global learning, generation, ready
         os.makedirs(os.path.join(".","models"),exist_ok=True)
         Settings().load()
         self.bot = bot
         learning = Learning()
         generation = Generation()
     
-
     @commands.command()
     async def start(self,ctx):
         await ctx.defer()
@@ -268,19 +292,36 @@ class Tf(commands.Cog):
         await ctx.send(generation.generate_sentence(word_amount,seed))
     
     @commands.command()
-    async def create(self,ctx):
+    async def create(self,ctx:commands.Context, epochs:int=3):
+        global tf_callback
         await ctx.defer()
         with open("memory.json","r") as f:
             memory:List[str] = json.load(f)
-        learning.create_model(memory) # TODO: CHANGE
-        await ctx.send("Trained succesfully!")
+        await ctx.send("Initializing tensorflow")
+        embed = discord.Embed(title="Creating a model...", description="Progress of creating a model")
+        embed.set_footer(text="Note: Progress tracking might report delayed / wrong data, since the function is run asynchronously")
+        target_message:discord.Message = await ctx.send(embed=embed)
+        
+        tf_callback = TFCallback(self.bot,embed,target_message)
+        await learning.run_async(learning.create_model,self.bot,memory,epochs)
+        embed = target_message.embeds[0]
+        embed.add_field(name=f"<t:{round(time.time())}:t> Finished",value="Model saved.")
+        await target_message.edit(embed=embed)
+        
         
     @commands.command()
-    async def train(self,ctx):
+    async def train(self,ctx, epochs:int=2):
+        global tf_callback
+        
         await ctx.defer()
         with open("memory.json","r") as f:
             memory:List[str] = json.load(f)
-        learning.add_training(memory,2)
+            
+        embed = discord.Embed(title="Training model...", description="Progress of training model")
+        target_message = await ctx.send(embed=embed)
+        tf_callback = TFCallback(self.bot,embed,target_message)
+
+        await learning.run_async(learning.add_training,self.bot,memory,epochs)
         await ctx.send("Finished!")
     
     @commands.command() 
@@ -296,4 +337,4 @@ class Tf(commands.Cog):
             generation.reload_model()
 
 async def setup(bot):
-    await bot.add_cog(Tf(bot))
\ No newline at end of file
+    await bot.add_cog(Tf(bot))

From 65190d791ed02000441f8bdfb3882ea5f7d0904f Mon Sep 17 00:00:00 2001
From: ctih <78687256+ctih1@users.noreply.github.com>
Date: Mon, 6 Jan 2025 12:01:55 +0200
Subject: [PATCH 2/2] Fixed python ver

---
 customcommands/README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/customcommands/README.md b/customcommands/README.md
index 05a4ac0..f85f562 100644
--- a/customcommands/README.md
+++ b/customcommands/README.md
@@ -9,4 +9,4 @@ by PowerPCFan
 by expect
 
 [TensorFlow integration](https://github.com/WhatDidYouExpect/goober/blob/main/customcommands/tf.py)
-by SuperSilly2 (requires Python 3.11, tensorflow-metal/tensorflow-gpu and tensorflow/tensorflow-macos)
+by SuperSilly2 (requires Python 3.7 - 3.10, tensorflow-metal/tensorflow-gpu and tensorflow/tensorflow-macos)