From db009105c77bfd114807f0926bb742d4a1285574 Mon Sep 17 00:00:00 2001
From: Jonathan Lucas <bucolucas@gmail.com>
Date: Sun, 18 Aug 2024 07:35:52 -0500
Subject: [PATCH] Add ability to switch models

---
 prompts/developer_prompt.txt |  2 +-
 telegram_inference_bot.py    | 42 ++++++++++++++++++++++--------------
 2 files changed, 27 insertions(+), 17 deletions(-)

diff --git a/prompts/developer_prompt.txt b/prompts/developer_prompt.txt
index 5dcd149..e3a5c85 100644
--- a/prompts/developer_prompt.txt
+++ b/prompts/developer_prompt.txt
@@ -2,7 +2,7 @@ Imagine you're a savvy developer with a trusty toolkit, working in harmony with
 
 As you navigate the repository, keep in mind the following principles:
 
-Practicality: When updating files, consider that you're writing them in their entirety to disk. DO NOT omit code in your output.
+Practicality: When updating files, consider that you're writing them in their entirety to disk. DO NOT omit code, especially when sending to a function or tool.
 Literal Interpretation: When asked to implement functionality or create a feature, interpret the request as if you were literally told to find all relevant files, navigate relevant functions in code, update the required portions of code, and add required files.
 Design Agnosticism: Avoid making high-level design decisions, such as choosing programming languages or operating systems, unless absolutely sure. If unsure, ask before proceeding.
 Holistic Thinking: Consider the broader impacts of minor changes and strive for meaningful, measured exchanges.
diff --git a/telegram_inference_bot.py b/telegram_inference_bot.py
index f535faa..ac84025 100644
--- a/telegram_inference_bot.py
+++ b/telegram_inference_bot.py
@@ -19,22 +19,18 @@ client = OpenAI()
 GPT_4O = "gpt-4o"
 GPT_4O_MINI = "gpt-4o-mini"
 
-class StringFilter(logging.Filter):
-    def __init__(self, strings_to_filter):
-        super().__init__()
-        self.strings_to_filter = strings_to_filter
+model_max_tokens = {
+    GPT_4O: 4096,
+    GPT_4O_MINI: 16384
+}
 
-    def filter(self, record):
-        return not any(s in record.getMessage() for s in self.strings_to_filter)
-
-strings_to_filter = ['unwanted_string_1', 'unwanted_string_2']  # Change these to the specific strings you want to filter out
+use_smart_model = True
 
 # Set up logging to console and file
-logging.basicConfig(level=logging.INFO, handlers=[
+logging.basicConfig(level=logging.WARNING, handlers=[
     logging.StreamHandler(),
     logging.FileHandler('logs/output.log', mode='a')
 ])
-logging.getLogger().addFilter(StringFilter(strings_to_filter))
 
 # Set up Telegram bot
 TELEGRAM_BOT_TOKEN = os.getenv('TELEGRAM_BOT_TOKEN')
@@ -139,14 +135,14 @@ async def handle_message(update: Update, context: ContextTypes.DEFAULT_TYPE) ->
             del user_images[user_id]
         else:
             # Call OpenAI API for inference (text-only)
-            response = get_chat_response(client, messages, 4096, GPT_4O)
+            response = get_chat_response(client, messages, GPT_4O if use_smart_model else GPT_4O_MINI)
 
         # Extract the assistant's reply
         assistant_message = response.choices[0].message
         toolUseCount = 0
         if hasattr(assistant_message, 'function_call') and assistant_message.function_call:
             while hasattr(assistant_message, 'function_call') and assistant_message.function_call and toolUseCount < 50: # Todo: put amount in env
-                tool_response = call_tool(assistant_message.function_call, messages)
+                tool_response = call_tool(assistant_message.function_call)
                 
                 conversation_history[user_id].append({"role": "function", "name": assistant_message.function_call.name, "content": json.dumps(tool_response)})
                 messages.append({
@@ -156,7 +152,7 @@ async def handle_message(update: Update, context: ContextTypes.DEFAULT_TYPE) ->
                 })
 
                 # Call API again to get the final response
-                assistant_message = get_chat_response(client, messages, 4096, GPT_4O).choices[0].message
+                assistant_message = get_chat_response(client, messages, GPT_4O if use_smart_model else GPT_4O_MINI).choices[0].message
                 if not hasattr(assistant_message, 'function_call') or not assistant_message.function_call:
                     assistant_reply = assistant_message.content
                     conversation_history[user_id].append({"role": "assistant", "content": assistant_reply})
@@ -178,7 +174,7 @@ async def handle_message(update: Update, context: ContextTypes.DEFAULT_TYPE) ->
         logging.error(f"An error occurred: {str(e)}")
         await update.message.reply_text("Sorry, an error occurred while processing your request.")
 
-def call_tool(function_call, messages):
+def call_tool(function_call):
     # Execute the function
     function_name = function_call.name
     function_args = function_call.arguments
@@ -186,16 +182,28 @@ def call_tool(function_call, messages):
         if function_name in [f["name"] for f in tool.get_functions()]:
             return tool.execute(function_name, **eval(function_args))
 
-def get_chat_response(client, messages, max_tokens, model):
+def get_chat_response(client, messages, model):
     response = client.chat.completions.create(
         model=model,
         messages=messages,
         functions=functions,
         function_call="auto",
-        max_tokens=max_tokens
+        max_tokens=model_max_tokens[model]
     )
     return response
 
+def switch(update: Update, context: ContextTypes.DEFAULT_TYPE) -> None:
+    global use_smart_model
+    use_smart_model = not use_smart_model
+    model = GPT_4O if use_smart_model else GPT_4O_MINI
+    logging.info(f"Switched to model: {model}")
+    update.message.reply_text(f"Switched to model: {model}")
+
+async def status(update: Update, context: ContextTypes.DEFAULT_TYPE) -> None:
+    model = GPT_4O if use_smart_model else GPT_4O_MINI
+    await update.message.reply_text(f"Currently using model model: {model}")
+    pass
+
 def main() -> None:
     # Create the Application and pass it your bot's token
     application = Application.builder().token(TELEGRAM_BOT_TOKEN).build()
@@ -203,6 +211,8 @@ def main() -> None:
     # Add handlers
     application.add_handler(CommandHandler("start", start))
     application.add_handler(CommandHandler("clear", clear))
+    application.add_handler(CommandHandler("switch", switch))
+    application.add_handler(CommandHandler("status", status))
     application.add_handler(MessageHandler(filters.PHOTO, handle_image))
     application.add_handler(MessageHandler(filters.TEXT & ~filters.COMMAND, handle_message))