272 lines
14 KiB
Python
272 lines
14 KiB
Python
import os
|
|
import json
|
|
import logging
|
|
from anthropic import Anthropic, APIError, RateLimitError
|
|
from base_telegram_inference_bot import BaseTelegramInferenceBot
|
|
from telegram_helper import TelegramHelper # Used in main, not class
|
|
|
|
class AnthropicTelegramInferenceBot(BaseTelegramInferenceBot):
|
|
DEFAULT_SMALL_MODEL_NAME = "claude-3-haiku-20240307"
|
|
DEFAULT_SMALL_MODEL_MAX_TOKENS = "2048"
|
|
DEFAULT_LARGE_MODEL_NAME = "claude-3-opus-20240229"
|
|
DEFAULT_LARGE_MODEL_MAX_TOKENS = "4096"
|
|
|
|
def __init__(
|
|
self,
|
|
anthropic_client: Anthropic | None = None,
|
|
api_key: str | None = None,
|
|
small_model_name: str | None = None,
|
|
small_model_max_tokens: str | None = None,
|
|
large_model_name: str | None = None,
|
|
large_model_max_tokens: str | None = None,
|
|
system_prompt_content: str | None = None,
|
|
system_prompt_path: str | None = None
|
|
):
|
|
super().__init__(system_prompt_content=system_prompt_content, system_prompt_path=system_prompt_path)
|
|
|
|
if anthropic_client:
|
|
self.anthropic_client = anthropic_client
|
|
else:
|
|
_api_key = api_key or os.environ.get("ANTHROPIC_API_KEY")
|
|
if not _api_key:
|
|
raise ValueError("Anthropic API key must be provided either via argument or ANTHROPIC_API_KEY environment variable.")
|
|
self.anthropic_client = Anthropic(api_key=_api_key)
|
|
|
|
self.small_model_name = small_model_name or os.environ.get("ANTHROPIC_SMALL_MODEL") or self.DEFAULT_SMALL_MODEL_NAME
|
|
self.small_model_max_tokens_str = small_model_max_tokens or os.environ.get("ANTHROPIC_SMALL_MODEL_MAX_TOKENS") or self.DEFAULT_SMALL_MODEL_MAX_TOKENS
|
|
self.large_model_name = large_model_name or os.environ.get("ANTHROPIC_LARGE_MODEL") or self.DEFAULT_LARGE_MODEL_NAME
|
|
self.large_model_max_tokens_str = large_model_max_tokens or os.environ.get("ANTHROPIC_LARGE_MODEL_MAX_TOKENS") or self.DEFAULT_LARGE_MODEL_MAX_TOKENS
|
|
|
|
# Initialize with the small model by default
|
|
self._configure_model_and_tokens(
|
|
self.small_model_name,
|
|
self.small_model_max_tokens_str,
|
|
default_max_tokens=int(self.DEFAULT_SMALL_MODEL_MAX_TOKENS) # pass int for default
|
|
)
|
|
|
|
def _configure_model_and_tokens(self, model_name: str, max_tokens_str: str, default_max_tokens: int = 2048):
|
|
self.model = model_name
|
|
try:
|
|
self.max_tokens = int(max_tokens_str) if max_tokens_str is not None else default_max_tokens
|
|
except ValueError:
|
|
logging.error(f"Invalid value for Anthropic max_tokens: {max_tokens_str}. Using default {default_max_tokens}.")
|
|
self.max_tokens = default_max_tokens
|
|
logging.info(f"Configured to use Anthropic model: {self.model} with max_tokens: {self.max_tokens}")
|
|
|
|
def get_llm_description(self) -> str:
|
|
return f"LLM: {self.model}, Max Tokens: {self.max_tokens}"
|
|
|
|
def get_chat_response(self, messages_history):
|
|
current_system_prompt = self.system_prompt if self.system_prompt else ""
|
|
anthropic_tools = []
|
|
if hasattr(self, 'functions') and self.functions:
|
|
anthropic_tools = [
|
|
{
|
|
"name": function['function']['name'],
|
|
"description": function['function']['description'],
|
|
"input_schema": function['function']['parameters'] if function['function']['parameters'] not in [None, {}] else {"type": "object", "properties": {}}
|
|
}
|
|
for function in self.functions
|
|
]
|
|
|
|
try:
|
|
response = self.anthropic_client.messages.create(
|
|
model=self.model,
|
|
system=current_system_prompt,
|
|
messages=messages_history,
|
|
max_tokens=self.max_tokens,
|
|
tools=anthropic_tools if anthropic_tools else None,
|
|
tool_choice={"type": "auto"} if anthropic_tools else None
|
|
)
|
|
return response
|
|
except (APIError, RateLimitError) as e:
|
|
logging.error(f"Anthropic API error: {e}")
|
|
raise
|
|
except Exception as e:
|
|
logging.error(f"An unexpected error occurred during Anthropic API call: {e}")
|
|
raise
|
|
|
|
def _format_tool_response_for_anthropic(self, tool_response_data):
|
|
if isinstance(tool_response_data, str):
|
|
# Wrap plain string in a list of text blocks if not already structured
|
|
return [{"type": "text", "text": tool_response_data}]
|
|
elif isinstance(tool_response_data, list) and all(isinstance(item, dict) and "type" in item for item in tool_response_data):
|
|
# Already a list of content blocks
|
|
return tool_response_data
|
|
elif isinstance(tool_response_data, (dict, list)):
|
|
# Attempt to JSON dump other dicts/lists if not already in content block format
|
|
try:
|
|
return [{"type": "text", "text": json.dumps(tool_response_data)}]
|
|
except (TypeError, json.JSONDecodeError):
|
|
return [{"type": "text", "text": str(tool_response_data)}] # Fallback to string
|
|
else:
|
|
# Fallback for other types (int, float, etc.)
|
|
return [{"type": "text", "text": str(tool_response_data)}]
|
|
|
|
async def handle_message(self, user_id, user_message):
|
|
if user_id not in self.conversation_history:
|
|
self.conversation_history[user_id] = []
|
|
|
|
self.conversation_history[user_id].append({"role": "user", "content": user_message})
|
|
current_turn_messages = list(self.conversation_history[user_id])
|
|
|
|
MAX_TOOL_ITERATIONS = 5
|
|
tool_use_count = 0
|
|
assistant_response_content = ""
|
|
|
|
while tool_use_count < MAX_TOOL_ITERATIONS:
|
|
response = self.get_chat_response(current_turn_messages)
|
|
|
|
if not response or not response.content:
|
|
logging.error("No valid response content from Anthropic LLM.")
|
|
self.conversation_history[user_id] = current_turn_messages # Save current state
|
|
return "Error: Could not get a valid response from the LLM."
|
|
|
|
assistant_current_turn_content_blocks = response.content
|
|
current_turn_messages.append({"role": "assistant", "content": assistant_current_turn_content_blocks})
|
|
|
|
text_parts_from_assistant = []
|
|
tool_calls_from_response = []
|
|
for block in assistant_current_turn_content_blocks:
|
|
if block.type == "text":
|
|
text_parts_from_assistant.append(block.text)
|
|
elif block.type == "tool_use":
|
|
tool_calls_from_response.append(block)
|
|
|
|
assistant_response_content = "".join(text_parts_from_assistant)
|
|
|
|
if not tool_calls_from_response:
|
|
break
|
|
|
|
tool_results_for_model = []
|
|
for tool_call in tool_calls_from_response:
|
|
tool_name = tool_call.name
|
|
tool_input = tool_call.input
|
|
tool_use_id = tool_call.id
|
|
|
|
logging.info(f"Attempting to call Anthropic tool: {tool_name} with input: {tool_input}")
|
|
try:
|
|
tool_response_data = self.call_tool(tool_name, tool_input)
|
|
tool_result_content_block = self._format_tool_response_for_anthropic(tool_response_data)
|
|
tool_results_for_model.append({
|
|
"type": "tool_result",
|
|
"tool_use_id": tool_use_id,
|
|
"content": tool_result_content_block
|
|
})
|
|
except Exception as e:
|
|
logging.error(f"Error calling tool {tool_name}: {e}")
|
|
tool_results_for_model.append({
|
|
"type": "tool_result",
|
|
"tool_use_id": tool_use_id,
|
|
"content": [{"type": "text", "text": f"Error executing tool {tool_name}: {str(e)}"}],
|
|
"is_error": True
|
|
})
|
|
|
|
current_turn_messages.append({"role": "user", "content": tool_results_for_model}) # Anthropic expects tool results as a user message
|
|
|
|
tool_use_count += 1
|
|
if tool_use_count >= MAX_TOOL_ITERATIONS:
|
|
logging.warning(f"Max tool iterations ({MAX_TOOL_ITERATIONS}) reached for Anthropic.")
|
|
# Update assistant_response_content with any text from the last assistant turn before breaking
|
|
if not assistant_response_content and text_parts_from_assistant:
|
|
assistant_response_content = "".join(text_parts_from_assistant)
|
|
assistant_response_content += "\n[Max tool iterations reached]"
|
|
break
|
|
|
|
self.conversation_history[user_id] = current_turn_messages
|
|
|
|
if len(self.conversation_history[user_id]) > 20:
|
|
self.conversation_history[user_id] = self.conversation_history[user_id][-20:]
|
|
|
|
if assistant_response_content:
|
|
return assistant_response_content
|
|
else:
|
|
# Fallback if no text parts were found but there was an assistant message
|
|
if current_turn_messages:
|
|
last_message_in_turn = current_turn_messages[-1]
|
|
# Check if the last message content has text blocks (Anthropic specific structure)
|
|
if last_message_in_turn.get("role") == "assistant" and isinstance(last_message_in_turn.get("content"), list):
|
|
for block in reversed(last_message_in_turn["content"]):
|
|
if block.type == "text" and hasattr(block, 'text') and block.text:
|
|
return block.text # Return the first non-empty text found from the end
|
|
return "No textual response generated by the assistant after processing." # More informative default
|
|
|
|
async def start(self):
|
|
logging.info("Anthropic Bot started")
|
|
|
|
# clear_conversation_history is inherited from BaseTelegramInferenceBot and calls super().clear_conversation_history
|
|
# No need to override if the base implementation is sufficient, unless specific logging is needed.
|
|
# async def clear_conversation_history(self, user_id):
|
|
# super().clear_conversation_history(user_id)
|
|
# logging.info(f"Cleared conversation history for Anthropic bot, user {user_id}")
|
|
|
|
async def abort_processing(self, user_id):
|
|
# This abort is a soft abort, as actual Anthropic API call is synchronous within handle_message
|
|
# It primarily clears state and prevents further processing in the bot's loop if any.
|
|
if user_id in self.processing_status:
|
|
self.processing_status[user_id]["processing"] = False # Mark as not processing
|
|
# self.clear_processing_status(user_id) # Use base class method to remove entry
|
|
# Clearing history might be too aggressive for a simple abort, depends on desired UX
|
|
# For now, let's just stop processing and clear the flag.
|
|
# Consider if conversation history should be cleared here or if that is a separate user action.
|
|
# super().clear_conversation_history(user_id) # Moved to be less aggressive
|
|
logging.info(f"Abort requested for user {user_id}. Processing flag cleared.")
|
|
return "Processing aborted. You can send a new message or /clear the conversation."
|
|
|
|
async def switch_model(self):
|
|
if not self.small_model_name or not self.large_model_name:
|
|
logging.warning("Small or Large model names for Anthropic are not defined. Cannot switch model.")
|
|
return f"Model switching not fully configured. Currently using {self.model}."
|
|
|
|
current_is_small = self.model == self.small_model_name
|
|
current_is_large = self.model == self.large_model_name
|
|
|
|
if current_is_small:
|
|
target_model = self.large_model_name
|
|
target_max_tokens_str = self.large_model_max_tokens_str
|
|
default_target_max_tokens = int(self.DEFAULT_LARGE_MODEL_MAX_TOKENS)
|
|
elif current_is_large:
|
|
target_model = self.small_model_name
|
|
target_max_tokens_str = self.small_model_max_tokens_str
|
|
default_target_max_tokens = int(self.DEFAULT_SMALL_MODEL_MAX_TOKENS)
|
|
else:
|
|
logging.warning(f"Current model {self.model} is unrecognized. Switching to default small model.")
|
|
target_model = self.small_model_name
|
|
target_max_tokens_str = self.small_model_max_tokens_str
|
|
default_target_max_tokens = int(self.DEFAULT_SMALL_MODEL_MAX_TOKENS)
|
|
|
|
self._configure_model_and_tokens(target_model, target_max_tokens_str, default_max_tokens=default_target_max_tokens)
|
|
logging.info(f"Switched Anthropic model to: {self.model}")
|
|
return f"Switched to Anthropic model: {self.model} (Max Tokens: {self.max_tokens})"
|
|
|
|
|
|
# The main function is for standalone execution and basic testing, not part of the class itself.
|
|
# It's good practice to update it to reflect changes if you use it for quick tests.
|
|
# For unit tests, we'll instantiate the class with mocked dependencies.
|
|
def main():
|
|
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
|
|
|
|
# Example of how to instantiate with new constructor (assuming API key is in ENV for this example)
|
|
# For real tests, you'd mock Anthropic() or pass a mock client.
|
|
try:
|
|
# These would typically come from a config file or CLI args in a real app if not ENV
|
|
# For this example, we rely on ENV or defaults being handled by constructor if not provided.
|
|
bot = AnthropicTelegramInferenceBot(
|
|
api_key=os.environ.get("ANTHROPIC_API_KEY") # Explicitly pass, or let constructor handle ENV
|
|
)
|
|
except ValueError as e:
|
|
logging.error(f"Failed to initialize bot: {e}")
|
|
return
|
|
except Exception as e: # Catch any other init errors
|
|
logging.error(f"An unexpected error occurred during bot initialization: {e}")
|
|
return
|
|
|
|
# TelegramHelper also updated, ensure it's instantiated correctly for this main context.
|
|
# For this basic main, we might not pass all configurable paths to TelegramHelper,
|
|
# letting them use defaults.
|
|
telegram_helper = TelegramHelper(bot)
|
|
telegram_helper.run()
|
|
|
|
if __name__ == '__main__':
|
|
main()
|