Fix RAG inference

This commit is contained in:
2025-08-07 15:38:01 -05:00
parent 4327e1c581
commit e504407190
9 changed files with 222 additions and 31 deletions
+8 -6
View File
@@ -97,11 +97,12 @@ class OpenAICompatibleInferenceBot(InferenceBot):
num_tokens = 0
for message in messages:
num_tokens += 4
for key, value in message.items():
if isinstance(value, str):
num_tokens += len(encoding.encode(value))
if key == "name":
num_tokens += 1
if hasattr(message, "items"):
for key, value in message.items():
if isinstance(value, str):
num_tokens += len(encoding.encode(value))
if key == "name":
num_tokens += 1
num_tokens += 2
return num_tokens
@@ -132,7 +133,8 @@ class OpenAICompatibleInferenceBot(InferenceBot):
messages=messages,
tools=cleaned_tools,
tool_choice="auto" if cleaned_tools else None,
max_tokens=self.max_tokens
max_tokens=self.max_tokens,
)
return response
except Exception as e: