Fix RAG inference
This commit is contained in:
@@ -97,11 +97,12 @@ class OpenAICompatibleInferenceBot(InferenceBot):
|
||||
num_tokens = 0
|
||||
for message in messages:
|
||||
num_tokens += 4
|
||||
for key, value in message.items():
|
||||
if isinstance(value, str):
|
||||
num_tokens += len(encoding.encode(value))
|
||||
if key == "name":
|
||||
num_tokens += 1
|
||||
if hasattr(message, "items"):
|
||||
for key, value in message.items():
|
||||
if isinstance(value, str):
|
||||
num_tokens += len(encoding.encode(value))
|
||||
if key == "name":
|
||||
num_tokens += 1
|
||||
num_tokens += 2
|
||||
return num_tokens
|
||||
|
||||
@@ -132,7 +133,8 @@ class OpenAICompatibleInferenceBot(InferenceBot):
|
||||
messages=messages,
|
||||
tools=cleaned_tools,
|
||||
tool_choice="auto" if cleaned_tools else None,
|
||||
max_tokens=self.max_tokens
|
||||
max_tokens=self.max_tokens,
|
||||
|
||||
)
|
||||
return response
|
||||
except Exception as e:
|
||||
|
||||
Reference in New Issue
Block a user