Improve multimodal functionality (#2297)

This commit is contained in:
Dev Khant
2025-03-10 23:33:18 +05:30
committed by GitHub
parent e9a0be66d8
commit 9c0954133f
4 changed files with 123 additions and 26 deletions

View File

@@ -115,7 +115,10 @@ class Memory(MemoryBase):
if isinstance(messages, str):
messages = [{"role": "user", "content": messages}]
messages = parse_vision_messages(messages)
if self.config.llm.config.get("enable_vision"):
messages = parse_vision_messages(messages, self.llm, self.config.llm.config.get("vision_details"))
else:
messages = parse_vision_messages(messages)
with concurrent.futures.ThreadPoolExecutor() as executor:
future1 = executor.submit(self._add_to_vector_store, messages, metadata, filters)