Files
t6_mem0/mem0/vector_stores/configs.py
2024-08-03 21:48:27 +05:30

108 lines
4.2 KiB
Python

from typing import Optional
from pydantic import BaseModel, Field, field_validator, model_validator
from qdrant_client import QdrantClient
from chromadb.api.client import Client as ChromaDbClient
def create_default_config(provider: str):
"""Create a default configuration based on the provider."""
if provider == "qdrant":
return QdrantConfig(path="/tmp/qdrant")
elif provider == "chromadb":
return ChromaDbConfig(path="/tmp/chromadb")
else:
raise ValueError(f"Unsupported vector store provider: {provider}")
class QdrantConfig(BaseModel):
collection_name: str = Field("mem0", description="Name of the collection")
embedding_model_dims: Optional[int] = Field(1536, description="Dimensions of the embedding model")
client: Optional[QdrantClient] = Field(None, description="Existing Qdrant client instance")
host: Optional[str] = Field(None, description="Host address for Qdrant server")
port: Optional[int] = Field(None, description="Port for Qdrant server")
path: Optional[str] = Field("/tmp/qdrant", description="Path for local Qdrant database")
url: Optional[str] = Field(None, description="Full URL for Qdrant server")
api_key: Optional[str] = Field(None, description="API key for Qdrant server")
@model_validator(mode="before")
def check_host_port_or_path(cls, values):
host, port, path, url, api_key = (
values.get("host"),
values.get("port"),
values.get("path"),
values.get("url"),
values.get("api_key"),
)
if not path and not (host and port) and not (url and api_key):
raise ValueError(
"Either 'host' and 'port' or 'url' and 'api_key' or 'path' must be provided."
)
return values
class Config:
arbitrary_types_allowed = True
class ChromaDbConfig(BaseModel):
collection_name: str = Field("mem0", description="Default name for the collection")
client: Optional[ChromaDbClient] = Field(None, description="Existing ChromaDB client instance")
path: Optional[str] = Field(None, description="Path to the database directory")
host: Optional[str] = Field(None, description="Database connection remote host")
port: Optional[str] = Field(None, description="Database connection remote port")
@model_validator(mode="before")
def check_host_port_or_path(cls, values):
host, port, path = values.get("host"), values.get("port"), values.get("path")
if not path and not (host and port):
raise ValueError("Either 'host' and 'port' or 'path' must be provided.")
return values
class Config:
arbitrary_types_allowed = True
class VectorStoreConfig(BaseModel):
provider: str = Field(
description="Provider of the vector store (e.g., 'qdrant', 'chromadb', 'elasticsearch')",
default="qdrant",
)
config: Optional[dict] = Field(
description="Configuration for the specific vector store",
default=None
)
@field_validator("config")
def validate_config(cls, v, values):
provider = values.data.get("provider")
if v is None:
return create_default_config(provider)
if isinstance(v, dict):
if provider == "qdrant":
if "path" not in v:
v["path"] = "/tmp/qdrant"
return QdrantConfig(**v)
elif provider == "chromadb":
if "path" not in v:
v["path"] = "/tmp/chromadb"
return ChromaDbConfig(**v)
return v
@model_validator(mode="after")
def ensure_config_type(cls, values):
provider = values.provider
config = values.config
if config is None:
values.config = create_default_config(provider)
elif isinstance(config, dict):
if provider == "qdrant":
values.config = QdrantConfig(**config)
elif provider == "chromadb":
values.config = ChromaDbConfig(**config)
elif not isinstance(config, (QdrantConfig, ChromaDbConfig)):
raise ValueError(f"Invalid config type for provider {provider}")
return values