学习如何使用 MongoDB 中包含用户特定元数据的 PDF 文档来过滤知识库搜索。
from agno.agent import Agent
from agno.knowledge.pdf import PDFKnowledgeBase
from agno.utils.media import (
SampleDataFileExtension,
download_knowledge_filters_sample_data,
)
from agno.vectordb.mongodb import MongoDb
# 下载所有示例简历并获取其路径
downloaded_cv_paths = download_knowledge_filters_sample_data(
num_files=5, file_extension=SampleDataFileExtension.PDF
)
mdb_connection_string = "mongodb+srv://<username>:<password>@cluster0.mongodb.net/?retryWrites=true&w=majority"
# 步骤 1:使用文档和元数据初始化知识库
# ------------------------------------------------------------------------------
# 在初始化知识库时,我们可以附加将用于过滤的元数据
# 此元数据可以包括用户 ID、文档类型、日期或任何其他属性
knowledge_base = PDFKnowledgeBase(
path=[
{
"path": downloaded_cv_paths[0],
"metadata": {
"user_id": "jordan_mitchell",
"document_type": "cv",
"year": 2025,
},
},
{
"path": downloaded_cv_paths[1],
"metadata": {
"user_id": "taylor_brooks",
"document_type": "cv",
"year": 2025,
},
},
{
"path": downloaded_cv_paths[2],
"metadata": {
"user_id": "morgan_lee",
"document_type": "cv",
"year": 2025,
},
},
{
"path": downloaded_cv_paths[3],
"metadata": {
"user_id": "casey_jordan",
"document_type": "cv",
"year": 2025,
},
},
{
"path": downloaded_cv_paths[4],
"metadata": {
"user_id": "alex_rivera",
"document_type": "cv",
"year": 2025,
},
},
],
vector_db=MongoDb(
collection_name="filters",
db_url=mdb_connection_string,
search_index_name="filters",
),
)
# 将所有文档加载到向量数据库中
knowledge_base.load(recreate=True)
# 步骤 2:使用不同的过滤组合查询知识库
# ------------------------------------------------------------------------------
agent = Agent(
knowledge=knowledge_base,
search_knowledge=True,
)
agent.print_response(
"Tell me about Jordan Mitchell's experience and skills",
knowledge_filters={"user_id": "jordan_mitchell"},
markdown=True,
)
安装库
pip install -U agno pymongo openai
运行示例
python cookbook/agent_concepts/knowledge/filters/filtering_mongo_db.py