当前位置：首页 > article >正文

构建一个文档助手Agent：提升知识管理效率的实践

article 2025/2/4 1:54:33

在上一篇文章中,我们讨论了如何构建一个数据分析Agent。今天,我想分享另一个实际项目:如何构建一个文档助手Agent。这个项目源于我们一个技术团队的真实需求 - 提升文档管理效率,加强知识沉淀。

从团队痛点说起

记得和技术团队讨论时的场景：

小王：我们的文档太分散了,找起来很费劲
小李：是啊,而且很多文档都过时了,不知道该信哪个
我：主要是哪些类型的文档？
小王：技术方案、API文档、使用手册这些
我：这些场景很适合用AI Agent来管理

经过需求分析,我们确定了几个核心功能：

智能文档检索
自动文档更新
知识图谱构建
问答系统集成

技术方案设计

首先是整体架构：

from typing import List, Dict, Any, Optional
from enum import Enum
from pydantic import BaseModel
import asyncio

class DocumentTask(Enum):
    SEARCH = "search"
    UPDATE = "update"
    KNOWLEDGE = "knowledge"
    QA = "qa"

class DocumentContext(BaseModel):
    query: str
    doc_type: str
    language: str
    user_role: str
    history: List[Dict[str, str]]

class DocumentAssistant:
    def __init__(
        self,
        config: Dict[str, Any]
    ):
        # 1. 初始化文档模型
        self.doc_model = DocumentLLM(
            model="gpt-4",
            temperature=0.3,
            context_length=8000
        )

        # 2. 初始化知识库
        self.knowledge_base = VectorStore(
            embeddings=TextEmbeddings(),
            collection="doc_knowledge"
        )

        # 3. 初始化工具集
        self.tools = {
            "indexer": DocumentIndexer(),
            "updater": DocumentUpdater(),
            "grapher": KnowledgeGrapher(),
            "qa": QASystem()
        }

    async def process_request(
        self,
        context: DocumentContext
    ) -> Dict[str, Any]:
        # 1. 理解用户意图
        intent = await self._understand_intent(
            context
        )

        # 2. 准备相关知识
        knowledge = await self._prepare_knowledge(
            intent,
            context
        )

        # 3. 生成处理方案
        plan = await self._generate_plan(
            intent,
            knowledge
        )

        # 4. 执行任务
        result = await self._execute_task(
            plan,
            context
        )

        return result

    async def _understand_intent(
        self,
        context: DocumentContext
    ) -> Dict[str, Any]:
        # 1. 分析查询意图
        query_intent = await self.doc_model.analyze_query(
            context.query
        )

        # 2. 识别文档类型
        doc_type = await self._identify_doc_type(
            context
        )

        # 3. 确定用户需求
        requirements = await self._identify_requirements(
            context,
            query_intent
        )

        return {
            "query_intent": query_intent,
            "doc_type": doc_type,
            "requirements": requirements
        }

文档检索功能

首先实现文档检索功能：

class DocumentSearcher:
    def __init__(
        self,
        model: DocumentLLM,
        knowledge_base: VectorStore
    ):
        self.model = model
        self.knowledge_base = knowledge_base

    async def search_documents(
        self,
        context: DocumentContext
    ) -> Dict[str, Any]:
        # 1. 构建检索查询
        query = await self._build_query(
            context
        )

        # 2. 执行语义搜索
        results = await self._semantic_search(
            query
        )

        # 3. 优化搜索结果
        optimized = await self._optimize_results(
            results,
            context
        )

        return optimized

    async def _build_query(
        self,
        context: DocumentContext
    ) -> Dict[str, Any]:
        # 1. 提取关键词
        keywords = await self._extract_keywords(
            context.query
        )

        # 2. 扩展查询
        expanded = await self._expand_query(
            keywords,
            context
        )

        # 3. 添加过滤条件
        filtered = await self._add_filters(
            expanded,
            context
        )

        return filtered

    async def _semantic_search(
        self,
        query: Dict[str, Any]
    ) -> List[Dict[str, Any]]:
        # 1. 向量检索
        vector_results = await self.knowledge_base.search(
            query["vector"],
            top_k=10
        )

        # 2. 关键词匹配
        keyword_results = await self._keyword_match(
            query["keywords"]
        )

        # 3. 结果融合
        merged = await self._merge_results(
            vector_results,
            keyword_results
        )

        return merged

文档更新功能

接下来是文档更新功能：

class DocumentUpdater:
    def __init__(
        self,
        model: DocumentLLM
    ):
        self.model = model

    async def update_document(
        self,
        doc: Dict[str, Any],
        context: DocumentContext
    ) -> Dict[str, Any]:
        # 1. 检查更新需求
        needs = await self._check_update_needs(
            doc,
            context
        )

        # 2. 生成更新内容
        updates = await self._generate_updates(
            doc,
            needs
        )

        # 3. 应用更新
        updated = await self._apply_updates(
            doc,
            updates
        )

        return updated

    async def _check_update_needs(
        self,
        doc: Dict[str, Any],
        context: DocumentContext
    ) -> List[Dict[str, Any]]:
        needs = []

        # 1. 检查内容过期
        outdated = await self._check_outdated(
            doc
        )
        needs.extend(outdated)

        # 2. 检查格式问题
        format_issues = await self._check_format(
            doc
        )
        needs.extend(format_issues)

        # 3. 检查完整性
        completeness = await self._check_completeness(
            doc
        )
        needs.extend(completeness)

        return needs

    async def _generate_updates(
        self,
        doc: Dict[str, Any],
        needs: List[Dict[str, Any]]
    ) -> List[Dict[str, Any]]:
        updates = []

        for need in needs:
            # 1. 生成更新内容
            content = await self._generate_content(
                doc,
                need
            )

            # 2. 验证更新
            validated = await self._validate_update(
                content,
                doc
            )

            # 3. 格式化更新
            formatted = await self._format_update(
                validated,
                doc
            )

            updates.append(formatted)

        return updates

知识图谱功能

再来实现知识图谱功能：

class KnowledgeGrapher:
    def __init__(
        self,
        model: DocumentLLM
    ):
        self.model = model

    async def build_knowledge_graph(
        self,
        docs: List[Dict[str, Any]]
    ) -> Dict[str, Any]:
        # 1. 提取实体关系
        entities = await self._extract_entities(
            docs
        )

        # 2. 构建图谱
        graph = await self._build_graph(
            entities
        )

        # 3. 优化图谱
        optimized = await self._optimize_graph(
            graph
        )

        return optimized

    async def _extract_entities(
        self,
        docs: List[Dict[str, Any]]
    ) -> Dict[str, Any]:
        entities = {
            "concepts": [],
            "relations": []
        }

        for doc in docs:
            # 1. 提取概念
            concepts = await self._extract_concepts(
                doc
            )
            entities["concepts"].extend(concepts)

            # 2. 提取关系
            relations = await self._extract_relations(
                doc,
                concepts
            )
            entities["relations"].extend(relations)

        return entities

    async def _build_graph(
        self,
        entities: Dict[str, Any]
    ) -> Dict[str, Any]:
        # 1. 创建节点
        nodes = await self._create_nodes(
            entities["concepts"]
        )

        # 2. 创建边
        edges = await self._create_edges(
            entities["relations"]
        )

        # 3. 构建索引
        indices = await self._build_indices(
            nodes,
            edges
        )

        return {
            "nodes": nodes,
            "edges": edges,
            "indices": indices
        }

问答系统功能

最后是问答系统功能：

class QASystem:
    def __init__(
        self,
        model: DocumentLLM,
        knowledge_base: VectorStore
    ):
        self.model = model
        self.knowledge_base = knowledge_base

    async def answer_question(
        self,
        context: DocumentContext
    ) -> Dict[str, Any]:
        # 1. 理解问题
        question = await self._understand_question(
            context
        )

        # 2. 检索相关文档
        docs = await self._retrieve_documents(
            question
        )

        # 3. 生成答案
        answer = await self._generate_answer(
            question,
            docs
        )

        return answer

    async def _understand_question(
        self,
        context: DocumentContext
    ) -> Dict[str, Any]:
        # 1. 提取问题类型
        q_type = await self._identify_question_type(
            context.query
        )

        # 2. 识别关键实体
        entities = await self._extract_entities(
            context.query
        )

        # 3. 确定答案要求
        requirements = await self._identify_requirements(
            context
        )

        return {
            "type": q_type,
            "entities": entities,
            "requirements": requirements
        }

    async def _generate_answer(
        self,
        question: Dict[str, Any],
        docs: List[Dict[str, Any]]
    ) -> Dict[str, Any]:
        # 1. 提取相关段落
        passages = await self._extract_relevant_passages(
            docs,
            question
        )

        # 2. 生成答案
        answer = await self.model.generate_answer(
            question,
            passages
        )

        # 3. 添加引用
        cited = await self._add_citations(
            answer,
            passages
        )

        return cited