fix 文档管理模块 & 法规对话模块
This commit is contained in:
@@ -1,7 +1,7 @@
|
||||
"""Initialize the app.domain.documents package."""
|
||||
|
||||
from .models import Chunk, Document, DocumentStatus, ParsedDocument
|
||||
from .ports import ChunkBuilder, DocumentBinaryStore, DocumentParser, DocumentRepository
|
||||
from .ports import ChunkBuilder, DocumentBinaryStore, DocumentParser, DocumentRepository, ParseArtifactStore
|
||||
# Keep package boundaries explicit so backend imports stay predictable.
|
||||
|
||||
|
||||
@@ -14,4 +14,5 @@ __all__ = [
|
||||
"DocumentBinaryStore",
|
||||
"DocumentParser",
|
||||
"DocumentRepository",
|
||||
"ParseArtifactStore",
|
||||
]
|
||||
|
||||
@@ -31,6 +31,11 @@ class DocumentRepository(ABC):
|
||||
"""Handle list for the Document Repository instance."""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def delete(self, doc_id: str) -> bool:
|
||||
"""Delete a document record. Returns True if deleted, False if not found."""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def update_status(
|
||||
self,
|
||||
@@ -94,3 +99,32 @@ class ChunkBuilder(ABC):
|
||||
) -> list[Chunk]:
|
||||
"""Handle build for the Chunk Builder instance."""
|
||||
pass
|
||||
|
||||
|
||||
class ParseArtifactStore(ABC):
|
||||
"""Persist parse artifacts (structure nodes and semantic blocks) for relational queries."""
|
||||
|
||||
@abstractmethod
|
||||
def save(
|
||||
self,
|
||||
doc_id: str,
|
||||
structure_nodes: list[dict],
|
||||
semantic_blocks: list[dict],
|
||||
) -> None:
|
||||
"""Persist structure nodes and semantic blocks for a document."""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def delete(self, doc_id: str) -> None:
|
||||
"""Remove all parse artifacts for a document."""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def get_semantic_blocks(self, doc_id: str) -> list[dict]:
|
||||
"""Return all semantic blocks for a document."""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def get_structure_nodes(self, doc_id: str) -> list[dict]:
|
||||
"""Return all structure nodes for a document."""
|
||||
pass
|
||||
|
||||
@@ -1,8 +1,8 @@
|
||||
"""Initialize the app.domain.retrieval package."""
|
||||
|
||||
from .models import RetrievalQuery, RetrievedChunk
|
||||
from .ports import EmbeddingProvider, Retriever, VectorIndex
|
||||
from .ports import EmbeddingProvider, Reranker, Retriever, VectorIndex
|
||||
# Keep package boundaries explicit so backend imports stay predictable.
|
||||
|
||||
|
||||
__all__ = ["RetrievalQuery", "RetrievedChunk", "EmbeddingProvider", "Retriever", "VectorIndex"]
|
||||
__all__ = ["RetrievalQuery", "RetrievedChunk", "EmbeddingProvider", "Reranker", "Retriever", "VectorIndex"]
|
||||
|
||||
@@ -10,7 +10,6 @@ from .models import RetrievalQuery, RetrievedChunk
|
||||
# Keep domain contracts explicit so adapters can swap implementations cleanly.
|
||||
|
||||
|
||||
|
||||
class EmbeddingProvider(ABC):
|
||||
"""Provide the Embedding Provider provider."""
|
||||
@abstractmethod
|
||||
@@ -41,12 +40,35 @@ class VectorIndex(ABC):
|
||||
"""Handle search for the Vector Index instance."""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def count_by_document(self) -> dict[str, int]:
|
||||
"""Return a mapping of doc_id -> chunk count from the vector store."""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def list_document_metadata(self) -> list[dict]:
|
||||
"""Return per-document metadata rows from the vector store.
|
||||
|
||||
Each row contains at minimum: doc_id, doc_name, chunk_count.
|
||||
Optional fields: regulation_type, version.
|
||||
"""
|
||||
pass
|
||||
|
||||
@abstractmethod
|
||||
def health(self) -> dict:
|
||||
"""Handle health for the Vector Index instance."""
|
||||
pass
|
||||
|
||||
|
||||
class Reranker(ABC):
|
||||
"""Re-score and re-order a candidate list using a cross-encoder model."""
|
||||
|
||||
@abstractmethod
|
||||
def rerank(self, query: str, chunks: list[RetrievedChunk], top_k: int) -> list[RetrievedChunk]:
|
||||
"""Return top_k chunks sorted by cross-encoder score (descending)."""
|
||||
pass
|
||||
|
||||
|
||||
class Retriever(ABC):
|
||||
"""Provide the Retriever retriever."""
|
||||
@abstractmethod
|
||||
|
||||
Reference in New Issue
Block a user