Refactor code structure for improved readability and maintainability
This commit is contained in:
@@ -1,7 +1,6 @@
|
||||
# src/services/embedding/__init__.py
|
||||
"""嵌入和分块服务"""
|
||||
|
||||
from .text_chunker import RegulationChunker
|
||||
from .bge_m3_embedder import BGEM3Embedder
|
||||
|
||||
__all__ = ["RegulationChunker", "BGEM3Embedder"]
|
||||
__all__ = ["RegulationChunker", "BGEM3Embedder"]
|
||||
|
||||
@@ -1,4 +1,3 @@
|
||||
# src/services/embedding/bge_m3_embedder.py
|
||||
"""BGE-M3嵌入服务 - Dense+Sparse双路向量生成"""
|
||||
|
||||
import numpy as np
|
||||
@@ -293,4 +292,4 @@ def embed_single_text(
|
||||
) -> Dict:
|
||||
"""便捷函数:对单个文本生成嵌入"""
|
||||
embedder = BGEM3Embedder(model_name=model_name, **kwargs)
|
||||
return embedder.embed_single(text)
|
||||
return embedder.embed_single(text)
|
||||
|
||||
@@ -1,4 +1,3 @@
|
||||
# src/services/embedding/text_chunker.py
|
||||
"""智能分块器 - 章节级+条款级双粒度切割"""
|
||||
|
||||
import re
|
||||
@@ -446,4 +445,4 @@ def chunk_regulation_document(
|
||||
doc_name,
|
||||
regulation_type,
|
||||
version
|
||||
)
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user