46 lines
761 B
Plaintext
46 lines
761 B
Plaintext
|
|
# AI+合规智能中枢 - 法律法规文档解析入库
|
|||
|
|
# MVP核心依赖包
|
|||
|
|
|
|||
|
|
# 向量数据库
|
|||
|
|
pymilvus>=2.4.0
|
|||
|
|
|
|||
|
|
# API框架
|
|||
|
|
fastapi>=0.100.0
|
|||
|
|
uvicorn[standard]>=0.23.0
|
|||
|
|
python-multipart>=0.0.6
|
|||
|
|
|
|||
|
|
# RAG框架
|
|||
|
|
langchain>=0.1.0
|
|||
|
|
langchain-milvus>=0.1.0
|
|||
|
|
|
|||
|
|
# PDF解析
|
|||
|
|
pymupdf>=1.24.0 # PyMuPDF
|
|||
|
|
|
|||
|
|
# Word文档解析
|
|||
|
|
python-docx>=0.8.11
|
|||
|
|
|
|||
|
|
# MinerU多模态PDF解析(可选,需要额外配置)
|
|||
|
|
# magic-pdf[full]>=0.6.0
|
|||
|
|
|
|||
|
|
# 嵌入模型
|
|||
|
|
FlagEmbedding>=1.2.0
|
|||
|
|
sentence-transformers>=2.2.0
|
|||
|
|
|
|||
|
|
# 任务队列(可选)
|
|||
|
|
celery>=5.3.0
|
|||
|
|
redis>=4.5.0
|
|||
|
|
|
|||
|
|
# 对象存储(可选)
|
|||
|
|
minio>=7.1.0
|
|||
|
|
|
|||
|
|
# 数据库
|
|||
|
|
psycopg2-binary>=2.9.0
|
|||
|
|
# mysql-connector-python>=8.0.0
|
|||
|
|
|
|||
|
|
# 工具库
|
|||
|
|
pydantic>=2.0.0
|
|||
|
|
pydantic-settings>=2.0.0
|
|||
|
|
python-dotenv>=1.0.0
|
|||
|
|
loguru>=0.7.0
|
|||
|
|
tenacity>=8.2.0
|
|||
|
|
httpx>=0.24.0
|