Files
ash66 30c7bda389 Refactor document handling and update Milvus collection settings
- Removed multiple failed document entries from `documents.json`.
- Added a new document entry with updated metadata and changed the index name to `regulations_dense_1024_v2`.
- Updated architecture documentation to reflect changes in the Milvus collection name.
- Adjusted requirements by removing the sqlalchemy dependency.
- Modified test cases to align with new document structure and naming conventions.
- Introduced a new test file for Milvus vector index runtime recovery and error handling.
- Updated assertions in various test files to ensure compatibility with the new schema.
2026-05-26 20:21:31 +08:00

38 lines
1.5 KiB
JSON

{
"7cbdfe3c": {
"doc_id": "7cbdfe3c",
"doc_name": "使用RSA Token连接CheckPoint VPN及PIN码设置_220.181.114.93 or 10.25.134.3.docx",
"file_name": "使用RSA Token连接CheckPoint VPN及PIN码设置_220.181.114.93 or 10.25.134.3.docx",
"object_name": "7cbdfe3c/使用RSA Token连接CheckPoint VPN及PIN码设置_220.181.114.93 or 10.25.134.3.docx",
"content_type": "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
"size_bytes": 1199920,
"status": "indexed",
"regulation_type": "",
"version": "",
"summary": "",
"summary_latency_ms": 0,
"chunk_count": 34,
"parser_name": "aliyun_docmind",
"index_name": "regulations_dense_1024_v2",
"error_message": "",
"created_at": "2026-05-26T12:18:27.206125+00:00",
"updated_at": "2026-05-26T12:18:51.171308+00:00",
"metadata": {
"generate_summary": true,
"parser_backend": "aliyun_docmind",
"parse_task_id": "docmind-20260526-10b94713ccb348498b12180a5dcf32ff",
"layout_count": 48,
"structure_node_count": 6,
"semantic_block_count": 33,
"vector_chunk_count": 34,
"artifact_keys": {
"layouts": "artifacts/7cbdfe3c/layouts.json",
"structure_nodes": "artifacts/7cbdfe3c/structure_nodes.json",
"semantic_blocks": "artifacts/7cbdfe3c/semantic_blocks.json",
"vector_chunks": "artifacts/7cbdfe3c/vector_chunks.json"
},
"processing_stage": "indexed",
"index_collection": "regulations_dense_1024_v2"
}
}
}