export default { translation: { common: { back: 'Back', operationFailed: 'Operation failed', noResults: 'No results.', selectPlaceholder: 'select value', selectAll: 'Select All', delete: 'Delete', deleteModalTitle: 'Are you sure to delete this item?', ok: 'Yes', cancel: 'No', no: 'No', total: 'Total', rename: 'Rename', name: 'Name', save: 'Save', namePlaceholder: 'Please input name', next: 'Next', create: 'Create', edit: 'Edit', update: 'Update', configure: 'Configure', upload: 'Upload', english: 'English', portugueseBr: 'Portuguese (Brazil)', chinese: 'Simplified Chinese', traditionalChinese: 'Traditional Chinese', language: 'Language', languageMessage: 'Please input your language!', loading: 'Loading...', close: 'Close', languagePlaceholder: 'select your language', copy: 'Copy', copied: 'Copied', comingSoon: 'Coming soon', download: 'Download', preview: 'Preview', move: 'Move', warn: 'Warn', action: 'Action', s: 'S', pleaseSelect: 'Please select', pleaseInput: 'Please input', submit: 'Submit', clear: 'Clear', embedIntoSite: 'Embed into webpage', previousPage: 'Previous', nextPage: 'Next', add: 'Add', remove: 'Remove', search: 'Search', noDataFound: 'No data found.', noData: 'No data', promptPlaceholder: `Please input or use / to quickly insert variables.`, all: 'All', refresh: 'Refresh', submitting: 'Submitting...', description: 'Description', confirm: 'Confirm', enabled: 'Enabled', disabled: 'Disabled', clearFilter: 'Clear Filter', confirmFilter: 'Confirm Filter', private: 'Private', moreActions: 'More Actions', disable: 'Disable', enable: 'Enable', onlyMe: 'Only Me', team: 'Team', public: 'Public', unknown: 'Unknown', noDescription: 'No description', viewAll: 'View All', viewDetails: 'View Details', mcp: { namePlaceholder: 'My MCP Server', nameRequired: 'It must be 1–64 characters long and can only contain letters, numbers, hyphens, and underscores.', urlPlaceholder: 'https://api.example.com/v1/mcp', tokenPlaceholder: 'e.g. eyJhbGciOiJIUzI1Ni...', }, }, knowledgeSettings: { submitData: 'Submit data:', basicInfoUpdateSuccess: 'Basic information updated successfully', parseConfigUpdateSuccess: 'Parse configuration updated successfully', updateFailed: '{{type}} update failed', basicInfo: 'Basic Information', parseConfig: 'Parse Configuration', knowledgeBase: 'Knowledge Base', knowledgeBaseDetail: 'Knowledge Base Detail', settings: 'Settings', overview: 'Overview', fileLogs: 'File Logs', knowledgeBaseSettings: 'Knowledge Base Settings', settingsTabs: 'Settings Tabs', backToKnowledgeDetail: 'Back to Knowledge Base Detail', }, form: { fieldRequired: '{{field}} is required', minValueExceeded: '{{field}} cannot be less than {{min}}', maxValueExceeded: '{{field}} cannot be greater than {{max}}', configurationError: 'Form configuration error', chipListPlaceholder: 'Type and press Enter to add', maxChipsExceeded: '{{field}} can have at most {{max}} tags', noChips: 'No tags', formConfigError: 'Form configuration error', }, knowledge: { basicInfo: 'Basic Information', uploadAvatar: 'Upload Avatar', nameRequired: 'Knowledge base name cannot be empty', knowledgeBaseName: 'Knowledge Base Name', descriptionPlaceholder: 'Please enter knowledge base description...', permissionSettings: 'Permission Settings', onlyMe: 'Only Me', teamMembers: 'Team Members', retrievalTest: 'Retrieval Test', configSettings: 'Configuration Settings', knowledgeBaseActions: 'Knowledge Base Actions', filter: 'Filter', runStatus: { unstart: 'Not Started', running: 'Running', cancel: 'Cancelled', done: 'Done', fail: 'Failed', unknown: 'Unknown', parsing: 'Parsing' }, runStatusFilter: 'Run Status', fileName: 'File Name', actions: 'Actions', fileType: 'File Type', fileTypeFilter: 'File Type', searchFiles: 'Search Files', uploadFile: 'Upload File', fileCount: 'File Count', chunkCount: 'Chunk Count', tokenCount: 'Token Count', size: 'Size', createTime: 'Create Time', updateTime: 'Update Time', language: 'Language', permission: 'Permission', embeddingModel: 'Embedding Model', parser: 'Parser', type: 'Type', status: 'Status', parseStatus: 'Parse Status', uploadTime: 'Upload Time', documentCount: 'Document Count', lastUpdate: 'Last Update', creator: 'Creator', testPrompt: 'Test Prompt', testResultOverview: 'Test Result Overview', matchedChunks: 'Matched Chunks', relatedDocuments: 'Related Documents', returnedChunks: 'Returned Chunks', documentFilter: 'Document Filter', selectDocuments: 'Select Documents', noContent: 'No content', keywords: 'Keywords', relatedDocumentStats: 'Related Document Statistics', selectParserMethod: 'Select Parser Method', unknown: 'Unknown', description: 'Description', pageRank: 'Page Rank', edge: 'Edge', missingIds: 'missing IDs', nodeNotExists: 'node not exists', noGraphData: 'No graph data available', legend: 'Legend', graphStats: 'Graph Statistics', reparse: 'Reparse', cancelRun: 'Cancel Run', renameFile: 'Rename File', viewDetails: 'View Details', viewFileDetails: 'View File Details', matchedChunksCount: 'Matched Chunks Count', matchedChunksTitle: 'Matched Chunks Title', totalMatchedChunks: 'Total Matched Chunks', similarity: 'Similarity', vectorSimilarity: 'Vector Similarity', termSimilarity: 'Term Similarity', nodeCount: 'Node Count', edgeCount: 'Edge Count', noMatchingKnowledgeBases: 'No matching knowledge bases', noKnowledgeBases: 'No knowledge bases', tryAdjustingFilters: 'Try adjusting your filters', createFirstKnowledgeBase: 'Create your first knowledge base', createKnowledgeBase: 'Create Knowledge Base', noDescription: 'No description', config: { basicConfig: 'Basic Configuration', pageRankAndAutoExtract: 'PageRank and Auto Extract', raptorStrategy: 'RAPTOR Strategy', knowledgeGraph: 'Knowledge Graph', chunkMethod: 'Chunk Method', selectChunkMethod: 'Select chunk method', pageRank: 'Page Rank', enterPageRank: 'Enter page rank', autoKeywords: 'Auto Keywords Extraction', enterKeywordCount: 'Enter keyword count', autoQuestions: 'Auto Questions Extraction', enterQuestionCount: 'Enter question count', pdfParser: 'PDF Parser', plainText: 'Naive', minerU: 'MinerU', experimental: 'Experimental', tocEnhance: 'TOC Enhance', delimiter: 'Delimiter', enterDelimiter: 'Enter delimiter', embeddingModel: 'Embedding Model', pageRankConfigTodo: 'PageRank Configuration - To be implemented', entityTypeConfigTodo: 'Entity Type Configuration - To be implemented', maxTokenConfigTodo: 'Max Token Configuration (Max: 16384) - To be implemented', delimiterConfigTodo: 'Delimiter Configuration - To be implemented', chunkTokenSize: 'Suggested chunk token size', htmlForExcel: 'Table to HTML', tags: 'Tags', useRaptorStrategy: 'Use Retrieval-Augmented RAPTOR Strategy', prompt: 'Prompt', raptorPromptDefault: 'Please summarize the following paragraphs. Be careful with numbers and do not make up information. Paragraphs:\n{cluster_content}\nThe above is the content you need to summarize.', maxTokens: 'Max tokens', threshold: 'Threshold', maxClusterCount: 'Max cluster count', randomSeed: 'Random seed', extractKnowledgeGraph: 'Extract knowledge graph', entityTypes: '*Entity types', method: 'Method', entityNormalization: 'Entity normalization', communityReportGeneration: 'Community report generation', parser: { general: 'General Parser', qa: 'Q&A Parser', resume: 'Resume Parser', manual: 'Manual Parser', table: 'Table Parser', paper: 'Paper Parser', book: 'Book Parser', laws: 'Laws Parser', presentation: 'Presentation Parser', one: 'One Parser', tag: 'Tag Parser' } } }, login: { login: 'Sign in', signUp: 'Sign up', loginDescription: 'We’re so excited to see you again!', registerDescription: 'Glad to have you on board!', emailLabel: 'Email', emailPlaceholder: 'Please input email', emailInvalid: 'Invalid email address', passwordLabel: 'Password', passwordPlaceholder: 'Please input password', confirmPasswordRequired: 'Please confirm your password', confirmPassword: 'Confirm password', confirmPasswordMessage: 'Please confirm your password!', confirmPasswordNonMatchMessage: 'The confirm password that you entered do not match!', rememberMe: 'Remember me', signInTip: 'Don’t have an account?', signUpTip: 'Already have an account?', nicknameLabel: 'Nickname', nicknamePlaceholder: 'Please input nickname', register: 'Create an account', continue: 'Continue', title: 'Start building your smart assistants.', description: 'Sign up for free to explore top RAG technology. Create knowledge bases and AIs to empower your business.', review: 'from 500+ reviews', }, header: { knowledgeBase: 'Knowledge Bases', chat: 'Chat', register: 'Register', signin: 'Sign in', home: 'Home', setting: 'Settings', logout: 'Log out', fileManager: 'File Management', agents: 'Agents', models: 'Models', mcp: 'MCP', search: 'Search', welcome: 'Welcome to', }, knowledgeHooks: { fetchKnowledgeListFailed: 'Failed to fetch knowledge base list', fetchKnowledgeDetailFailed: 'Failed to fetch knowledge base details', fetchKnowledgeGraphFailed: 'Failed to fetch knowledge graph', createKnowledgeFailed: 'Failed to create knowledge base', updateKnowledgeBasicInfoFailed: 'Failed to update knowledge base basic information', updateKnowledgeModelConfigFailed: 'Failed to update knowledge base model configuration', deleteKnowledgeFailed: 'Failed to delete knowledge base', batchDeleteKnowledgeFailed: 'Failed to batch delete knowledge bases', batchDeleteFailedKnowledgeBases: 'Failed to delete knowledge bases', }, knowledgeTesting: { retrievalTestComplete: 'Retrieval test completed', retrievalTestFailed: 'Retrieval test failed', paginationRequestFailed: 'Pagination request failed', knowledgeBase: 'Knowledge Base', knowledgeBaseDetail: 'Knowledge Base Detail', testing: 'Testing', knowledgeBaseTesting: 'Knowledge Base Testing', testConfiguration: 'Test Configuration', testQuestion: 'Test Question', pleaseEnterTestQuestion: 'Please enter test question', testQuestionPlaceholder: 'Please enter the question you want to test...', similarityThreshold: 'Similarity Threshold', vectorSimilarityWeight: 'Vector Similarity Weight', rerankModel: 'Rerank Model (Optional)', noRerank: 'No reranking', pleaseEnterResultCount: 'Please enter result count', minValue1: 'Minimum value is 1', maxValue2048: 'Maximum value is 2048', useWithRerankModel: 'Use with Rerank model', crossLanguageSearch: 'Cross-language Search', useKnowledgeGraph: 'Use Knowledge Graph', startTest: 'Start Test', languages: { english: 'English', chinese: 'Chinese', japanese: 'Japanese', korean: 'Korean', french: 'French', german: 'German', spanish: 'Spanish', italian: 'Italian', portuguese: 'Portuguese', russian: 'Russian', arabic: 'Arabic', hindi: 'Hindi', thai: 'Thai', vietnamese: 'Vietnamese', indonesian: 'Indonesian', malay: 'Malay', filipino: 'Filipino', turkish: 'Turkish', polish: 'Polish', dutch: 'Dutch', swedish: 'Swedish', danish: 'Danish', norwegian: 'Norwegian', finnish: 'Finnish', hebrew: 'Hebrew', czech: 'Czech', slovak: 'Slovak', hungarian: 'Hungarian', romanian: 'Romanian', bulgarian: 'Bulgarian', croatian: 'Croatian', serbian: 'Serbian', slovenian: 'Slovenian', estonian: 'Estonian', latvian: 'Latvian', lithuanian: 'Lithuanian', maltese: 'Maltese', irish: 'Irish', welsh: 'Welsh', basque: 'Basque', catalan: 'Catalan', galician: 'Galician', icelandic: 'Icelandic', macedonian: 'Macedonian', albanian: 'Albanian', belarusian: 'Belarusian', ukrainian: 'Ukrainian', kazakh: 'Kazakh', kyrgyz: 'Kyrgyz', uzbek: 'Uzbek', tajik: 'Tajik', mongolian: 'Mongolian', georgian: 'Georgian', armenian: 'Armenian', azerbaijani: 'Azerbaijani', persian: 'Persian', urdu: 'Urdu', bengali: 'Bengali', tamil: 'Tamil', telugu: 'Telugu', malayalam: 'Malayalam', kannada: 'Kannada', gujarati: 'Gujarati', punjabi: 'Punjabi', odia: 'Odia', assamese: 'Assamese', nepali: 'Nepali', sinhala: 'Sinhala', burmese: 'Burmese', khmer: 'Khmer', lao: 'Lao', swahili: 'Swahili', amharic: 'Amharic', yoruba: 'Yoruba', igbo: 'Igbo', hausa: 'Hausa', zulu: 'Zulu', xhosa: 'Xhosa', afrikaans: 'Afrikaans', } }, knowledgeList: { welcome: 'Welcome back', description: 'Which knowledge bases will you use today?', createKnowledgeBase: 'Create Knowledge Base', name: 'Name', namePlaceholder: 'Please input name!', doc: 'Docs', searchKnowledgePlaceholder: 'Search', noMoreData: `That's all. Nothing more.`, confirmDeleteKnowledge: 'Are you sure to delete knowledge base', teamFilter: 'Team Filter', loadError: 'Failed to load knowledge base list', paginationInfo: 'Total {{total}} knowledge bases, page {{current}} of {{totalPages}}', }, knowledgeDetails: { fileSize: 'File Size', fileType: 'File Type', uploadedBy: 'Uploaded by', notGenerated: 'Not generated', generatedOn: 'Generated on', subbarFiles: 'Files', generateKnowledgeGraph: 'This will extract entities and relationships from all your documents in this dataset. The process may take a while to complete.', generateRaptor: 'This will extract entities and relationships from all your documents in this dataset. The process may take a while to complete.', generate: 'Generate', raptor: 'Raptor', processingType: 'Processing Type', dataPipeline: 'Data Pipeline', ingestionPipeline: 'Ingestion Pipeline', operations: 'Operations', taskId: 'Task ID', duration: 'Duration', details: 'Details', status: 'Status', task: 'Task', startDate: 'Start Date', source: 'Source', fileName: 'File Name', datasetLogs: 'Dataset Logs', fileLogs: 'File Logs', overview: 'Overview', success: 'Success', failed: 'Failed', completed: 'Completed', datasetLog: 'Dataset Log', created: 'Created', learnMore: 'Learn More', localUpload: 'Local Upload', general: 'General', chunkMethodTab: 'Chunk Method', testResults: 'Test Results', testSetting: 'Test Setting', retrievalTesting: 'Retrieval Testing', retrievalTestingDescription: 'Conduct a retrieval test to check if RAGFlow can recover the intended content for the LLM.', Parse: 'Parse', file: 'File', dataset: 'Dataset', testing: 'Retrieval testing', files: 'Files List', configuration: 'Configuration', knowledgeGraph: 'Knowledge Graph', name: 'Name', namePlaceholder: 'Please input name!', // 新增的字段 deleteFileFailed: 'Delete file failed', uploadFiles: 'Upload files:', uploadFileFailed: 'Upload file failed', reparseFailed: 'Reparse failed', renameFailed: 'Rename failed', changeStatusFailed: 'Change status failed', viewDetails: 'View Details', viewProcessDetails: 'View Process Details', knowledgeBase: 'Knowledge Base', knowledgeBaseDetail: 'Knowledge Base Detail', documents: 'Documents', graph: 'Graph', deleteFiles: 'Delete files:', newSelectionModel: 'New selection model:', uploadFilesToKnowledge: 'Upload files to knowledge base', confirmDelete: 'Confirm Delete', confirmDeleteMessage: 'Are you sure you want to delete the selected {{count}} files? This action cannot be undone.', documentProcessDetails: 'Document Process Details', basicInfo: 'Basic Information', parserId: 'Parser ID', notSpecified: 'Not specified', processStatus: 'Process Status', startTime: 'Start Time', notStarted: 'Not started', processingTime: 'Processing Time', notCompleted: 'Not completed', progress: 'Progress', processDetails: 'Process Details', seconds: 'seconds', doc: 'Docs', datasetDescription: 'Please wait for your files to finish parsing before starting an AI-powered chat.', addFile: 'Add file', searchFiles: 'Search your files', localFiles: 'Local files', emptyFiles: 'Create empty file', webCrawl: 'Web Crawl', chunkNumber: 'Chunk Number', uploadDate: 'Upload Date', chunkMethod: 'Chunking method', enabled: 'Enable', disabled: 'Disable', action: 'Action', parsingStatus: 'Parsing Status', parsingStatusTip: 'Document parsing time varies based on several factors. Enabling features like Knowledge Graph, RAPTOR, Auto Question Extraction, or Auto Keyword Extraction will significantly increase processing time. If the progress bar stalls, please consult these two FAQs: https://ragflow.io/docs/dev/faq#why-does-my-document-parsing-stall-at-under-one-percent.', processBeginAt: 'Begin at', processDuration: 'Duration', progressMsg: 'Progress', noTestResultsForRuned: 'No relevant results found. Try adjusting your query or parameters.', noTestResultsForNotRuned: 'No test has been run yet. Results will appear here.', testingDescription: 'Conduct a retrieval test to check if RAGFlow can recover the intended content for the LLM. If you have adjusted the default settings, such as keyword similarity weight or similarity threshold, to achieve the optimal results, be aware that these changes will not be automatically saved. You must apply them to your chat assistant settings or the Retrieval agent component settings.', similarityThreshold: 'Similarity threshold', similarityThresholdTip: 'RAGFlow employs either a combination of weighted keyword similarity and weighted vector cosine similarity, or a combination of weighted keyword similarity and weighted reranking score during retrieval. This parameter sets the threshold for similarities between the user query and chunks. Any chunk with a similarity score below this threshold will be excluded from the results. By default, the threshold is set to 0.2. This means that only chunks with hybrid similarity score of 20 or higher will be retrieved.', vectorSimilarityWeight: 'Vector similarity weight', vectorSimilarityWeightTip: 'This sets the weight of keyword similarity in the combined similarity score, either used with vector cosine similarity or with reranking score. The total of the two weights must equal 1.0.', keywordSimilarityWeight: 'Keyword similarity weight', keywordSimilarityWeightTip: 'This sets the weight of keyword similarity in the combined similarity score, either used with vector cosine similarity or with reranking score. The total of the two weights must equal 1.0.', testText: 'Test text', testTextPlaceholder: 'Input your question here!', testingLabel: 'Testing', similarity: 'Hybrid similarity', termSimilarity: 'Term similarity', vectorSimilarity: 'Vector similarity', hits: 'Hits', view: 'View', filesSelected: 'Files selected', upload: 'Upload', run: 'Parse', runningStatus0: 'PENDING', runningStatus1: 'PARSING', runningStatus2: 'CANCELED', runningStatus3: 'SUCCESS', runningStatus4: 'FAIL', pageRanges: 'Page Ranges', pageRangesTip: 'Range of pages to be parsed; pages outside this range will not be processed.', fromPlaceholder: 'from', fromMessage: 'Missing start page number', toPlaceholder: 'to', toMessage: 'Missing end page number (excluded)', layoutRecognize: 'PDF parser', layoutRecognizeTip: 'Use a visual model for PDF layout analysis to effectively locate document titles, text blocks, images, and tables. If the naive option is chosen, only the plain text in the PDF will be retrieved. Please note that this option currently works ONLY for PDF documents.', taskPageSize: 'Task page size', taskPageSizeMessage: 'Please input your task page size!', taskPageSizeTip: `During layout recognition, a PDF file is split into chunks and processed in parallel to increase processing speed. This parameter sets the size of each chunk. A larger chunk size reduces the likelihood of splitting continuous text between pages.`, addPage: 'Add page', greaterThan: 'The current value must be greater than to!', greaterThanPrevious: 'The current value must be greater than the previous to!', selectFiles: 'Select files', changeSpecificCategory: 'Change specific category', uploadTitle: 'Drag and drop your file here to upload', uploadDescription: 'Supports single or batch file upload. For a locally deployed RAGFlow: the total file size limit per upload is 1GB, with a batch upload limit of 32 files. There is no cap on the total number of files per account. For demo.ragflow.io, the total file size limit per upload is 10MB, with each file not exceeding 10MB and a maximum of 128 files per account.', chunk: 'Chunk', bulk: 'Bulk', cancel: 'Cancel', close: 'Close', rerankModel: 'Rerank model', rerankPlaceholder: 'Please select', rerankTip: `Optional. If left empty, RAGFlow will use a combination of weighted keyword similarity and weighted vector cosine similarity; if a rerank model is selected, a weighted reranking score will replace the weighted vector cosine similarity. Please be aware that using a rerank model will significantly increase the system's response time. If you wish to use a rerank model, ensure you use a SaaS reranker; if you prefer a locally deployed rerank model, ensure you start RAGFlow with docker-compose-gpu.yml.`, topK: 'Top-K', topKTip: `Used together with the Rerank model, this setting defines the number of text chunks to be sent to the specified reranking model.`, delimiter: `Delimiter for text`, delimiterTip: 'A delimiter or separator can consist of one or multiple special characters. If it is multiple characters, ensure they are enclosed in backticks( ``). For example, if you configure your delimiters like this: \\n`##`;, then your texts will be separated at line breaks, double hash symbols (##), and semicolons.', html4excel: 'Excel to HTML', html4excelTip: `Use with the General chunking method. When disabled, spreadsheets (XLSX or XLS(Excel 97-2003)) in the knowledge base will be parsed into key-value pairs. When enabled, they will be parsed into HTML tables, splitting every 12 rows if the original table has more than 12 rows. See https://ragflow.io/docs/dev/enable_excel2html for details.`, autoKeywords: 'Auto-keyword', autoKeywordsTip: `Automatically extract N keywords for each chunk to increase their ranking for queries containing those keywords. Be aware that extra tokens will be consumed by the chat model specified in 'System model settings'. You can check or update the added keywords for a chunk from the chunk list. For details, see https://ragflow.io/docs/dev/autokeyword_autoquestion.`, autoQuestions: 'Auto-question', autoQuestionsTip: `Automatically extract N questions for each chunk to increase their ranking for queries containing those questions. You can check or update the added questions for a chunk from the chunk list. This feature will not disrupt the chunking process if an error occurs, except that it may add an empty result to the original chunk. Be aware that extra tokens will be consumed by the LLM specified in 'System model settings'. For details, see https://ragflow.io/docs/dev/autokeyword_autoquestion.`, redo: 'Do you want to clear the existing {{chunkNum}} chunks?', setMetaData: 'Set Meta Data', pleaseInputJson: 'Please enter JSON', documentMetaTips: `
The meta data is in Json format(it's not searchable). It will be added into prompt for LLM if any chunks of this document are included in the prompt.
Examples:
The meta data is:
{
"Author": "Alex Dowson",
"Date": "2024-11-12"
}
Document: the_name_of_document
Author: Alex Dowson
Date: 2024-11-12
Relevant fragments as following:
Deleting the generated {{type}} results will remove all derived entities and relationships from this dataset. Your original files will remain intact.
Do you want to continue?
`,
extractRaptor: 'Extract Raptor',
extractKnowledgeGraph: 'Extract Knowledge Graph',
filterPlaceholder: 'please input filter',
fileFilterTip: '',
fileFilter: 'File Filter',
setDefaultTip: '',
setDefault: 'Set as Default',
eidtLinkDataPipeline: 'Edit Data Pipeline',
linkPipelineSetTip: 'Manage data pipeline linkage with this dataset',
default: 'Default',
buildMode: 'Build Mode',
dataPipeline: 'Data Pipeline',
linkDataPipeline: 'Link Data Pipeline',
enableAutoGenerate: 'Enable Auto Generate',
teamPlaceholder: 'Please select a team.',
dataFlowPlaceholder: 'Please select a pipeline.',
buildItFromScratch: 'Build it from scratch',
dataFlow: 'Pipeline',
parseType: 'Ingestion pipeline',
manualSetup: 'Manual Setup',
builtIn: 'Built-in',
titleDescription:
'Update your knowledge base configuration here, particularly the chunking method.',
name: 'Knowledge base name',
photo: 'Knowledge base photo',
photoTip: 'You can upload a file with 4 MB',
description: 'Description',
language: 'Document language',
languageMessage: 'Please input your language!',
languagePlaceholder: 'Please input your language!',
permissions: 'Permissions',
embeddingModel: 'Embedding model',
chunkTokenNumber: 'Recommended chunk size',
chunkTokenNumberMessage: 'Chunk token number for text is required',
embeddingModelTip:
'The default embedding model for the knowledge base. It cannot be changed once the knowledge base has chunks. To switch to a different default embedding model, you must delete all existing chunks in the knowledge base.',
permissionsTip:
"If it is set to 'Team', all your team members will be able to manage the knowledge base.",
chunkTokenNumberTip:
'It kind of sets the token threshold for a creating a chunk. A segment with fewer tokens than this threshold will be combined with the following segments until the token count exceeds the threshold, at which point a chunk is created. No new chunk is created unless a delimiter is encountered, even if the threshold is exceeded.',
chunkMethod: 'Chunking method',
chunkMethodTip: 'View the tips on the right.',
upload: 'Upload',
english: 'English',
chinese: 'Chinese',
portugueseBr: 'Portuguese (Brazil)',
embeddingModelPlaceholder: 'Please select a embedding model.',
chunkMethodPlaceholder: 'Please select a chunking method.',
save: 'Save',
me: 'Only me',
team: 'Team',
cancel: 'Cancel',
methodTitle: 'Chunking method description',
methodExamples: 'Examples',
methodExamplesDescription:
'The following screenshots are provided for clarification.',
dialogueExamplesTitle: 'view',
methodEmpty:
'This will display a visual explanation of the knowledge base categories',
book: `
Supported file formats are DOCX, PDF, TXT.
For each book in PDF, please set the page ranges to remove unwanted information and reduce analysis time.
`, laws: `Supported file formats are DOCX, PDF, TXT.
Legal documents typically follow a rigorous writing format. We use text feature to identify split point.
The chunk has a granularity consistent with 'ARTICLE', ensuring all upper level text is included in the chunk.
`, manual: `Only PDF is supported.
We assume that the manual has a hierarchical section structure, using the lowest section titles as basic unit for chunking documents. Therefore, figures and tables in the same section will not be separated, which may result in larger chunk sizes.
`, naive: `Supported file formats are MD, MDX, DOCX, XLSX, XLS (Excel 97-2003), PPT, PDF, TXT, JPEG, JPG, PNG, TIF, GIF, CSV, JSON, EML, HTML.
This method chunks files using a 'naive' method:
Only PDF file is supported.
Papers will be split by section, such as abstract, 1.1, 1.2.
This approach enables the LLM to summarize the paper more effectively and to provide more comprehensive, understandable responses. However, it also increases the context for AI conversations and adds to the computational cost for the LLM. So during a conversation, consider reducing the value of ‘topN’.
`, presentation: `Supported file formats are PDF, PPTX.
Every page in the slides is treated as a chunk, with its thumbnail image stored.
This chunking method is automatically applied to all uploaded PPT files, so you do not need to specify it manually.
`, qa: `This chunking method supports XLSX and CSV/TXT file formats.
Lines of texts that fail to follow the above rules will be ignored, and each Q&A pair will be considered a distinct chunk.
`, resume: `Supported file formats are DOCX, PDF, TXT.
Résumés of various forms are parsed and organized into structured data to facilitate candidate search for recruiters.
`, table: `Supported file formats are XLSX and CSV/TXT.
Here are some prerequisites and tips:
Here are some examples of headers:
Image files are supported, with video support coming soon.
This method employs an OCR model to extract texts from images.
If the text extracted by the OCR model is deemed insufficient, a specified visual LLM will be used to provide a description of the image.
`, one: `Supported file formats are DOCX, XLSX, XLS (Excel 97-2003), PDF, TXT.
This method treats each document in its entirety as a chunk.
Applicable when you require the LLM to summarize the entire document, provided it can handle that amount of context length.
`, knowledgeGraph: `Supported file formats are DOCX, EXCEL, PPT, IMAGE, PDF, TXT, MD, JSON, EML
This approach chunks files using the 'naive'/'General' method. It splits a document into segments and then combines adjacent segments until the token count exceeds the threshold specified by 'Chunk token number for text', at which point a chunk is created.
The chunks are then fed to the LLM to extract entities and relationships for a knowledge graph and a mind map.
Ensure that you set the Entity types.
`, tag: `A knowledge base using the 'Tag' chunking method functions as a tag set. Other knowledge bases use it to tag their chunks, and queries to these knowledge bases are also tagged using this tag set.
A tag set will NOT be directly involved in a Retrieval-Augmented Generation (RAG) process.
Each chunk in this knowledge base is an independent description-tag pair.
Supported file formats include XLSX and CSV/TXT:
If a file is in XLSX format, it should contain two columns without headers: one for tag descriptions and the other for tag names, with the Description column preceding the Tag column. Multiple sheets are acceptable, provided the columns are properly structured.
If a file is in CSV/TXT format, it must be UTF-8 encoded with TAB as the delimiter to separate descriptions and tags.
In a Tag column, comma is used to separate tags.
Lines of texts that fail to follow the above rules will be ignored. `, useRaptor: 'RAPTOR', useRaptorTip: 'Enable RAPTOR for multi-hop question-answering tasks. See https://ragflow.io/docs/dev/enable_raptor for details.', prompt: 'Prompt', promptTip: 'Use the system prompt to describe the task for the LLM, specify how it should respond, and outline other miscellaneous requirements. The system prompt is often used in conjunction with keys (variables), which serve as various data inputs for the LLM. Use a forward slash `/` or the (x) button to show the keys to use.', promptMessage: 'Prompt is required', promptText: `Please summarize the following paragraphs. Be careful with the numbers, do not make things up. Paragraphs as following: {cluster_content} The above is the content you need to summarize.`, maxToken: 'Max token', maxTokenTip: 'The maximum number of tokens per generated summary chunk.', maxTokenMessage: 'Max token is required', threshold: 'Threshold', thresholdTip: 'In RAPTOR, chunks are clustered by their semantic similarity. The Threshold parameter sets the minimum similarity required for chunks to be grouped together. A higher Threshold means fewer chunks in each cluster, while a lower one means more.', thresholdMessage: 'Threshold is required', maxCluster: 'Max cluster', maxClusterTip: 'The maximum number of clusters to create.', maxClusterMessage: 'Max cluster is required', randomSeed: 'Random seed', randomSeedMessage: 'Random seed is required', entityTypes: 'Entity types', vietnamese: 'Vietnamese', pageRank: 'Page rank', pageRankTip: `You can assign a higher PageRank score to specific knowledge bases during retrieval. The corresponding score is added to the hybrid similarity scores of retrieved chunks from these knowledge bases, increasing their ranking. See https://ragflow.io/docs/dev/set_page_rank for details.`, tagName: 'Tag', frequency: 'Frequency', searchTags: 'Search tags', tagCloud: 'Cloud', tagTable: 'Table', tagSet: 'Tag sets', tagSetTip: `Select one or multiple tag knowledge bases to auto-tag chunks in your knowledge base. See https://ragflow.io/docs/dev/use_tag_sets for details.
The user query will also be auto-tagged.
This auto-tagging feature enhances retrieval by adding another layer of domain-specific knowledge to the existing dataset.Difference between auto-tag and auto-keyword: