mirror of
https://git.mirrors.martin98.com/https://github.com/infiniflow/ragflow.git
synced 2025-05-29 17:45:33 +08:00
### What problem does this PR solve? feat: Configurable for excel, html table or row based text #2516 ### Type of change - [ ] Bug Fix (non-breaking change which fixes an issue) - [x] New Feature (non-breaking change which adds functionality) - [ ] Documentation Update - [ ] Refactoring - [ ] Performance Improvement - [ ] Other (please describe):
This commit is contained in:
parent
db1be22a2f
commit
dd019e7ba1
@ -24,6 +24,7 @@ import { useFetchParserListOnMount } from './hooks';
|
|||||||
import { useTranslate } from '@/hooks/common-hooks';
|
import { useTranslate } from '@/hooks/common-hooks';
|
||||||
import Delimiter from '../delimiter';
|
import Delimiter from '../delimiter';
|
||||||
import EntityTypesItem from '../entity-types-item';
|
import EntityTypesItem from '../entity-types-item';
|
||||||
|
import ExcelToHtml from '../excel-to-html';
|
||||||
import LayoutRecognize from '../layout-recognize';
|
import LayoutRecognize from '../layout-recognize';
|
||||||
import ParseConfiguration, {
|
import ParseConfiguration, {
|
||||||
showRaptorParseConfiguration,
|
showRaptorParseConfiguration,
|
||||||
@ -104,6 +105,9 @@ const ChunkMethodModal: React.FC<IProps> = ({
|
|||||||
|
|
||||||
const showEntityTypes = selectedTag === 'knowledge_graph';
|
const showEntityTypes = selectedTag === 'knowledge_graph';
|
||||||
|
|
||||||
|
const showExcelToHtml =
|
||||||
|
selectedTag === 'naive' && documentExtension === 'xlsx';
|
||||||
|
|
||||||
const afterClose = () => {
|
const afterClose = () => {
|
||||||
form.resetFields();
|
form.resetFields();
|
||||||
};
|
};
|
||||||
@ -279,6 +283,7 @@ const ChunkMethodModal: React.FC<IProps> = ({
|
|||||||
<Delimiter></Delimiter>
|
<Delimiter></Delimiter>
|
||||||
</>
|
</>
|
||||||
)}
|
)}
|
||||||
|
{showExcelToHtml && <ExcelToHtml></ExcelToHtml>}
|
||||||
{showRaptorParseConfiguration(selectedTag) && (
|
{showRaptorParseConfiguration(selectedTag) && (
|
||||||
<ParseConfiguration></ParseConfiguration>
|
<ParseConfiguration></ParseConfiguration>
|
||||||
)}
|
)}
|
||||||
|
19
web/src/components/excel-to-html.tsx
Normal file
19
web/src/components/excel-to-html.tsx
Normal file
@ -0,0 +1,19 @@
|
|||||||
|
import { useTranslate } from '@/hooks/common-hooks';
|
||||||
|
import { Form, Switch } from 'antd';
|
||||||
|
|
||||||
|
const ExcelToHtml = () => {
|
||||||
|
const { t } = useTranslate('knowledgeDetails');
|
||||||
|
return (
|
||||||
|
<Form.Item
|
||||||
|
name={['parser_config', 'html4excel']}
|
||||||
|
label={t('html4excel')}
|
||||||
|
initialValue={false}
|
||||||
|
valuePropName="checked"
|
||||||
|
tooltip={t('html4excelTip')}
|
||||||
|
>
|
||||||
|
<Switch />
|
||||||
|
</Form.Item>
|
||||||
|
);
|
||||||
|
};
|
||||||
|
|
||||||
|
export default ExcelToHtml;
|
@ -150,6 +150,8 @@ export default {
|
|||||||
topK: 'Top-K',
|
topK: 'Top-K',
|
||||||
topKTip: `K chunks will be fed into rerank models.`,
|
topKTip: `K chunks will be fed into rerank models.`,
|
||||||
delimiter: `Delimiter`,
|
delimiter: `Delimiter`,
|
||||||
|
html4excel: 'Excel to HTML',
|
||||||
|
html4excelTip: `Excel will be parsed into HTML table or not. If it's FALSE, every row in Excel will be formed as a chunk.`,
|
||||||
},
|
},
|
||||||
knowledgeConfiguration: {
|
knowledgeConfiguration: {
|
||||||
titleDescription:
|
titleDescription:
|
||||||
|
@ -146,6 +146,8 @@ export default {
|
|||||||
topK: 'Top-K',
|
topK: 'Top-K',
|
||||||
topKTip: `K塊將被送入Rerank型號。`,
|
topKTip: `K塊將被送入Rerank型號。`,
|
||||||
delimiter: `分段標識符`,
|
delimiter: `分段標識符`,
|
||||||
|
html4excel: '表格轉HTML',
|
||||||
|
html4excelTip: `Excel 是否會被解析為 HTML 表格。如果為 FALSE,Excel 中的每一行都會形成一個區塊。`,
|
||||||
},
|
},
|
||||||
knowledgeConfiguration: {
|
knowledgeConfiguration: {
|
||||||
titleDescription: '在這裡更新您的知識庫詳細信息,尤其是解析方法。',
|
titleDescription: '在這裡更新您的知識庫詳細信息,尤其是解析方法。',
|
||||||
|
@ -147,6 +147,8 @@ export default {
|
|||||||
topK: 'Top-K',
|
topK: 'Top-K',
|
||||||
topKTip: `K块将被送入Rerank型号。`,
|
topKTip: `K块将被送入Rerank型号。`,
|
||||||
delimiter: `分段标识符`,
|
delimiter: `分段标识符`,
|
||||||
|
html4excel: '表格转HTML',
|
||||||
|
html4excelTip: `Excel 是否将被解析为 HTML 表。如果为 FALSE,Excel 中的每一行都将形成一个块。`,
|
||||||
},
|
},
|
||||||
knowledgeConfiguration: {
|
knowledgeConfiguration: {
|
||||||
titleDescription: '在这里更新您的知识库详细信息,尤其是解析方法。',
|
titleDescription: '在这里更新您的知识库详细信息,尤其是解析方法。',
|
||||||
|
@ -1,5 +1,6 @@
|
|||||||
import Delimiter from '@/components/delimiter';
|
import Delimiter from '@/components/delimiter';
|
||||||
import EntityTypesItem from '@/components/entity-types-item';
|
import EntityTypesItem from '@/components/entity-types-item';
|
||||||
|
import ExcelToHtml from '@/components/excel-to-html';
|
||||||
import LayoutRecognize from '@/components/layout-recognize';
|
import LayoutRecognize from '@/components/layout-recognize';
|
||||||
import MaxTokenNumber from '@/components/max-token-number';
|
import MaxTokenNumber from '@/components/max-token-number';
|
||||||
import ParseConfiguration, {
|
import ParseConfiguration, {
|
||||||
@ -124,6 +125,7 @@ const ConfigurationForm = ({ form }: { form: FormInstance }) => {
|
|||||||
<MaxTokenNumber></MaxTokenNumber>
|
<MaxTokenNumber></MaxTokenNumber>
|
||||||
<Delimiter></Delimiter>
|
<Delimiter></Delimiter>
|
||||||
<LayoutRecognize></LayoutRecognize>
|
<LayoutRecognize></LayoutRecognize>
|
||||||
|
<ExcelToHtml></ExcelToHtml>
|
||||||
</>
|
</>
|
||||||
)}
|
)}
|
||||||
{showRaptorParseConfiguration(parserId) && (
|
{showRaptorParseConfiguration(parserId) && (
|
||||||
|
Loading…
x
Reference in New Issue
Block a user