From c900a186b786af965dbec6211243d928079dc6c4 Mon Sep 17 00:00:00 2001 From: Wenwei Lin Date: Sun, 9 Feb 2025 18:24:25 +0800 Subject: [PATCH] =?UTF-8?q?feat:=20=E7=9F=A5=E8=AF=86=E5=BA=93=E6=96=87?= =?UTF-8?q?=E4=BB=B6=E6=94=AF=E6=8C=81=20html=20=E7=B1=BB=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/main/services/KnowledgeService.ts | 11 +++++++++++ src/renderer/src/pages/knowledge/KnowledgeContent.tsx | 2 +- 2 files changed, 12 insertions(+), 1 deletion(-) diff --git a/src/main/services/KnowledgeService.ts b/src/main/services/KnowledgeService.ts index 95634a7d..ccbf2bb3 100644 --- a/src/main/services/KnowledgeService.ts +++ b/src/main/services/KnowledgeService.ts @@ -178,6 +178,17 @@ class KnowledgeService { const fileContent = fs.readFileSync(file.path, 'utf-8') + if (['.html'].includes(file.ext)) { + return await ragApplication.addLoader( + new WebLoader({ + urlOrContent: fileContent, + chunkSize: base.chunkSize, + chunkOverlap: base.chunkOverlap + }) as any, + forceReload + ) + } + return await ragApplication.addLoader( new TextLoader({ text: fileContent, chunkSize: base.chunkSize, chunkOverlap: base.chunkOverlap }), forceReload diff --git a/src/renderer/src/pages/knowledge/KnowledgeContent.tsx b/src/renderer/src/pages/knowledge/KnowledgeContent.tsx index 857be2ea..6474e08e 100644 --- a/src/renderer/src/pages/knowledge/KnowledgeContent.tsx +++ b/src/renderer/src/pages/knowledge/KnowledgeContent.tsx @@ -33,7 +33,7 @@ interface KnowledgeContentProps { selectedBase: KnowledgeBase } -const fileTypes = ['.pdf', '.docx', '.pptx', '.xlsx', '.txt', '.md'] +const fileTypes = ['.pdf', '.docx', '.pptx', '.xlsx', '.txt', '.md', '.html'] const KnowledgeContent: FC = ({ selectedBase }) => { const { t } = useTranslation()