diff --git a/api/apps/dataset_api.py b/api/apps/dataset_api.py index d00c52bb..f8e2d193 100644 --- a/api/apps/dataset_api.py +++ b/api/apps/dataset_api.py @@ -381,6 +381,8 @@ def upload_documents(dataset_id): doc["parser_id"] = ParserType.AUDIO.value if re.search(r"\.(ppt|pptx|pages)$", filename): doc["parser_id"] = ParserType.PRESENTATION.value + if re.search(r"\.(eml)$", filename): + doc["parser_id"] = ParserType.EMAIL.value DocumentService.insert(doc) FileService.add_file_from_kb(doc, kb_folder["id"], dataset.tenant_id) diff --git a/api/apps/document_app.py b/api/apps/document_app.py index b33bff4c..0f69dc5e 100644 --- a/api/apps/document_app.py +++ b/api/apps/document_app.py @@ -139,6 +139,8 @@ def web_crawl(): doc["parser_id"] = ParserType.AUDIO.value if re.search(r"\.(ppt|pptx|pages)$", filename): doc["parser_id"] = ParserType.PRESENTATION.value + if re.search(r"\.(eml)$", filename): + doc["parser_id"] = ParserType.EMAIL.value DocumentService.insert(doc) FileService.add_file_from_kb(doc, kb_folder["id"], kb.tenant_id) except Exception as e: