Added description for .ppt, specify the reason for unstructured.io (#9452)

Co-authored-by: crazywoola <427733928@qq.com>
This commit is contained in:
Zixuan Cheng 2024-10-24 07:13:06 -07:00 committed by GitHub
parent e71f494839
commit 88dec6ef2b
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -121,6 +121,8 @@ class ExtractProcessor:
extractor = UnstructuredEmailExtractor(file_path, unstructured_api_url, unstructured_api_key)
elif file_extension == ".ppt":
extractor = UnstructuredPPTExtractor(file_path, unstructured_api_url, unstructured_api_key)
# You must first specify the API key
# because unstructured_api_key is necessary to parse .ppt documents
elif file_extension == ".pptx":
extractor = UnstructuredPPTXExtractor(file_path, unstructured_api_url, unstructured_api_key)
elif file_extension == ".xml":