chardet
filetype
python-magic
lxml
nltk
tabulate
requests

[all-docs]
python-pptx
msg_parser
pypandoc
pdf2image
xlrd
pandas
markdown
python-docx
unstructured-inference==0.5.7
pdfminer.six
Pillow<10
openpyxl

[azure]
adlfs
fsspec

[box]
boxfs
fsspec

[confluence]
atlassian-python-api

[csv]
pandas

[discord]
discord-py

[docx]
python-docx

[dropbox]
dropboxdrivefs
fsspec

[elasticsearch]
elasticsearch
jq

[epub]
pypandoc

[gcs]
gcsfs
fsspec

[github]
pygithub==1.58.2

[gitlab]
python-gitlab

[google-drive]
google-api-python-client

[huggingface]
langdetect
sacremoses
sentencepiece
torch
transformers

[image]
pdf2image
pdfminer.six
Pillow<10
unstructured-inference==0.5.7

[local-inference]
python-pptx
msg_parser
pypandoc
pdf2image
xlrd
pandas
markdown
python-docx
unstructured-inference==0.5.7
pdfminer.six
Pillow<10
openpyxl

[md]
markdown

[msg]
msg_parser

[odt]
python-docx
pypandoc

[onedrive]
msal
Office365-REST-Python-Client==2.4.2
cryptography==41.0.2

[org]
pypandoc

[outlook]
msal
Office365-REST-Python-Client==2.4.2
cryptography==41.0.2

[pdf]
pdf2image
pdfminer.six
Pillow<10
unstructured-inference==0.5.7

[pptx]
python-pptx

[reddit]
praw

[rst]
pypandoc

[rtf]
pypandoc

[s3]
s3fs
fsspec

[slack]
slack_sdk

[tsv]
pandas

[wikipedia]
wikipedia

[xlsx]
openpyxl
pandas
xlrd
