httpx<=0.26,>=0.15
deprecated~=1.2.0
packaging>=20.0
pydantic>=1.10.7
wrapt<1.15,>=1.14
tqdm<5.0.0,>=4.66.1
backoff
monotonic
rich!=13.1.0
typer<0.10.0,>=0.6.0
python-dotenv
minio
html5lib
fastapi<1.0.0
pypandoc~=1.13
beautifulsoup4~=4.12.2
pandas~=2.2.2
pandera[io]~=0.19.3
numpy~=1.26.4
spacy~=3.7.2
pyarrow==14.*
natsort~=8.4.0
rapidfuzz~=3.8.1
dill~=0.3.8
json-repair~=0.19.2
fastparquet
tiktoken
pymupdf
llama-index~=0.10.40
llama-index-core~=0.10.40
llama-index-callbacks-langfuse~=0.1.4
llama-index-llms-openai
llama-index-embeddings-openai
llama-index-multi-modal-llms-openai
weaviate-client>=4
llama-index-vector-stores-weaviate~=1.0.0

[integrations]
PyYAML<6.1.0,>=5.4.1
datasets!=2.3.2,>1.17.0
huggingface_hub>=0.5.0
flair>=0.12.2
faiss-cpu
flyingsquid
pgmpy
plotly>=4.1.0
snorkel>=0.9.7
spacy<3.7.0,>=3.5.0
spacy-transformers>=1.2.5
spacy-huggingface-hub>=0.0.10
transformers[torch]>=4.30.0
evaluate
seqeval
sentence-transformers
setfit>=1.0.0
span_marker
sentence-transformers<3.0.0,>=2.0.0
textdescriptives<3.0.0,>=2.7.0
openai<1.0.0,>=0.27.10
peft
trl>=0.5.0
ipynbname

[listeners]
schedule~=1.1.0

[nlp]
textdescriptives
setfit~=0.7.0

[ocr]
nougat-ocr[api]
timm==0.5.4
transformers~=4.25.1

[pdf]
unstructured[pdf]~=0.12.3
llmsherpa~=0.1.3
python-doctr~=0.8.1
deepdoctection
pypdf
pypdfium2
pymupdf
pdf2image~=1.16.0

[server]
extralit-server~=0.2.1

[server-postgresql]
extralit-server[postgresql]~=0.2.1

[tests]
pytest
pytest-cov
pytest-mock
pytest-xdist
pytest-asyncio
pytest-env
factory_boy~=3.2.1
