requests
numpy
pandas
fasttext
omegaconf
datasets
pyspark
scipy
trafilatura
html2text
faker
awscli
boto3
pre-commit==3.6.0
