# PySpark dependencies (required)
py4j

# PySpark dependencies (optional)
numpy
pyarrow
pandas
scipy
plotly
mlflow>=1.0
sklearn
matplotlib<3.3.0

# PySpark test dependencies
xmlrunner

# PySpark test dependencies (optional)
coverage

# Linter
mypy
pytest-mypy-plugins==1.9.3
flake8==3.9.0
# See SPARK-38680.
pandas-stubs<1.2.0.54

# Documentation (SQL)
mkdocs

# Documentation (Python)
pydata_sphinx_theme
ipython
nbsphinx
numpydoc
jinja2<3.0.0
sphinx<3.1.0
sphinx-plotly-directive
docutils<0.18.0

# Development scripts
jira
PyGithub

# pandas API on Spark Code formatter.
black
py
