| # PySpark dependencies (required) |
| py4j |
| |
| # PySpark dependencies (optional) |
| numpy |
| pyarrow |
| pandas |
| scipy |
| plotly |
| mlflow>=1.0 |
| sklearn |
| matplotlib<3.3.0 |
| |
| # PySpark test dependencies |
| xmlrunner |
| |
| # PySpark test dependencies (optional) |
| coverage |
| |
| # Linter |
| mypy |
| pytest-mypy-plugins==1.9.3 |
| flake8==3.9.0 |
| # See SPARK-38680. |
| pandas-stubs<1.2.0.54 |
| |
| # Documentation (SQL) |
| mkdocs |
| |
| # Documentation (Python) |
| pydata_sphinx_theme |
| ipython |
| nbsphinx |
| numpydoc |
| jinja2<3.0.0 |
| sphinx<3.1.0 |
| sphinx-plotly-directive |
| |
| # Development scripts |
| jira |
| PyGithub |
| |
| # pandas API on Spark Code formatter. |
| black |