blob: d6530d8ce282179625bbaa66d0445d4033369332 [file] [log] [blame]
# PySpark dependencies (required)
py4j>=0.10.9.7
# PySpark dependencies (optional)
numpy>=1.21
pyarrow>=4.0.0
six==1.16.0
pandas>=1.4.4
scipy
plotly
mlflow>=2.3.1
scikit-learn
matplotlib
memory-profiler>=0.61.0
# PySpark test dependencies
unittest-xml-reporting
openpyxl
# PySpark test dependencies (optional)
coverage
# Linter
mypy==1.8.0
pytest-mypy-plugins==1.9.3
flake8==3.9.0
# See SPARK-38680.
pandas-stubs<1.2.0.54
# Documentation (SQL)
mkdocs
# Documentation (Python)
pydata_sphinx_theme>=0.13
ipython
nbsphinx
numpydoc
jinja2
sphinx==4.5.0
sphinx-plotly-directive
sphinx-copybutton
docutils<0.18.0
markupsafe
# Development scripts
jira>=3.5.2
PyGithub
# pandas API on Spark Code formatter.
black==23.9.1
py
# Spark Connect (required)
grpcio>=1.62.0
grpcio-status>=1.62.0
googleapis-common-protos>=1.56.4
# Spark Connect python proto generation plugin (optional)
mypy-protobuf==3.3.0
googleapis-common-protos-stubs==2.2.0
grpc-stubs==1.24.11
# TorchDistributor dependencies
torch
torchvision
torcheval
# DeepspeedTorchDistributor dependencies
deepspeed; sys_platform != 'darwin'