blob: 76652df7448156203a13371d078e0b399799b2f5 [file] [log] [blame]
# PySpark dependencies (required)
py4j>=0.10.9.9
# PySpark dependencies (optional)
numpy>=1.22
pyarrow>=15.0.0
six==1.16.0
pandas>=2.2.0
scipy
plotly<6.0.0
mlflow>=2.3.1
scikit-learn
matplotlib
memory-profiler>=0.61.0
pyyaml>=3.11
# PySpark test dependencies
unittest-xml-reporting
openpyxl
# PySpark test dependencies (optional)
coverage
# Linter
mypy==1.8.0
pytest-mypy-plugins==1.9.3
flake8==3.9.0
# See SPARK-38680.
pandas-stubs<1.2.0.54
scipy-stubs; python_version>='3.10'
types-PyYAML
# Documentation (SQL)
mkdocs
# Documentation (Python)
pydata_sphinx_theme>=0.13
ipython
nbsphinx
numpydoc
jinja2
sphinx==4.5.0
# With sphinx 4.5.0, we need to set the upperbound version of sphinxcontrib*, it should be removed after upgrading sphinx>=5
sphinxcontrib-applehelp<=1.0.4
sphinxcontrib-devhelp<=1.0.2
sphinxcontrib-htmlhelp<=2.0.1
sphinxcontrib-jsmath<=1.0.1
sphinxcontrib-qthelp<=1.0.3
sphinxcontrib-serializinghtml<=1.1.5
sphinx-plotly-directive
sphinx-copybutton
docutils<0.18.0
markupsafe
# Development scripts
jira>=3.5.2
PyGithub
# pandas API on Spark Code formatter.
black==23.12.1
py
# Spark Connect (required)
grpcio>=1.67.0
grpcio-status>=1.67.0
googleapis-common-protos>=1.65.0
protobuf==5.29.5
# Spark Connect python proto generation plugin (optional)
mypy-protobuf==3.3.0
googleapis-common-protos-stubs==2.2.0
grpc-stubs==1.24.11
# Debug for Spark and Spark Connect
graphviz==0.20.3
flameprof==0.4
# TorchDistributor dependencies
torch
torchvision
torcheval
# DeepspeedTorchDistributor dependencies
deepspeed; sys_platform != 'darwin'