Skip to content

Commit

Permalink
Adding support for Spark 3.5 (#210)
Browse files Browse the repository at this point in the history
* Adding support for Spark 3.5

Skipping Spark 3.4 for now, due to dependency issue with Breeze. Will revisit in future PR.

* Added spark 3.5 to workflow
  • Loading branch information
rdsharma26 authored Jul 2, 2024
1 parent 7ecb7da commit 11bafa3
Show file tree
Hide file tree
Showing 4 changed files with 5 additions and 4 deletions.
2 changes: 1 addition & 1 deletion .github/workflows/base.yml
Original file line number Diff line number Diff line change
Expand Up @@ -12,7 +12,7 @@ jobs:
strategy:
fail-fast: false
matrix:
PYSPARK_VERSION: ["3.1.3", "3.2", "3.3"]
PYSPARK_VERSION: ["3.1.3", "3.2", "3.3", "3.5"]

steps:
- uses: actions/checkout@v3
Expand Down
4 changes: 2 additions & 2 deletions Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -22,8 +22,8 @@ COPY poetry.lock /python-deequ
WORKDIR python-deequ

RUN poetry install -vvv
RUN poetry add pyspark==3.3 -vvv
RUN poetry add pyspark==3.5.0 -vvv

ENV SPARK_VERSION=3.3
ENV SPARK_VERSION=3.5
COPY . /python-deequ
CMD poetry run python -m pytest -s tests
1 change: 1 addition & 0 deletions pydeequ/configs.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,6 +5,7 @@


SPARK_TO_DEEQU_COORD_MAPPING = {
"3.5": "com.amazon.deequ:deequ:2.0.7-spark-3.5",
"3.3": "com.amazon.deequ:deequ:2.0.7-spark-3.3",
"3.2": "com.amazon.deequ:deequ:2.0.7-spark-3.2",
"3.1": "com.amazon.deequ:deequ:2.0.7-spark-3.1"
Expand Down
2 changes: 1 addition & 1 deletion pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,7 @@ classifiers = [


[tool.poetry.dependencies]
python = ">=3.7,<4"
python = ">=3.8,<4"
numpy = ">=1.14.1"
pandas = ">=0.23.0"
pyspark = { version = ">=2.4.7, <3.3.0", optional = true }
Expand Down

0 comments on commit 11bafa3

Please sign in to comment.