From 574d2215ef0bffec08bd8c06c76ad5c8b7d9832c Mon Sep 17 00:00:00 2001 From: Tim Liu Date: Mon, 22 Jan 2024 23:05:34 +0800 Subject: [PATCH] Smoke test with '--package' to fetch the plugin jar To fix https://github.com/NVIDIA/spark-rapids/issues/10160 Run SPARK_SHELL_SMOKE_TEST with '--package' to fetch the plugin jar Can downloading the plugin jar from specified artifact repo by '--repositories' This test can fetch plugin jar from internal maven repo, maven central, or Sonatype staging repo. Signed-off-by: Tim Liu --- integration_tests/run_pyspark_from_build.sh | 7 ++++++- jenkins/spark-tests.sh | 5 +++++ 2 files changed, 11 insertions(+), 1 deletion(-) diff --git a/integration_tests/run_pyspark_from_build.sh b/integration_tests/run_pyspark_from_build.sh index f6e32c72161..f98f167766c 100755 --- a/integration_tests/run_pyspark_from_build.sh +++ b/integration_tests/run_pyspark_from_build.sh @@ -1,5 +1,5 @@ #!/bin/bash -# Copyright (c) 2020-2023, NVIDIA CORPORATION. +# Copyright (c) 2020-2024, NVIDIA CORPORATION. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. @@ -333,6 +333,11 @@ EOF --driver-class-path "${PYSP_TEST_spark_driver_extraClassPath}" --conf spark.executor.extraClassPath="${PYSP_TEST_spark_driver_extraClassPath}" ) + elif [[ -n "$PYSP_TEST_spark_jars_packages" ]]; then + SPARK_SHELL_ARGS_ARR+=(--packages "${PYSP_TEST_spark_jars_packages}") + if [[ -n "$PYSP_TEST_spark_jars_repositories" ]]; then + SPARK_SHELL_ARGS_ARR+=(--repositories "${PYSP_TEST_spark_jars_repositories}") + fi else SPARK_SHELL_ARGS_ARR+=(--jars "${PYSP_TEST_spark_jars}") fi diff --git a/jenkins/spark-tests.sh b/jenkins/spark-tests.sh index 368a62ac1e8..0a455afcb10 100755 --- a/jenkins/spark-tests.sh +++ b/jenkins/spark-tests.sh @@ -304,6 +304,11 @@ if [[ $TEST_MODE == "DEFAULT" ]]; then PYSP_TEST_spark_shuffle_manager=com.nvidia.spark.rapids.${SHUFFLE_SPARK_SHIM}.RapidsShuffleManager \ ./run_pyspark_from_build.sh + SPARK_SHELL_SMOKE_TEST=1 \ + PYSP_TEST_spark_jars_packages=com.nvidia:rapids-4-spark_${SCALA_BINARY_VER}:${PROJECT_VER} \ + PYSP_TEST_spark_jars_repositories=${PROJECT_REPO} \ + ./run_pyspark_from_build.sh + # ParquetCachedBatchSerializer cache_test PYSP_TEST_spark_sql_cache_serializer=com.nvidia.spark.ParquetCachedBatchSerializer \ ./run_pyspark_from_build.sh -k cache_test