-
Notifications
You must be signed in to change notification settings - Fork 29
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge remote-tracking branch 'upstream/branch-0.37' into test-cuda-12.2
- Loading branch information
Showing
31 changed files
with
816 additions
and
219 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -57,3 +57,41 @@ jobs: | |
branch: ${{ inputs.branch }} | ||
date: ${{ inputs.date }} | ||
sha: ${{ inputs.sha }} | ||
wheel-build-ucxx: | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: ${{ inputs.build_type || 'branch' }} | ||
branch: ${{ inputs.branch }} | ||
sha: ${{ inputs.sha }} | ||
date: ${{ inputs.date }} | ||
script: ci/build_wheel_ucxx.sh | ||
wheel-publish-ucxx: | ||
needs: wheel-build-ucxx | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: ${{ inputs.build_type || 'branch' }} | ||
branch: ${{ inputs.branch }} | ||
sha: ${{ inputs.sha }} | ||
date: ${{ inputs.date }} | ||
package-name: ucxx | ||
wheel-build-distributed-ucxx: | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: ${{ inputs.build_type || 'branch' }} | ||
branch: ${{ inputs.branch }} | ||
sha: ${{ inputs.sha }} | ||
date: ${{ inputs.date }} | ||
script: ci/build_wheel_distributed_ucxx.sh | ||
wheel-publish-distributed-ucxx: | ||
needs: [wheel-build-ucxx, wheel-build-distributed-ucxx] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: ${{ inputs.build_type || 'branch' }} | ||
branch: ${{ inputs.branch }} | ||
sha: ${{ inputs.sha }} | ||
date: ${{ inputs.date }} | ||
package-name: distributed_ucxx |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -17,6 +17,10 @@ jobs: | |
- docs-build | ||
- conda-cpp-tests | ||
- conda-python-tests | ||
- wheel-build-ucxx | ||
- wheel-tests-ucxx | ||
- wheel-build-distributed-ucxx | ||
- wheel-tests-distributed-ucxx | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
checks: | ||
|
@@ -54,3 +58,33 @@ jobs: | |
with: | ||
build_type: pull-request | ||
container-options: "--cap-add CAP_SYS_PTRACE --shm-size=8g --ulimit=nofile=1000000:1000000" | ||
wheel-build-ucxx: | ||
needs: checks | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: pull-request | ||
script: ci/build_wheel_ucxx.sh | ||
wheel-tests-ucxx: | ||
needs: wheel-build-ucxx | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: pull-request | ||
container-options: "--cap-add CAP_SYS_PTRACE --shm-size=8g --ulimit=nofile=1000000:1000000" | ||
script: ci/test_wheel_ucxx.sh | ||
wheel-build-distributed-ucxx: | ||
needs: checks | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: pull-request | ||
script: ci/build_wheel_distributed_ucxx.sh | ||
wheel-tests-distributed-ucxx: | ||
needs: [wheel-build-ucxx, wheel-build-distributed-ucxx] | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: pull-request | ||
container-options: "--cap-add CAP_SYS_PTRACE --shm-size=8g --ulimit=nofile=1000000:1000000" | ||
script: ci/test_wheel_distributed_ucxx.sh |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -32,3 +32,23 @@ jobs: | |
date: ${{ inputs.date }} | ||
sha: ${{ inputs.sha }} | ||
container-options: "--cap-add CAP_SYS_PTRACE --shm-size=8g --ulimit=nofile=1000000:1000000" | ||
wheel-tests-ucxx: | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: nightly | ||
branch: ${{ inputs.branch }} | ||
date: ${{ inputs.date }} | ||
sha: ${{ inputs.sha }} | ||
container-options: "--cap-add CAP_SYS_PTRACE --shm-size=8g --ulimit=nofile=1000000:1000000" | ||
script: ci/test_wheel_ucxx.sh | ||
wheel-tests-distributed-ucxx: | ||
secrets: inherit | ||
uses: rapidsai/shared-workflows/.github/workflows/[email protected] | ||
with: | ||
build_type: nightly | ||
branch: ${{ inputs.branch }} | ||
date: ${{ inputs.date }} | ||
sha: ${{ inputs.sha }} | ||
container-options: "--cap-add CAP_SYS_PTRACE --shm-size=8g --ulimit=nofile=1000000:1000000" | ||
script: ci/test_wheel_distributed_ucxx.sh |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
0.37.00 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,147 @@ | ||
#!/bin/bash | ||
# Copyright (c) 2024, NVIDIA CORPORATION. | ||
|
||
set -euo pipefail | ||
|
||
package_name=$1 | ||
package_dir=$2 | ||
|
||
source rapids-configure-sccache | ||
source rapids-date-string | ||
|
||
version=$(rapids-generate-version) | ||
commit=$(git rev-parse HEAD) | ||
|
||
RAPIDS_PY_CUDA_SUFFIX="$(rapids-wheel-ctk-name-gen ${RAPIDS_CUDA_VERSION})" | ||
|
||
# This is the version of the suffix with a preceding hyphen. It's used | ||
# everywhere except in the final wheel name. | ||
PACKAGE_CUDA_SUFFIX="-${RAPIDS_PY_CUDA_SUFFIX}" | ||
|
||
# Patch project metadata files to include the CUDA version suffix and version override. | ||
pyproject_file="${package_dir}/pyproject.toml" | ||
|
||
sed -i -E "s/^name = \"${package_name}(.*)?\"$/name = \"${package_name}${PACKAGE_CUDA_SUFFIX}\"/g" ${pyproject_file} | ||
echo "${version}" > VERSION | ||
sed -i "/^__git_commit__/ s/= .*/= \"${commit}\"/g" "${package_dir}/${package_name//-/_}/_version.py" | ||
|
||
# For nightlies we want to ensure that we're pulling in alphas as well. The | ||
# easiest way to do so is to augment the spec with a constraint containing a | ||
# min alpha version that doesn't affect the version bounds but does allow usage | ||
# of alpha versions for that dependency without --pre | ||
alpha_spec='' | ||
if ! rapids-is-release-build; then | ||
alpha_spec=',>=0.0.0a0' | ||
fi | ||
|
||
if [[ ${package_name} == "distributed-ucxx" ]]; then | ||
sed -r -i "s/rapids-dask-dependency==(.*)\"/rapids-dask-dependency==\1${alpha_spec}\"/g" ${pyproject_file} | ||
sed -r -i "s/\"ucxx(.*)\"/\"ucxx${PACKAGE_CUDA_SUFFIX}\1${alpha_spec}\"/g" ${pyproject_file} | ||
|
||
python -m pip wheel "${package_dir}/" -w "${package_dir}/dist" -vvv --no-deps --disable-pip-version-check | ||
|
||
RAPIDS_PY_WHEEL_NAME="distributed_ucxx_${RAPIDS_PY_CUDA_SUFFIX}" rapids-upload-wheels-to-s3 ${package_dir}/dist | ||
elif [[ ${package_name} == "ucxx" ]]; then | ||
# Add -cuXX to package name | ||
sed -r -i "s/rapids-dask-dependency==(.*)\"/rapids-dask-dependency==\1${alpha_spec}\"/g" ${pyproject_file} | ||
sed -r -i "s/rmm(.*)\"/rmm${PACKAGE_CUDA_SUFFIX}\1${alpha_spec}\"/g" ${pyproject_file} | ||
sed -r -i "s/cudf(.*)\"/cudf${PACKAGE_CUDA_SUFFIX}\1${alpha_spec}\"/g" ${pyproject_file} | ||
|
||
# Update cupy package name (different suffix from RAPIDS) | ||
if [[ $PACKAGE_CUDA_SUFFIX == "-cu12" ]]; then | ||
sed -i "s/cupy-cuda11x/cupy-cuda12x/g" ${pyproject_file} | ||
fi | ||
|
||
SKBUILD_CMAKE_ARGS="-DUCXX_ENABLE_RMM=ON" \ | ||
python -m pip wheel "${package_dir}"/ -w "${package_dir}"/dist -vvv --no-deps --disable-pip-version-check | ||
|
||
python -m auditwheel repair -w ${package_dir}/final_dist ${package_dir}/dist/* | ||
|
||
# Auditwheel rewrites dynamic libraries that are referenced at link time in the | ||
# package. However, UCX loads a number of sub-libraries at runtime via dlopen; | ||
# these are not picked up by auditwheel. Since we have a priori knowledge of | ||
# what these libraries are, we mimic the behaviour of auditwheel by using the | ||
# same hash-based uniqueness scheme and rewriting the link paths. | ||
|
||
WHL=$(realpath ${package_dir}/final_dist/ucxx*manylinux*.whl) | ||
|
||
# first grab the auditwheel hashes for libuc{tms} | ||
LIBUCM=$(unzip -l $WHL | awk 'match($4, /libucm-[^\.]+\./) { print substr($4, RSTART) }') | ||
LIBUCT=$(unzip -l $WHL | awk 'match($4, /libuct-[^\.]+\./) { print substr($4, RSTART) }') | ||
LIBUCS=$(unzip -l $WHL | awk 'match($4, /libucs-[^\.]+\./) { print substr($4, RSTART) }') | ||
LIBNUMA=$(unzip -l $WHL | awk 'match($4, /libnuma-[^\.]+\./) { print substr($4, RSTART) }') | ||
|
||
# Extract the libraries that have already been patched in by auditwheel | ||
mkdir -p repair_dist/ucxx_${RAPIDS_PY_CUDA_SUFFIX}.libs/ucx | ||
unzip $WHL "ucxx_${RAPIDS_PY_CUDA_SUFFIX}.libs/*.so*" -d repair_dist/ | ||
|
||
# Patch the RPATH to include ORIGIN for each library | ||
pushd repair_dist/ucxx_${RAPIDS_PY_CUDA_SUFFIX}.libs | ||
for f in libu*.so* | ||
do | ||
if [[ -f $f ]]; then | ||
patchelf --add-rpath '$ORIGIN' $f | ||
fi | ||
done | ||
|
||
popd | ||
|
||
# Now copy in all the extra libraries that are only ever loaded at runtime | ||
pushd repair_dist/ucxx_${RAPIDS_PY_CUDA_SUFFIX}.libs/ucx | ||
if [[ -d /usr/lib64/ucx ]]; then | ||
cp -P /usr/lib64/ucx/* . | ||
elif [[ -d /usr/lib/ucx ]]; then | ||
cp -P /usr/lib/ucx/* . | ||
else | ||
echo "Could not find ucx libraries" | ||
exit 1 | ||
fi | ||
|
||
# we link against <python>/lib/site-packages/ucxx_${RAPIDS_PY_CUDA_SUFFIX}.lib/libuc{ptsm} | ||
# we also amend the rpath to search one directory above to *find* libuc{tsm} | ||
for f in libu*.so* | ||
do | ||
# Avoid patching symlinks, which is redundant | ||
if [[ ! -L $f ]]; then | ||
patchelf --replace-needed libuct.so.0 $LIBUCT $f | ||
patchelf --replace-needed libucs.so.0 $LIBUCS $f | ||
patchelf --replace-needed libucm.so.0 $LIBUCM $f | ||
patchelf --replace-needed libnuma.so.1 $LIBNUMA $f | ||
patchelf --add-rpath '$ORIGIN/..' $f | ||
fi | ||
done | ||
|
||
# Bring in cudart as well. To avoid symbol collision with other libraries e.g. | ||
# cupy we mimic auditwheel by renaming the libraries to include the hashes of | ||
# their names. Since there will typically be a chain of symlinks | ||
# libcudart.so->libcudart.so.X->libcudart.so.X.Y.Z we need to follow the chain | ||
# and rename all of them. | ||
|
||
find /usr/local/cuda/ -name "libcudart*.so*" | xargs cp -P -t . | ||
src=libcudart.so | ||
hash=$(sha256sum ${src} | awk '{print substr($1, 0, 8)}') | ||
target=$(basename $(readlink -f ${src})) | ||
|
||
mv ${target} ${target/libcudart/libcudart-${hash}} | ||
while readlink ${src} > /dev/null; do | ||
target=$(readlink ${src}) | ||
ln -s ${target/libcudart/libcudart-${hash}} ${src/libcudart/libcudart-${hash}} | ||
rm -f ${src} | ||
src=${target} | ||
done | ||
|
||
to_rewrite=$(ldd libuct_cuda.so | awk '/libcudart/ { print $1 }') | ||
patchelf --replace-needed ${to_rewrite} libcudart-${hash}.so libuct_cuda.so | ||
patchelf --add-rpath '$ORIGIN' libuct_cuda.so | ||
|
||
popd | ||
|
||
pushd repair_dist | ||
zip -r $WHL ucxx_${RAPIDS_PY_CUDA_SUFFIX}.libs/ | ||
popd | ||
|
||
RAPIDS_PY_WHEEL_NAME="ucxx_${RAPIDS_PY_CUDA_SUFFIX}" rapids-upload-wheels-to-s3 ${package_dir}/final_dist | ||
else | ||
echo "Unknown package '${package_name}'" | ||
exit 1 | ||
fi |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,8 @@ | ||
#!/bin/bash | ||
# Copyright (c) 2024, NVIDIA CORPORATION. | ||
|
||
set -euo pipefail | ||
|
||
package_dir="python/distributed-ucxx" | ||
|
||
./ci/build_wheel.sh distributed-ucxx ${package_dir} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,8 @@ | ||
#!/bin/bash | ||
# Copyright (c) 2024, NVIDIA CORPORATION. | ||
|
||
set -euo pipefail | ||
|
||
package_dir="python" | ||
|
||
./ci/build_wheel.sh ucxx ${package_dir} |
Oops, something went wrong.