diff --git a/.github/workflows/release-worker.yml b/.github/workflows/release-worker.yml index 71e6565a1..86aff4128 100644 --- a/.github/workflows/release-worker.yml +++ b/.github/workflows/release-worker.yml @@ -32,7 +32,7 @@ jobs: id: login-ecr with: registry-type: public - mask-password: 'true' + mask-password: "true" - name: Set version id: set-version @@ -49,3 +49,6 @@ jobs: ${{ steps.login-ecr.outputs.registry }}/n4e0e1y0/beta9-worker:latest target: final platforms: linux/amd64 + build-args: | + CEDANA_TOKEN=${{ secrets.CEDANA_TOKEN }} + CEDANA_BASE_URL=${{ secrets.CEDANA_BASE_URL }} diff --git a/docker/Dockerfile.worker b/docker/Dockerfile.worker index f0eec083a..636f682c6 100644 --- a/docker/Dockerfile.worker +++ b/docker/Dockerfile.worker @@ -88,9 +88,6 @@ RUN apt-get update && \ apt-get install psmisc RUN curl -L https://beam-runner-python-deps.s3.amazonaws.com/juicefs -o /usr/local/bin/juicefs && chmod +x /usr/local/bin/juicefs -RUN curl -L https://beam-runner-python-deps.s3.amazonaws.com/cedana-gpu-controller -o /usr/local/bin/cedana-gpu-controller && chmod +x /usr/local/bin/cedana-gpu-controller -RUN curl -L https://beam-runner-python-deps.s3.amazonaws.com/libcedana-gpu.so -o /usr/local/lib/libcedana-gpu.so && chmod +x /usr/local/lib/libcedana-gpu.so - RUN curl -fsSL https://tailscale.com/install.sh | sh RUN apt-get install -y --no-install-recommends nvidia-container-toolkit-base nvidia-container-toolkit @@ -107,7 +104,7 @@ if [ "$(uname -m)" = "x86_64" ]; then fi EOT -ARG CEDANA_VERSION=0.9.233 +ARG CEDANA_VERSION=0.9.234 RUN < - C/R failed: %v\n", containerId, err) } if restored { - // HOTFIX: If we restored from a checkpoint, we need to use the container ID of the restored container - // instead of the original container ID - containerInstance, exists := s.containerInstances.Get(request.ContainerId) - if exists { - containerInstance.Id = restoredContainerId - s.containerInstances.Set(containerId, containerInstance) - containerId = restoredContainerId - } - exitCode = s.waitForRestoredContainer(ctx, containerId, startedChan, outputChan, request, spec) return }