diff --git a/.github/workflows/GithubActionTests.yml b/.github/workflows/GithubActionTests.yml index c4577ebddc1..9356003b5da 100644 --- a/.github/workflows/GithubActionTests.yml +++ b/.github/workflows/GithubActionTests.yml @@ -6,6 +6,7 @@ concurrency: jobs: test-linux: + if: ${{ false }} # FIXME name: Linux tests runs-on: ubuntu-latest strategy: @@ -34,13 +35,6 @@ jobs: conda list python setup.py install - - name: Build docker container - run: | - docker build -t quay.io/bioconda/bioconda-utils-build-env-cos7:latest ./ - docker history quay.io/bioconda/bioconda-utils-build-env-cos7:latest - docker run --rm -t quay.io/bioconda/bioconda-utils-build-env-cos7:latest sh -lec 'type -t conda && conda info --verbose && conda list' - docker build -t quay.io/bioconda/bioconda-utils-test-env-cos7:latest -f ./Dockerfile.test ./ - - name: Run tests '${{ matrix.py_test_marker }}' run: | eval "$(conda shell.bash hook)" @@ -51,6 +45,7 @@ jobs: echo "Skipping pytest - only docs modified" fi test-macosx: + if: ${{ false }} # FIXME name: OSX tests runs-on: macos-13 steps: @@ -83,6 +78,7 @@ jobs: fi autobump-test: + if: ${{ false }} # FIXME name: autobump test runs-on: ubuntu-latest steps: diff --git a/.github/workflows/build-image.yml b/.github/workflows/build-image.yml deleted file mode 100644 index 1ae6a9ec7bd..00000000000 --- a/.github/workflows/build-image.yml +++ /dev/null @@ -1,63 +0,0 @@ -name: Build image -concurrency: - group: ${{ github.workflow }}-${{ github.ref }} - cancel-in-progress: true - -on: - pull_request: - paths-ignore: - - '.circleci/**' - - 'docs/**' - - 'test/**' - -jobs: - build: - name: Build image - runs-on: ubuntu-20.04 - strategy: - matrix: - include: - - arch: arm64 - image: bioconda-utils-build-env-cos7-aarch64 - base_image: quay.io/condaforge/linux-anvil-aarch64 - - arch: amd64 - image: bioconda-utils-build-env-cos7 - base_image: quay.io/condaforge/linux-anvil-cos7-x86_64 - steps: - - uses: actions/checkout@v4 - with: - fetch-depth: 0 - - - id: get-tag - run: | - tag=${{ github.event.release && github.event.release.tag_name || github.sha }} - - # https://github.blog/changelog/2022-10-11-github-actions-deprecating-save-state-and-set-output-commands/ - # printf %s "::set-output name=tag::${tag#v}" - printf %s "tag=${tag#v}" >> $GITHUB_OUTPUT - - - name: Install qemu dependency - run: | - sudo apt-get update - sudo apt-get install -y qemu-user-static - - - name: Build image - id: buildah-build - uses: redhat-actions/buildah-build@v2 - with: - image: ${{ matrix.image }} - arch: ${{ matrix.arch }} - build-args: | - BASE_IMAGE=${{ matrix.base_image }} - tags: >- - latest - ${{ steps.get-tag.outputs.tag }} - dockerfiles: | - ./Dockerfile - - - name: Test built image - run: | - image='${{ steps.buildah-build.outputs.image }}' - for tag in ${{ steps.buildah-build.outputs.tags }} ; do - podman run --rm "${image}:${tag}" bioconda-utils --version - done diff --git a/.github/workflows/build-images.yml b/.github/workflows/build-images.yml new file mode 100644 index 00000000000..bcd3586e7f2 --- /dev/null +++ b/.github/workflows/build-images.yml @@ -0,0 +1,285 @@ +# Build all container images. +# +name: Build images +concurrency: + group: ${{ github.workflow }}-${{ github.ref }} + cancel-in-progress: true + +on: + pull_request: + paths-ignore: + - '.circleci/**' + - 'docs/**' + - 'test/**' +env: + # Used to override BIOCONDA_UTILS_VERSION in images/versions.sh + BIOCONDA_UTILS_VERSION: ${{ github.event.release && github.event.release.tag_name || github.head_ref || github.ref_name }} + +jobs: + + # JOBS FOR BUILDING IMAGES + # ---------------------------------------------------------------------- + # These jobs will build images for archs, put them into a manifest, and push + # that to GitHub Container Registry. Later, the testing jobs will test and + # push to quay.io. + + build-base-debian: + name: Build base-debian + runs-on: ubuntu-22.04 + outputs: + # A note on these TAG_EXISTS_* outputs: these allow subsequent jobs to + # change behavior (e.g., skip building or skip pushing to ghcr) depending + # on whether an image has already been created. + TAG_EXISTS_base-debian: ${{ steps.base-debian.outputs.TAG_EXISTS_base-debian }} + steps: + + - uses: actions/checkout@v4 + with: + fetch-depth: 0 + + - name: Install qemu dependency + run: | + sudo apt-get update + sudo apt-get install -y qemu-user-static + + - name: base-debian + id: base-debian + run: | + source images/versions.sh + if [ $(tag_exists $BASE_DEBIAN_IMAGE_NAME $BASE_TAG) ]; then + echo "TAG_EXISTS_base-debian=true" >> $GITHUB_OUTPUT + else + cd images && bash build.sh base-glibc-debian-bash + fi + + - name: push to ghcr + if: '${{ ! steps.base-debian.outputs.TAG_EXISTS_base-debian }}' + run: | + echo '${{ secrets.GITHUB_TOKEN }}' | podman login ghcr.io -u '${{ github.actor }}' --password-stdin + source images/versions.sh + push_to_ghcr $BASE_DEBIAN_IMAGE_NAME $BASE_TAG + + build-base-busybox: + name: Build base-busybox + runs-on: ubuntu-22.04 + outputs: + TAG_EXISTS_base-busybox: ${{ steps.base-busybox.outputs.TAG_EXISTS_base-busybox }} + steps: + + - uses: actions/checkout@v4 + with: + fetch-depth: 0 + + - name: Install qemu dependency + run: | + sudo apt-get update + sudo apt-get install -y qemu-user-static + + - name: base-busybox + id: base-busybox + run: | + source images/versions.sh + if [ $(tag_exists $BASE_BUSYBOX_IMAGE_NAME $BASE_TAG) ]; then + echo "TAG_EXISTS_base-busybox=true" >> $GITHUB_OUTPUT + else + cd images && bash build.sh base-glibc-busybox-bash + fi + + - name: push to ghcr + if: '${{ ! steps.base-busybox.outputs.TAG_EXISTS_base-busybox }}' + run: | + echo '${{ secrets.GITHUB_TOKEN }}' | podman login ghcr.io -u '${{ github.actor }}' --password-stdin + source images/versions.sh + push_to_ghcr $BASE_BUSYBOX_IMAGE_NAME $BASE_TAG + + build-build-env: + name: Build build-env + outputs: + TAG_EXISTS_build-env: ${{ steps.build-env.outputs.TAG_EXISTS_build-env }} + runs-on: ubuntu-22.04 + steps: + - uses: actions/checkout@v4 + with: + fetch-depth: 0 + + - name: Install qemu dependency + run: | + sudo apt-get update + sudo apt-get install -y qemu-user-static + + - name: build-env + id: build-env + run: | + source images/versions.sh + if [ $(tag_exists $BUILD_ENV_IMAGE_NAME $BIOCONDA_IMAGE_TAG) ]; then + echo "TAG_EXISTS_build-env=true" >> $GITHUB_OUTPUT + else + cd images && bash build.sh bioconda-utils-build-env-cos7 + fi + + - name: push to ghcr + if: '${{ ! steps.build-env.outputs.TAG_EXISTS_build-env }}' + run: | + echo '${{ secrets.GITHUB_TOKEN }}' | podman login ghcr.io -u '${{ github.actor }}' --password-stdin + source images/versions.sh + push_to_ghcr $BUILD_ENV_IMAGE_NAME $BIOCONDA_IMAGE_TAG + + build-create-env: + name: Build create-env + needs: [build-build-env, build-base-busybox] + outputs: + TAG_EXISTS_create-env: ${{ steps.create-env.outputs.TAG_EXISTS_create-env }} + runs-on: ubuntu-22.04 + steps: + - uses: actions/checkout@v4 + with: + fetch-depth: 0 + + - name: Install qemu dependency + run: | + sudo apt-get update + sudo apt-get install -y qemu-user-static + + - name: Build create-env + id: create-env + run: | + source images/versions.sh + echo '${{ secrets.GITHUB_TOKEN }}' | podman login ghcr.io -u '${{ github.actor }}' --password-stdin + if [ $(tag_exists $CREATE_ENV_IMAGE_NAME $BIOCONDA_IMAGE_TAG) ]; then + echo "TAG_EXISTS_create-env=true" >> $GITHUB_OUTPUT + else + cd images && bash build.sh create-env + fi + + - name: push to ghcr + if: '${{ ! steps.create-env.outputs.TAG_EXISTS_create-env }}' + run: | + echo '${{ secrets.GITHUB_TOKEN }}' | podman login ghcr.io -u '${{ github.actor }}' --password-stdin + source images/versions.sh + push_to_ghcr $CREATE_ENV_IMAGE_NAME $BIOCONDA_IMAGE_TAG + + + # END OF BUILDING IMAGES + # ---------------------------------------------------------------------- + # START TESTING + # These testing jobs will run the respective Dockerfile.test in each image + # directory. + + test: + name: test bioconda-utils with images + runs-on: ubuntu-20.04 + needs: [build-base-debian, build-base-busybox, build-build-env, build-create-env] + steps: + + - uses: actions/checkout@v4 + with: + fetch-depth: 0 + + # # Clone bioconda-recipes to use as part of the tests. + # - uses: actions/checkout@v4 + # with: + # fetch-depth: 0 + # repository: bioconda/bioconda-recipes + # path: recipes + + # - name: set path + # run: echo "/opt/mambaforge/bin" >> $GITHUB_PATH + + - name: Install bioconda-utils + run: | + export BIOCONDA_DISABLE_BUILD_PREP=1 + BRANCH=simplify-unify-containers + wget https://raw.githubusercontent.com/bioconda/bioconda-common/${BRANCH}/{common,install-and-set-up-conda,configure-conda}.sh + source images/versions.sh + + # Ensure install-and-set-up-conda uses same version as in the container + # (which uses images/versions.sh + export BIOCONDA_UTILS_TAG=$BIOCONDA_UTILS_VERSION + bash install-and-set-up-conda.sh + eval "$(conda shell.bash hook)" + conda create -n bioconda -y --file test-requirements.txt --file bioconda_utils/bioconda_utils-requirements.txt + conda activate bioconda + python setup.py install + + - name: test + run: | + eval "$(conda shell.bash hook)" + conda activate bioconda + + source images/versions.sh + + # Figure out which registry to use for each image, based on what was built. + [ ${{ needs.build-build-env.outputs.TAG_EXISTS_build-env }} ] && BUILD_ENV_REGISTRY='quay.io/bioconda' || BUILD_ENV_REGISTRY="ghcr.io/bioconda" + [ ${{ needs.build-create-env.outputs.TAG_EXISTS_create-env }} ] && CREATE_ENV_REGISTRY='quay.io/bioconda' || CREATE_ENV_REGISTRY="ghcr.io/bioconda" + [ ${{ needs.build-base-busybox.outputs.TAG_EXISTS_base_busybox }} ] && DEST_BASE_REGISTRY='quay.io/bioconda' || DEST_BASE_REGISTRY="ghcr.io/bioconda" + [ ${{ needs.build-base-debian.outputs.TAG_EXISTS_base_debian }} ] && DEST_EXTENDED_BASE_REGISTRY='quay.io/bioconda' || DEST_EXTENDED_BASE_REGISTRY="ghcr.io/bioconda" + + # Tell mulled-build which image to use + export DEST_BASE_IMAGE="${DEST_BASE_IMAGE_REGISTRY}/${BASE_BUSYBOX_IMAGE_NAME}:${BASE_TAG}" + export DEFAULT_BASE_IMAGE="${DEST_BASE_REGISTRY}/${BASE_BUSYBOX_IMAGE_NAME}" + export DEFAULT_EXTENDED_BASE_IMAGE="${DEST_EXTENDED_BASE_REGISTRY}/${BASE_DEBIAN_IMAGE_NAME}" + export BUILD_ENV_IMAGE="${BUILD_ENV_REGISTRY}/${BUILD_ENV_IMAGE_NAME}:${BIOCONDA_IMAGE_TAG}" + export CREATE_ENV_IMAGE="${CREATE_ENV_REGISTRY}/${CREATE_ENV_IMAGE_NAME}:${BIOCONDA_IMAGE_TAG}" + + # # Build a package with containers. + # cd recipes + # bioconda-utils build \ + # --docker-base-image "${BUILD_ENV_REGISTRY}/${BUILD_ENV_IMAGE_NAME}:${BIOCONDA_IMAGE_TAG}" \ + # --mulled-conda-image "${CREATE_ENV_REGISTRY}/${CREATE_ENV_IMAGE_NAME}:${BIOCONDA_IMAGE_TAG}" \ + # --packages seqtk \ + # --docker \ + # --mulled-test \ + # --force + + py.test --durations=0 test/ -v --log-level=DEBUG -k "docker" --tb=native + + # END TESTING + # ------------------------------------------------------------------------ + # START PUSHING IMAGES + + # For these push steps, a repository must first exist on quay.io/bioconda + # AND that repository must also be configured to allow write access for the + # appropriate service account. This must be done by a user with admin + # access to quay.io/bioconda. + # + # This uses the TAG_EXISTS_* outputs from previous jobs to determine if + # a push to quay.io should happen. + + push: + name: push images + runs-on: ubuntu-20.04 + needs: [build-base-debian, build-base-busybox, build-build-env, build-create-env, test] + steps: + + - uses: actions/checkout@v4 + with: + fetch-depth: 0 + + - name: push base-debian + if: ${{ ! needs.base-debian.outputs.TAG_EXISTS_base-debian }} + run: | + echo '${{ secrets.QUAY_BIOCONDA_TOKEN }}' | podman login quay.io -u '${{ secrets.QUAY_BIOCONDA_USERNAME }}' --password-stdin + source images/versions.sh + move_from_ghcr_to_quay ${BASE_DEBIAN_IMAGE_NAME} ${BASE_TAG} + + + - name: push base-busybox + if: ${{ ! needs.base-busybox.outputs.TAG_EXISTS_base-busybox }} + run: | + echo '${{ secrets.QUAY_BIOCONDA_TOKEN }}' | podman login quay.io -u '${{ secrets.QUAY_BIOCONDA_USERNAME }}' --password-stdin + source images/versions.sh + move_from_ghcr_to_quay ${BASE_BUSYBOX_IMAGE_NAME} ${BASE_TAG} + + - name: push create-env + if: ${{ ! needs.create-env.outputs.TAG_EXISTS_create-env }} + run: | + echo '${{ secrets.QUAY_BIOCONDA_TOKEN }}' | podman login quay.io -u '${{ secrets.QUAY_BIOCONDA_USERNAME }}' --password-stdin + source images/versions.sh + move_from_ghcr_to_quay ${CREATE_ENV_IMAGE_NAME} ${BIOCONDA_IMAGE_TAG} + + - name: push build-env + if: ${{ ! needs.build-env.outputs.TAG_EXISTS_build-env }} + run: | + echo '${{ secrets.QUAY_BIOCONDA_TOKEN }}' | podman login quay.io -u '${{ secrets.QUAY_BIOCONDA_USERNAME }}' --password-stdin + source images/versions.sh + move_from_ghcr_to_quay ${BUILD_ENV_IMAGE_NAME} ${BIOCONDA_IMAGE_TAG} diff --git a/.gitignore b/.gitignore index 1b98ca9bb87..1c13699dcea 100644 --- a/.gitignore +++ b/.gitignore @@ -15,3 +15,10 @@ docs/source/developer/_autosummary # Mac OS Files .DS_Store +env +recipes/ + +# files created when building images +images/*/metadata.txt +images/bioconda-utils-build-env-cos7/bioconda-utils +images/bioconda-utils-build-env-cos7/C.utf8 diff --git a/bioconda_utils/build.py b/bioconda_utils/build.py index 9ba35d7495b..358db668f33 100644 --- a/bioconda_utils/build.py +++ b/bioconda_utils/build.py @@ -56,7 +56,7 @@ def build(recipe: str, pkg_paths: List[str] = None, docker_builder: docker_utils.RecipeBuilder = None, raise_error: bool = False, linter=None, - mulled_conda_image: str = pkg_test.MULLED_CONDA_IMAGE, + mulled_conda_image: str = pkg_test.CREATE_ENV_IMAGE, record_build_failure: bool = False, dag: Optional[nx.DiGraph] = None, skiplist_leafs: bool = False, @@ -317,7 +317,7 @@ def build_recipes(recipe_folder: str, config_path: str, recipes: List[str], n_workers: int = 1, worker_offset: int = 0, keep_old_work: bool = False, - mulled_conda_image: str = pkg_test.MULLED_CONDA_IMAGE, + mulled_conda_image: str = pkg_test.CREATE_ENV_IMAGE, record_build_failures: bool = False, skiplist_leafs: bool = False, live_logs: bool = True, diff --git a/bioconda_utils/cli.py b/bioconda_utils/cli.py index 8f75948ce0f..eaed2c40f8b 100644 --- a/bioconda_utils/cli.py +++ b/bioconda_utils/cli.py @@ -445,7 +445,7 @@ def build(recipe_folder, config, packages="*", git_range=None, testonly=False, pkg_dir=None, anaconda_upload=False, mulled_upload_target=None, build_image=False, keep_image=False, lint=False, lint_exclude=None, check_channels=None, n_workers=1, worker_offset=0, keep_old_work=False, - mulled_conda_image=pkg_test.MULLED_CONDA_IMAGE, + mulled_conda_image=pkg_test.CREATE_ENV_IMAGE, docker_base_image=None, record_build_failures=False, skiplist_leafs=False, @@ -476,7 +476,12 @@ def build(recipe_folder, config, packages="*", git_range=None, testonly=False, logger.warning(f"Using tag {image_tag} for docker image, since there is no image for a not yet release version ({VERSION}).") else: image_tag = VERSION - docker_base_image = docker_base_image or f"quay.io/bioconda/bioconda-utils-build-env-cos7:{image_tag}" + + docker_base_image = ( + docker_base_image or + os.getenv("BUILD_ENV_IMAGE", None) or + docker_base_image or f"quay.io/bioconda/bioconda-utils-build-env-cos7:{image_tag}" + ) logger.info(f"Using docker image {docker_base_image} for building.") docker_builder = docker_utils.RecipeBuilder( diff --git a/bioconda_utils/pkg_test.py b/bioconda_utils/pkg_test.py index 97cea7f38b6..8d78d9f5a18 100644 --- a/bioconda_utils/pkg_test.py +++ b/bioconda_utils/pkg_test.py @@ -18,7 +18,8 @@ logger = logging.getLogger(__name__) -MULLED_CONDA_IMAGE = "quay.io/bioconda/create-env:latest" +# Will be provided to mulled-build via "CONDA_IMAGE" env var. +CREATE_ENV_IMAGE = os.getenv("CREATE_ENV_IMAGE", "quay.io/bioconda/create-env:latest") def get_tests(path): @@ -98,7 +99,7 @@ def test_package( channels=("conda-forge", "local", "bioconda"), mulled_args="", base_image=None, - conda_image=MULLED_CONDA_IMAGE, + conda_image=CREATE_ENV_IMAGE, live_logs = True, ): """ @@ -179,7 +180,10 @@ def test_package( env = os.environ.copy() if base_image is not None: env["DEST_BASE_IMAGE"] = base_image - env["CONDA_IMAGE"] = conda_image + if os.getenv("CONDA_IMAGE", None): + raise ValueError("CONDA_IMAGE env var already exists!") + else: + env["CONDA_IMAGE"] = conda_image with tempfile.TemporaryDirectory() as d: with utils.Progress(): p = utils.run(cmd, env=env, cwd=d, mask=False, live=live_logs) diff --git a/images/README.md b/images/README.md new file mode 100644 index 00000000000..565ca37c550 --- /dev/null +++ b/images/README.md @@ -0,0 +1,26 @@ +The intended use is to run `build.sh`, providing it an image directory. + + +Image directories must at least contain the following: + +- `prepare.sh` script, where the first line should be `source ../versions.sh` +- `Dockerfile` for building +- `Dockerfile.test` for testing. + +`build.sh` sources `/prepare.sh`, which sources `versions.sh` to +populate the env vars needed for that particular image. +`/prepare.sh` should also do any other needed work in preparation +for building. + +A note on locale: we prepare the C.utf8 locale ahead of time in +`locale/generate_locale.sh`. This can be copied over to image dirs if/when +needed by `prepare.sh`. Previously, we were preparing the locale each time in +an image and copying that out to subsequent image. Since this is expected to +change infrequently, storing it separately like this in the repo allows us to +remove the dependency of building that first image. + +E.g., + +``` +bash build.sh base-glibc-busybox-bash +``` diff --git a/images/base-glibc-busybox-bash/Dockerfile b/images/base-glibc-busybox-bash/Dockerfile new file mode 100644 index 00000000000..e875a2d41ac --- /dev/null +++ b/images/base-glibc-busybox-bash/Dockerfile @@ -0,0 +1,116 @@ +# Don't use Debian's busybox package since it only provides a smaller subset of +# BusyBox's functions (e.g., no administrative tools like adduser etc.). +# Since we create a glibc image anyway, we can also use a the slightly smaller +# dynamically linked binary. + +ARG debian_version +FROM "debian:${debian_version}-slim" AS build_base +RUN [ ! -f /etc/apt/sources.list ] || sed --in-place= --regexp-extended \ + '/ stretch/ { s,-updates,-backports, ; s,/(deb|security)\.,/archive., }' \ + /etc/apt/sources.list + + +FROM build_base AS rootfs_builder + +ARG busybox_image +COPY --from="${busybox_image}" /build /build +WORKDIR /busybox-rootfs +RUN arch="$( uname -m )" \ + && \ + mkdir -p ./bin ./sbin ./usr/bin ./usr/sbin \ + && \ + cp -al "/build/busybox.${arch}" ./bin/busybox \ + && \ + ldd ./bin/busybox \ + | grep --only-matching --extended-regexp '/lib\S+' \ + | xargs -n1 sh -xc 'mkdir -p ".${1%/*}" && cp -aL "${1}" ".${1%/*}"' -- \ + && \ + chroot . /bin/busybox --install \ + && \ + rm -rf ./lib* + +WORKDIR /rootfs + +RUN mkdir -p ./etc ./home ./opt ./root ./run /tmp ./usr ./var/log \ + && \ + for dir in bin lib sbin ; do \ + mkdir "./usr/${dir}" \ + && \ + if [ -L "/bin" ] ; then \ + ln -s "usr/${dir}" "./${dir}" ; \ + else \ + mkdir "./${dir}" ; \ + fi ; \ + done + +RUN find /busybox-rootfs -type f \ + -exec sh -c 'cp -al -- "${1}" "./${1#/busybox-rootfs/}"' -- '{}' ';' + +# Install helper tools used by install-pkgs. +RUN apt-get update -qq \ + && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get install --yes --no-install-recommends \ + patchelf + +COPY install-pkgs /usr/local/bin +RUN install-pkgs "$( pwd )" /tmp/work \ + bash \ + base-passwd \ + libc-bin \ + login \ + ncurses-base \ + && \ + # Remove contents of /usr/local as downstream images overwrite those. + find ./usr/local/ \ + -mindepth 1 -depth \ + -delete + +RUN while IFS=: read _ _ uid gid _ home _ ; do \ + [ -n "${home##/var/run/*}" ] || home="${home#/var}" \ + && \ + [ -d "./${home#/}" ] || [ "${home}" = "/nonexistent" ] && continue ; \ + mkdir -p "./${home#/}" \ + && \ + chown "${uid}:${gid}" "./${home#/}" \ + && \ + chmod 775 "./${home#/}" \ + ; done < ./etc/passwd \ + && \ + pwck --read-only --root "$( pwd )" \ + | { ! grep -v -e 'no changes' -e '/nonexistent' ; } \ + && \ + grpck --read-only --root "$( pwd )" \ + && \ + find \ + -xdev -type f \! -path ./var/\* \! -path ./usr/share/\* \! -name \*.pl \ + | xargs -P0 -n100 sh -c \ + 'chroot . ldd -- "${@}" 2> /dev/null | sed -n "/:/h; /not found/{x;p;x;p}"' -- \ + | { ! grep . ; } + +# env-activate.sh (+ optionally env-execute) should be overwritten downstream. +# - env-activate.sh: +# Is sourced (via symlink in /etc/profile.d/) to activate the /usr/local env. +# - env-execute: +# Is set as the ENTRYPOINT to activate /usr/local before exec'ing CMD. +RUN touch ./usr/local/env-activate.sh \ + && \ + touch ./usr/local/env-execute \ + && \ + chmod +x ./usr/local/env-execute \ + && \ + ln -s \ + /usr/local/env-activate.sh \ + ./etc/profile.d/env-activate.sh \ + && \ + printf '%s\n' \ + '#! /bin/bash' \ + ". '/usr/local/env-activate.sh'" \ + 'exec "${@}"' \ + > ./usr/local/env-execute + +FROM scratch +COPY --from=rootfs_builder /rootfs / +ENV LANG=C.UTF-8 +ENTRYPOINT [ "/usr/local/env-execute" ] +CMD [ "bash" ] diff --git a/images/base-glibc-busybox-bash/Dockerfile.busybox b/images/base-glibc-busybox-bash/Dockerfile.busybox new file mode 100644 index 00000000000..fcbd60bd350 --- /dev/null +++ b/images/base-glibc-busybox-bash/Dockerfile.busybox @@ -0,0 +1,23 @@ +# Build busybox ourselves to have more fine-grained control over what we want +# (or not want) to include. +# Use old Debian version to ensure compatible (low glibc requirement) binaries. +FROM debian:9-slim AS busybox_builder +RUN [ ! -f /etc/apt/sources.list ] || sed --in-place= --regexp-extended \ + '/ stretch/ { s,-updates,-backports, ; s,/(deb|security)\.,/archive., }' \ + /etc/apt/sources.list \ + && \ + apt-get update && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get install --yes --no-install-recommends \ + bzip2 curl ca-certificates tar \ + gcc libc6-dev \ + gcc-aarch64-linux-gnu libc6-dev-arm64-cross \ + make patch + +WORKDIR /build +COPY build-busybox ./ +ARG busybox_version +RUN ./build-busybox \ + "${busybox_version}" \ + x86_64 aarch64 + diff --git a/images/base-glibc-busybox-bash/Dockerfile.test b/images/base-glibc-busybox-bash/Dockerfile.test new file mode 100644 index 00000000000..feba4402b8a --- /dev/null +++ b/images/base-glibc-busybox-bash/Dockerfile.test @@ -0,0 +1,27 @@ +ARG base +FROM "${base}" + +# Check if env-activate.sh gets sourced for login shell and in env-execute. +RUN [ "$( sh -lc 'printf world' )" = 'world' ] \ + && \ + [ "$( /usr/local/env-execute sh -c 'printf world' )" = 'world' ] \ + && \ + printf '%s\n' \ + 'printf "hello "' \ + > /usr/local/env-activate.sh \ + && \ + [ "$( sh -lc 'printf world' )" = 'hello world' ] \ + && \ + [ "$( /usr/local/env-execute sh -c 'printf world' )" = 'hello world' ] \ + && \ + printf '' \ + > /usr/local/env-activate.sh + +RUN arch=$(uname -m) \ + && \ + wget --quiet \ + "https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-${arch}.sh" \ + && \ + sh ./Miniforge3-Linux-${arch}.sh -bp /opt/conda \ + && \ + /opt/conda/bin/conda info --all diff --git a/images/base-glibc-busybox-bash/build-busybox b/images/base-glibc-busybox-bash/build-busybox new file mode 100755 index 00000000000..902b33753d8 --- /dev/null +++ b/images/base-glibc-busybox-bash/build-busybox @@ -0,0 +1,140 @@ +#! /bin/sh +set -xeu + +download() { + curl --location --silent \ + "https://busybox.net/downloads/busybox-${version}.tar.bz2" \ + | tar -xjf- --strip-components=1 +} + +patch() { + case "${version}" in 1.36.* ) + # Small fix to let it build with older glibc versions. + curl --location --silent \ + 'https://git.busybox.net/busybox/patch/miscutils/seedrng.c?id=200a9669fbf6f06894e4243cccc9fc11a1a6073a' \ + 'https://git.busybox.net/busybox/patch/miscutils/seedrng.c?id=cb57abb46f06f4ede8d9ccbdaac67377fdf416cf' \ + | command patch --strip=1 + esac + + # Add support for running busybox wget without OpenSSL under QEMU. + # (NB: If we run into other QEMU+BusyBox problems that needs debugging: That + # vfork issue might affect other BusyBox parts, so check for it first.) + command patch --strip=1 <<'EOP' +From e7b57533ffcd5842fa93f5aa96949b3eaed54b67 Mon Sep 17 00:00:00 2001 +From: Marcel Bargull +Date: Sat, 14 Oct 2023 22:58:42 +0200 +Subject: [PATCH] wget: don't assume vfork blocking for openssl exec + +Under QEMU, busybox wget fails to fallback to busybox ssl_client in case +openssl s_client can't be executed because QEMU's vfork does not block. +Ref.: https://man7.org/linux/man-pages/man2/vfork.2.html#VERSIONS + +Signed-off-by: Marcel Bargull +--- + networking/wget.c | 24 +++++++++++++++++++++--- + 1 file changed, 21 insertions(+), 3 deletions(-) + +diff --git a/networking/wget.c b/networking/wget.c +index 9ec0e67b9..4bcc26e86 100644 +--- a/networking/wget.c ++++ b/networking/wget.c +@@ -683,3 +683,9 @@ static int spawn_https_helper_openssl(const char *host, unsigned port) + int pid; +- IF_FEATURE_WGET_HTTPS(volatile int child_failed = 0;) ++ ++# if ENABLE_FEATURE_WGET_HTTPS ++ struct fd_pair status; ++ int exec_errno = 0; ++ ++ xpiped_pair(status); ++# endif + +@@ -701,2 +707,7 @@ static int spawn_https_helper_openssl(const char *host, unsigned port) + ++# if ENABLE_FEATURE_WGET_HTTPS ++ close(status.rd); ++ if (fcntl(status.wr, F_SETFD, FD_CLOEXEC) != 0) ++ bb_simple_perror_msg_and_die("fcntl"); ++# endif + close(sp[0]); +@@ -743,5 +754,8 @@ static int spawn_https_helper_openssl(const char *host, unsigned port) + BB_EXECVP(argv[0], argv); ++ exec_errno = errno; + xmove_fd(3, 2); + # if ENABLE_FEATURE_WGET_HTTPS +- child_failed = 1; ++ if (write(status.wr, &exec_errno, sizeof(exec_errno)) != sizeof(exec_errno)) ++ bb_simple_perror_msg_and_die("write"); ++ close(status.wr); + xfunc_die(); +@@ -758,3 +772,7 @@ static int spawn_https_helper_openssl(const char *host, unsigned port) + # if ENABLE_FEATURE_WGET_HTTPS +- if (child_failed) { ++ close(status.wr); ++ if (read(status.rd, &exec_errno, sizeof(exec_errno)) == -1) ++ bb_simple_perror_msg_and_die("read"); ++ close(status.rd); ++ if (exec_errno) { + close(sp[0]); +EOP +} + +config() { + make defconfig + mv .config .defconfig + # Set CONFIG_SUBST_WCHAR=0 for better Unicode support and remove big components. + printf %s\\n \ + CONFIG_AR=y \ + CONFIG_FEATURE_AR_CREATE=y \ + CONFIG_FEATURE_AR_LONG_FILENAMES=y \ + CONFIG_SUBST_WCHAR=0 \ + CONFIG_RPM=n \ + CONFIG_RPM2CPIO=n \ + CONFIG_FSCK_MINIX=n \ + CONFIG_MKFS_MINIX=n \ + CONFIG_BC=n \ + CONFIG_DC=n \ + CONFIG_HDPARM=n \ + CONFIG_HEXEDIT=n \ + CONFIG_I2CGET=n \ + CONFIG_I2CSET=n \ + CONFIG_I2CDUMP=n \ + CONFIG_I2CDETECT=n \ + CONFIG_I2CTRANSFER=n \ + CONFIG_DNSD=n \ + CONFIG_FTPD=n \ + CONFIG_HTTPD=n \ + CONFIG_TCPSVD=n \ + CONFIG_UDPSVD=n \ + CONFIG_UDHCPD=n \ + CONFIG_SH_IS_ASH=n \ + CONFIG_SH_IS_NONE=y \ + CONFIG_SHELL_ASH=n \ + CONFIG_ASH=n \ + CONFIG_HUSH=n \ + CONFIG_SHELL_HUSH=n \ + | cat - .defconfig \ + > .config + # make still asks which shell to use for sh although CONFIG_SH_IS_NONE=y is set!? + printf \\n | make oldconfig +} + +build() { + make -j "$( nproc )" busybox +} + +main() { + version="${1}" + shift + download + patch + for target ; do + export MAKEFLAGS="ARCH=${target} CROSS_COMPILE=${target}-linux-gnu-" + make clean + config + build + cp -al ./busybox "./busybox.${target}" + done +} + +main "${@}" diff --git a/images/base-glibc-busybox-bash/install-pkgs b/images/base-glibc-busybox-bash/install-pkgs new file mode 100755 index 00000000000..fdb483dd268 --- /dev/null +++ b/images/base-glibc-busybox-bash/install-pkgs @@ -0,0 +1,361 @@ +#! /bin/sh +set -xeu + +arch=$(uname -m) + +prepare_remove_docs() { + # remove lintian and docs (apart from copyright) + rm -rf \ + ./usr/share/lintian \ + ./usr/share/man + find ./usr/share/doc/ -type f ! -name copyright -delete + find ./usr/share/doc/ -type d -empty -delete +} + + +prepare_usrmerge() { + # If we are on Debian >=12, /bin et al. are symlinks to /usr/ counterparts. + # Since we don't do full apt installs, we accomodate for it here. + if [ -L "${root_fs}/bin" ] ; then + for dir in bin lib* sbin ; do + [ -d "./${dir}" ] || continue + [ -L "./${dir}" ] && continue + mkdir -p ./usr + cp -ral "./${dir}" ./usr/ + rm -rf "./${dir}" + ln -s "usr/${dir}" "${dir}" + done + fi +} + + +add_rpath() { + local binary="${1}" + shift + local new_rpath="${1}" + shift + local rpath + rpath="$( + patchelf \ + --print-rpath \ + "${binary}" + )" + patchelf \ + --set-rpath \ + "${rpath:+${rpath}:}${new_rpath}" \ + "${binary}" +} + + +prepare() { + local pkg="${1}" + shift + local destdir="${1}" + shift + + case "${pkg}" in + libc6 ) + # To reduce image size, remove all charset conversion modules apart + # from smaller ones for some common encodings. + # Update gconv-modules accordingly. + # NOTE: When adding/removing any, check required dyn. linked libs! + + local gconv_path="./usr/lib/${arch}-linux-gnu/gconv" + local gconv_modules_regex + if [ -e "${gconv_path}/gconv-modules.d/gconv-modules-extra.conf" ] ; then + gconv_modules_regex="$( + sed -nE 's/^module\s+\S+\s+\S+\s+(\S+)\s+.*/\1/p' \ + < "${gconv_path}/gconv-modules" \ + | sort -u \ + | tr '\n' '|' \ + | sed 's/|$//' + )" + : > "${gconv_path}/gconv-modules.d/gconv-modules-extra.conf" + else + gconv_modules_regex='UTF-\w+|UNICODE|ISO8859-(1|15)|CP1252|ANSI_X3\.110' + local gconv_modules_file_tmp='./.tmp.gconv-modules' + + mv "${gconv_path}"/gconv-modules "${gconv_modules_file_tmp}" + + grep -E \ + '^\s*$|^#|^(alias\s+.*|module\s+[^\s]+\s+[^\s]+)\s+\<('"${gconv_modules_regex}"')(//|\s)' \ + "${gconv_modules_file_tmp}" \ + | sed -nEe '1N;N;/^(#.*)\n.*\1/{D;D};P;D' | cat -s \ + > "${gconv_path}"/gconv-modules + rm "${gconv_modules_file_tmp}" + fi + + find "${gconv_path}" \ + -mindepth 1 -maxdepth 1 \ + -name '*.so' \ + -type f \ + -regextype posix-extended \ + ! -regex '.*/('"${gconv_modules_regex}"').so' \ + -print -delete + + iconvconfig --prefix ./ + + ;; + bash ) + rm -rf ./usr/share/locale + # Add custom rpath for libtinfo (see below) to bash binaries. + local new_rpath="/lib/${arch}-linux-gnu/terminfo:/usr/lib/${arch}-linux-gnu/terminfo" + add_rpath ./bin/bash "${new_rpath}" + add_rpath ./usr/bin/clear_console "${new_rpath}" + ;; + libtinfo* ) + # Move libtinfo libraries to a custom path to ensure it is not + # unintentionally used in downstream images. + find ./usr/lib/${arch}-linux-gnu -type f \ + | { + while read binary ; do + add_rpath "${binary}" "/lib/${arch}-linux-gnu/terminfo" + done + } + + mv ./lib/${arch}-linux-gnu ./temp + mkdir ./lib/${arch}-linux-gnu + mv ./temp ./lib/${arch}-linux-gnu/terminfo + + mv ./usr/lib/${arch}-linux-gnu ./temp + mkdir ./usr/lib/${arch}-linux-gnu + mv ./temp ./usr/lib/${arch}-linux-gnu/terminfo + ;; + base-passwd ) + # The dependencies libdebconfclient0 (and libselinux1 for Debian>=12) + # are needed for update-passwd, but we ignore them => remove the binary. + rm ./usr/sbin/update-passwd + ;; + login ) + rm -rf ./usr/share/locale + # The following binaries provided by BusyBox or pull in more dependencies + # (PAM, libselinux1, and their dependencies) => remove them. + rm -f \ + ./bin/login \ + ./bin/su \ + ./usr/bin/lastlog \ + ./usr/bin/newgrp \ + ./usr/bin/sg + ;; + libc-bin | \ + libgcc1 | \ + base-files | \ + gcc-*-base | \ + libcrypt1 | \ + libgcc-s1 | \ + libdebconfclient0 | \ + libpcre* | \ + libselinux1 | \ + ncurses-base | \ + zlib1g ) + : + ;; + * ) + # Abort if we get an unexpected package. + printf %s\\n "\`prepare\` not defined for ${pkg}" >&2 + return 1 + ;; + esac + prepare_remove_docs + prepare_usrmerge +} + + +postinst_ldconfig_trigger() { + ldconfig --verbose -r ./ +} + + +postinst() { + local pkg="${1}" + shift + local destdir="${1}" + shift + + case "${pkg}" in + libc-bin ) + cp -p --remove-destination \ + ./usr/share/libc-bin/nsswitch.conf \ + ./etc/nsswitch.conf + postinst_ldconfig_trigger + ;; + base-files ) + cp "${destdir}/DEBIAN/postinst" ./base-files-postinst + chroot ./ sh /base-files-postinst configure + rm ./base-files-postinst + ;; + base-passwd ) + mkdir -p "${destdir}/etc" + cp -p --remove-destination \ + "${destdir}/usr/share/base-passwd/group.master" \ + ./etc/group + cp -p --remove-destination \ + "${destdir}/usr/share/base-passwd/passwd.master" \ + ./etc/passwd + DPKG_ROOT="$( pwd )" \ + shadowconfig on + ;; + login ) + for file in /var/log/faillog /etc/subuid /etc/subgid ; do + [ -f "./${file}" ] || continue + touch "${file}" + chown 0:0 "${file}" + chmod 644 "${file}" + done + ;; + bash ) + # Replace BusyBox's sh by Bash + rm -f ./bin/sh + ln -s /bin/bash ./bin/sh + chroot ./ add-shell /bin/sh + chroot ./ add-shell /bin/bash + chroot ./ add-shell /bin/rbash + # Bash 4.* did not have default key bindings for control-arrow-key key + # combinations. Add some for convenience: + cat >> ./etc/inputrc <<'EOF' + +"\e[5C": forward-word +"\e[5D": backward-word +"\e\e[C": forward-word +"\e\e[D": backward-word +"\e[1;5C": forward-word +"\e[1;5D": backward-word +EOF + ;; + libc6 | \ + libdebconfclient0 | \ + libgcc1 | \ + libcrypt1 | \ + libgcc-s1 | \ + libpcre* | \ + libselinux1 | \ + libtinfo* | \ + zlib1g ) + postinst_ldconfig_trigger + ;; + gcc-*-base | \ + ncurses-base ) + : + ;; + * ) + # Abort if we get an unexpected package. + printf %s\\n "\`postinst\` not defined for ${pkg}" >&2 + return 1 + ;; + esac +} + + +install_pkg() { + local pkg="${1}" + shift + + local work_dir="${work_base}/${pkg}" + mkdir "${work_dir}" + cd "${work_dir}" + + # Download package + apt-get download "${pkg}" + local deb_file + deb_file="$( find "$( pwd )" -maxdepth 1 -name '*.deb' )" + + # Prepare package + local destdir="${work_dir}/destdir" + mkdir "${destdir}" + cd "${destdir}" + dpkg-deb --raw-extract "${deb_file}" ./ + prepare "${pkg}" "${destdir}" + dpkg-deb --build ./ "${deb_file}" + cd "${work_dir}" + + # Extract package + dpkg-deb --vextract "${deb_file}" "${root_fs}" + rm "${deb_file}" + printf %s\\n "$( basename "${deb_file}" )" >> "${root_fs}/.deb.lst" + + # Finalize package installation + cd "${root_fs}" + postinst "${pkg}" "${destdir}" + + cd "${work_base}" + rm -rf "${work_dir}" + printf %s\\n "${pkg}" >> "${root_fs}/.pkg.lst" +} + + +get_deps() { + [ -z "${*}" ] && return 0 + + # Instead of using `apt-cache depends --recurse` or `debfoster -d`, recurse + # manually so that we can exclude some packages that are either already + # installed or would pull in files/packages we don't need. + + local ignore_pkgs + ignore_pkgs="$( + printf %s\\n \ + base-files '' debianutils dash \ + libdebconfclient0 libselinux1 \ + libaudit1 libpam-modules libpam-runtime libpam0g \ + | grep -vFx "$( printf %s\\n "${@}" )" + )" + [ -f "${root_fs}/.pkg.lst" ] && \ + ignore_pkgs=$( printf %s\\n ${ignore_pkgs} $( cat -s "${root_fs}/.pkg.lst" ) ) + + local new_pkgs="${*}" + local old_pkgs='' + while ! [ "${new_pkgs}" = "${old_pkgs}" ] ; do + old_pkgs="${new_pkgs}" + new_pkgs="$( + apt-cache depends \ + --no-recommends --no-suggests --no-conflicts \ + --no-breaks --no-replaces --no-enhances \ + ${old_pkgs} \ + | sed -n 's/.*Depends: //p' | cat -s + )" + new_pkgs="$( + printf %s\\n ${old_pkgs} ${new_pkgs} \ + | sort -u \ + | grep -vFx "$( printf %s\\n ${ignore_pkgs} )" + )" + done + printf %s\\n ${new_pkgs} +} + + +install_with_deps() { + get_deps "${@}" | while read -r pkg ; do + install_pkg "${pkg}" + done +} + + +main() { + root_fs="${1}" + shift + work_base="${1}" + shift + + mkdir -p "${work_base}" + cd "${work_base}" + + apt-get update + + # Unconditionally install glibc (package libc6). + # Also install dependencies acc. to `apt-cache depends`: + # - libgcc1 only consists of libgcc_s.so.1 (+ docs, which we remove). + # - gcc-*-base only has empty directories (+ docs, which we remove). + install_with_deps libc6 + + # libc-bin must be in ${@} for Unicode support (C.UTF-8 locale). + install_with_deps "${@}" + + # base-files contains /usr/share/common-licenses/, /etc/profile, etc. + # Install base-files afterwards so we have a working sh for the postinst. + install_with_deps base-files + + cd "${root_fs}" + rm -rf "${work_base}" +} + + +main "${@}" diff --git a/images/base-glibc-busybox-bash/prepare.sh b/images/base-glibc-busybox-bash/prepare.sh new file mode 100644 index 00000000000..c97209955da --- /dev/null +++ b/images/base-glibc-busybox-bash/prepare.sh @@ -0,0 +1,24 @@ +source ../versions.sh +IMAGE_NAME="${BASE_BUSYBOX_IMAGE_NAME}" +TAG="$BASE_TAG" + +# Build busybox binaries for each arch. +# +# The respective busybox base containers for each arch will later extract the +# relevant binary from this image. + +BUILD_ARGS=() +BUILD_ARGS+=("--build-arg=debian_version=${DEBIAN_VERSION}") +BUILD_ARGS+=("--build-arg=busybox_version=${BUSYBOX_VERSION}") +iidfile="$( mktemp )" +buildah bud \ + --iidfile="${iidfile}" \ + --file=Dockerfile.busybox \ + ${BUILD_ARGS[@]} +busybox_image="$( cat "${iidfile}" )" +rm "${iidfile}" + +# Override build args for what's needed in main Dockerfile +BUILD_ARGS=() +BUILD_ARGS+=("--build-arg=debian_version=${DEBIAN_VERSION}") +BUILD_ARGS+=("--build-arg=busybox_image=${busybox_image}") diff --git a/images/base-glibc-debian-bash/Dockerfile b/images/base-glibc-debian-bash/Dockerfile new file mode 100644 index 00000000000..c0adc29222d --- /dev/null +++ b/images/base-glibc-debian-bash/Dockerfile @@ -0,0 +1,131 @@ +ARG debian_version + +FROM "debian:${debian_version}-slim" +RUN [ ! -f /etc/apt/sources.list ] || sed --in-place= --regexp-extended \ + '/ stretch/ { s,-updates,-backports, ; s,/(deb|security)\.,/archive., }' \ + /etc/apt/sources.list \ + && \ + apt-get update -qq \ + && \ + # Add en_US.UTF-8 locale. + printf '%s\n' 'en_US.UTF-8 UTF-8' \ + >> /etc/locale.gen \ + && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get install --yes --no-install-recommends \ + $( \ + . /etc/os-release \ + && \ + [ "${VERSION_ID-10}" -lt 10 ] \ + && \ + printf '%s\n' \ + libegl1-mesa \ + libgl1-mesa-glx \ + || \ + printf '%s\n' \ + libegl1 \ + libgl1 \ + libglx-mesa0 \ + ) \ + libglvnd0 \ + libopengl0 \ + locales \ + openssh-client \ + procps \ + && \ + # Remove "locales" package, but keep the generated locale. + sed -i \ + 's/\s*rm .*locale-archive$/: &/' \ + /var/lib/dpkg/info/locales.prerm \ + && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get remove --yes \ + locales \ + && \ + # On Debian 10 (and 11) libgl1-mesa-glx pulls in libgl1-mesa-dri (which in + # turn has more heavy-weight dependencies). We leave these out of the image + # (by manually removing it from "Depends:" list) like we do with Debian 9. + sed -i \ + '/^Depends:/ s/, libgl1-mesa-dri\>//g' \ + /var/lib/dpkg/status \ + && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get autoremove --yes \ + && \ + # Remove apt package lists. + rm -rf /var/lib/apt/lists/* \ + && \ + # Remove contents of /usr/local as downstream images overwrite those. + find ./usr/local/ \ + -mindepth 1 -depth \ + -delete + +RUN dpkg-query --show --showformat \ + '${db:Status-Status} ${Package}\n' \ + | sed -n 's/:/%3a/g ; s/^installed //p' \ + > /.pkg.lst \ + && \ + dpkg-query --show --showformat \ + '${db:Status-Status} ${Package}_${Version}_${Architecture}\n' \ + | sed -n 's/:/%3a/g ; s/$/.deb/ ; s/^installed //p' \ + > /.deb.lst + +RUN while IFS=: read _ _ uid gid _ home _ ; do \ + [ -n "${home##/var/run/*}" ] || home="${home#/var}" \ + && \ + [ -d "./${home#/}" ] || [ "${home}" = "/nonexistent" ] && continue ; \ + mkdir -p "./${home#/}" \ + && \ + chown "${uid}:${gid}" "./${home#/}" \ + && \ + chmod 775 "./${home#/}" \ + ; done < ./etc/passwd \ + && \ + pwck --read-only --root "$( pwd )" \ + | { ! grep -v -e 'no changes' -e '/nonexistent' ; } \ + && \ + grpck --read-only --root "$( pwd )" \ + && \ + find \ + -xdev -type f \! -path ./var/\* \! -path ./usr/share/\* \! -name \*.pl \ + | xargs -P0 -n100 sh -c \ + 'chroot . ldd -- "${@}" 2> /dev/null | sed -n "/:/h; /not found/{x;p;x;p}"' -- \ + | { ! grep . ; } + +# Bash 4.* did not have default key bindings for control-arrow-key key +# combinations. Add some for convenience: +RUN >> /etc/inputrc \ + printf '%s\n' \ + '' \ + '"\e[5C": forward-word' \ + '"\e[5D": backward-word' \ + '"\e\e[C": forward-word' \ + '"\e\e[D": backward-word' \ + '"\e[1;5C": forward-word' \ + '"\e[1;5D": backward-word' \ + ; + +# env-activate.sh (+ optionally env-execute) should be overwritten downstream. +# - env-activate.sh: +# Is sourced (via symlink in /etc/profile.d/) to activate the /usr/local env. +# - env-execute: +# Is set as the ENTRYPOINT to activate /usr/local before exec'ing CMD. +RUN touch /usr/local/env-activate.sh \ + && \ + touch /usr/local/env-execute \ + && \ + chmod +x /usr/local/env-execute \ + && \ + ln -s \ + /usr/local/env-activate.sh \ + /etc/profile.d/env-activate.sh \ + && \ + printf '%s\n' \ + '#! /bin/bash' \ + ". '/usr/local/env-activate.sh'" \ + 'exec "${@}"' \ + > /usr/local/env-execute + +ENV LANG=C.UTF-8 +ENTRYPOINT [ "/usr/local/env-execute" ] +CMD [ "bash" ] diff --git a/images/base-glibc-debian-bash/Dockerfile.test b/images/base-glibc-debian-bash/Dockerfile.test new file mode 100644 index 00000000000..f2f0bace3a8 --- /dev/null +++ b/images/base-glibc-debian-bash/Dockerfile.test @@ -0,0 +1,39 @@ +ARG base +FROM "${base}" + +# Check if env-activate.sh gets sourced for login shell and in env-execute. +RUN [ "$( sh -lc 'printf world' )" = 'world' ] \ + && \ + [ "$( /usr/local/env-execute sh -c 'printf world' )" = 'world' ] \ + && \ + printf '%s\n' \ + 'printf "hello "' \ + > /usr/local/env-activate.sh \ + && \ + [ "$( sh -lc 'printf world' )" = 'hello world' ] \ + && \ + [ "$( /usr/local/env-execute sh -c 'printf world' )" = 'hello world' ] \ + && \ + printf '' \ + > /usr/local/env-activate.sh + +# Check if all desired locales are there. +RUN locale -a | grep -i 'c\.utf-\?8' \ + && \ + locale -a | grep -i 'en_us\.utf-\?8' + +RUN apt-get update -qq \ + && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get install --yes --no-install-recommends \ + ca-certificates \ + wget \ + && \ + arch=$(uname -m) \ + && \ + wget --quiet \ + "https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-${arch}.sh" \ + && \ + sh ./Miniforge3-Linux-${arch}.sh -bp /opt/conda \ + && \ + /opt/conda/bin/conda info --all diff --git a/images/base-glibc-debian-bash/prepare.sh b/images/base-glibc-debian-bash/prepare.sh new file mode 100644 index 00000000000..d3459adb0fc --- /dev/null +++ b/images/base-glibc-debian-bash/prepare.sh @@ -0,0 +1,5 @@ +source ../versions.sh +IMAGE_NAME="${BASE_DEBIAN_IMAGE_NAME}" +TAG="$BASE_TAG" +BUILD_ARGS=() +BUILD_ARGS+=("--build-arg=debian_version=$DEBIAN_VERSION") diff --git a/images/bioconda-recipes-issue-responder/Dockerfile b/images/bioconda-recipes-issue-responder/Dockerfile new file mode 100644 index 00000000000..9b94896414c --- /dev/null +++ b/images/bioconda-recipes-issue-responder/Dockerfile @@ -0,0 +1,40 @@ +ARG base=quay.io/bioconda/base-glibc-busybox-bash:2.0.0 + +FROM quay.io/bioconda/create-env:2.0.0 as build +RUN /opt/create-env/env-execute \ + create-env \ + --conda=mamba \ + --strip-files=\* \ + --remove-paths=\*.a \ + --remove-paths=\*.pyc \ + /usr/local \ + aiohttp \ + anaconda-client \ + ca-certificates \ + git \ + openssh \ + python=3.8 \ + pyyaml \ + skopeo \ + && \ + # Workaround for https://github.com/conda/conda/issues/10490 + export CONDA_REPODATA_THREADS=1 && \ + # We don't need Perl (used by Git for some functionalities). + # => Remove perl package to reduce image size. + /opt/create-env/env-execute \ + conda remove --yes \ + --prefix=/usr/local \ + --force-remove \ + perl + +FROM "${base}" +COPY --from=build /usr/local /usr/local +COPY ./issue-responder /usr/local/bin/ + +# Used environment variables: +# - JOB_CONTEXT +# - BOT_TOKEN +# - GITTER_TOKEN +# - ANACONDA_TOKEN +# - QUAY_OAUTH_TOKEN +# - QUAY_LOGIN diff --git a/images/bioconda-recipes-issue-responder/Dockerfile.test b/images/bioconda-recipes-issue-responder/Dockerfile.test new file mode 100644 index 00000000000..665dc72ed0a --- /dev/null +++ b/images/bioconda-recipes-issue-responder/Dockerfile.test @@ -0,0 +1,7 @@ +ARG base + + +FROM "${base}" +RUN JOB_CONTEXT='{"event": {"issue": {}}}' \ + /usr/local/env-execute \ + issue-responder diff --git a/images/bioconda-recipes-issue-responder/issue-responder b/images/bioconda-recipes-issue-responder/issue-responder new file mode 100755 index 00000000000..9d915f2f528 --- /dev/null +++ b/images/bioconda-recipes-issue-responder/issue-responder @@ -0,0 +1,615 @@ +#! /usr/bin/env python + +import logging +import os +import re +import sys +from asyncio import gather, run, sleep +from asyncio.subprocess import create_subprocess_exec +from pathlib import Path +from shutil import which +from subprocess import check_call +from typing import Any, Dict, List, Optional, Set, Tuple +from zipfile import ZipFile + +from aiohttp import ClientSession +from yaml import safe_load + +logger = logging.getLogger(__name__) +log = logger.info + + +async def async_exec( + command: str, *arguments: str, env: Optional[Dict[str, str]] = None +) -> None: + process = await create_subprocess_exec(command, *arguments, env=env) + return_code = await process.wait() + if return_code != 0: + raise RuntimeError( + f"Failed to execute {command} {arguments} (return code: {return_code})" + ) + + +# Post a comment on a given issue/PR with text in message +async def send_comment(session: ClientSession, issue_number: int, message: str) -> None: + token = os.environ["BOT_TOKEN"] + url = ( + f"https://api.github.com/repos/bioconda/bioconda-recipes/issues/{issue_number}/comments" + ) + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + payload = {"body": message} + log("Sending comment: url=%s", url) + log("Sending comment: payload=%s", payload) + async with session.post(url, headers=headers, json=payload) as response: + status_code = response.status + log("the response code was %d", status_code) + if status_code < 200 or status_code > 202: + sys.exit(1) + + +def list_zip_contents(fname: str) -> [str]: + f = ZipFile(fname) + return [e.filename for e in f.infolist() if e.filename.endswith('.tar.gz') or e.filename.endswith('.tar.bz2')] + + +# Download a zip file from url to zipName.zip and return that path +# Timeout is 30 minutes to compensate for any network issues +async def download_file(session: ClientSession, zipName: str, url: str) -> str: + async with session.get(url, timeout=60*30) as response: + if response.status == 200: + ofile = f"{zipName}.zip" + with open(ofile, 'wb') as fd: + while True: + chunk = await response.content.read(1024*1024*1024) + if not chunk: + break + fd.write(chunk) + return ofile + return None + + +# Find artifact zip files, download them and return their URLs and contents +async def fetch_azure_zip_files(session: ClientSession, buildId: str) -> [(str, str)]: + artifacts = [] + + url = f"https://dev.azure.com/bioconda/bioconda-recipes/_apis/build/builds/{buildId}/artifacts?api-version=4.1" + log("contacting azure %s", url) + async with session.get(url) as response: + # Sometimes we get a 301 error, so there are no longer artifacts available + if response.status == 301: + return artifacts + res = await response.text() + + res_object = safe_load(res) + if res_object['count'] == 0: + return artifacts + + for artifact in res_object['value']: + zipName = artifact['name'] # LinuxArtifacts or OSXArtifacts + zipUrl = artifact['resource']['downloadUrl'] + log(f"zip name is {zipName} url {zipUrl}") + fname = await download_file(session, zipName, zipUrl) + if not fname: + continue + pkgsImages = list_zip_contents(fname) + for pkg in pkgsImages: + artifacts.append((zipUrl, pkg)) + + return artifacts + + +def parse_azure_build_id(url: str) -> str: + return re.search("buildId=(\d+)", url).group(1) + + +# Given a PR and commit sha, fetch a list of the artifact zip files URLs and their contents +async def fetch_pr_sha_artifacts(session: ClientSession, pr: int, sha: str) -> List[Tuple[str, str]]: + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/commits/{sha}/check-runs" + + headers = { + "User-Agent": "BiocondaCommentResponder", + "Accept": "application/vnd.github.antiope-preview+json", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + check_runs = safe_load(res) + log(f"DEBUG url was {url} returned {check_runs}") + + for check_run in check_runs["check_runs"]: + # The names are "bioconda.bioconda-recipes (test_osx test_osx)" or similar + if check_run["name"].startswith("bioconda.bioconda-recipes (test_"): + # The azure build ID is in the details_url as buildId=\d+ + buildID = parse_azure_build_id(check_run["details_url"]) + log(f"DEBUG buildID is {buildID}") + zipFiles = await fetch_azure_zip_files(session, buildID) + log(f"DEBUG zipFiles are {zipFiles}") + return zipFiles # We've already fetched all possible artifacts + + return [] + + +# Given a PR and commit sha, post a comment with any artifacts +async def make_artifact_comment(session: ClientSession, pr: int, sha: str) -> None: + artifacts = await fetch_pr_sha_artifacts(session, pr, sha) + nPackages = len(artifacts) + log(f"DEBUG the artifacts are {artifacts}") + + if nPackages > 0: + comment = "Package(s) built on Azure are ready for inspection:\n\n" + comment += "Arch | Package | Zip File\n-----|---------|---------\n" + install_noarch = "" + install_linux = "" + install_osx = "" + + # Table of packages and repodata.json + for URL, artifact in artifacts: + if not (package_match := re.match(r"^((.+)\/(.+)\/(.+)\/(.+\.tar\.bz2))$", artifact)): + continue + url, archdir, basedir, subdir, packageName = package_match.groups() + urlBase = URL[:-3] # trim off zip from format= + urlBase += "file&subPath=%2F{}".format("%2F".join([basedir, subdir])) + conda_install_url = urlBase + # N.B., the zip file URL is nearly identical to the URL for the individual member files. It's unclear if there's an API for getting the correct URL to the files themselves + #pkgUrl = "%2F".join([urlBase, packageName]) + #repoUrl = "%2F".join([urlBase, "current_repodata.json"]) + #resp = await session.get(repoUrl) + + if subdir == "noarch": + comment += "noarch |" + elif subdir == "linux-64": + comment += "linux-64 |" + else: + comment += "osx-64 |" + comment += f" {packageName} | [{archdir}]({URL})\n" + + # Conda install examples + comment += "***\n\nYou may also use `conda` to install these after downloading and extracting the appropriate zip file. From the LinuxArtifacts or OSXArtifacts directories:\n\n" + comment += "```conda install -c ./packages \n```\n" + + # Table of containers + comment += "***\n\nDocker image(s) built (images are in the LinuxArtifacts zip file above):\n\n" + comment += "Package | Tag | Install with `docker`\n" + comment += "--------|-----|----------------------\n" + + for URL, artifact in artifacts: + if artifact.endswith(".tar.gz"): + image_name = artifact.split("/").pop()[: -len(".tar.gz")] + if ':' in image_name: + package_name, tag = image_name.split(':', 1) + #image_url = URL[:-3] # trim off zip from format= + #image_url += "file&subPath=%2F{}.tar.gz".format("%2F".join(["images", '%3A'.join([package_name, tag])])) + comment += f"[{package_name}] | {tag} | " + comment += f'
show`gzip -dc LinuxArtifacts/images/{image_name}.tar.gz \\| docker load`\n' + comment += "\n\n" + else: + comment = ( + "No artifacts found on the most recent Azure build. " + "Either the build failed, the artifacts have were removed due to age, or the recipe was blacklisted/skipped." + ) + await send_comment(session, pr, comment) + + +# Post a comment on a given PR with its CircleCI artifacts +async def artifact_checker(session: ClientSession, issue_number: int) -> None: + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}" + headers = { + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + pr_info = safe_load(res) + + await make_artifact_comment(session, issue_number, pr_info["head"]["sha"]) + + +# Return true if a user is a member of bioconda +async def is_bioconda_member(session: ClientSession, user: str) -> bool: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/orgs/bioconda/members/{user}" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + rc = 404 + async with session.get(url, headers=headers) as response: + try: + response.raise_for_status() + rc = response.status + except: + # Do nothing, this just prevents things from crashing on 404 + pass + + return rc == 204 + + +# Reposts a quoted message in a given issue/PR if the user isn't a bioconda member +async def comment_reposter(session: ClientSession, user: str, pr: int, message: str) -> None: + if await is_bioconda_member(session, user): + log("Not reposting for %s", user) + return + log("Reposting for %s", user) + await send_comment( + session, + pr, + f"Reposting for @{user} to enable pings (courtesy of the BiocondaBot):\n\n> {message}", + ) + + +# Fetch and return the JSON of a PR +# This can be run to trigger a test merge +async def get_pr_info(session: ClientSession, pr: int) -> Any: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{pr}" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + pr_info = safe_load(res) + return pr_info + + +# Update a branch from upstream master, this should be run in a try/catch +async def update_from_master_runner(session: ClientSession, pr: int) -> None: + async def git(*args: str) -> None: + return await async_exec("git", *args) + + # Setup git, otherwise we can't push + await git("config", "--global", "user.email", "biocondabot@gmail.com") + await git("config", "--global", "user.name", "BiocondaBot") + + pr_info = await get_pr_info(session, pr) + remote_branch = pr_info["head"]["ref"] + remote_repo = pr_info["head"]["repo"]["full_name"] + + max_depth = 2000 + # Clone + await git( + "clone", + f"--depth={max_depth}", + f"--branch={remote_branch}", + f"git@github.com:{remote_repo}.git", + "bioconda-recipes", + ) + + async def git_c(*args: str) -> None: + return await git("-C", "bioconda-recipes", *args) + + # Add/pull upstream + await git_c("remote", "add", "upstream", "https://github.com/bioconda/bioconda-recipes") + await git_c("fetch", f"--depth={max_depth}", "upstream", "master") + + # Merge + await git_c("merge", "upstream/master") + + await git_c("push") + + +# Merge the upstream master branch into a PR branch, leave a message on error +async def update_from_master(session: ClientSession, pr: int) -> None: + try: + await update_from_master_runner(session, pr) + except Exception as e: + await send_comment( + session, + pr, + "I encountered an error updating your PR branch. You can report this to bioconda/core if you'd like.\n-The Bot", + ) + sys.exit(1) + + +# Ensure there's at least one approval by a member +async def approval_review(session: ClientSession, issue_number: int) -> bool: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}/reviews" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + reviews = safe_load(res) + + approved_reviews = [review for review in reviews if review["state"] == "APPROVED"] + if not approved_reviews: + return False + + # Ensure the review author is a member + return any( + gather( + *( + is_bioconda_member(session, review["user"]["login"]) + for review in approved_reviews + ) + ) + ) + + +# Check the mergeable state of a PR +async def check_is_mergeable( + session: ClientSession, issue_number: int, second_try: bool = False +) -> bool: + token = os.environ["BOT_TOKEN"] + # Sleep a couple of seconds to allow the background process to finish + if second_try: + await sleep(3) + + # PR info + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + pr_info = safe_load(res) + + # We need mergeable == true and mergeable_state == clean, an approval by a member and + if pr_info.get("mergeable") is None and not second_try: + return await check_is_mergeable(session, issue_number, True) + elif ( + pr_info.get("mergeable") is None + or not pr_info["mergeable"] + or pr_info["mergeable_state"] != "clean" + ): + return False + + return await approval_review(session, issue_number) + + +# Ensure uploaded containers are in repos that have public visibility +async def toggle_visibility(session: ClientSession, container_repo: str) -> None: + url = f"https://quay.io/api/v1/repository/biocontainers/{container_repo}/changevisibility" + QUAY_OAUTH_TOKEN = os.environ["QUAY_OAUTH_TOKEN"] + headers = { + "Authorization": f"Bearer {QUAY_OAUTH_TOKEN}", + "Content-Type": "application/json", + } + body = {"visibility": "public"} + rc = 0 + try: + async with session.post(url, headers=headers, json=body) as response: + rc = response.status + except: + # Do nothing + pass + log("Trying to toggle visibility (%s) returned %d", url, rc) + + +# Download an artifact from CircleCI, rename and upload it +async def download_and_upload(session: ClientSession, x: str) -> None: + basename = x.split("/").pop() + # the tarball needs a regular name without :, the container needs pkg:tag + image_name = basename.replace("%3A", ":").replace("\n", "").replace(".tar.gz", "") + file_name = basename.replace("%3A", "_").replace("\n", "") + + async with session.get(x) as response: + with open(file_name, "wb") as file: + logged = 0 + loaded = 0 + while chunk := await response.content.read(256 * 1024): + file.write(chunk) + loaded += len(chunk) + if loaded - logged >= 50 * 1024 ** 2: + log("Downloaded %.0f MiB: %s", max(1, loaded / 1024 ** 2), x) + logged = loaded + log("Downloaded %.0f MiB: %s", max(1, loaded / 1024 ** 2), x) + + if x.endswith(".gz"): + # Container + log("uploading with skopeo: %s", file_name) + # This can fail, retry with 5 second delays + count = 0 + maxTries = 5 + success = False + QUAY_LOGIN = os.environ["QUAY_LOGIN"] + env = os.environ.copy() + # TODO: Fix skopeo package to find certificates on its own. + skopeo_path = which("skopeo") + if not skopeo_path: + raise RuntimeError("skopeo not found") + env["SSL_CERT_DIR"] = str(Path(skopeo_path).parents[1].joinpath("ssl")) + while count < maxTries: + try: + await async_exec( + "skopeo", + "--command-timeout", + "600s", + "copy", + f"docker-archive:{file_name}", + f"docker://quay.io/biocontainers/{image_name}", + "--dest-creds", + QUAY_LOGIN, + env=env, + ) + success = True + break + except: + count += 1 + if count == maxTries: + raise + await sleep(5) + if success: + await toggle_visibility(session, basename.split("%3A")[0]) + elif x.endswith(".bz2"): + # Package + log("uploading package") + ANACONDA_TOKEN = os.environ["ANACONDA_TOKEN"] + await async_exec("anaconda", "-t", ANACONDA_TOKEN, "upload", file_name, "--force") + + log("cleaning up") + os.remove(file_name) + + +# Upload artifacts to quay.io and anaconda, return the commit sha +# Only call this for mergeable PRs! +async def upload_artifacts(session: ClientSession, pr: int) -> str: + # Get last sha + pr_info = await get_pr_info(session, pr) + sha: str = pr_info["head"]["sha"] + + # Fetch the artifacts + artifacts = await fetch_pr_sha_artifacts(session, pr, sha) + artifacts = [artifact for artifact in artifacts if artifact.endswith((".gz", ".bz2"))] + assert artifacts + + # Download/upload Artifacts + for artifact in artifacts: + await download_and_upload(session, artifact) + + return sha + + +# Assume we have no more than 250 commits in a PR, which is probably reasonable in most cases +async def get_pr_commit_message(session: ClientSession, issue_number: int) -> str: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}/commits" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + commits = safe_load(res) + message = "".join(f" * {commit['commit']['message']}\n" for commit in reversed(commits)) + return message + + +# Merge a PR +async def merge_pr(session: ClientSession, pr: int) -> None: + token = os.environ["BOT_TOKEN"] + await send_comment( + session, + pr, + "I will attempt to upload artifacts and merge this PR. This may take some time, please have patience.", + ) + + try: + mergeable = await check_is_mergeable(session, pr) + log("mergeable state of %s is %s", pr, mergeable) + if not mergeable: + await send_comment(session, pr, "Sorry, this PR cannot be merged at this time.") + else: + log("uploading artifacts") + sha = await upload_artifacts(session, pr) + log("artifacts uploaded") + + # Carry over last 250 commit messages + msg = await get_pr_commit_message(session, pr) + + # Hit merge + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{pr}/merge" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + payload = { + "sha": sha, + "commit_title": f"[ci skip] Merge PR {pr}", + "commit_message": f"Merge PR #{pr}, commits were: \n{msg}", + "merge_method": "squash", + } + log("Putting merge commit") + async with session.put(url, headers=headers, json=payload) as response: + rc = response.status + log("body %s", payload) + log("merge_pr the response code was %s", rc) + except: + await send_comment( + session, + pr, + "I received an error uploading the build artifacts or merging the PR!", + ) + logger.exception("Upload failed", exc_info=True) + + +# Add the "Please review and merge" label to a PR +async def add_pr_label(session: ClientSession, pr: int) -> None: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/issues/{pr}/labels" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + payload = {"labels": ["please review & merge"]} + async with session.post(url, headers=headers, json=payload) as response: + response.raise_for_status() + + +async def gitter_message(session: ClientSession, msg: str) -> None: + token = os.environ["GITTER_TOKEN"] + room_id = "57f3b80cd73408ce4f2bba26" + url = f"https://api.gitter.im/v1/rooms/{room_id}/chatMessages" + headers = { + "Authorization": f"Bearer {token}", + "Content-Type": "application/json", + "Accept": "application/json", + "User-Agent": "BiocondaCommentResponder", + } + payload = {"text": msg} + log("Sending request to %s", url) + async with session.post(url, headers=headers, json=payload) as response: + response.raise_for_status() + + +async def notify_ready(session: ClientSession, pr: int) -> None: + try: + await gitter_message( + session, + f"PR ready for review: https://github.com/bioconda/bioconda-recipes/pull/{pr}", + ) + except Exception: + logger.exception("Posting to Gitter failed", exc_info=True) + # Do not die if we can't post to gitter! + + +# This requires that a JOB_CONTEXT environment variable, which is made with `toJson(github)` +async def main() -> None: + job_context = safe_load(os.environ["JOB_CONTEXT"]) + log("%s", job_context) + if job_context["event"]["issue"].get("pull_request") is None: + return + issue_number = job_context["event"]["issue"]["number"] + + original_comment = job_context["event"]["comment"]["body"] + log("the comment is: %s", original_comment) + + comment = original_comment.lower() + async with ClientSession() as session: + if comment.startswith(("@bioconda-bot", "@biocondabot")): + if "please update" in comment: + await update_from_master(session, issue_number) + elif " hello" in comment: + await send_comment(session, issue_number, "Yes?") + elif " please fetch artifacts" in comment or " please fetch artefacts" in comment: + await artifact_checker(session, issue_number) + elif " please merge" in comment: + await send_comment(session, issue_number, "Sorry, I'm currently disabled") + #await merge_pr(session, issue_number) + elif " please add label" in comment: + await add_pr_label(session, issue_number) + await notify_ready(session, issue_number) + # else: + # # Methods in development can go below, flanked by checking who is running them + # if job_context["actor"] != "dpryan79": + # console.log("skipping") + # sys.exit(0) + elif "@bioconda/" in comment: + await comment_reposter( + session, job_context["actor"], issue_number, original_comment + ) + + +if __name__ == "__main__": + logging.basicConfig(level=logging.INFO) + run(main()) diff --git a/images/bioconda-utils-build-env-cos7/Dockerfile b/images/bioconda-utils-build-env-cos7/Dockerfile new file mode 100644 index 00000000000..bae6f61430f --- /dev/null +++ b/images/bioconda-utils-build-env-cos7/Dockerfile @@ -0,0 +1,66 @@ +ARG base_image +FROM ${base_image} as base + +COPY ./C.utf8 /usr/lib/locale/C.utf8 + +# Provide system deps unconditionally until we are able to offer per-recipe installs. +# (Addresses, e.g., "ImportError: libGL.so.1" in tests directly invoked by conda-build.) +# Also install packages that have been installed historically (openssh-client). +RUN yum install -y mesa-libGL-devel \ + && \ + yum install -y openssh-clients \ + && \ + yum install -y git \ + && \ + yum clean all && \ + rm -rf /var/cache/yum/* + +# This changes root's .condarc which ENTRYPOINT copies to /home/conda/.condarc later. +RUN . /opt/conda/etc/profile.d/conda.sh && \ + conda config \ + --add channels defaults \ + --add channels bioconda \ + --add channels conda-forge \ + && \ + { conda config --remove repodata_fns current_repodata.json 2> /dev/null || true ; } && \ + conda config --prepend repodata_fns repodata.json && \ + conda config --set channel_priority strict && \ + conda config --set auto_update_conda False + +FROM base as build +WORKDIR /tmp/repo +ARG BIOCONDA_UTILS_FOLDER=./bioconda-utils +COPY ${BIOCONDA_UTILS_FOLDER} ./ + +RUN . /opt/conda/etc/profile.d/conda.sh && conda list +RUN . /opt/conda/etc/profile.d/conda.sh && conda activate base && \ + pip wheel . && \ + mkdir - /opt/bioconda-utils && \ + cp ./bioconda_utils-*.whl \ + ./bioconda_utils/bioconda_utils-requirements.txt \ + /opt/bioconda-utils/ \ + && \ + chgrp -R lucky /opt/bioconda-utils && \ + chmod -R g=u /opt/bioconda-utils + +FROM base +COPY --from=build /opt/bioconda-utils /opt/bioconda-utils +RUN . /opt/conda/etc/profile.d/conda.sh && conda activate base && \ + # Make sure we get the (working) conda we want before installing the rest. + sed -nE \ + '/^conda([>/d' recipe/meta.yaml \ +# && \ +# conda-build -m .ci_support/linux_64_.yaml recipe/ +ARG packages= +ARG python=3.8 +ARG prefix=/usr/local +RUN . /opt/create-env/env-activate.sh && \ + export CONDA_ADD_PIP_AS_PYTHON_DEPENDENCY=0 \ + && \ + create-env \ + --conda=mamba \ + --strip-files=\* \ + --remove-paths=\*.a \ + --remove-paths=\*.c \ + --remove-paths=\*.pyc \ + --remove-paths=\*.pyi \ + --remove-paths=\*.pyx \ + --remove-paths=\*.pyx \ + --remove-paths=include/\* \ + --remove-paths=share/doc/\* \ + --remove-paths=share/man/\* \ + --remove-paths='share/terminfo/[!x]/*' \ + --remove-paths=share/locale/\* \ + --remove-paths=lib/python*/ensurepip/\* \ + "${prefix}" \ + --channel=local \ + --channel=conda-forge \ + --override-channels \ + pip wheel setuptools \ + python="${python}" \ + aiohttp \ + ca-certificates \ + idna\<3 \ + pyyaml \ + ${packages} \ + && \ + # Remove tk since no tkinter & co. are needed. + conda remove \ + --yes \ + --force-remove \ + --prefix="${prefix}" \ + tk \ + && \ + # Get rid of Perl pulled in by Git. + # (Bot only uses non-Perl Git functionality => remove baggage.) + if conda list --prefix="${prefix}" | grep -q '^perl\s' ; then \ + conda remove \ + --yes \ + --force-remove \ + --prefix="${prefix}" \ + perl \ + ; fi +# Install bioconda_bot. +WORKDIR /tmp/bot +COPY . ./ +RUN . "${prefix}/env-activate.sh" && \ + pip wheel --no-deps . \ + && \ + pip install --no-deps --find-links . bioconda_bot + +FROM "${base}" +COPY --from=build /usr/local /usr/local diff --git a/images/bot/Dockerfile.test b/images/bot/Dockerfile.test new file mode 100644 index 00000000000..5a6fdcbbd5b --- /dev/null +++ b/images/bot/Dockerfile.test @@ -0,0 +1,9 @@ +ARG base +FROM "${base}" +RUN . /usr/local/env-activate.sh && \ + ls -lA /usr/local/conda-meta/*.json && \ + bioconda-bot --help && \ + bioconda-bot comment --help && \ + bioconda-bot merge --help && \ + bioconda-bot update --help && \ + bioconda-bot change --help diff --git a/images/bot/pyproject.toml b/images/bot/pyproject.toml new file mode 100644 index 00000000000..9787c3bdf00 --- /dev/null +++ b/images/bot/pyproject.toml @@ -0,0 +1,3 @@ +[build-system] +requires = ["setuptools", "wheel"] +build-backend = "setuptools.build_meta" diff --git a/images/bot/setup.cfg b/images/bot/setup.cfg new file mode 100644 index 00000000000..749dfc7ed74 --- /dev/null +++ b/images/bot/setup.cfg @@ -0,0 +1,20 @@ +[metadata] +name = bioconda-bot +version = 0.0.1 + +[options] +python_requires = >=3.8 +install_requires = + aiohttp + PyYaml + +packages = find: +package_dir = + = src + +[options.packages.find] +where = src + +[options.entry_points] +console_scripts = + bioconda-bot = bioconda_bot.cli:main diff --git a/images/bot/src/bioconda_bot/__init__.py b/images/bot/src/bioconda_bot/__init__.py new file mode 100644 index 00000000000..e69de29bb2d diff --git a/images/bot/src/bioconda_bot/automerge.py b/images/bot/src/bioconda_bot/automerge.py new file mode 100644 index 00000000000..a09ee4148d0 --- /dev/null +++ b/images/bot/src/bioconda_bot/automerge.py @@ -0,0 +1,138 @@ +import logging +import os + +from typing import Any, Dict, List, Optional, Set, Tuple + +from aiohttp import ClientSession +from yaml import safe_load + +from .common import ( + get_job_context, + get_prs_for_sha, + get_sha_for_status_check, + get_sha_for_workflow_run, +) +from .merge import MergeState, request_merge + +logger = logging.getLogger(__name__) +log = logger.info + + +async def get_pr_labels(session: ClientSession, pr: int) -> Set[str]: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/issues/{pr}/labels" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + labels = safe_load(res) + return {label["name"] for label in labels} + + +async def is_automerge_labeled(session: ClientSession, pr: int) -> bool: + labels = await get_pr_labels(session, pr) + return "automerge" in labels + + +async def merge_if_labeled(session: ClientSession, pr: int) -> MergeState: + if not await is_automerge_labeled(session, pr): + return MergeState.UNKNOWN + return await request_merge(session, pr) + + +async def get_check_runs(session: ClientSession, sha: str) -> Any: + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/commits/{sha}/check-runs" + + headers = { + "User-Agent": "BiocondaCommentResponder", + "Accept": "application/vnd.github.antiope-preview+json", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + check_runs = [ + check_run + for check_run in safe_load(res)["check_runs"] or [] + if check_run["name"] != "bioconda-bot automerge" + ] + log("Got %d check_runs for SHA %s", len(check_runs or []), sha) + return check_runs + + +async def all_checks_completed(session: ClientSession, sha: str) -> bool: + check_runs = await get_check_runs(session, sha) + + is_all_completed = all(check_run["status"] == "completed" for check_run in check_runs) + if not is_all_completed: + log("Some check_runs are not completed yet.") + for i, check_run in enumerate(check_runs, 1): + log("check_run %d / %d: %s", i, len(check_runs), check_run) + return is_all_completed + + +async def all_checks_passed(session: ClientSession, sha: str) -> bool: + check_runs = await get_check_runs(session, sha) + + # TODO: "neutral" might be a valid conclusion to consider in the future. + valid_conclusions = {"success", "skipped"} + if any(check_run["conclusion"] not in valid_conclusions for check_run in check_runs): + log(f"Some check_runs are not marked as {'/'.join(valid_conclusions)} yet.") + for i, check_run in enumerate(check_runs, 1): + log("check_run %d / %d: %s", i, len(check_runs), check_run) + return False + return True + + +async def merge_automerge_passed(sha: str) -> None: + async with ClientSession() as session: + if not await all_checks_passed(session, sha): + return + prs = await get_prs_for_sha(session, sha) + if not prs: + log("No PRs found for SHA %s", sha) + for pr in prs: + merge_state = await merge_if_labeled(session, pr) + log("PR %d has merge state %s", pr, merge_state) + if merge_state is MergeState.MERGED: + break + + +async def get_sha_for_review(job_context: Dict[str, Any]) -> Optional[str]: + if job_context["event_name"] != "pull_request_review": + return None + log("Got %s event", "pull_request_review") + event = job_context["event"] + if event["review"]["state"] != "approved": + return None + sha: Optional[str] = event["pull_request"]["head"]["sha"] + log("Use %s event SHA %s", "pull_request_review", sha) + return sha + + +async def get_sha_for_labeled_pr(job_context: Dict[str, Any]) -> Optional[str]: + if job_context["event_name"] != "pull_request": + return None + log("Got %s event", "pull_request") + event = job_context["event"] + if event["action"] != "labeled" or event["label"]["name"] != "automerge": + return None + sha: Optional[str] = event["pull_request"]["head"]["sha"] + log("Use %s event SHA %s", "pull_request", sha) + return sha + + +# This requires that a JOB_CONTEXT environment variable, which is made with `toJson(github)` +async def main() -> None: + job_context = await get_job_context() + + sha = ( + await get_sha_for_status_check(job_context) + or await get_sha_for_workflow_run(job_context) + or await get_sha_for_review(job_context) + or await get_sha_for_labeled_pr(job_context) + ) + if sha: + await merge_automerge_passed(sha) diff --git a/images/bot/src/bioconda_bot/changeVisibility.py b/images/bot/src/bioconda_bot/changeVisibility.py new file mode 100644 index 00000000000..ba036f83479 --- /dev/null +++ b/images/bot/src/bioconda_bot/changeVisibility.py @@ -0,0 +1,63 @@ +import logging +import os +import re +import sys +from asyncio import gather, sleep +from asyncio.subprocess import create_subprocess_exec +from enum import Enum, auto +from pathlib import Path +from shutil import which +from typing import Any, Dict, List, Optional, Set, Tuple +from zipfile import ZipFile, ZipInfo + +from aiohttp import ClientSession +from yaml import safe_load + +from .common import ( + async_exec, + fetch_pr_sha_artifacts, + get_job_context, + get_pr_comment, + get_pr_info, + is_bioconda_member, + send_comment, +) + +logger = logging.getLogger(__name__) +log = logger.info + + +# Ensure uploaded containers are in repos that have public visibility +# TODO: This should ping @bioconda/core if it fails +async def toggle_visibility(session: ClientSession, container_repo: str) -> None: + url = f"https://quay.io/api/v1/repository/biocontainers/{container_repo}/changevisibility" + QUAY_OAUTH_TOKEN = os.environ["QUAY_OAUTH_TOKEN"] + headers = { + "Authorization": f"Bearer {QUAY_OAUTH_TOKEN}", + "Content-Type": "application/json", + } + body = {"visibility": "public"} + rc = 0 + try: + async with session.post(url, headers=headers, json=body) as response: + rc = response.status + except: + # Do nothing + pass + log("Trying to toggle visibility (%s) returned %d", url, rc) + + +# This requires that a JOB_CONTEXT environment variable, which is made with `toJson(github)` +async def main() -> None: + job_context = await get_job_context() + issue_number, original_comment = await get_pr_comment(job_context) + if issue_number is None or original_comment is None: + return + + comment = original_comment.lower() + if comment.startswith(("@bioconda-bot", "@biocondabot")): + if " please toggle visibility" in comment: + pkg = comment.split("please change visibility")[1].strip().split()[0] + async with ClientSession() as session: + await toggle_visibility(session, pkg) + await send_comment(session, issue_number, "Visibility changed.") diff --git a/images/bot/src/bioconda_bot/cli.py b/images/bot/src/bioconda_bot/cli.py new file mode 100644 index 00000000000..a88601d5370 --- /dev/null +++ b/images/bot/src/bioconda_bot/cli.py @@ -0,0 +1,81 @@ +from logging import INFO, basicConfig + +from argparse import ArgumentDefaultsHelpFormatter, ArgumentParser +from asyncio import run +from typing import List, Optional + + +def build_parser_comment(parser: ArgumentParser) -> None: + def run_command() -> None: + from .comment import main as main_ + + run(main_()) + + parser.set_defaults(run_command=run_command) + + +def build_parser_merge(parser: ArgumentParser) -> None: + def run_command() -> None: + from .merge import main as main_ + + run(main_()) + + parser.set_defaults(run_command=run_command) + + +def build_parser_update(parser: ArgumentParser) -> None: + def run_command() -> None: + from .update import main as main_ + + run(main_()) + + parser.set_defaults(run_command=run_command) + + +def build_parser_automerge(parser: ArgumentParser) -> None: + def run_command() -> None: + from .automerge import main as main_ + + run(main_()) + + parser.set_defaults(run_command=run_command) + + +def build_parser_changeVisibility(parser: ArgumentParser) -> None: + def run_command() -> None: + from .changeVisibility import main as main_ + + run(main_()) + + parser.set_defaults(run_command=run_command) + + +def get_argument_parser() -> ArgumentParser: + parser = ArgumentParser( + prog="bioconda-bot", + formatter_class=ArgumentDefaultsHelpFormatter, + ) + sub_parsers = parser.add_subparsers( + dest="command", + required=True, + ) + for command_name, build_parser in ( + ("comment", build_parser_comment), + ("merge", build_parser_merge), + ("update", build_parser_update), + ("automerge", build_parser_automerge), + ("change", build_parser_changeVisibility), + ): + sub_parser = sub_parsers.add_parser( + command_name, + formatter_class=ArgumentDefaultsHelpFormatter, + ) + build_parser(sub_parser) + return parser + + +def main(args: Optional[List[str]] = None) -> None: + basicConfig(level=INFO) + parser = get_argument_parser() + parsed_args = parser.parse_args(args) + parsed_args.run_command() diff --git a/images/bot/src/bioconda_bot/comment.py b/images/bot/src/bioconda_bot/comment.py new file mode 100644 index 00000000000..eb9e13fb7b0 --- /dev/null +++ b/images/bot/src/bioconda_bot/comment.py @@ -0,0 +1,197 @@ +import logging +import os +import re + +from aiohttp import ClientSession +from yaml import safe_load + +from .common import ( + async_exec, + fetch_pr_sha_artifacts, + get_job_context, + get_pr_comment, + get_pr_info, + get_prs_for_sha, + get_sha_for_status_check, + is_bioconda_member, + send_comment, +) + +logger = logging.getLogger(__name__) +log = logger.info + + +# Given a PR and commit sha, post a comment with any artifacts +async def make_artifact_comment(session: ClientSession, pr: int, sha: str) -> None: + artifacts = await fetch_pr_sha_artifacts(session, pr, sha) + nPackages = len(artifacts) + + if nPackages > 0: + comment = "Package(s) built on Azure are ready for inspection:\n\n" + comment += "Arch | Package | Zip File\n-----|---------|---------\n" + install_noarch = "" + install_linux = "" + install_osx = "" + + # Table of packages and repodata.json + for URL, artifact in artifacts: + if not (package_match := re.match(r"^((.+)\/(.+)\/(.+)\/(.+\.tar\.bz2))$", artifact)): + continue + url, archdir, basedir, subdir, packageName = package_match.groups() + urlBase = URL[:-3] # trim off zip from format= + urlBase += "file&subPath=%2F{}".format("%2F".join([basedir, subdir])) + conda_install_url = urlBase + # N.B., the zip file URL is nearly identical to the URL for the individual member files. It's unclear if there's an API for getting the correct URL to the files themselves + #pkgUrl = "%2F".join([urlBase, packageName]) + #repoUrl = "%2F".join([urlBase, "current_repodata.json"]) + #resp = await session.get(repoUrl) + + if subdir == "noarch": + comment += "noarch |" + elif subdir == "linux-64": + comment += "linux-64 |" + elif subdir == "linux-aarch64": + comment += "linux-aarch64 |" + else: + comment += "osx-64 |" + comment += f" {packageName} | [{archdir}]({URL})\n" + + # Conda install examples + comment += "***\n\nYou may also use `conda` to install these after downloading and extracting the appropriate zip file. From the LinuxArtifacts or OSXArtifacts directories:\n\n" + comment += "```\nconda install -c ./packages \n```\n" + + # Table of containers + comment += "***\n\nDocker image(s) built (images are in the LinuxArtifacts zip file above):\n\n" + comment += "Package | Tag | Install with `docker`\n" + comment += "--------|-----|----------------------\n" + + for URL, artifact in artifacts: + if artifact.endswith(".tar.gz"): + image_name = artifact.split("/").pop()[: -len(".tar.gz")] + if ':' in image_name: + package_name, tag = image_name.split(':', 1) + #image_url = URL[:-3] # trim off zip from format= + #image_url += "file&subPath=%2F{}.tar.gz".format("%2F".join(["images", '%3A'.join([package_name, tag])])) + comment += f"{package_name} | {tag} | " + comment += f'
show`gzip -dc LinuxArtifacts/images/{image_name}.tar.gz \\| docker load`\n' + comment += "\n\n" + else: + comment = ( + "No artifacts found on the most recent Azure build. " + "Either the build failed, the artifacts have were removed due to age, or the recipe was blacklisted/skipped." + ) + await send_comment(session, pr, comment) + + +# Post a comment on a given PR with its CircleCI artifacts +async def artifact_checker(session: ClientSession, issue_number: int) -> None: + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}" + headers = { + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + pr_info = safe_load(res) + + await make_artifact_comment(session, issue_number, pr_info["head"]["sha"]) + + +# Reposts a quoted message in a given issue/PR if the user isn't a bioconda member +async def comment_reposter(session: ClientSession, user: str, pr: int, message: str) -> None: + if await is_bioconda_member(session, user): + log("Not reposting for %s", user) + return + log("Reposting for %s", user) + await send_comment( + session, + pr, + f"Reposting for @{user} to enable pings (courtesy of the BiocondaBot):\n\n> {message}", + ) + + +# Add the "Please review and merge" label to a PR +async def add_pr_label(session: ClientSession, pr: int) -> None: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/issues/{pr}/labels" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + payload = {"labels": ["please review & merge"]} + async with session.post(url, headers=headers, json=payload) as response: + response.raise_for_status() + + +async def gitter_message(session: ClientSession, msg: str) -> None: + token = os.environ["GITTER_TOKEN"] + room_id = "57f3b80cd73408ce4f2bba26" + url = f"https://api.gitter.im/v1/rooms/{room_id}/chatMessages" + headers = { + "Authorization": f"Bearer {token}", + "Content-Type": "application/json", + "Accept": "application/json", + "User-Agent": "BiocondaCommentResponder", + } + payload = {"text": msg} + log("Sending request to %s", url) + async with session.post(url, headers=headers, json=payload) as response: + response.raise_for_status() + + +async def notify_ready(session: ClientSession, pr: int) -> None: + try: + await gitter_message( + session, + f"PR ready for review: https://github.com/bioconda/bioconda-recipes/pull/{pr}", + ) + except Exception: + logger.exception("Posting to Gitter failed", exc_info=True) + # Do not die if we can't post to gitter! + + +# This requires that a JOB_CONTEXT environment variable, which is made with `toJson(github)` +async def main() -> None: + job_context = await get_job_context() + + sha = await get_sha_for_status_check(job_context) + if sha: + # This is a successful status or check_suite event => post artifact lists. + async with ClientSession() as session: + for pr in await get_prs_for_sha(session, sha): + await artifact_checker(session, pr) + return + + issue_number, original_comment = await get_pr_comment(job_context) + if issue_number is None or original_comment is None: + return + + comment = original_comment.lower() + async with ClientSession() as session: + if comment.startswith(("@bioconda-bot", "@biocondabot")): + if "please update" in comment: + log("This should have been directly invoked via bioconda-bot-update") + from .update import update_from_master + + await update_from_master(session, issue_number) + elif " hello" in comment: + await send_comment(session, issue_number, "Yes?") + elif " please fetch artifacts" in comment or " please fetch artefacts" in comment: + await artifact_checker(session, issue_number) + #elif " please merge" in comment: + # await send_comment(session, issue_number, "Sorry, I'm currently disabled") + # #log("This should have been directly invoked via bioconda-bot-merge") + # #from .merge import request_merge + # #await request_merge(session, issue_number) + elif " please add label" in comment: + await add_pr_label(session, issue_number) + await notify_ready(session, issue_number) + # else: + # # Methods in development can go below, flanked by checking who is running them + # if job_context["actor"] != "dpryan79": + # console.log("skipping") + # sys.exit(0) + elif "@bioconda/" in comment: + await comment_reposter( + session, job_context["actor"], issue_number, original_comment + ) diff --git a/images/bot/src/bioconda_bot/common.py b/images/bot/src/bioconda_bot/common.py new file mode 100644 index 00000000000..565674fdd00 --- /dev/null +++ b/images/bot/src/bioconda_bot/common.py @@ -0,0 +1,249 @@ +import logging +import os +import re +import sys +from asyncio import gather, sleep +from asyncio.subprocess import create_subprocess_exec +from pathlib import Path +from shutil import which +from typing import Any, Dict, List, Optional, Set, Tuple +from zipfile import ZipFile + +from aiohttp import ClientSession +from yaml import safe_load + +logger = logging.getLogger(__name__) +log = logger.info + + +async def async_exec( + command: str, *arguments: str, env: Optional[Dict[str, str]] = None +) -> None: + process = await create_subprocess_exec(command, *arguments, env=env) + return_code = await process.wait() + if return_code != 0: + raise RuntimeError( + f"Failed to execute {command} {arguments} (return code: {return_code})" + ) + + +# Post a comment on a given issue/PR with text in message +async def send_comment(session: ClientSession, issue_number: int, message: str) -> None: + token = os.environ["BOT_TOKEN"] + url = ( + f"https://api.github.com/repos/bioconda/bioconda-recipes/issues/{issue_number}/comments" + ) + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + payload = {"body": message} + log("Sending comment: url=%s", url) + log("Sending comment: payload=%s", payload) + async with session.post(url, headers=headers, json=payload) as response: + status_code = response.status + log("the response code was %d", status_code) + if status_code < 200 or status_code > 202: + sys.exit(1) + + +# Return true if a user is a member of bioconda +async def is_bioconda_member(session: ClientSession, user: str) -> bool: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/orgs/bioconda/members/{user}" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + rc = 404 + async with session.get(url, headers=headers) as response: + try: + response.raise_for_status() + rc = response.status + except: + # Do nothing, this just prevents things from crashing on 404 + pass + + return rc == 204 + + +# Fetch and return the JSON of a PR +# This can be run to trigger a test merge +async def get_pr_info(session: ClientSession, pr: int) -> Any: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{pr}" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + pr_info = safe_load(res) + return pr_info + + +def list_zip_contents(fname: str) -> [str]: + f = ZipFile(fname) + return [e.filename for e in f.infolist() if e.filename.endswith('.tar.gz') or e.filename.endswith('.tar.bz2')] + + +# Download a zip file from url to zipName.zip and return that path +# Timeout is 30 minutes to compensate for any network issues +async def download_file(session: ClientSession, zipName: str, url: str) -> str: + async with session.get(url, timeout=60*30) as response: + if response.status == 200: + ofile = f"{zipName}.zip" + with open(ofile, 'wb') as fd: + while True: + chunk = await response.content.read(1024*1024*1024) + if not chunk: + break + fd.write(chunk) + return ofile + return None + + +# Find artifact zip files, download them and return their URLs and contents +async def fetch_azure_zip_files(session: ClientSession, buildId: str) -> [(str, str)]: + artifacts = [] + + url = f"https://dev.azure.com/bioconda/bioconda-recipes/_apis/build/builds/{buildId}/artifacts?api-version=4.1" + log("contacting azure %s", url) + async with session.get(url) as response: + # Sometimes we get a 301 error, so there are no longer artifacts available + if response.status == 301: + return artifacts + res = await response.text() + + res_object = safe_load(res) + if res_object['count'] == 0: + return artifacts + + for artifact in res_object['value']: + zipName = artifact['name'] # LinuxArtifacts or OSXArtifacts + zipUrl = artifact['resource']['downloadUrl'] + log(f"zip name is {zipName} url {zipUrl}") + fname = await download_file(session, zipName, zipUrl) + if not fname: + continue + pkgsImages = list_zip_contents(fname) + for pkg in pkgsImages: + artifacts.append((zipUrl, pkg)) + + return artifacts + + +def parse_azure_build_id(url: str) -> str: + return re.search("buildId=(\d+)", url).group(1) + + +# Given a PR and commit sha, fetch a list of the artifact zip files URLs and their contents +async def fetch_pr_sha_artifacts(session: ClientSession, pr: int, sha: str) -> List[Tuple[str, str]]: + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/commits/{sha}/check-runs" + + headers = { + "User-Agent": "BiocondaCommentResponder", + "Accept": "application/vnd.github.antiope-preview+json", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + check_runs = safe_load(res) + + for check_run in check_runs["check_runs"]: + # The names are "bioconda.bioconda-recipes (test_osx test_osx)" or similar + if check_run["name"].startswith("bioconda.bioconda-recipes (test_"): + # The azure build ID is in the details_url as buildId=\d+ + buildID = parse_azure_build_id(check_run["details_url"]) + zipFiles = await fetch_azure_zip_files(session, buildID) + return zipFiles # We've already fetched all possible artifacts + + return [] + + +async def get_sha_for_status(job_context: Dict[str, Any]) -> Optional[str]: + if job_context["event_name"] != "status": + return None + log("Got %s event", "status") + event = job_context["event"] + if event["state"] != "success": + return None + branches = event.get("branches") + if not branches: + return None + sha: Optional[str] = branches[0]["commit"]["sha"] + log("Use %s event SHA %s", "status", sha) + return sha + + +async def get_sha_for_check_suite_or_workflow( + job_context: Dict[str, Any], event_name: str +) -> Optional[str]: + if job_context["event_name"] != event_name: + return None + log("Got %s event", event_name) + event_source = job_context["event"][event_name] + if event_source["conclusion"] != "success": + return None + sha: Optional[str] = event_source.get("head_sha") + if not sha: + pull_requests = event_source.get("pull_requests") + if pull_requests: + sha = pull_requests[0]["head"]["sha"] + if not sha: + return None + log("Use %s event SHA %s", event_name, sha) + return sha + + +async def get_sha_for_check_suite(job_context: Dict[str, Any]) -> Optional[str]: + return await get_sha_for_check_suite_or_workflow(job_context, "check_suite") + + +async def get_sha_for_workflow_run(job_context: Dict[str, Any]) -> Optional[str]: + return await get_sha_for_check_suite_or_workflow(job_context, "workflow_run") + + +async def get_prs_for_sha(session: ClientSession, sha: str) -> List[int]: + headers = { + "User-Agent": "BiocondaCommentResponder", + "Accept": "application/vnd.github.v3+json", + } + pr_numbers: List[int] = [] + per_page = 100 + for page in range(1, 20): + url = ( + "https://api.github.com/repos/bioconda/bioconda-recipes/pulls" + f"?per_page={per_page}" + f"&page={page}" + ) + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + prs = safe_load(res) + pr_numbers.extend(pr["number"] for pr in prs if pr["head"]["sha"] == sha) + if len(prs) < per_page: + break + return pr_numbers + + +async def get_sha_for_status_check(job_context: Dict[str, Any]) -> Optional[str]: + return await get_sha_for_status(job_context) or await get_sha_for_check_suite(job_context) + + +async def get_job_context() -> Any: + job_context = safe_load(os.environ["JOB_CONTEXT"]) + log("%s", job_context) + return job_context + + +async def get_pr_comment(job_context: Dict[str, Any]) -> Tuple[Optional[int], Optional[str]]: + event = job_context["event"] + if event["issue"].get("pull_request") is None: + return None, None + issue_number = event["issue"]["number"] + + original_comment = event["comment"]["body"] + log("the comment is: %s", original_comment) + return issue_number, original_comment diff --git a/images/bot/src/bioconda_bot/merge.py b/images/bot/src/bioconda_bot/merge.py new file mode 100644 index 00000000000..455c7f31d39 --- /dev/null +++ b/images/bot/src/bioconda_bot/merge.py @@ -0,0 +1,371 @@ +import logging +import os +import re +import sys +from asyncio import gather, sleep +from asyncio.subprocess import create_subprocess_exec +from enum import Enum, auto +from pathlib import Path +from shutil import which +from typing import Any, Dict, List, Optional, Set, Tuple +from zipfile import ZipFile, ZipInfo + +from aiohttp import ClientSession +from yaml import safe_load + +from .common import ( + async_exec, + fetch_pr_sha_artifacts, + get_job_context, + get_pr_comment, + get_pr_info, + is_bioconda_member, + send_comment, +) + +logger = logging.getLogger(__name__) +log = logger.info + + +class MergeState(Enum): + UNKNOWN = auto() + MERGEABLE = auto() + NOT_MERGEABLE = auto() + NEEDS_REVIEW = auto() + MERGED = auto() + + +# Ensure there's at least one approval by a member +async def approval_review(session: ClientSession, issue_number: int) -> bool: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}/reviews" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + reviews = safe_load(res) + + approved_reviews = [review for review in reviews if review["state"] == "APPROVED"] + if not approved_reviews: + return False + + # Ensure the review author is a member + return any( + gather( + *( + is_bioconda_member(session, review["user"]["login"]) + for review in approved_reviews + ) + ) + ) + + +# Check the mergeable state of a PR +async def check_is_mergeable( + session: ClientSession, issue_number: int, second_try: bool = False +) -> MergeState: + token = os.environ["BOT_TOKEN"] + # Sleep a couple of seconds to allow the background process to finish + if second_try: + await sleep(3) + + # PR info + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + pr_info = safe_load(res) + + if pr_info.get("merged"): + return MergeState.MERGED + + # We need mergeable == true and mergeable_state == clean, an approval by a member and + if pr_info.get("mergeable") is None and not second_try: + return await check_is_mergeable(session, issue_number, True) + + # Check approved reviews beforehand because we (somehow?) get NOT_MERGEABLE otherwise. + if not await approval_review(session, issue_number): + return MergeState.NEEDS_REVIEW + + if ( + pr_info.get("mergeable") is None + or not pr_info["mergeable"] + or pr_info["mergeable_state"] != "clean" + ): + return MergeState.NOT_MERGEABLE + + return MergeState.MERGEABLE + + +# Ensure uploaded containers are in repos that have public visibility +# TODO: This should ping @bioconda/core if it fails +async def toggle_visibility(session: ClientSession, container_repo: str) -> None: + url = f"https://quay.io/api/v1/repository/biocontainers/{container_repo}/changevisibility" + QUAY_OAUTH_TOKEN = os.environ["QUAY_OAUTH_TOKEN"] + headers = { + "Authorization": f"Bearer {QUAY_OAUTH_TOKEN}", + "Content-Type": "application/json", + } + body = {"visibility": "public"} + rc = 0 + try: + async with session.post(url, headers=headers, json=body) as response: + rc = response.status + except: + # Do nothing + pass + log("Trying to toggle visibility (%s) returned %d", url, rc) + + +## Download an artifact from CircleCI, rename and upload it +#async def download_and_upload(session: ClientSession, x: str) -> None: +# basename = x.split("/").pop() +# # the tarball needs a regular name without :, the container needs pkg:tag +# image_name = basename.replace("%3A", ":").replace("\n", "").replace(".tar.gz", "") +# file_name = basename.replace("%3A", "_").replace("\n", "") +# +# async with session.get(x) as response: +# with open(file_name, "wb") as file: +# logged = 0 +# loaded = 0 +# while chunk := await response.content.read(256 * 1024): +# file.write(chunk) +# loaded += len(chunk) +# if loaded - logged >= 50 * 1024 ** 2: +# log("Downloaded %.0f MiB: %s", max(1, loaded / 1024 ** 2), x) +# logged = loaded +# log("Downloaded %.0f MiB: %s", max(1, loaded / 1024 ** 2), x) +# +# if x.endswith(".gz"): +# # Container +# log("uploading with skopeo: %s", file_name) +# # This can fail, retry with 5 second delays +# count = 0 +# maxTries = 5 +# success = False +# QUAY_LOGIN = os.environ["QUAY_LOGIN"] +# env = os.environ.copy() +# # TODO: Fix skopeo package to find certificates on its own. +# skopeo_path = which("skopeo") +# if not skopeo_path: +# raise RuntimeError("skopeo not found") +# env["SSL_CERT_DIR"] = str(Path(skopeo_path).parents[1].joinpath("ssl")) +# while count < maxTries: +# try: +# await async_exec( +# "skopeo", +# "--command-timeout", +# "600s", +# "copy", +# f"docker-archive:{file_name}", +# f"docker://quay.io/biocontainers/{image_name}", +# "--dest-creds", +# QUAY_LOGIN, +# env=env, +# ) +# success = True +# break +# except: +# count += 1 +# if count == maxTries: +# raise +# await sleep(5) +# if success: +# await toggle_visibility(session, basename.split("%3A")[0]) +# elif x.endswith(".bz2"): +# # Package +# log("uploading package") +# ANACONDA_TOKEN = os.environ["ANACONDA_TOKEN"] +# await async_exec("anaconda", "-t", ANACONDA_TOKEN, "upload", file_name, "--force") +# +# log("cleaning up") +# os.remove(file_name) + + +async def upload_package(session: ClientSession, zf: ZipFile, e: ZipInfo): + log(f"extracting {e.filename}") + fName = zf.extract(e) + + log(f"uploading {fName}") + ANACONDA_TOKEN = os.environ["ANACONDA_TOKEN"] + await async_exec("anaconda", "-t", ANACONDA_TOKEN, "upload", fName, "--force") + + log("cleaning up") + os.remove(fName) + + +async def upload_image(session: ClientSession, zf: ZipFile, e: ZipInfo): + basename = e.filename.split("/").pop() + image_name = basename.replace("\n", "").replace(".tar.gz", "") + + log(f"extracting {e.filename}") + fName = zf.extract(e) + # Skopeo can't handle a : in the file name, so we need to remove it + newFName = fName.replace(":", "") + os.rename(fName, newFName) + + log(f"uploading with skopeo: {newFName} {image_name}") + # This can fail, retry with 5 second delays + count = 0 + maxTries = 5 + success = False + QUAY_LOGIN = os.environ["QUAY_LOGIN"] + env = os.environ.copy() + # TODO: Fix skopeo package to find certificates on its own. + skopeo_path = which("skopeo") + if not skopeo_path: + raise RuntimeError("skopeo not found") + env["SSL_CERT_DIR"] = str(Path(skopeo_path).parents[1].joinpath("ssl")) + while count < maxTries: + try: + await async_exec( + "skopeo", + "--command-timeout", + "600s", + "copy", + f"docker-archive:{newFName}", + f"docker://quay.io/biocontainers/{image_name}", + "--dest-creds", + QUAY_LOGIN, + env=env, + ) + success = True + break + except: + count += 1 + if count == maxTries: + raise + await sleep(5) + if success: + await toggle_visibility(session, basename.split(":")[0] if ":" in basename else basename.split("%3A")[0]) + + log("cleaning up") + os.remove(newFName) + + +# Given an already downloaded zip file name in the current working directory, upload the contents +async def extract_and_upload(session: ClientSession, fName: str) -> int: + if os.path.exists(fName): + zf = ZipFile(fName) + for e in zf.infolist(): + if e.filename.endswith('.tar.bz2'): + await upload_package(session, zf, e) + elif e.filename.endswith('.tar.gz'): + await upload_image(session, zf, e) + return 0 + return 1 + + +# Upload artifacts to quay.io and anaconda, return the commit sha +# Only call this for mergeable PRs! +async def upload_artifacts(session: ClientSession, pr: int) -> str: + # Get last sha + pr_info = await get_pr_info(session, pr) + sha: str = pr_info["head"]["sha"] + + # Fetch the artifacts (a list of (URL, artifact) tuples actually) + artifacts = await fetch_pr_sha_artifacts(session, pr, sha) + artifacts = [artifact for (URL, artifact) in artifacts if artifact.endswith((".gz", ".bz2"))] + assert artifacts + + # Download/upload Artifacts + for zipFileName in ["LinuxArtifacts.zip", "OSXArtifacts.zip"]: + await extract_and_upload(session, zipFileName) + + return sha + + +# Assume we have no more than 250 commits in a PR, which is probably reasonable in most cases +async def get_pr_commit_message(session: ClientSession, issue_number: int) -> str: + token = os.environ["BOT_TOKEN"] + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{issue_number}/commits" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + async with session.get(url, headers=headers) as response: + response.raise_for_status() + res = await response.text() + commits = safe_load(res) + message = "".join(f" * {commit['commit']['message']}\n" for commit in reversed(commits)) + return message + + +# Merge a PR +async def merge_pr(session: ClientSession, pr: int, init_message: str) -> MergeState: + token = os.environ["BOT_TOKEN"] + mergeable = await check_is_mergeable(session, pr) + log("mergeable state of %s is %s", pr, mergeable) + if mergeable is not MergeState.MERGEABLE: + return mergeable + + if init_message: + await send_comment(session, pr, init_message) + try: + log("uploading artifacts") + sha = await upload_artifacts(session, pr) + log("artifacts uploaded") + + # Carry over last 250 commit messages + msg = await get_pr_commit_message(session, pr) + + # Hit merge + url = f"https://api.github.com/repos/bioconda/bioconda-recipes/pulls/{pr}/merge" + headers = { + "Authorization": f"token {token}", + "User-Agent": "BiocondaCommentResponder", + } + payload = { + "sha": sha, + "commit_title": f"[ci skip] Merge PR {pr}", + "commit_message": f"Merge PR #{pr}, commits were: \n{msg}", + "merge_method": "squash", + } + log("Putting merge commit") + async with session.put(url, headers=headers, json=payload) as response: + rc = response.status + log("body %s", payload) + log("merge_pr the response code was %s", rc) + except: + await send_comment( + session, + pr, + "I received an error uploading the build artifacts or merging the PR!", + ) + logger.exception("Upload failed", exc_info=True) + return MergeState.MERGED + + +async def request_merge(session: ClientSession, pr: int) -> MergeState: + init_message = "I will attempt to upload artifacts and merge this PR. This may take some time, please have patience." + merged = await merge_pr(session, pr, init_message) + if merged is MergeState.NEEDS_REVIEW: + await send_comment( + session, + pr, + "Sorry, this PR cannot be merged until it's approved by a Bioconda member.", + ) + elif merged is MergeState.NOT_MERGEABLE: + await send_comment(session, pr, "Sorry, this PR cannot be merged at this time.") + return merged + + +# This requires that a JOB_CONTEXT environment variable, which is made with `toJson(github)` +async def main() -> None: + job_context = await get_job_context() + issue_number, original_comment = await get_pr_comment(job_context) + if issue_number is None or original_comment is None: + return + + comment = original_comment.lower() + if comment.startswith(("@bioconda-bot", "@biocondabot")): + if " please merge" in comment: + async with ClientSession() as session: + await request_merge(session, issue_number) diff --git a/images/bot/src/bioconda_bot/update.py b/images/bot/src/bioconda_bot/update.py new file mode 100644 index 00000000000..0af1f8db09e --- /dev/null +++ b/images/bot/src/bioconda_bot/update.py @@ -0,0 +1,78 @@ +import logging +import sys + +from aiohttp import ClientSession + +from .common import ( + async_exec, + get_job_context, + get_pr_comment, + get_pr_info, + send_comment, +) + +logger = logging.getLogger(__name__) +log = logger.info + + +# Update a branch from upstream master, this should be run in a try/catch +async def update_from_master_runner(session: ClientSession, pr: int) -> None: + async def git(*args: str) -> None: + return await async_exec("git", *args) + + # Setup git, otherwise we can't push + await git("config", "--global", "user.email", "biocondabot@gmail.com") + await git("config", "--global", "user.name", "BiocondaBot") + + pr_info = await get_pr_info(session, pr) + remote_branch = pr_info["head"]["ref"] + remote_repo = pr_info["head"]["repo"]["full_name"] + + max_depth = 2000 + # Clone + await git( + "clone", + f"--depth={max_depth}", + f"--branch={remote_branch}", + f"git@github.com:{remote_repo}.git", + "bioconda-recipes", + ) + + async def git_c(*args: str) -> None: + return await git("-C", "bioconda-recipes", *args) + + # Add/pull upstream + await git_c("remote", "add", "upstream", "https://github.com/bioconda/bioconda-recipes") + await git_c("fetch", f"--depth={max_depth}", "upstream", "master") + + # Merge + await git_c("merge", "upstream/master") + + await git_c("push") + + +# Merge the upstream master branch into a PR branch, leave a message on error +async def update_from_master(session: ClientSession, pr: int) -> None: + try: + await update_from_master_runner(session, pr) + except Exception as e: + await send_comment( + session, + pr, + "I encountered an error updating your PR branch. You can report this to bioconda/core if you'd like.\n-The Bot", + ) + sys.exit(1) + + +# This requires that a JOB_CONTEXT environment variable, which is made with `toJson(github)` +async def main() -> None: + job_context = await get_job_context() + issue_number, original_comment = await get_pr_comment(job_context) + if issue_number is None or original_comment is None: + return + + comment = original_comment.lower() + if comment.startswith(("@bioconda-bot", "@biocondabot")): + if "please update" in comment: + async with ClientSession() as session: + await update_from_master(session, issue_number) diff --git a/images/build.sh b/images/build.sh new file mode 100644 index 00000000000..caa695243eb --- /dev/null +++ b/images/build.sh @@ -0,0 +1,79 @@ +#!/bin/bash + +# This script builds multi-arch images and a manifest that points to them. The +# manifest can be then pushed to a registry with e.g. podman manifest push. +# +# Usage: +# +# build.sh +# +# The only arg directly provided to this script is the image directory, +# containing at least a Dockerfile. +# +# In that directory, if prepare.sh exists it will be sourced. Use prepare.sh to +# create all required env vars and do any image-specific prep work. +# +# Expected env vars to be populated by prepare.sh +# ----------------------------------------------- +# TAG: tag to build +# ARCHS: space-separated string of archs to build +# IMAGE_NAME: name of image; created manifest will be IMAGE_NAME:tag +# BUILD_ARGS: array of arguments like ("--build-arg=argument1=the-value", "--build-arg=arg2=a") + +set -xeu + +IMAGE_DIR=$1 + +cd $IMAGE_DIR + +[ -e prepare.sh ] && source prepare.sh + + +# Clean up any manifests before we start. +# IMAGE_NAME and TAG should be created by prepare.sh +buildah manifest rm "${IMAGE_NAME}:${TAG}" || true +buildah manifest create "${IMAGE_NAME}:${TAG}" + +# ARCHS should be created by prepare.sh +for arch in $ARCHS; do + + # This logic is specific to the build-env. We need an arch-specific base + # image, but the nomenclature is inconsistent. So we directly map arch names + # to conda-forge base images. + BASE_IMAGE_BUILD_ARG="" + if [ "${IS_BUILD_ENV:-false}" == "true" ]; then + if [ "$arch" == "amd64" ]; then + BASE_IMAGE_BUILD_ARG="--build-arg=base_image=quay.io/condaforge/linux-anvil-cos7-x86_64" + fi + if [ "$arch" == "arm64" ]; then + BASE_IMAGE_BUILD_ARG="--build-arg=base_image=quay.io/condaforge/linux-anvil-aarch64" + fi + fi + + # Actual building happens here. We will keep track of the built image in + # $image_id. + iidfile="$( mktemp )" + buildah bud \ + --arch="${arch}" \ + --iidfile="${iidfile}" \ + --file=Dockerfile \ + ${BUILD_ARGS[@]} \ + $BASE_IMAGE_BUILD_ARG + image_id="$( cat "${iidfile}" )" + rm "${iidfile}" + + # In order for GitHub Actions to inherit container permissions from the repo + # permissions, we need to add a special label. However `buildah config + # --label` operates on a container, not an image. So we add the label to + # a temporary container and then save the resulting image. + container="$( buildah from "${image_id}" )" + buildah config \ + --label="org.opencontainers.image.source=https://github.com/bioconda/bioconda-utils" \ + "${container}" + image_id="$( buildah commit "${container}" )" + buildah rm "${container}" + + # Add image to manifest + buildah tag "${image_id}" "${IMAGE_NAME}:${TAG}-${arch}" + buildah manifest add "${IMAGE_NAME}:${TAG}" "${image_id}" +done diff --git a/images/create-env/CHANGELOG.md b/images/create-env/CHANGELOG.md new file mode 100644 index 00000000000..cd5a8d32db5 --- /dev/null +++ b/images/create-env/CHANGELOG.md @@ -0,0 +1,152 @@ +# Changelog + + +## bioconda/create-env 3.0 (2023-10-17) + +### Changed + +- Add linux-aarch64 image; bioconda/create-env is now a multiplatform manifest. + +- Change to a simple "major.minor" version scheme and offer mutable "major" tag. + +- Drop defaults channel from included config. + +- Use Miniforge installer to build this image. + +- Rebuilt on the latest base image with Debian 12.2 / BusyBox 1.36.1. + +- Do not install findutils, sed if provided by the base image (as is currently). + + +## bioconda/create-env 2.2.1 (2022-10-14) + +### Changed + +- Limit open fd (ulimit -n) for strip (small number chosen arbitrarily). + + The container image itself had unstripped binaries in 2.2.0. + + +## bioconda/create-env 2.2.0 (2022-10-14) + +### Changed + +- Use the exact conda, mamba versions as used in bioconda-recipes' builds. + + +## bioconda/create-env 2.1.0 (2021-04-14) + +### Changed + +- Copy instead of hardlink licenses, exit on error + + Hardlink fails if copying spans cross devices (e.g., via bound volumes). + + +## bioconda/create-env 2.0.0 (2021-04-13) + +### Changed + +- Rename `--remove-files` to `--remove-paths` + +- Replace `--strip` by `--strip-files=GLOB` + +- Replace `CONDA_ALWAYS_COPY=1` usage by config option + +- Use `/bin/bash` for entrypoints + + `/bin/sh` fails on some Conda packages' activations scripts' Bashisms. + + +## bioconda/create-env 1.2.1 (2021-04-09) + +### Fixed + +- Fail `--strip` if `strip` is not available + +### Changed + +- Delete links/dirs for `--remove-files` + + +## bioconda/create-env 1.2.0 (2021-03-30) + +### Added + +- Add license copying + +- Add status messages + +- Add help texts + +### Changed + +- Suppress `bash -i` ioctl warning + + +## bioconda/create-env 1.1.1 (2021-03-27) + +### Changed + +- Use `CONDA_ALWAYS_COPY=1` + + +## bioconda/create-env 1.1.0 (2021-03-27) + +### Added + +- Add option to change `create --copy` + +### Changed + +- Rebuild with `python` pinned to `3.8` + + To avoid hitting + - https://github.com/conda/conda/issues/10490 + - https://bugs.python.org/issue43517 + + +## bioconda/create-env 1.0.2 (2021-03-22) + +### Changed + +- Rebuild on new Debian 10 base images + + +## bioconda/create-env 1.0.1 (2021-03-22) + +### Fixed + +- Use entrypoint from `/opt/create-env/` + + `/usr/local` gets "overwritten" (=bind-mounted) when building via mulled. + + +## bioconda/create-env 1.0.0 (2021-03-21) + +### Added + +- Initial release + + + diff --git a/images/create-env/Dockerfile b/images/create-env/Dockerfile new file mode 100644 index 00000000000..a84d9219dbc --- /dev/null +++ b/images/create-env/Dockerfile @@ -0,0 +1,38 @@ +ARG BUSYBOX_IMAGE +FROM ${BUSYBOX_IMAGE} as build + +WORKDIR /tmp/work +COPY install-conda print-env-activate create-env ./ +RUN arch="$( uname -m )" \ + && \ + wget --quiet -O ./miniconda.sh \ + "https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-${arch}.sh" + +# Install exact versions of conda/mamba +ARG CONDA_VERSION +RUN echo -e "$CONDA_VERSION" > requirements.txt +RUN ./install-conda ./requirements.txt /opt/create-env + +ARG BUSYBOX_IMAGE +FROM ${BUSYBOX_IMAGE} +COPY --from=build /opt/create-env /opt/create-env + +# Copy (Bioconda-specific) Conda configuration created by the install-conda script. +COPY --from=build /root/.condarc /root/ + +RUN \ + # Use a per-user config (instead of conda config --sys) for more flexibility. + cp /root/.condarc /etc/skel/ \ + && \ + # Enable conda shell function for login shells. + ln -s /opt/create-env/etc/profile.d/conda.sh /etc/profile.d/ \ + && \ + # Enable conda function in interactive Bash (via .bashrc) and POSIX shells (via ENV). + printf '%s\n' \ + '\. /etc/profile.d/conda.sh' \ + | tee -a /root/.bashrc \ + >> /etc/skel/.bashrc +ENV ENV=/etc/profile.d/conda.sh + +ENTRYPOINT [ "/opt/create-env/bin/tini", "--", "/opt/create-env/env-execute" ] +CMD [ "bash" ] diff --git a/images/create-env/Dockerfile.test b/images/create-env/Dockerfile.test new file mode 100644 index 00000000000..f04649005ef --- /dev/null +++ b/images/create-env/Dockerfile.test @@ -0,0 +1,80 @@ +ARG base +ARG BUSYBOX_IMAGE +FROM "${base}" +RUN set -x && \ + CONDA_PKGS_DIRS="/tmp/pkgs" \ + /opt/create-env/env-execute \ + create-env \ + /usr/local \ + file findutils grep +RUN set -x && \ + . /usr/local/env-activate.sh && \ + if find /opt/create-env \ + -xdev \ + -type f \ + -exec file {} \+ \ + | grep 'not stripped' \ + ; then \ + >&2 printf 'found unstripped binaries\n' ; exit 1 \ + ; fi +RUN set -x && \ + . /usr/local/env-activate.sh && \ + if find /opt/create-env \ + -xdev \ + -type f \ + -name \*.a \ + | grep . \ + ; then \ + >&2 printf 'found static libraries\n' ; exit 1 \ + ; fi + + +FROM "${base}" as build_bioconda_package +RUN set -x && \ + /opt/create-env/env-execute \ + create-env \ + --strip-files=\* \ + /usr/local \ + python + +FROM "${BUSYBOX_IMAGE}" +COPY --from=build_bioconda_package /usr/local /usr/local +RUN set -x && \ + /usr/local/env-execute \ + python --version \ + && \ + [ ! "${CONDA_PREFIX}" = /usr/local ] \ + && \ + { set -x && . /usr/local/env-activate.sh && set +x ; } \ + && \ + [ "${CONDA_PREFIX}" = /usr/local ] \ + && \ + python --version + + +FROM "${base}" as build_conda +RUN set -x && \ + /opt/create-env/env-execute \ + create-env \ + --env-activate-args='--prefix-is-base' \ + --strip-files=\* \ + --remove-paths=\*.a \ + --remove-paths=\*.pyc \ + /opt/conda \ + conda + +FROM "${BUSYBOX_IMAGE}" +COPY --from=build_conda /opt/conda /opt/conda +COPY --from=build_conda /opt/conda/env-activate.sh /usr/local/ +RUN set -x && \ + /usr/local/env-execute \ + conda info --all \ + && \ + { set -x && . /usr/local/env-activate.sh && set +x ; } \ + && \ + . "${CONDA_PREFIX}/etc/profile.d/conda.sh" \ + && \ + conda activate \ + && \ + conda info \ + | grep 'base environment.*/opt/conda' diff --git a/images/create-env/README.md b/images/create-env/README.md new file mode 100644 index 00000000000..cc84f3b4765 --- /dev/null +++ b/images/create-env/README.md @@ -0,0 +1,96 @@ +# bioconda/create-env + +The `create-env` container image, available as [`quay.io/bioconda/create-env`](https://quay.io/repository/bioconda/create-env?tab=tags), provides [`conda`](https://github.com/conda/conda/) alongside a convenience wrapper `create-env` to create small container images based on Conda packages. + + +## Options + +`create-env` runs `conda create` for a given `PREFIX` plus a set of packages and (optionally) runs post-processing steps on the created environment. + +Post-processing steps are triggered by arguments to `create-env`: + +- `--env-activate-script=FILE`: + + Create a shell activation script `FILE` (defaults to `PREFIX/env-activate.sh`) which contains the environment activation instructions as executed per `conda activate PREFIX`. + + Example usage: `sh -c '. PREFIX/env-activate.sh && command-to-run-from-PREFIX'`. + +- `--env-execute-script=FILE`: + + Create an executable `FILE` (defaults to `PREFIX/env-execute`) which runs a given program in the activated `PREFIX` environment. + + Example usage: `PREFIX/env-execute command-to-run-from-PREFIX`. + +- `--remove-paths=GLOB`: + + Remove some paths from `PREFIX` to reduce the target container image size. + +- `--strip-files=GLOB`: + + Run [`strip`](https://sourceware.org/binutils/docs/binutils/strip.html) on files in `PREFIX` whose paths match `GLOB` to reduce the target container image size. + +- `licenses-path=PATH`: + + Directory in which to copy license files for the installed packages (defaults to `PREFIX/conda-meta`). + + +## Usage example: +```Dockerfile +FROM quay.io/bioconda/create-env:2.1.0 as build +# Create an environment containing python=3.9 at /usr/local, strip +# files and remove some less important files: +RUN export CONDA_ADD_PIP_AS_PYTHON_DEPENDENCY=0 \ + && \ + /opt/create-env/env-execute \ + create-env \ + --strip-files='bin/*' \ + --strip-files='lib/*' \ + --remove-paths='*.a' \ + --remove-paths='share/terminfo/[!x]*' \ + /usr/local \ + python=3.9 + +# The base image below (quay.io/bioconda/base-glibc-busybox-bash:2.1.0) defines +# /usr/local/env-execute as the ENTRYPOINT so that created containers always +# start in an activated environment. +FROM quay.io/bioconda/base-glibc-busybox-bash:2.1.0 as target +COPY --from=build /usr/local /usr/local + +FROM target as test +RUN /usr/local/env-execute python -c 'import sys; print(sys.version)' +RUN /usr/local/env-activate.sh && python -c 'import sys; print(sys.version)' + +# Build and test with, e.g.: +# buildah bud --target=target --tag=localhost/python:3.9 . +# podman run --rm localhost/python:3.9 python -c 'import sys; print(sys.version)' +``` + +## Miscellaneous information: + +- Run `podman run --rm quay.io/bioconda/create-env create-env --help` for usage information. + +- Run `podman run --rm quay.io/bioconda/create-env conda config --show-sources` to see predefined configuration options. + +- The environment in which `create-env` runs has been itself created by `create-env`. + As such, `/opt/create-env/env-activate.sh` and `/opt/create-env/env-execute` scripts can be used to activate/execute in `create-env`'s environment in a `Dockerfile` context. + In other contexts when a container is run via the image's entrypoint, the environments is activated automatically. + + The separate `/opt/create-env` path is used to avoid collisions with environments created at, e.g., `/usr/local` or `/opt/conda`. + +- By default, package files are copied rather than hard-linked to avoid altering Conda package cachge files when running `strip`. + + If the target image should contain multiple environments, it is advisable to set `CONDA_ALWAYS_COPY=0` to allow hardlinks between the environments (to reduce the overall image size) and run `strip` after the environments have been created. + This can be done by invoking `create-env` twice whilst omitting the environment creation during the second invocation (using `--conda=:`). + + E.g.: + ```sh + . /opt/create-env/env-activate.sh + export CONDA_ALWAYS_COPY=0 + create-env --conda=: --strip-files=\* /opt/python-3.8 + create-env --conda=: --strip-files=\* /opt/python-3.9 + ``` + +- Container images created as in the example above are meant to be lightweight and as such do **not** contain `conda`. + Hence, there is no `conda activate PREFIX` available but only the source-able `PREFIX/env-activate.sh` scripts and the `PREFIX/env-execute` launchers. + These scripts are generated at build time and assume no previously activated Conda environment. + Likewise, the environments are not expected to be deactivated, which is why no corresponding deactivate scripts are provided. diff --git a/images/create-env/create-env b/images/create-env/create-env new file mode 100755 index 00000000000..fde5bffc334 --- /dev/null +++ b/images/create-env/create-env @@ -0,0 +1,242 @@ +#! /bin/sh -eu + +for arg do + case "${arg}" in + --help ) + cat <<'end-of-help' +Usage: create-env [OPTIONS]... [--] PREFIX [CONDA_CREATE_ARGS]... +Use conda (or mamba via --conda=mamba) to create a Conda environment at PREFIX +according to specifications given by CONDA_CREATE_ARGS. + + --conda=CONDA Conda implementation to run CONDA CREATE for. + E.g.: "conda", "mamba", "conda env", "mamba env". + Use ":" to skip env creation. (default: conda) + --create-command=CREATE Conda command to run. E.g.: "create", "install". + (default: create) + --env-activate-args=ARGS Single string of arguments to pass on to + print-env-activate. (default: --prefix=PREFIX) + --env-activate-script=FILE Destination path of environment activation + script. (default: PREFIX/env-activate.sh) + --env-execute-script=FILE Destination path of environment execution script. + (default: PREFIX/env-execute) + --remove-paths=GLOB Glob of paths to remove from PREFIX after its + creation. Can be passed on multiple times. Will + be passed on to `find -path PREFIX/GLOB`. + (no default) + --strip-files=GLOB Glob of paths in PREFIX to run `strip` on. Will + be passed on to `find -type f -path PREFIX/GLOB`. + Error messages from `strip` are suppressed, i.e., + --strip-files=* may be used to run `strip` on all + files. Can be passed on multiple times. + (no default) + --licenses-path=PATH Destination path to copy package license files + to (relative to PREFIX or absolute). Pass on + empty path (--licenses-path=) to skip copying. + (default: conda-meta) +end-of-help + exit 0 ;; + --conda=* ) + conda_impl="${arg#--conda=}" + shift ;; + --create-command=* ) + create_command="${arg#--create-command=}" + shift ;; + --env-activate-args=* ) + env_activate_args="${arg#--env-activate-args=}" + shift ;; + --env-activate-script=* ) + env_activate_file="${arg#--env-activate-script=}" + shift ;; + --env-execute-script=* ) + env_execute_file="${arg#--env-execute-script=}" + shift ;; + --remove-paths=* ) + remove_paths_globs="$( + printf '%s\n' \ + ${remove_paths_globs+"${remove_paths_globs}"} \ + "${arg#--remove-paths=}" + )" + shift ;; + --strip-files=* ) + strip_files_globs="$( + printf '%s\n' \ + ${strip_files_globs+"${strip_files_globs}"} \ + "${arg#--strip-files=}" + )" + shift ;; + --licenses-path=* ) + licenses_path="${arg#--licenses-path=}" + shift ;; + -- ) + break ;; + -* ) + printf 'unknown option: %s\n' "${arg}" + exit 1 ;; + * ) + break + esac +done + +if [ $# -eq 0 ] ; then + printf 'missing argument: environment path\n' + exit 1 +fi + +prefix="${1%%/}" +shift + +conda_impl="${conda_impl:-conda}" +create_command="${create_command-create}" +env_activate_args="--prefix='${prefix}' ${env_activate_args-}" +env_activate_file="${env_activate_file-"${prefix}/env-activate.sh"}" +env_execute_file="${env_execute_file-"${prefix}/env-execute"}" +remove_paths_globs="$( printf '%s\n' "${remove_paths_globs-}" | sort -u )" +strip_files_globs="$( printf '%s\n' "${strip_files_globs-}" | sort -u )" +licenses_path="${licenses_path-conda-meta}" + + +set +u +eval "$( conda shell.posix activate base )" +set -u + +printf 'creating environment at %s ...\n' "${prefix}" 1>&2 +CONDA_YES=1 \ + ${conda_impl} \ + ${create_command} \ + --prefix="${prefix}" \ + "${@}" + +if [ -n "${env_activate_file}${env_execute_file}" ] ; then + printf 'generating activation script...\n' 1>&2 + activate_script="$( + eval "set -- ${env_activate_args}" + print-env-activate "${@}" + )" + if [ -n "${env_activate_file-}" ] ; then + printf 'writing activation script to %s ...\n' "${env_activate_file}" 1>&2 + printf '%s\n' \ + "${activate_script}" \ + > "${env_activate_file}" + activate_script=". '${env_activate_file}'" + fi + if [ -n "${env_execute_file-}" ] ; then + printf 'writing execution script to %s ...\n' "${env_execute_file}" 1>&2 + printf '%s\n' \ + '#! /bin/bash' \ + "${activate_script}" \ + 'exec "${@}"' \ + > "${env_execute_file}" + chmod +x "${env_execute_file}" + fi +fi + + +if [ -n "${remove_paths_globs}" ] ; then + printf 'removing paths from %s ...\n' "${prefix}" 1>&2 + ( + eval "set -- $( + printf %s "${remove_paths_globs}" \ + | sed -e "s|.*|-path '${prefix}/&'|" -e '1!s/^/-o /' \ + | tr '\n' ' ' + )" + find "${prefix}" \ + \( "${@}" \) \ + -delete + ) +fi + +if [ -n "${strip_files_globs}" ] ; then + # Ensure "strip" is available beforehand because errors are ignored later on. + strip --version > /dev/null + printf 'stripping binaries in %s ...\n' "${prefix}" 1>&2 + ( + eval "set -- $( + printf %s "${strip_files_globs}" \ + | sed -e "s|.*|-path '${prefix}/&'|" -e '1!s/^/-o /' \ + | tr '\n' ' ' + )" + # Strip binaries. (Run strip on all files; ignore errors for non-ELF files.) + # Limit open fds (ulimit -n) for strip (small number chosen arbitrarily). + # (To avoid "could not create temporary file to hold stripped copy: Too many open files") + + # Filter out the binaries currently in use by the pipeline via sed below. + skip_inode_expressions="$( + command -v -- find xargs sed strip \ + | xargs -- stat -L -c '-e /^%d,%i:/d' -- + )" + find "${prefix}" \ + -type f \ + \( "${@}" \) \ + -print0 \ + | xargs \ + -0 \ + -n 64 \ + -- \ + stat -L -c '%d,%i:%n' -- \ + | sed \ + ${skip_inode_expressions} \ + -e 's/^[^:]*://' \ + | tr \\n \\0 \ + | + xargs \ + -0 \ + -n 64 \ + -- \ + strip -- \ + 2>&1 \ + | sed '/: file format not recognized/d' \ + || true + ) +fi + + +if [ -n "${licenses_path}" ] ; then + abs_licenses_path="$( + cd "${prefix}" + mkdir -p "${licenses_path}" + cd "${licenses_path}" + pwd + )" + printf 'copying license files to %s ...\n' "${abs_licenses_path}" 1>&2 + pkgs_dirs="$( + conda config --show pkgs_dirs \ + | sed -n 's|[^/]*\(/.*\)|"\1"|p' \ + | tr '\n' ' ' + )" + ( + eval "set -- $( + find "${prefix}/conda-meta" \ + -maxdepth 1 \ + -name \*.json \ + | sed 's|.*/\(.*\)\.json|"\1"|' \ + | tr '\n' ' ' + )" + for pkg do + pkg_info="$( + eval "set -- ${pkgs_dirs}" + for pkgs_dir ; do + if [ -d "${pkgs_dir}/${pkg}/info" ] ; then + printf %s "${pkgs_dir}/${pkg}/info" + exit + fi + done + printf 'missing metadata for %s\n' "${pkg}" 1>&2 + exit 1 + )" + find "${pkg_info}" \ + -maxdepth 1 \ + \( -name LICENSE.txt -o -name licenses \) \ + -exec sh -ec ' + dest_dir="${1}" ; shift + mkdir -p "${dest_dir}" + cp -fR "${@}" "${dest_dir}/" + ' -- "${abs_licenses_path}/${pkg}" {} \+ \ + || { + printf 'failed to copy licenses for %s\n' "${pkg}" 1>&2 + exit 1 + } + done + ) +fi + +printf 'finished create-env for %s\n' "${prefix}" 1>&2 diff --git a/images/create-env/install-conda b/images/create-env/install-conda new file mode 100755 index 00000000000..7ce597bc323 --- /dev/null +++ b/images/create-env/install-conda @@ -0,0 +1,123 @@ +#! /bin/bash -eux + +requirements_file="${1}" +conda_install_prefix="${2}" + +# Install a bootstrap Miniconda installation. +miniconda_boostrap_prefix="$( pwd )/miniconda" +# Run the following in a subshell to avoid environment changes from bootstrap. +( + + # Use the base image-provided tools if they work for us: + tools='' + find -print0 -maxdepth 0 && xargs -0 true < /dev/null \ + || tools="${tools} findutils" + sed -e '' < /dev/null \ + || tools="${tools} sed" + + sh ./miniconda.sh \ + -b \ + -p "${miniconda_boostrap_prefix}" + + # Install the base Conda installation. + . "${miniconda_boostrap_prefix}/etc/profile.d/conda.sh" + + # Install conda and some additional tools: + # - tini: init program, + # - binutils, findutils: tools to strip down image/environment size, + + # Only need `strip` executable from binutils. Other binaries from the package + # and especially the "sysroot" dependency is only bloat for this container + # image. (NOTE: The binary needs libgcc-ng which is explicitly added later.) + conda create --yes \ + --prefix="${conda_install_prefix}" \ + --channel=conda-forge \ + binutils + cp -aL "${conda_install_prefix}/bin/strip" ./strip + conda run --prefix="${conda_install_prefix}" strip -- ./strip + conda remove --yes --all \ + --prefix="${conda_install_prefix}" + + conda create --yes \ + --prefix="${conda_install_prefix}" \ + --channel=conda-forge \ + \ + --file="${requirements_file}" \ + \ + tini \ + \ + libgcc-ng \ + ${tools} \ + ; + + mv \ + ./print-env-activate \ + ./create-env \ + ./strip \ + "${conda_install_prefix}/bin/" +) + +# Activate the new base environment. +activate_script="$( + "${conda_install_prefix}/bin/conda" shell.posix activate base +)" +set +u +eval "${activate_script}" +set -u +unset activate_script + +# Strip find/xargs/sed beforehand as they are excluded in the strip pipeline. +for prog in find xargs sed ; do + case "$( command -v "${prog}" )" in + "${conda_install_prefix%%/}"/* ) + strip -- "$( command -v "${prog}" )" + esac +done + +# Use --conda=: to turn the `conda create` into a no-op, but do continue to +# run strip, remove files and output the activate/execute scripts. +CONDA_PKGS_DIRS="${miniconda_boostrap_prefix}/pkgs" \ + create-env \ + --conda=: \ + --strip-files=\* \ + --remove-paths=\*.a \ + --remove-paths=\*.pyc \ + --env-activate-args=--prefix-is-base \ + "${conda_install_prefix}" + +# Remove bootstrap Miniconda files. +rm -rf "${miniconda_boostrap_prefix}" + +# Add standard Bioconda config to root's Conda config. +conda config \ + --append channels conda-forge \ + --append channels bioconda \ + ; +conda config \ + --remove channels defaults \ + 2> /dev/null \ + || true +conda config \ + --remove repodata_fns current_repodata.json \ + 2> /dev/null \ + || true +conda config \ + --prepend repodata_fns repodata.json + +# Use `always_copy` to cut links to package cache. +# (Which is esp. important if files are manipulated via --strip-files !) +conda config \ + --set always_copy true \ + --set allow_softlinks false + + +# Log information of the newly created Conda installation. +# NB: Running conda after the .pyc removal will recreate some .pyc files. +# This is intentional as it speeds up conda startup time. +conda list --name=base +conda info --all +# Make sure we have the requested conda version installed, and no mamba +conda list \ + --export '^(conda|mamba)$' \ + | sed -n 's/=[^=]*$//p' \ + | diff "${requirements_file}" - diff --git a/images/create-env/prepare.sh b/images/create-env/prepare.sh new file mode 100644 index 00000000000..d98ad01b4fd --- /dev/null +++ b/images/create-env/prepare.sh @@ -0,0 +1,39 @@ +source ../versions.sh +IMAGE_NAME="${CREATE_ENV_IMAGE_NAME}" +TAG=$BIOCONDA_IMAGE_TAG +BUILD_ARGS=() + + + +# Get the exact versions of mamba and conda that were installed in build-env. +# +# If this tag exists on quay.io (that is, this create-env is being built in +# a subsequent run), then use that. Otherwise, we assume this tag has already +# been built locally (and the GitHub Actions job dependency should reflect +# this) +if [ $(tag_exists $BUILD_ENV_IMAGE_NAME $BIOCONDA_IMAGE_TAG) ]; then + REGISTRY=quay.io/bioconda +else + REGISTRY=ghcr.io/bioconda +fi + +CONDA_VERSION=$( + podman run -t $REGISTRY/${BUILD_ENV_IMAGE_NAME}:${BIOCONDA_IMAGE_TAG} \ + bash -c "/opt/conda/bin/conda list --export '^conda$'| sed -n 's/=[^=]*$//p'" +) +# Remove trailing \r with parameter expansion +export CONDA_VERSION=${CONDA_VERSION%$'\r'} + +BUILD_ARGS+=("--build-arg=CONDA_VERSION=$CONDA_VERSION") + +# Needs busybox image to copy some items over +if [ $(tag_exists $BASE_BUSYBOX_IMAGE_NAME $BASE_TAG) ]; then + REGISTRY=quay.io/bioconda +else + REGISTRY=ghcr.io/bioconda +fi + +BUILD_ARGS+=("--build-arg=BUSYBOX_IMAGE=${REGISTRY}/${BASE_BUSYBOX_IMAGE_NAME}:${BASE_TAG}") + +# TEST_BUILD_ARGS=() +# TEST_BUILD_ARGS+=("--build-arg=BUSYBOX_IMAGE=$BUSYBOX_IMAGE") diff --git a/images/create-env/print-env-activate b/images/create-env/print-env-activate new file mode 100755 index 00000000000..fbaa4a405b2 --- /dev/null +++ b/images/create-env/print-env-activate @@ -0,0 +1,95 @@ +#! /bin/bash -eu + +for arg do + case "${arg}" in + --help ) + cat <<'end-of-help' +Usage: print-env-activate [OPTIONS]... [--] [PREFIX] +Print shell activation script contents conda creates for environment at PREFIX. + + --prefix=PREFIX Optionally pass on PREFIX path as option-argument + instead of operand. + --prefix-is-base[=yes|=no] Specify if PREFIX is a base environment and use + `PREFIX/bin/conda` to create a full base + environment activation script. (default: no) +end-of-help + exit 0 ;; + --prefix=* ) + prefix="${arg#--prefix=}" + shift ;; + --prefix-is-base=yes | --prefix-is-base ) + prefix_is_base=1 + shift ;; + --prefix-is-base=no ) + prefix_is_base=0 + shift ;; + -- ) + break ;; + -* ) + printf 'unknown option: %s\n' "${arg}" + exit 1 ;; + * ) + break + esac +done + +if [ -z "${prefix:-}" ] ; then + prefix="${1}" + shift +fi + +if [ $# -ne 0 ] ; then + printf 'excess argument: %s\n' "${@}" + exit +fi + +if [ "${prefix_is_base-}" = 1 ] ; then + conda_exe="${prefix}/bin/conda" +else + conda_exe="$( command -v conda )" +fi + +# Deactivate current active env for full `conda shell.posix activate` changes. +deactivate_script="$( + conda shell.posix deactivate +)" +if [ "${prefix_is_base-}" = 1 ] ; then + deactivate_script="$( + printf %s "${deactivate_script}" \ + | sed "s|/[^\"'=:]*/condabin:||g" + )" +fi +set +u +eval "${deactivate_script}" +set -u +unset deactivate_script + +# NOTE: The following gets a proper PS1 value from an interactive Bash which +# `conda shell posix.activate` can reuse. +# NB: Ideally, conda activate should not use the current PS1 but rather write +# out something like PS1="${CONDA_PROMPT_MODIFIER}${PS1}". +# (Also, running this in the build instead of final container might not +# reflect the actual PS1 the target container image would provide.) +PS1="$( + bash -ic 'printf %s "${PS1}"' 2>/dev/null + printf . +)" +PS1="${PS1%.}" + +activate_script="$( + export PS1 + if [ ! "${prefix_is_base-}" = 1 ] ; then + export CONDA_ENV_PROMPT= + fi + "${conda_exe}" shell.posix activate "${prefix}" +)" + +printf '%s\n' "${activate_script}" \ + | { + if [ "${prefix_is_base-}" = 1 ] ; then + cat + else + grep -vE '^export (_CE_M|_CE_CONDA|CONDA_EXE|CONDA_PYTHON_EXE)=' \ + | sed "s|/[^\"'=:]*/condabin:||g" + fi + } diff --git a/images/locale/C.utf8/LC_ADDRESS b/images/locale/C.utf8/LC_ADDRESS new file mode 100644 index 00000000000..c4b6714c7a4 Binary files /dev/null and b/images/locale/C.utf8/LC_ADDRESS differ diff --git a/images/locale/C.utf8/LC_COLLATE b/images/locale/C.utf8/LC_COLLATE new file mode 100644 index 00000000000..b36405433f1 Binary files /dev/null and b/images/locale/C.utf8/LC_COLLATE differ diff --git a/images/locale/C.utf8/LC_CTYPE b/images/locale/C.utf8/LC_CTYPE new file mode 100644 index 00000000000..cba1025364b Binary files /dev/null and b/images/locale/C.utf8/LC_CTYPE differ diff --git a/images/locale/C.utf8/LC_IDENTIFICATION b/images/locale/C.utf8/LC_IDENTIFICATION new file mode 100644 index 00000000000..fa899b0a7e1 Binary files /dev/null and b/images/locale/C.utf8/LC_IDENTIFICATION differ diff --git a/images/locale/C.utf8/LC_MEASUREMENT b/images/locale/C.utf8/LC_MEASUREMENT new file mode 100644 index 00000000000..5325e195580 Binary files /dev/null and b/images/locale/C.utf8/LC_MEASUREMENT differ diff --git a/images/locale/C.utf8/LC_MESSAGES/SYS_LC_MESSAGES b/images/locale/C.utf8/LC_MESSAGES/SYS_LC_MESSAGES new file mode 100644 index 00000000000..8843f43def7 Binary files /dev/null and b/images/locale/C.utf8/LC_MESSAGES/SYS_LC_MESSAGES differ diff --git a/images/locale/C.utf8/LC_MONETARY b/images/locale/C.utf8/LC_MONETARY new file mode 100644 index 00000000000..cecafe1b1d4 Binary files /dev/null and b/images/locale/C.utf8/LC_MONETARY differ diff --git a/images/locale/C.utf8/LC_NAME b/images/locale/C.utf8/LC_NAME new file mode 100644 index 00000000000..cafa1edd3a1 Binary files /dev/null and b/images/locale/C.utf8/LC_NAME differ diff --git a/images/locale/C.utf8/LC_NUMERIC b/images/locale/C.utf8/LC_NUMERIC new file mode 100644 index 00000000000..23ba63a16af Binary files /dev/null and b/images/locale/C.utf8/LC_NUMERIC differ diff --git a/images/locale/C.utf8/LC_PAPER b/images/locale/C.utf8/LC_PAPER new file mode 100644 index 00000000000..18cfad8afdf Binary files /dev/null and b/images/locale/C.utf8/LC_PAPER differ diff --git a/images/locale/C.utf8/LC_TELEPHONE b/images/locale/C.utf8/LC_TELEPHONE new file mode 100644 index 00000000000..1042aff9e17 Binary files /dev/null and b/images/locale/C.utf8/LC_TELEPHONE differ diff --git a/images/locale/C.utf8/LC_TIME b/images/locale/C.utf8/LC_TIME new file mode 100644 index 00000000000..5eb2a8a6efc Binary files /dev/null and b/images/locale/C.utf8/LC_TIME differ diff --git a/images/locale/Dockerfile b/images/locale/Dockerfile new file mode 100644 index 00000000000..fcc9124e9ae --- /dev/null +++ b/images/locale/Dockerfile @@ -0,0 +1,21 @@ +# Generate UTF-8 local to be used in other images + +FROM "debian:12.1-slim" +RUN apt-get update -qq \ + && \ + # Add en_US.UTF-8 locale. + printf '%s\n' 'en_US.UTF-8 UTF-8' \ + >> /etc/locale.gen \ + && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get install --yes --no-install-recommends \ + locales \ + && \ + # Remove "locales" package, but keep the generated locale. + sed -i \ + 's/\s*rm .*locale-archive$/: &/' \ + /var/lib/dpkg/info/locales.prerm \ + && \ + DEBIAN_FRONTEND=noninteractive \ + apt-get remove --yes \ + locales diff --git a/images/locale/generate_locale.sh b/images/locale/generate_locale.sh new file mode 100644 index 00000000000..9b91b2bfbeb --- /dev/null +++ b/images/locale/generate_locale.sh @@ -0,0 +1,5 @@ +#!/bin/bash + +iidfile="$( mktemp )" +buildah bud --iidfile="${iidfile}" --file=Dockerfile +podman run -v $(pwd):/tmp "$( cat $iidfile )" cp -r /usr/lib/locale/C.utf8 /tmp diff --git a/images/versions.sh b/images/versions.sh new file mode 100644 index 00000000000..ea99c0b00db --- /dev/null +++ b/images/versions.sh @@ -0,0 +1,80 @@ +#!/bin/bash + +# Configures various versions to be used throughout infrastructure +ARCHS="amd64 arm64" +DEBIAN_VERSION=12.2 +BUSYBOX_VERSION=1.36.1 +BASE_DEBIAN_IMAGE_NAME="tmp-debian" +BASE_BUSYBOX_IMAGE_NAME="tmp-busybox" +BUILD_ENV_IMAGE_NAME="tmp-build-env" +CREATE_ENV_IMAGE_NAME="tmp-create-env" +BASE_TAG="0.2" + +# Inspect this repo to get the currently-checked-out version, but if +# BIOCONDA_UTILS_VERSION was set outside this script, use that instead. +BIOCONDA_UTILS_VERSION=${BIOCONDA_UTILS_VERSION:-$(git describe --tags --dirty --always)} + +# This will be used as the tag for create-env and build-env images, which +# depend on bioconda-utils +BIOCONDA_IMAGE_TAG=${BIOCONDA_UTILS_VERSION}_base${BASE_TAG} + +# FUNCTIONS -------------------------------------------------------------------- + +function tag_exists () { + # Returns 0 if the tag for the image exists on quay.io, otherwise returns 1. + # Skips "latest" tags (likely they will always be present) + # $1: image name + # $2: tags + local IMAGE_NAME="$1" + local TAGS="$2" + + response="$(curl -sL "https://quay.io/api/v1/repository/bioconda/${IMAGE_NAME}/tag/")" + + # Images can be set to expire; the jq query selects only non-expired images. + existing_tags="$( + printf %s "${response}" \ + | jq -r '.tags[]|select(.end_ts == null or .end_ts >= now)|.name' + )" \ + || { + printf %s\\n \ + 'Could not get list of image tags.' \ + 'Does the repository exist on Quay.io?' \ + 'Quay.io REST API response was:' \ + "${response}" >&2 + return 1 + } + for tag in $TAGS ; do + case "${tag}" in + "latest" ) ;; + * ) + if printf %s "${existing_tags}" | grep -qxF "${tag}" ; then + printf 'Tag %s already exists for %s on quay.io!\n' "${tag}" "${IMAGE_NAME}" >&2 + echo "exists" + fi + esac + done +} + +# Helper function to push a just-built image to GitHub Container +# Respository, which is used as a temporary storage mechanism. +function push_to_ghcr () { + podman manifest push localhost/${1}:${2} ghcr.io/bioconda/${1}:${2} +} + +# Helper function to move an image from gchr to quay.io for public use. +function move_from_ghcr_to_quay () { + local image_name=$1 + local tag=$2 + + # Locally-named manifest to which we'll add the different archs. + buildah manifest create "local_${image_name}:${tag}" + + # Expects images for archs to be built already; add them to local manifest. + for arch in $ARCHS; do + imgid=$(buildah pull --arch=$arch "ghcr.io/bioconda/${image_name}:${tag}") + buildah manifest add "local_${image_name}:${tag}" "${imgid}" + done + + # Publish + podman manifest push "local_${image_name}:${tag}" "quay.io/bioconda/${image_name}:${tag}" +} diff --git a/test/test_utils.py b/test/test_utils.py index 4ec044dd7f8..ab63850e176 100644 --- a/test/test_utils.py +++ b/test/test_utils.py @@ -39,7 +39,7 @@ # docker, once without). On OSX, only the non-docker runs. # Docker ref for build container -DOCKER_BASE_IMAGE = "quay.io/bioconda/bioconda-utils-test-env-cos7:latest" +DOCKER_BASE_IMAGE = "quay.io/bioconda/bioconda-utils-build-env-cos7:latest" SKIP_DOCKER_TESTS = sys.platform.startswith('darwin') SKIP_NOT_OSX = not sys.platform.startswith('darwin')