-
Notifications
You must be signed in to change notification settings - Fork 59
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Co-authored-by: Ruinong Tian <[email protected]>
- Loading branch information
Showing
20 changed files
with
1,194 additions
and
8 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,24 @@ | ||
# Change log: 0.13.0(cpu) | ||
|
||
## Upgrades: | ||
|
||
Package | Previous Version | Current Version | ||
---|---|--- | ||
python|3.8.18|3.11.9 | ||
ipython|8.12.2|8.26.0 | ||
jinja2|3.1.3|3.1.4 | ||
ipywidgets|7.8.0|7.8.3 | ||
numpy|1.24.4|1.26.4 | ||
pandas|2.0.3|2.2.2 | ||
boto3|1.34.36|1.34.151 | ||
aws-glue-sessions|1.0.4|1.0.6 | ||
keras|2.13.1|2.15.0 | ||
matplotlib|3.7.3|3.9.1 | ||
scipy|1.10.1|1.14.0 | ||
scikit-learn|1.3.2|1.5.1 | ||
pytorch|2.0.0|2.1.2 | ||
sagemaker-headless-execution-driver|0.0.12|0.0.13 | ||
sagemaker-python-sdk|2.206.0|2.227.0 | ||
sagemaker-studio-analytics-extension|0.0.21|0.1.2 | ||
tensorflow|2.13.1|2.15.0 | ||
torchvision|0.15.2|0.16.1 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,22 @@ | ||
# Change log: 0.13.0(gpu) | ||
|
||
## Upgrades: | ||
|
||
Package | Previous Version | Current Version | ||
---|---|--- | ||
python|3.8.18|3.11.9 | ||
ipython|8.12.2|8.26.0 | ||
jinja2|3.1.3|3.1.4 | ||
ipywidgets|7.8.0|7.8.3 | ||
numpy|1.24.4|1.26.4 | ||
pandas|2.0.3|2.2.2 | ||
boto3|1.34.36|1.34.151 | ||
aws-glue-sessions|1.0.4|1.0.6 | ||
keras|2.13.1|2.14.0 | ||
matplotlib|3.7.3|3.9.1 | ||
scipy|1.10.1|1.14.0 | ||
scikit-learn|1.3.2|1.5.1 | ||
sagemaker-headless-execution-driver|0.0.12|0.0.13 | ||
sagemaker-python-sdk|2.206.0|2.227.0 | ||
sagemaker-studio-analytics-extension|0.0.21|0.1.2 | ||
tensorflow|2.13.1|2.14.0 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,152 @@ | ||
ARG TAG_FOR_BASE_MICROMAMBA_IMAGE | ||
FROM mambaorg/micromamba:$TAG_FOR_BASE_MICROMAMBA_IMAGE | ||
|
||
ARG CUDA_MAJOR_MINOR_VERSION='' | ||
ARG ENV_IN_FILENAME | ||
ARG ARG_BASED_ENV_IN_FILENAME | ||
|
||
|
||
ARG NB_USER="sagemaker-user" | ||
ARG NB_UID=1000 | ||
ARG NB_GID=100 | ||
|
||
# https://www.openssl.org/source/ | ||
ARG FIPS_VALIDATED_SSL=3.0.8 | ||
|
||
ENV SAGEMAKER_LOGGING_DIR="/var/log/sagemaker/" | ||
ENV STUDIO_LOGGING_DIR="/var/log/studio/" | ||
ENV EDITOR="nano" | ||
|
||
USER root | ||
RUN usermod "--login=${NB_USER}" "--home=/home/${NB_USER}" --move-home "-u ${NB_UID}" "${MAMBA_USER}" && \ | ||
groupmod "--new-name=${NB_USER}" --non-unique "-g ${NB_GID}" "${MAMBA_USER}" && \ | ||
# Update the expected value of MAMBA_USER for the | ||
# _entrypoint.sh consistency check. | ||
echo "${NB_USER}" > "/etc/arg_mamba_user" && \ | ||
: | ||
ENV MAMBA_USER=$NB_USER | ||
ENV USER=$NB_USER | ||
|
||
RUN apt-get update && apt-get upgrade -y && \ | ||
apt-get install -y --no-install-recommends sudo gettext-base wget curl unzip git rsync build-essential openssh-client nano cron less mandoc && \ | ||
# We just install tzdata below but leave default time zone as UTC. This helps packages like Pandas to function correctly. | ||
DEBIAN_FRONTEND=noninteractive apt-get install -y --no-install-recommends tzdata krb5-user libkrb5-dev libsasl2-dev libsasl2-modules && \ | ||
chmod g+w /etc/passwd && \ | ||
echo "ALL ALL=(ALL) NOPASSWD: ALL" >> /etc/sudoers && \ | ||
touch /etc/krb5.conf.lock && chown ${NB_USER}:${MAMBA_USER} /etc/krb5.conf* && \ | ||
# Note that we do NOT run `rm -rf /var/lib/apt/lists/*` here. If we did, anyone building on top of our images will | ||
# not be able to run any `apt-get install` commands and that would hamper customizability of the images. | ||
curl "https://awscli.amazonaws.com/awscli-exe-linux-x86_64.zip" -o "awscliv2.zip" && \ | ||
unzip awscliv2.zip && \ | ||
sudo ./aws/install && \ | ||
rm -rf aws awscliv2.zip && \ | ||
: | ||
RUN echo "source /usr/local/bin/_activate_current_env.sh" | tee --append /etc/profile | ||
|
||
USER $MAMBA_USER | ||
COPY --chown=$MAMBA_USER:$MAMBA_USER $ENV_IN_FILENAME *.in /tmp/ | ||
|
||
# Make sure that $ENV_IN_FILENAME has a newline at the end before the `tee` command runs. Otherwise, nasty things | ||
# will happen. | ||
RUN if [[ -z $ARG_BASED_ENV_IN_FILENAME ]] ; \ | ||
then echo 'No ARG_BASED_ENV_IN_FILENAME passed' ; \ | ||
else envsubst < /tmp/$ARG_BASED_ENV_IN_FILENAME | tee --append /tmp/$ENV_IN_FILENAME ; \ | ||
fi | ||
|
||
ARG CONDA_OVERRIDE_CUDA=$CUDA_MAJOR_MINOR_VERSION | ||
RUN micromamba install -y --name base --file /tmp/$ENV_IN_FILENAME && \ | ||
micromamba clean --all --yes --force-pkgs-dirs && \ | ||
rm -rf /tmp/*.in | ||
|
||
|
||
ARG MAMBA_DOCKERFILE_ACTIVATE=1 | ||
# Enforce dependencies are all installed from conda-forge | ||
RUN sudo ln -s $(which python3) /usr/bin/python && \ | ||
conda config --remove channels defaults && \ | ||
micromamba config append channels conda-forge --env && \ | ||
micromamba config set channel_priority strict | ||
|
||
|
||
# Install glue kernels, and move to shared directory | ||
# Also patching base kernel so Studio background code doesn't start session silently | ||
RUN install-glue-kernels && \ | ||
SITE_PACKAGES=$(pip show aws-glue-sessions | grep Location | awk '{print $2}') && \ | ||
jupyter-kernelspec install $SITE_PACKAGES/aws_glue_interactive_sessions_kernel/glue_pyspark --user && \ | ||
jupyter-kernelspec install $SITE_PACKAGES/aws_glue_interactive_sessions_kernel/glue_spark --user && \ | ||
mv /home/sagemaker-user/.local/share/jupyter/kernels/glue_pyspark /opt/conda/share/jupyter/kernels && \ | ||
mv /home/sagemaker-user/.local/share/jupyter/kernels/glue_spark /opt/conda/share/jupyter/kernels && \ | ||
sed -i '/if not store_history and (/i\ if "sm_analytics_runtime_check" in code:\n return await self._complete_cell()\n' \ | ||
"$SITE_PACKAGES/aws_glue_interactive_sessions_kernel/glue_kernel_base/BaseKernel.py" | ||
|
||
|
||
# Patch glue kernels to use kernel wrapper | ||
COPY patch_glue_pyspark.json /opt/conda/share/jupyter/kernels/glue_pyspark/kernel.json | ||
COPY patch_glue_spark.json /opt/conda/share/jupyter/kernels/glue_spark/kernel.json | ||
|
||
USER root | ||
RUN HOME_DIR="/home/${NB_USER}/licenses" \ | ||
&& mkdir -p ${HOME_DIR} \ | ||
&& curl -o ${HOME_DIR}/oss_compliance.zip https://aws-dlinfra-utilities.s3.amazonaws.com/oss_compliance.zip \ | ||
&& unzip ${HOME_DIR}/oss_compliance.zip -d ${HOME_DIR}/ \ | ||
&& cp ${HOME_DIR}/oss_compliance/test/testOSSCompliance /usr/local/bin/testOSSCompliance \ | ||
&& chmod +x /usr/local/bin/testOSSCompliance \ | ||
&& chmod +x ${HOME_DIR}/oss_compliance/generate_oss_compliance.sh \ | ||
&& ${HOME_DIR}/oss_compliance/generate_oss_compliance.sh ${HOME_DIR} python \ | ||
&& rm -rf ${HOME_DIR}/oss_compliance* | ||
|
||
|
||
# Create logging directories for Studio Analytics extension | ||
RUN mkdir -p $SAGEMAKER_LOGGING_DIR && \ | ||
chmod a+rw $SAGEMAKER_LOGGING_DIR && \ | ||
mkdir -p ${STUDIO_LOGGING_DIR} && \ | ||
chown ${NB_USER}:${MAMBA_USER} ${STUDIO_LOGGING_DIR} | ||
|
||
|
||
USER $MAMBA_USER | ||
ENV PATH="/opt/conda/bin:/opt/conda/condabin:$PATH" | ||
WORKDIR "/home/${NB_USER}" | ||
|
||
# Install FIPS Provider for OpenSSL, on top of existing OpenSSL installation | ||
# v3.0.8 is latest FIPS validated provider, so this is the one we install | ||
# But we need to run tests against the installed version. | ||
# see https://github.com/openssl/openssl/blob/master/README-FIPS.md https://www.openssl.org/source/ | ||
RUN INSTALLED_SSL=$(micromamba list | grep openssl | tr -s ' ' | cut -d ' ' -f 3 | head -n 1) && \ | ||
# download source code for installed, and FIPS validated openssl versions | ||
curl -L https://www.openssl.org/source/openssl-$FIPS_VALIDATED_SSL.tar.gz > openssl-$FIPS_VALIDATED_SSL.tar.gz && \ | ||
curl -L https://www.openssl.org/source/openssl-$INSTALLED_SSL.tar.gz > openssl-$INSTALLED_SSL.tar.gz && \ | ||
tar -xf openssl-$FIPS_VALIDATED_SSL.tar.gz && tar -xf openssl-$INSTALLED_SSL.tar.gz && cd openssl-$FIPS_VALIDATED_SSL && \ | ||
# Configure both versions to enable FIPS and build | ||
./Configure enable-fips --prefix=/opt/conda --openssldir=/opt/conda/ssl && make && \ | ||
cd ../openssl-$INSTALLED_SSL && \ | ||
./Configure enable-fips --prefix=/opt/conda --openssldir=/opt/conda/ssl && make && \ | ||
# Copy validated provider to installed version for testing | ||
cp ../openssl-$FIPS_VALIDATED_SSL/providers/fips.so providers/. && \ | ||
cp ../openssl-$FIPS_VALIDATED_SSL/providers/fipsmodule.cnf providers/. && \ | ||
make tests && cd ../openssl-$FIPS_VALIDATED_SSL && \ | ||
# After tests pass, install FIPS provider and remove source code | ||
make install_fips && cd .. && rm -rf ./openssl-* | ||
# Create new config file with fips-enabled. Then user can override OPENSSL_CONF to enable FIPS | ||
# e.g. export OPENSSL_CONF=/opt/conda/ssl/openssl-fips.cnf | ||
RUN cp /opt/conda/ssl/openssl.cnf /opt/conda/ssl/openssl-fips.cnf && \ | ||
sed -i "s:# .include fipsmodule.cnf:.include /opt/conda/ssl/fipsmodule.cnf:" /opt/conda/ssl/openssl-fips.cnf && \ | ||
sed -i 's:# fips = fips_sect:fips = fips_sect:' /opt/conda/ssl/openssl-fips.cnf | ||
ENV OPENSSL_MODULES=/opt/conda/lib64/ossl-modules/ | ||
|
||
# Install Kerberos. | ||
# Make sure no dependency is added/updated | ||
RUN pip install "krb5>=0.5.1,<0.6" && \ | ||
pip show krb5 | grep Require | xargs -i sh -c '[ $(echo {} | cut -d: -f2 | wc -w) -eq 0 ] ' | ||
|
||
# https://stackoverflow.com/questions/122327 | ||
RUN SYSTEM_PYTHON_PATH=$(python3 -c "from __future__ import print_function;import sysconfig; print(sysconfig.get_paths().get('purelib'))") && \ | ||
# Remove SparkRKernel as it's not supported \ | ||
jupyter-kernelspec remove -f -y sparkrkernel && \ | ||
# Patch Sparkmagic lib to support Custom Certificates \ | ||
# https://github.com/jupyter-incubator/sparkmagic/pull/435/files \ | ||
cp -a ${SYSTEM_PYTHON_PATH}/sagemaker_studio_analytics_extension/patches/configuration.py ${SYSTEM_PYTHON_PATH}/sparkmagic/utils/ && \ | ||
cp -a ${SYSTEM_PYTHON_PATH}/sagemaker_studio_analytics_extension/patches/reliablehttpclient.py ${SYSTEM_PYTHON_PATH}/sparkmagic/livyclientlib/reliablehttpclient.py && \ | ||
sed -i 's= "python"= "/opt/conda/bin/python"=g' /opt/conda/share/jupyter/kernels/pysparkkernel/kernel.json /opt/conda/share/jupyter/kernels/sparkkernel/kernel.json && \ | ||
sed -i 's="Spark"="SparkMagic Spark"=g' /opt/conda/share/jupyter/kernels/sparkkernel/kernel.json && \ | ||
sed -i 's="PySpark"="SparkMagic PySpark"=g' /opt/conda/share/jupyter/kernels/pysparkkernel/kernel.json | ||
|
||
ENV SHELL=/bin/bash |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,33 @@ | ||
# Release notes: 0.13.0 | ||
Upgrade Python from 3.8 to 3.11 | ||
|
||
Package | gpu| cpu | ||
---|---|--- | ||
python|3.11.9|3.11.9 | ||
ipython|8.26.0|8.26.0 | ||
jinja2|3.1.4|3.1.4 | ||
ipywidgets|7.8.3|7.8.3 | ||
numpy|1.26.4|1.26.4 | ||
pandas|2.2.2|2.2.2 | ||
boto3|1.34.151|1.34.151 | ||
aws-glue-sessions|1.0.6|1.0.6 | ||
conda|23.11.0|23.11.0 | ||
jupyterlab|3.6.7|3.6.7 | ||
keras|2.14.0|2.15.0 | ||
matplotlib|3.9.1|3.9.1 | ||
pip|23.3.2|23.3.2 | ||
scipy|1.14.0|1.14.0 | ||
scikit-learn|1.5.1|1.5.1 | ||
py-xgboost-gpu|1.7.6| | ||
thrift_sasl|0.4.3|0.4.3 | ||
pyhive|0.7.0|0.7.0 | ||
python-gssapi|1.8.3|1.8.3 | ||
pytorch-gpu|2.0.0| | ||
sagemaker-headless-execution-driver|0.0.13|0.0.13 | ||
sagemaker-kernel-wrapper|0.0.2|0.0.2 | ||
sagemaker-python-sdk|2.227.0|2.227.0 | ||
sagemaker-studio-analytics-extension|0.1.2|0.1.2 | ||
tensorflow|2.14.0|2.15.0 | ||
torchvision|0.15.2|0.16.1 | ||
py-xgboost-cpu| |1.7.6 | ||
pytorch| |2.1.2 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,27 @@ | ||
# This file is auto-generated. | ||
conda-forge::pytorch[version='>=2.0.0,<3.0.0'] | ||
conda-forge::tensorflow[version='>=2.13.1,<3.0.0'] | ||
conda-forge::python[version='>=3.11.0,<3.12.0'] | ||
conda-forge::pip[version='>=23.3.2,<24.0.0'] | ||
conda-forge::torchvision[version='>=0.15.2,<1.0.0'] | ||
conda-forge::numpy[version='>=1.24.4,<2.0.0'] | ||
conda-forge::pandas[version='>=2.0.3,<3.0.0'] | ||
conda-forge::scikit-learn[version='>=1.3.2,<2.0.0'] | ||
conda-forge::jinja2[version='>=3.1.3,<4.0.0'] | ||
conda-forge::matplotlib[version='>=3.7.3,<4.0.0'] | ||
conda-forge::sagemaker-headless-execution-driver[version='>=0.0.12,<1.0.0'] | ||
conda-forge::ipython[version='>=8.12.2,<9.0.0'] | ||
conda-forge::scipy[version='>=1.10.1,<2.0.0'] | ||
conda-forge::keras[version='>=2.13.1,<3.0.0'] | ||
conda-forge::py-xgboost-cpu[version='>=1.7.6,<2.0.0'] | ||
conda-forge::jupyterlab[version='>=3.6.7,<4.0.0'] | ||
conda-forge::ipywidgets[version='>=7.8.0,<8.0.0'] | ||
conda-forge::conda[version='>=23.11.0,<24.0.0'] | ||
conda-forge::boto3[version='>=1.34.36,<2.0.0'] | ||
conda-forge::sagemaker-python-sdk[version='>=2.206.0,<3.0.0'] | ||
conda-forge::sagemaker-studio-analytics-extension[version='>=0.0.21,<1.0.0'] | ||
conda-forge::aws-glue-sessions[version='>=1.0.4,<2.0.0'] | ||
conda-forge::sagemaker-kernel-wrapper[version='>=0.0.2,<1.0.0'] | ||
conda-forge::thrift_sasl[version='>=0.4.3,<1.0.0'] | ||
conda-forge::pyhive[version='>=0.7.0,<1.0.0'] | ||
conda-forge::python-gssapi[version='>=1.8.3,<2.0.0'] |
Oops, something went wrong.